1 | //
|
---|
2 | // Cforall Version 1.0.0 Copyright (C) 2016 University of Waterloo
|
---|
3 | //
|
---|
4 | // The contents of this file are covered under the licence agreement in the
|
---|
5 | // file "LICENCE" distributed with Cforall.
|
---|
6 | //
|
---|
7 | // string -- variable-length, mutable run of text, with value semantics
|
---|
8 | //
|
---|
9 | // Author : Michael L. Brooks
|
---|
10 | // Created On : Fri Sep 03 11:00:00 2021
|
---|
11 | // Last Modified By : Peter A. Buhr
|
---|
12 | // Last Modified On : Wed Apr 9 22:27:41 2025
|
---|
13 | // Update Count : 259
|
---|
14 | //
|
---|
15 |
|
---|
16 | #pragma once
|
---|
17 |
|
---|
18 | #include <iostream.hfa>
|
---|
19 | #include <string_res.hfa>
|
---|
20 |
|
---|
21 | static struct __cfa_string_preference_boost_t {} __cfa_string_preference_boost;
|
---|
22 | #define PBOOST forall ( | { __cfa_string_preference_boost_t __cfa_string_preference_boost; } )
|
---|
23 |
|
---|
24 | struct string {
|
---|
25 | string_res * inner;
|
---|
26 | };
|
---|
27 |
|
---|
28 | // RAII, assignment
|
---|
29 | void ^?{}( string & s );
|
---|
30 |
|
---|
31 | void ?{}( string & s ); // empty string
|
---|
32 | void ?{}( string & s, string s2, size_t maxlen );
|
---|
33 | PBOOST void ?{}( string & s, string s2 );
|
---|
34 | void ?{}( string & s, char );
|
---|
35 | void ?{}( string & s, const char * c ); // copy from string literal (NULL-terminated)
|
---|
36 | void ?{}( string & s, const char * c, size_t size ); // copy specific length from buffer
|
---|
37 |
|
---|
38 | void ?{}( string & s, signed long int rhs );
|
---|
39 | void ?{}( string & s, size_t rhs );
|
---|
40 | void ?{}( string & s, double rhs );
|
---|
41 | void ?{}( string & s, long double rhs );
|
---|
42 | void ?{}( string & s, double _Complex rhs );
|
---|
43 | void ?{}( string & s, long double _Complex rhs );
|
---|
44 | static inline void ?{}( string & s, int rhs ) { (s){(signed long int) rhs}; }
|
---|
45 |
|
---|
46 | // string str( ssize_t rhs );
|
---|
47 | // string str( size_t rhs );
|
---|
48 | // string str( double rhs );
|
---|
49 | // string str( long double rhs );
|
---|
50 | // string str( double _Complex rhs );
|
---|
51 | // string str( long double _Complex rhs );
|
---|
52 |
|
---|
53 | PBOOST string & ?=?( string & s, string c );
|
---|
54 | string & ?=?( string & s, const char * c ); // copy from "literal"
|
---|
55 | string & ?=?( string & s, char c ); // copy from 'l'
|
---|
56 | string & assign( string & s, const string & c, size_t n );
|
---|
57 | string & assign( string & s, const char * c, size_t n );
|
---|
58 | string & ?=?( string & s, signed long int rhs );
|
---|
59 | string & ?=?( string & s, size_t rhs );
|
---|
60 | string & ?=?( string & s, double rhs );
|
---|
61 | string & ?=?( string & s, long double rhs );
|
---|
62 | string & ?=?( string & s, double _Complex rhs );
|
---|
63 | string & ?=?( string & s, long double _Complex rhs );
|
---|
64 | static inline string & ?=?( string & s, int rhs ) { return s = ((signed long int) rhs); } // to match cost of (char * int): int
|
---|
65 |
|
---|
66 | static inline string & strcpy( string & s, const char * c ) { s = c; return s; }
|
---|
67 | static inline string & strncpy( string & s, const char * c, size_t n ) { assign( s, c, n ); return s; }
|
---|
68 | static inline string & strcpy( string & s, const string & c ) { s = c; return s; }
|
---|
69 | static inline string & strncpy( string & s, const string & c, size_t n ) { assign( s, c, n ); return s; }
|
---|
70 |
|
---|
71 | // Alternate construction: request shared edits
|
---|
72 | struct string_Share {
|
---|
73 | string * s;
|
---|
74 | };
|
---|
75 | string_Share ?`share( string & s );
|
---|
76 | void ?{}( string & s, string_Share src );
|
---|
77 |
|
---|
78 | // Getters
|
---|
79 | static inline size_t len( const string & s ) { return len( *s.inner ); }
|
---|
80 | static inline size_t len( const char * cs ) { return strlen( cs ); };
|
---|
81 | static inline size_t strlen( const string & s ) { return len( s ); }
|
---|
82 |
|
---|
83 | // IO Operator
|
---|
84 | forall( ostype & | basic_ostream( ostype ) ) {
|
---|
85 | ostype & ?|?( ostype & out, string s );
|
---|
86 | void ?|?( ostype & out, string s );
|
---|
87 | }
|
---|
88 | forall( istype & | basic_istream( istype ) )
|
---|
89 | istype & ?|?( istype & in, string & s );
|
---|
90 |
|
---|
91 | static inline {
|
---|
92 | _Ostream_Manip(string) bin( string s ) { return (_Ostream_Manip(string))@{ s, 1, 0, 'b', { .all = 0 } }; }
|
---|
93 | _Ostream_Manip(string) oct( string s ) { return (_Ostream_Manip(string))@{ s, 1, 0, 'o', { .all = 0 } }; }
|
---|
94 | _Ostream_Manip(string) hex( string s ) { return (_Ostream_Manip(string))@{ s, 1, 0, 'x', { .all = 0 } }; }
|
---|
95 | _Ostream_Manip(string) wd( unsigned int w, string s ) { return (_Ostream_Manip(string))@{ s, w, 0, 's', { .all = 0 } }; }
|
---|
96 | _Ostream_Manip(string) wd( unsigned int w, unsigned int pc, string s ) { return (_Ostream_Manip(string))@{ s, w, pc, 's', { .flags.pc = true } }; }
|
---|
97 | _Ostream_Manip(string) & wd( unsigned int w, _Ostream_Manip(string) & fmt ) { fmt.wd = w; return fmt; }
|
---|
98 | _Ostream_Manip(string) & wd( unsigned int w, unsigned int pc, _Ostream_Manip(string) & fmt ) { fmt.wd = w; fmt.pc = pc; fmt.flags.pc = true; return fmt; }
|
---|
99 | _Ostream_Manip(string) & left( _Ostream_Manip(string) & fmt ) { fmt.flags.left = true; return fmt; }
|
---|
100 | _Ostream_Manip(string) & nobase( _Ostream_Manip(string) & fmt ) { fmt.flags.nobsdp = true; return fmt; }
|
---|
101 | } // distribution
|
---|
102 | forall( ostype & | basic_ostream( ostype ) ) {
|
---|
103 | ostype & ?|?( ostype & os, _Ostream_Manip(string) f );
|
---|
104 | void ?|?( ostype & os, _Ostream_Manip(string) );
|
---|
105 | }
|
---|
106 |
|
---|
107 | struct _Istream_Swidth {
|
---|
108 | string & s;
|
---|
109 | inline _Istream_str_base;
|
---|
110 | }; // _Istream_Swidth
|
---|
111 |
|
---|
112 | struct _Istream_Squoted {
|
---|
113 | _Istream_Swidth sstr;
|
---|
114 | }; // _Istream_Squoted
|
---|
115 |
|
---|
116 | struct _Istream_Sstr {
|
---|
117 | string & s;
|
---|
118 | inline _Istream_str_base;
|
---|
119 | // _Istream_Swidth sstr;
|
---|
120 | }; // _Istream_Sstr
|
---|
121 |
|
---|
122 | static inline {
|
---|
123 | // read width does not include null terminator
|
---|
124 | _Istream_Swidth wdi( unsigned int rwd, string & s ) { return (_Istream_Swidth)@{ .s = s, { {.scanset = 0p}, .wd = rwd, {.flags.rwd = true} } }; }
|
---|
125 | _Istream_Sstr getline( string & s, const char delimiter = '\n' ) {
|
---|
126 | // return (_Istream_Sstr)@{ { .s = s, { {.delimiters = { delimiter, '\0' } }, .wd = -1, {.flags.delimiter = true} } } };
|
---|
127 | return (_Istream_Sstr)@{ .s = s, { {.delimiters = { delimiter, '\0' } }, .wd = -1, {.flags.delimiter = true} } };
|
---|
128 | }
|
---|
129 | _Istream_Sstr & getline( _Istream_Swidth & f, const char delimiter = '\n' ) {
|
---|
130 | f.delimiters[0] = delimiter; f.delimiters[1] = '\0'; f.flags.delimiter = true; return (_Istream_Sstr &)f;
|
---|
131 | }
|
---|
132 | _Istream_Squoted quoted( string & s, const char Ldelimiter = '\"', const char Rdelimiter = '\0' ) {
|
---|
133 | return (_Istream_Squoted)@{ { .s = s, { {.delimiters = { Ldelimiter, Rdelimiter, '\0' }}, .wd = -1, {.flags.rwd = true} } } };
|
---|
134 | }
|
---|
135 | _Istream_Squoted & quoted( _Istream_Swidth & f, const char Ldelimiter = '"', const char Rdelimiter = '\0' ) {
|
---|
136 | f.delimiters[0] = Ldelimiter; f.delimiters[1] = Rdelimiter; f.delimiters[2] = '\0';
|
---|
137 | return (_Istream_Squoted &)f;
|
---|
138 | }
|
---|
139 | // _Istream_Sstr incl( const char scanset[], string & s ) { return (_Istream_Sstr)@{ { .s = s, { {.scanset = scanset}, .wd = -1, {.flags.inex = false} } } }; }
|
---|
140 | _Istream_Sstr incl( const char scanset[], string & s ) { return (_Istream_Sstr)@{ .s = s, { {.scanset = scanset}, .wd = -1, {.flags.inex = false} } }; }
|
---|
141 | _Istream_Sstr & incl( const char scanset[], _Istream_Swidth & f ) { f.scanset = scanset; f.flags.inex = false; return (_Istream_Sstr &)f; }
|
---|
142 | // _Istream_Sstr excl( const char scanset[], string & s ) { return (_Istream_Sstr)@{ { .s = s, { {.scanset = scanset}, .wd = -1, {.flags.inex = true} } } }; }
|
---|
143 | _Istream_Sstr excl( const char scanset[], string & s ) { return (_Istream_Sstr)@{ .s = s, { {.scanset = scanset}, .wd = -1, {.flags.inex = true} } }; }
|
---|
144 | _Istream_Sstr & excl( const char scanset[], _Istream_Swidth & f ) { f.scanset = scanset; f.flags.inex = true; return (_Istream_Sstr &)f; }
|
---|
145 | // _Istream_Sstr ignore( string & s ) { return (_Istream_Sstr)@{ { .s = s, { {.scanset = 0p}, .wd = -1, {.flags.ignore = true} } } }; }
|
---|
146 | _Istream_Sstr ignore( string & s ) { return (_Istream_Sstr)@{ .s = s, { {.scanset = 0p}, .wd = -1, {.flags.ignore = true} } }; }
|
---|
147 | _Istream_Sstr & ignore( _Istream_Swidth & f ) { f.flags.ignore = true; return (_Istream_Sstr &)f; }
|
---|
148 | _Istream_Squoted & ignore( _Istream_Squoted & f ) { f.sstr.flags.ignore = true; return (_Istream_Squoted &)f; }
|
---|
149 | // _Istream_Sstr & ignore( _Istream_Sstr & f ) { f.sstr.flags.ignore = true; return (_Istream_Sstr &)f; }
|
---|
150 | _Istream_Sstr & ignore( _Istream_Sstr & f ) { f.flags.ignore = true; return (_Istream_Sstr &)f; }
|
---|
151 | } // distribution
|
---|
152 | forall( istype & | basic_istream( istype ) ) {
|
---|
153 | istype & ?|?( istype & is, _Istream_Squoted f );
|
---|
154 | istype & ?|?( istype & is, _Istream_Sstr f );
|
---|
155 | static inline istype & ?|?( istype & is, _Istream_Swidth f ) { return is | *(_Istream_Sstr *)&f; }
|
---|
156 | }
|
---|
157 |
|
---|
158 | // Concatenation
|
---|
159 | void ?+=?( string & s, char c );
|
---|
160 | void ?+=?( string & s, const string & s2 );
|
---|
161 | void append( string & s, const string & s2, size_t maxlen );
|
---|
162 | void ?+=?( string & s, const char * s2 );
|
---|
163 | void append( string & s, const char * buffer, size_t bsize );
|
---|
164 |
|
---|
165 | string ?+?( string s, char c );
|
---|
166 | string ?+?( char c, string s );
|
---|
167 | PBOOST string ?+?( string s, string s2 );
|
---|
168 | string ?+?( const char * s, char c ); // not backwards compatible
|
---|
169 | string ?+?( char c, const char * s );
|
---|
170 | string ?+?( const char * c, const char * s );
|
---|
171 | string ?+?( const char * c, string s );
|
---|
172 | string ?+?( string s, const char * c );
|
---|
173 | string ?+?( char, char ); // not being called 8-(
|
---|
174 |
|
---|
175 | static inline string & strcat( string & s, const string & s2 ) { s += s2; return s; }
|
---|
176 | static inline string & strcat( string & s, const char * c ) { s += c; return s; }
|
---|
177 | static inline string & strncat( string & s, const string & s2, size_t maxlen ) { append( s, s2, maxlen ); return s; }
|
---|
178 | static inline string & strncat( string & s, const char * buffer, size_t bsize ) { append( s, buffer, bsize ); return s; }
|
---|
179 |
|
---|
180 | // Repetition
|
---|
181 |
|
---|
182 | // Type `signed long long int` chosen for `factor` argument to achieve cost detente.
|
---|
183 | // This way, the call `'a' * 3` gets the same safe conversion cost calling here as for
|
---|
184 | // the built-in definition `int * int`.
|
---|
185 | typedef signed long long int strmul_factor_t;
|
---|
186 |
|
---|
187 | void ?*=?( string & s, strmul_factor_t factor );
|
---|
188 | string ?*?( char c, strmul_factor_t factor ); // not backwards compatible
|
---|
189 | PBOOST string ?*?( string s, strmul_factor_t factor );
|
---|
190 | string ?*?( const char * s, strmul_factor_t factor );
|
---|
191 | static inline string ?*?( strmul_factor_t factor, char s ) { return s * factor; }
|
---|
192 | PBOOST static inline string ?*?( strmul_factor_t factor, string s ) { return s * factor; }
|
---|
193 | static inline string ?*?( strmul_factor_t factor, const char * s ) { return s * factor; }
|
---|
194 |
|
---|
195 | // Character access
|
---|
196 | char ?[?]( const string & s, size_t index );
|
---|
197 | string ?[?]( string & s, size_t index ); // mutable length-1 slice of original
|
---|
198 | //char codePointAt(const string & s, size_t index ); // to revisit under Unicode
|
---|
199 |
|
---|
200 | // Comparisons
|
---|
201 | int strcmp ( const string &, const string & );
|
---|
202 | bool ?==?( const string &, const string & );
|
---|
203 | bool ?!=?( const string &, const string & );
|
---|
204 | bool ?>? ( const string &, const string & );
|
---|
205 | bool ?>=?( const string &, const string & );
|
---|
206 | bool ?<=?( const string &, const string & );
|
---|
207 | bool ?<? ( const string &, const string & );
|
---|
208 |
|
---|
209 | int strcmp( const string &, const char * );
|
---|
210 | bool ?==?( const string &, const char * );
|
---|
211 | bool ?!=?( const string &, const char * );
|
---|
212 | bool ?>? ( const string &, const char * );
|
---|
213 | bool ?>=?( const string &, const char * );
|
---|
214 | bool ?<=?( const string &, const char * );
|
---|
215 | bool ?<? ( const string &, const char * );
|
---|
216 |
|
---|
217 | int strcmp( const char *, const string & );
|
---|
218 | bool ?==?( const char *, const string & );
|
---|
219 | bool ?!=?( const char *, const string & );
|
---|
220 | bool ?>? ( const char *, const string & );
|
---|
221 | bool ?>=?( const char *, const string & );
|
---|
222 | bool ?<=?( const char *, const string & );
|
---|
223 | bool ?<? ( const char *, const string & );
|
---|
224 |
|
---|
225 | // String search
|
---|
226 | bool contains( const string & s, char ch ); // single character
|
---|
227 |
|
---|
228 | //int find( const string & s, size_t start, size_t len, const string & key, size_t kstart, size_t klen );
|
---|
229 | size_t find$( const string_res & s, size_t start, size_t len, const string & key_res, size_t kstart, size_t klen );
|
---|
230 |
|
---|
231 | size_t find( const string & s, char key );
|
---|
232 | size_t find( const string & s, const char * key );
|
---|
233 | size_t find( const string & s, const string & key );
|
---|
234 | size_t find( const string & s, const char * key, size_t keysize );
|
---|
235 |
|
---|
236 | size_t find( const string & s, size_t start, char key );
|
---|
237 | size_t find( const string & s, size_t start, const string & key );
|
---|
238 | size_t find( const string & s, size_t start, const char * key );
|
---|
239 | size_t find( const string & s, size_t start, const char * key, size_t keysize );
|
---|
240 | static inline ?^?( const string & key, const string & s ) { return find( s, key ); }
|
---|
241 | static inline ?^?( const char * key, const string & s ) { return find( s, key ); }
|
---|
242 |
|
---|
243 | bool includes( const string & s, const string & mask );
|
---|
244 | bool includes( const string & s, const char * mask );
|
---|
245 | bool includes( const string & s, const char * mask, size_t masksize );
|
---|
246 |
|
---|
247 | bool startsWith( const string & s, const string & prefix );
|
---|
248 | bool startsWith( const string & s, const char * prefix );
|
---|
249 | bool startsWith( const string & s, const char * prefix, size_t prefixsize );
|
---|
250 |
|
---|
251 | bool endsWith( const string & s, const string & suffix );
|
---|
252 | bool endsWith( const string & s, const char * suffix );
|
---|
253 | bool endsWith( const string & s, const char * suffix, size_t suffixsize );
|
---|
254 |
|
---|
255 | // Slicing
|
---|
256 | string ?()( string & s, ssize_t start, ssize_t len );
|
---|
257 | static inline string ?()( const string & s, ssize_t start, ssize_t len ) { string & w = (string &)s; return w( start, len ); } // FIX ME
|
---|
258 | string ?()( string & s, ssize_t start );
|
---|
259 | static inline string ?()( const string & s, ssize_t start ) { string & w = (string &)s; return w( start ); } // FIX ME
|
---|
260 | static inline string ?()( string & s, char m ) { return s( find( s, m ), 1 )`share; }
|
---|
261 | static inline string ?()( const string & s, char m ) { string & w = (string &)s; return w( find( s, m ), 1 )`share; } // FIX ME
|
---|
262 | static inline string ?()( string & s, const char * m ) { return s( find( s, m ), len( m ) )`share; }
|
---|
263 | static inline string ?()( const string & s, const char * m ) { string & w = (string &)s; return w( find( s, m ), len( m ) )`share; } // FIX ME
|
---|
264 | static inline string ?()( string & s, const string & m ) { return s( find( s, m ), len( m ) )`share; }
|
---|
265 | static inline string ?()( const string & s, const string & m ) { string & w = (string &)s; return w( find( s, m ), len( m ) )`share; } // FIX ME
|
---|
266 |
|
---|
267 | struct charclass {
|
---|
268 | charclass_res * inner;
|
---|
269 | };
|
---|
270 |
|
---|
271 | void ?{}( charclass & ) = void;
|
---|
272 | void ?{}( charclass &, charclass ) = void;
|
---|
273 | charclass ?=?( charclass &, charclass ) = void;
|
---|
274 |
|
---|
275 | void ?{}( charclass &, const string & chars );
|
---|
276 | void ?{}( charclass &, const char * chars );
|
---|
277 | void ?{}( charclass &, const char * chars, size_t charssize );
|
---|
278 | void ^?{}( charclass & );
|
---|
279 |
|
---|
280 | size_t include( const string & s, const charclass & mask );
|
---|
281 | static inline size_t include( const char * s, const charclass & mask ) { string temp = s; return include( temp, mask ); }
|
---|
282 | static inline string include( const string & s, const charclass & mask ) { ssize_t i = include( s, mask ); return s( 0, i )`share; }
|
---|
283 | static inline string include( const char * s, const charclass & mask ) { string temp = s; ssize_t i = include( temp, mask ); return temp( 0, i ); }
|
---|
284 |
|
---|
285 | size_t exclude( const string & s, const charclass & mask );
|
---|
286 | static inline size_t exclude( const char * s, const charclass & mask ) { string temp = s; return exclude( temp, mask ); }
|
---|
287 | static inline string exclude( const string & s, const charclass & mask ) { ssize_t i = exclude( s, mask ); return s( 0, i )`share; }
|
---|
288 | static inline string exclude( const char * s, const charclass & mask ) { string temp = s; ssize_t i = exclude( temp, mask ); return temp( 0, i ); }
|
---|
289 |
|
---|
290 | size_t test( const string & s, int (*f)( int ) );
|
---|
291 | static inline size_t test( const char * c, int (*f)( int ) ) {
|
---|
292 | const string S = c;
|
---|
293 | return test( S, f );
|
---|
294 | }
|
---|
295 |
|
---|
296 | string replace( string & s, const string & from, const string & to );
|
---|
297 | static inline string replace( const char * s, const char * from, const char * to ) {
|
---|
298 | string S = s, From = from, To = to;
|
---|
299 | return replace( S, From, To );
|
---|
300 | }
|
---|
301 | static inline string replace( string & s, const char * from, const char * to ) {
|
---|
302 | string From = from, To = to;
|
---|
303 | return replace( s, From, To );
|
---|
304 | }
|
---|
305 | static inline string replace( string & s, const char * from, const string & to ) {
|
---|
306 | string From = from;
|
---|
307 | return replace( s, From, to );
|
---|
308 | }
|
---|
309 | static inline string replace( string & s, string & from, const char * to ) {
|
---|
310 | string To = to;
|
---|
311 | return replace( s, from, To );
|
---|
312 | }
|
---|
313 |
|
---|
314 | string translate( const string & s, int (*f)( int ) );
|
---|
315 | static inline string translate( const char * c, int (*f)( int ) ) {
|
---|
316 | const string S = c;
|
---|
317 | return translate( S, f );
|
---|
318 | }
|
---|
319 |
|
---|
320 | #ifndef _COMPILING_STRING_CFA_
|
---|
321 | #undef PBOOST
|
---|
322 | #endif
|
---|