source: libcfa/src/collections/string.hfa@ d8a2f98

Last change on this file since d8a2f98 was d8a2f98, checked in by Peter A. Buhr <pabuhr@…>, 5 days ago

formatting, add some tostr conversion routines

  • Property mode set to 100644
File size: 20.8 KB
Line 
1//
2// Cforall Version 1.0.0 Copyright (C) 2016 University of Waterloo
3//
4// The contents of this file are covered under the licence agreement in the
5// file "LICENCE" distributed with Cforall.
6//
7// string -- variable-length, mutable run of text, with value semantics
8//
9// Author : Michael L. Brooks
10// Created On : Fri Sep 03 11:00:00 2021
11// Last Modified By : Peter A. Buhr
12// Last Modified On : Mon May 4 21:54:23 2026
13// Update Count : 332
14//
15
16#pragma once
17
18#include <iostream.hfa>
19#include <string_res.hfa>
20
21static struct __cfa_string_preference_boost_t {} __cfa_string_preference_boost;
22#define PBOOST forall ( | { __cfa_string_preference_boost_t __cfa_string_preference_boost; } )
23
24struct string {
25 string_res * inner;
26};
27
28// RAII, assignment
29void ^?{}( string & s );
30
31void ?{}( string & s ); // empty string
32void ?{}( string & s, string s2, size_t maxlen );
33PBOOST void ?{}( string & s, string s2 );
34void ?{}( string & s, char );
35void ?{}( string & s, const char * cs ); // copy from string literal (NULL-terminated)
36void ?{}( string & s, const char * cs, size_t size ); // copy specific length from buffer
37
38void ?{}( string & s, signed long int rhs );
39void ?{}( string & s, size_t rhs );
40void ?{}( string & s, double rhs );
41void ?{}( string & s, long double rhs );
42void ?{}( string & s, double _Complex rhs );
43void ?{}( string & s, long double _Complex rhs );
44static inline void ?{}( string & s, int rhs ) { (s){(signed long int) rhs}; }
45
46PBOOST string & ?=?( string & s, string c );
47string & ?=?( string & s, const char * cs ); // copy from "literal"
48string & ?=?( string & s, char c ); // copy from 'l'
49string & assign( string & s, const string & c, size_t n );
50string & assign( string & s, const char * cs, size_t n );
51string & ?=?( string & s, signed long int rhs );
52string & ?=?( string & s, size_t rhs );
53string & ?=?( string & s, double rhs );
54string & ?=?( string & s, long double rhs );
55string & ?=?( string & s, double _Complex rhs );
56string & ?=?( string & s, long double _Complex rhs );
57static inline string & ?=?( string & s, int rhs ) { return s = ((signed long int) rhs); } // to match cost of (char * int): int
58
59static inline string tostr( char c ) { string s = c; return s; }
60static inline string tostr( const char * cs ) { string s = cs; return s; }
61static inline string tostr( signed long int v ) { string s = v; return s; }
62static inline string tostr( size_t v ) { string s = v; return s; }
63static inline string tostr( double v ) { string s = v; return s; }
64static inline string tostr( long double v ) { string s = v; return s; }
65static inline string tostr( long double _Complex v ) { string s = v; return s; }
66
67static inline string & strcpy( string & s, const char * cs ) { s = cs; return s; }
68static inline string & strncpy( string & s, const char * cs, size_t n ) { assign( s, cs, n ); return s; }
69static inline string & strcpy( string & s1, const string & s2 ) { s1 = s2; return s1; }
70static inline string & strncpy( string & s, const string & cs, size_t n ) { assign( s, cs, n ); return s; }
71char * strncpy( char * dst, string & src, size_t n );
72char * ?=?( char *& dst, string & src );
73void ?{}( char *& dst, string & src );
74
75// Alternate construction: request shared edits
76struct string_Share {
77 string * s;
78};
79string_Share ?`share( string & s );
80void ?{}( string & s, string_Share src );
81
82// Getters
83static inline size_t len( const string & s ) { return len( *s.inner ); }
84static inline size_t len( const char * cs ) { return strlen( cs ); };
85static inline size_t strlen( const string & s ) { return len( s ); }
86size_t strnlen( const string & s, size_t maxlen );
87
88// IO Operator
89forall( ostype & | basic_ostream( ostype ) ) {
90 ostype & ?|?( ostype & out, string s );
91 void ?|?( ostype & out, string s );
92}
93forall( istype & | basic_istream( istype ) )
94istype & ?|?( istype & in, string & s );
95
96static inline {
97 _Ostream_Manip(string) bin( string s ) { return (_Ostream_Manip(string))@{ .val = s, .wd = 1, .pc = 0, .base = 'b', { .all = 0 } }; }
98 _Ostream_Manip(string) oct( string s ) { return (_Ostream_Manip(string))@{ .val = s, .wd = 1, .pc = 0, .base = 'o', { .all = 0 } }; }
99 _Ostream_Manip(string) hex( string s ) { return (_Ostream_Manip(string))@{ .val = s, .wd = 1, .pc = 0, .base = 'x', { .all = 0 } }; }
100 _Ostream_Manip(string) quote( string s, const char qleft = '"', const char qright = '\0' ) {
101 return (_Ostream_Manip(string))@{ .val = s, .wd = 1, .pc = 0, .base = 's', { .flags.quote = true }, .qleft = qleft, .qright = qright }; }
102 _Ostream_Manip(string) wd( unsigned int wd, string s ) { return (_Ostream_Manip(string))@{ .val = s, .wd = wd, .pc = 0, .base = 's', { .all = 0 } }; }
103 _Ostream_Manip(string) wd( unsigned int wd, unsigned int pc, string s ) { return (_Ostream_Manip(string))@{ .val = s, .wd = wd, .pc = pc, .base = 's', { .flags.pc = true } }; }
104 _Ostream_Manip(string) & wd( unsigned int wd, _Ostream_Manip(string) & fmt ) { fmt.wd = wd; return fmt; }
105 _Ostream_Manip(string) & wd( unsigned int wd, unsigned int pc, _Ostream_Manip(string) & fmt ) { fmt.wd = wd; fmt.pc = pc; fmt.flags.pc = true; return fmt; }
106 _Ostream_Manip(string) & left( _Ostream_Manip(string) & fmt ) { fmt.flags.left = true; return fmt; }
107 _Ostream_Manip(string) & nobase( _Ostream_Manip(string) & fmt ) { fmt.flags.nobsdp = true; return fmt; }
108 _Ostream_Manip(string) & upcase( _Ostream_Manip(string) & fmt ) { if ( fmt.base == 'x' || fmt.base == 'b' ) fmt.base -= 32; /* upper case */ return fmt; }
109 _Ostream_Manip(string) & quote( _Ostream_Manip(string) & fmt, const char qleft = '"', const char qright = '\0' ) {
110 fmt.flags.quote = true; fmt.qleft = qleft, fmt.qright = qright; return fmt; }
111} // distribution
112
113forall( ostype & | basic_ostream( ostype ) ) {
114 ostype & ?|?( ostype & os, _Ostream_Manip(string) f );
115 void ?|?( ostype & os, _Ostream_Manip(string) );
116}
117
118struct _Istream_Swidth {
119 string & s;
120 inline _Istream_str_base;
121}; // _Istream_Swidth
122
123struct _Istream_Squote {
124 _Istream_Swidth sstr;
125}; // _Istream_Squote
126
127struct _Istream_Sstr {
128 string & s;
129 inline _Istream_str_base;
130// _Istream_Swidth sstr;
131}; // _Istream_Sstr
132
133static inline {
134 // read width does not include null terminator
135 _Istream_Swidth wdi( unsigned int rwd, string & s ) { return (_Istream_Swidth)@{ .s = s, { {.scanset = 0p}, .wd = rwd, {.flags.rwd = true} } }; }
136 _Istream_Sstr getline( string & s, const char delimiter = '\n' ) {
137 return (_Istream_Sstr)@{ .s = s, { {.delimiters = { delimiter, '\0' } }, .wd = -1, {.flags.delimiter = true} } };
138 }
139 _Istream_Sstr & getline( _Istream_Swidth & f, const char delimiter = '\n' ) {
140 f.delimiters[0] = delimiter; f.delimiters[1] = '\0'; f.flags.delimiter = true; return (_Istream_Sstr &)f;
141 }
142 _Istream_Squote quote( string & s, const char Ldelimiter = '\"', const char Rdelimiter = '\0' ) {
143 return (_Istream_Squote)@{ { .s = s, { {.delimiters = { Ldelimiter, Rdelimiter, '\0' }}, .wd = -1, {.flags.rwd = true} } } };
144 }
145 _Istream_Squote & quote( _Istream_Swidth & f, const char Ldelimiter = '"', const char Rdelimiter = '\0' ) {
146 f.delimiters[0] = Ldelimiter; f.delimiters[1] = Rdelimiter; f.delimiters[2] = '\0';
147 return (_Istream_Squote &)f;
148 }
149 _Istream_Sstr incl( const char scanset[], string & s ) { return (_Istream_Sstr)@{ .s = s, { {.scanset = scanset}, .wd = -1, {.flags.inex = false} } }; }
150 _Istream_Sstr & incl( const char scanset[], _Istream_Swidth & f ) { f.scanset = scanset; f.flags.inex = false; return (_Istream_Sstr &)f; }
151 _Istream_Sstr excl( const char scanset[], string & s ) { return (_Istream_Sstr)@{ .s = s, { {.scanset = scanset}, .wd = -1, {.flags.inex = true} } }; }
152 _Istream_Sstr & excl( const char scanset[], _Istream_Swidth & f ) { f.scanset = scanset; f.flags.inex = true; return (_Istream_Sstr &)f; }
153 _Istream_Sstr ignore( string & s ) { return (_Istream_Sstr)@{ .s = s, { {.scanset = 0p}, .wd = -1, {.flags.ignore = true} } }; }
154 _Istream_Sstr & ignore( _Istream_Swidth & f ) { f.flags.ignore = true; return (_Istream_Sstr &)f; }
155 _Istream_Squote & ignore( _Istream_Squote & f ) { f.sstr.flags.ignore = true; return (_Istream_Squote &)f; }
156 _Istream_Sstr & ignore( _Istream_Sstr & f ) { f.flags.ignore = true; return (_Istream_Sstr &)f; }
157} // distribution
158
159forall( istype & | basic_istream( istype ) ) {
160 istype & ?|?( istype & is, _Istream_Squote f );
161 istype & ?|?( istype & is, _Istream_Sstr f );
162 static inline istype & ?|?( istype & is, _Istream_Swidth f ) { return is | *(_Istream_Sstr *)&f; }
163}
164
165// Concatenation
166void ?+=?( string & s, char c );
167PBOOST void ?+=?( string & s, string );
168void append( string & s, const string & s2, size_t maxlen );
169void ?+=?( string & s, const char * cs );
170void append( string & s, const char * buffer, size_t bsize );
171
172string ?+?( string s, char c );
173string ?+?( char c, string s );
174PBOOST string ?+?( string s, string s2 );
175string ?+?( const char * cs, char c ); // not backwards compatible
176string ?+?( char c, const char * cs );
177string ?+?( const char * cs1 , const char * cs2 );
178string ?+?( const char * cs , string s );
179string ?+?( string s, const char * cs );
180string ?+?( char, char ); // not being called 8-(
181
182static inline string & strcat( string & s1, const string & s2 ) { s1 += s2; return s1; }
183static inline string & strcat( string & s, const char * cs ) { s += cs; return s; }
184static inline string & strncat( string & s1, const string & s2, size_t maxlen ) { append( s1, s2, maxlen ); return s1; }
185static inline string & strncat( string & s, const char * buffer, size_t bsize ) { append( s, buffer, bsize ); return s; }
186
187// Repetition
188
189// Type `signed long long int` chosen for `factor` argument to achieve cost detente.
190// This way, the call `'a' * 3` gets the same safe conversion cost calling here as for
191// the built-in definition `int * int`.
192typedef signed long long int strmul_factor_t;
193
194void ?*=?( string & s, strmul_factor_t factor );
195string ?*?( char c, strmul_factor_t factor ); // not backwards compatible
196PBOOST string ?*?( string s, strmul_factor_t factor );
197string ?*?( const char * cs, strmul_factor_t factor );
198static inline string ?*?( strmul_factor_t factor, char c ) { return c * factor; }
199PBOOST static inline string ?*?( strmul_factor_t factor, string s ) { return s * factor; }
200static inline string ?*?( strmul_factor_t factor, const char * cs ) { return cs * factor; }
201
202// Character access
203char ?[?]( const string & s, size_t index );
204string ?[?]( string & s, size_t index ); // mutable length-1 slice of original
205//char codePointAt(const string & s, size_t index ); // to revisit under Unicode
206
207// Comparisons
208static inline int strcmp( const string & s1, const string & s2 ) { return strcmp( *s1.inner, *s2.inner ); }
209int strncmp( const string & s1, const string & s2, size_t maxlen );
210static inline bool ?==?( const string & s1, const string & s2 ) { return *s1.inner == *s2.inner; }
211static inline bool ?!=?( const string & s1, const string & s2 ) { return *s1.inner != *s2.inner; }
212static inline bool ?>? ( const string & s1, const string & s2 ) { return *s1.inner > *s2.inner; }
213static inline bool ?>=?( const string & s1, const string & s2 ) { return *s1.inner >= *s2.inner; }
214static inline bool ?<=?( const string & s1, const string & s2 ) { return *s1.inner <= *s2.inner; }
215static inline bool ?<? ( const string & s1, const string & s2 ) { return *s1.inner < *s2.inner; }
216
217static inline int strcmp( const string & s1, const char * s2 ) { return strcmp( *s1.inner, s2 ); }
218int strncmp( const string & s1, const char * s2, size_t maxlen );
219static inline bool ?==?( const string & s1, const char * s2 ) { return *s1.inner == s2; }
220static inline bool ?!=?( const string & s1, const char * s2 ) { return *s1.inner != s2; }
221static inline bool ?>? ( const string & s1, const char * s2 ) { return *s1.inner > s2; }
222static inline bool ?>=?( const string & s1, const char * s2 ) { return *s1.inner >= s2; }
223static inline bool ?<=?( const string & s1, const char * s2 ) { return *s1.inner <= s2; }
224static inline bool ?<? ( const string & s1, const char * s2 ) { return *s1.inner < s2; }
225
226static inline int strcmp( const char * s1, const string & s2 ) { return strcmp( s1, *s2.inner ); }
227int strncmp( const char * s1, const string & s2, size_t maxlen );
228static inline bool ?==?( const char * s1, const string & s2 ) { return s1 == *s2.inner; }
229static inline bool ?!=?( const char * s1, const string & s2 ) { return s1 != *s2.inner; }
230static inline bool ?>? ( const char * s1, const string & s2 ) { return s1 > *s2.inner; }
231static inline bool ?>=?( const char * s1, const string & s2 ) { return s1 >= *s2.inner; }
232static inline bool ?<=?( const char * s1, const string & s2 ) { return s1 <= *s2.inner; }
233static inline bool ?<? ( const char * s1, const string & s2 ) { return s1 < *s2.inner; }
234
235// String search
236bool contains( const string & s, char ch ); // single character
237
238//int find( const string & s, size_t start, size_t len, const string & key, size_t kstart, size_t klen );
239size_t find$( const string_res & s, size_t start, size_t len, const string & key_res, size_t kstart, size_t klen );
240
241size_t find( const string & s, char key );
242size_t find( const string & s, const char * key );
243size_t find( const string & s, const string & key );
244size_t find( const string & s, const char * key, size_t keysize );
245
246size_t find( const string & s, size_t start, char key );
247size_t find( const string & s, size_t start, const string & key );
248size_t find( const string & s, size_t start, const char * key );
249size_t find( const string & s, size_t start, const char * key, size_t keysize );
250
251bool includes( const string & s, const string & mask );
252bool includes( const string & s, const char * mask );
253bool includes( const string & s, const char * mask, size_t masksize );
254
255bool startsWith( const string & s, const string & prefix );
256bool startsWith( const string & s, const char * prefix );
257bool startsWith( const string & s, const char * prefix, size_t prefixsize );
258
259bool endsWith( const string & s, const string & suffix );
260bool endsWith( const string & s, const char * suffix );
261bool endsWith( const string & s, const char * suffix, size_t suffixsize );
262
263// Slicing
264string ?()( string & s, ssize_t start, ssize_t len );
265static inline string ?()( const string & s, ssize_t start, ssize_t len ) { string & w = (string &)s; return w( start, len ); } // FIX ME
266string ?()( string & s, ssize_t start );
267static inline string ?()( const string & s, ssize_t start ) { string & w = (string &)s; return w( start ); } // FIX ME
268static inline string ?()( string & s, char m ) { return s( find( s, m ), 1 )`share; }
269static inline string ?()( const string & s, char m ) { string & w = (string &)s; return w( find( s, m ), 1 )`share; } // FIX ME
270static inline string ?()( string & s, const char * m ) { return s( find( s, m ), len( m ) )`share; }
271static inline string ?()( const string & s, const char * m ) { string & w = (string &)s; return w( find( s, m ), len( m ) )`share; } // FIX ME
272static inline string ?()( string & s, const string & m ) { return s( find( s, m ), len( m ) )`share; }
273static inline string ?()( const string & s, const string & m ) { string & w = (string &)s; return w( find( s, m ), len( m ) )`share; } // FIX ME
274
275struct charclass {
276 charclass_res * inner;
277};
278
279void ?{}( charclass & ) = void;
280void ?{}( charclass &, charclass ) = void;
281charclass ?=?( charclass &, charclass ) = void;
282
283void ?{}( charclass &, const string & chars );
284void ?{}( charclass &, const char * chars );
285void ?{}( charclass &, const char * chars, size_t charssize );
286void ^?{}( charclass & );
287
288size_t include( const string & s, const charclass & mask );
289static inline size_t include( const string & s, const char * mask ) { return include( s, (charclass){ mask } ); }
290static inline size_t include( const string & s, const string & mask ) { return include( s, (charclass){ mask } ); }
291static inline size_t include( const char * cs, const charclass & mask ) { return include( (string){ cs }, mask ); }
292static inline size_t include( const char * cs, const char * mask ) { return include( (string){ cs }, (charclass){ mask } ); }
293static inline size_t include( const char * cs, const string & mask ) { return include( (string){ cs }, (charclass){ mask } ); }
294
295static inline string include( const string & s, const charclass & mask ) { return s( 0, include( s, mask ) ); }
296static inline string include( const string & s, const char * mask ) { return s( 0, include( s, (charclass){ mask } ) ); }
297static inline string include( const string & s, const string & mask ) { return s( 0, include( s, (charclass){ mask } ) ); }
298static inline string include( const char * cs, const charclass & mask ) { const string s = cs; return s( 0, include( s, mask ) ); }
299static inline string include( const char * cs, const char * mask ) { const string s = cs; return s( 0, include( s, (charclass){ mask } ) ); }
300static inline string include( const char * cs, const string & mask ) { const string s = cs; return s( 0, include( s, (charclass){ mask } ) ); }
301
302size_t exclude( const string & s, const charclass & mask );
303static inline size_t exclude( const string & s, const char * mask ) { return exclude( s, (charclass){ mask } ); }
304static inline size_t exclude( const string & s, const string & mask ) { return exclude( s, (charclass){ mask } ); }
305static inline size_t exclude( const char * cs, const charclass & mask ) { return exclude( (string){ cs }, mask ); }
306static inline size_t exclude( const char * cs, const string & mask ) { return exclude( (string){ cs }, (charclass){ mask } ); }
307static inline size_t exclude( const char * cs, const char * mask ) { return exclude( (string){ cs }, (charclass){ mask } ); }
308
309static inline string exclude( const string & s, const charclass & mask ) { return s( 0, exclude( s, mask ) ); }
310static inline string exclude( const string & s, const char * mask ) { return s( 0, exclude( s, (charclass){ mask } ) ); }
311static inline string exclude( const string & s, const string & mask ) { return s( 0, exclude( s, (charclass){ mask } ) ); }
312static inline string exclude( const char * cs, const charclass & mask ) { const string s = cs; return s( 0, exclude( s, mask ) ); }
313static inline string exclude( const char * cs, const string & mask ) { const string s = cs; return s( 0, exclude( s, (charclass){ mask } ) ); }
314static inline string exclude( const char * cs, const char * mask ) { const string s = cs; return s( 0, exclude( s, (charclass){ mask } ) ); }
315
316size_t include( const string & s, int (* f)( int ) ); // for C character-class functions, e.g., isdigit
317static inline size_t include( const char * cs, int (* f)( int ) ) { return include( (string){ cs }, f ); }
318static inline string include( const string & s, int (* f)( int ) ) { return s( 0, include( s, f ) ); }
319static inline string include( const char * cs, int (* f)( int ) ) { const string s = cs; return s( 0, include( s, f ) ); }
320
321static inline size_t include( const string & s, bool (* f)( char ) ) { return include( s, (int (*)( int ))f ); }
322static inline size_t include( const char * cs, bool (* f)( char ) ) { return include( (string){ cs }, f ); }
323static inline string include( const string & s, bool (* f)( char ) ) { return s( 0, include( s, f ) ); }
324static inline string include( const char * cs, bool (* f)( char ) ) { const string s = cs; return s( 0, include( s, f ) ); }
325
326size_t exclude( const string & s, int (* f)( int ) ); // for C character-class functions, e.g., isdigit
327static inline size_t exclude( const char * cs, int (* f)( int ) ) { return exclude( (string){ cs }, f ); }
328static inline string exclude( const string & s, int (* f)( int ) ) { return s( 0, exclude( s, f ) ); }
329static inline string exclude( const char * cs, int (* f)( int ) ) { const string s = cs; return s( 0, exclude( s, f ) ); }
330
331static inline size_t exclude( const string & s, bool (* f)( char ) ) { return exclude( s, (int (*)( int ))f ); }
332static inline size_t exclude( const char * cs, bool (* f)( char ) ) { return exclude( (string){ cs }, f ); }
333static inline string exclude( const string & s, bool (* f)( char ) ) { return s( 0, exclude( s, f ) ); }
334static inline string exclude( const char * cs, bool (* f)( char ) ) { const string s = cs; return s( 0, exclude( s, f ) ); }
335
336string replace( const string & s, const string & from, const string & to );
337static inline string replace( const char * cs, const char * from, const char * to ) { return replace( (string){ cs }, (string){ from }, (string){ to } ); }
338static inline string replace( const string & s, const char * from, const char * to ) { return replace( s, (string){ from }, (string){ to } ); }
339static inline string replace( const string & s, const char * from, const string & to ) { return replace( s, (string){ from }, to ); }
340static inline string replace( const string & s, string & from, const char * to ) { return replace( s, from, (string){ to } ); }
341
342string translate( const string & s, int (* f)( int ) ); // for C character-class functions, e.g., isdigit
343static inline string translate( const char * cs, int (* f)( int ) ) { return translate( (string){ cs }, f ); }
344
345static inline string translate( const string & s, bool (* f)( char ) ) { return translate( s, (int (*)( int ))f ); }
346static inline string translate( const char * cs, bool (* f)( char ) ) { return translate( (string){ cs }, f ); }
347
348#ifndef _COMPILING_STRING_CFA_
349#undef PBOOST
350#endif
Note: See TracBrowser for help on using the repository browser.