source: libcfa/src/collections/string.hfa@ 2f16569

Last change on this file since 2f16569 was 2f16569, checked in by Peter A. Buhr <pabuhr@…>, 19 hours ago

remove string 'contains' function and replace with 'includes', make string 'includes' inline

  • Property mode set to 100644
File size: 20.6 KB
Line 
1//
2// Cforall Version 1.0.0 Copyright (C) 2016 University of Waterloo
3//
4// The contents of this file are covered under the licence agreement in the
5// file "LICENCE" distributed with Cforall.
6//
7// string -- variable-length, mutable run of text, with value semantics
8//
9// Author : Michael L. Brooks
10// Created On : Fri Sep 03 11:00:00 2021
11// Last Modified By : Peter A. Buhr
12// Last Modified On : Fri May 8 07:40:57 2026
13// Update Count : 353
14//
15
16#pragma once
17
18#include <iostream.hfa>
19#include <string_res.hfa>
20
21static struct __cfa_string_preference_boost_t {} __cfa_string_preference_boost;
22#define PBOOST forall ( | { __cfa_string_preference_boost_t __cfa_string_preference_boost; } )
23
24struct string {
25 string_res * inner;
26};
27
28// RAII, assignment
29void ^?{}( string & s );
30
31void ?{}( string & s ); // empty string
32void ?{}( string & s, string s2, size_t maxlen );
33PBOOST void ?{}( string & s, string s2 );
34void ?{}( string & s, char );
35void ?{}( string & s, const char * cs ); // copy from string literal (NULL-terminated)
36void ?{}( string & s, const char * cs, size_t size ); // copy specific length from buffer
37void ?{}( string & s, size_t rhs );
38void ?{}( string & s, ssize_t rhs );
39void ?{}( string & s, double rhs );
40void ?{}( string & s, long double rhs );
41void ?{}( string & s, double _Complex rhs );
42void ?{}( string & s, long double _Complex rhs );
43
44PBOOST string & ?=?( string & s, string rhs );
45string & ?=?( string & s, char rhs ); // copy from 'l'
46string & ?=?( string & s, const char * rhs ); // copy from "literal"
47string & assign( string & s, const string & rhs, size_t n );
48string & assign( string & s, const char * rhs, size_t n );
49string & ?=?( string & s, size_t rhs );
50string & ?=?( string & s, ssize_t rhs );
51string & ?=?( string & s, double rhs );
52string & ?=?( string & s, long double rhs );
53string & ?=?( string & s, double _Complex rhs );
54string & ?=?( string & s, long double _Complex rhs );
55
56// Conversion
57static inline string tostr( char c ) { string s = c; return s; }
58static inline string tostr( const char * cs ) { string s = cs; return s; }
59static inline string tostr( size_t v ) { string s = v; return s; }
60static inline string tostr( ssize_t v ) { string s = v; return s; }
61static inline string tostr( double v ) { string s = v; return s; }
62static inline string tostr( long double v ) { string s = v; return s; }
63static inline string tostr( long double _Complex v ) { string s = v; return s; }
64
65// C compatibility
66static inline string & strcpy( string & s, const char * cs ) { s = cs; return s; }
67static inline string & strncpy( string & s, const char * cs, size_t n ) { assign( s, cs, n ); return s; }
68static inline string & strcpy( string & s1, const string & s2 ) { s1 = s2; return s1; }
69static inline string & strncpy( string & s, const string & cs, size_t n ) { assign( s, cs, n ); return s; }
70char * strncpy( char * dst, string & src, size_t n );
71char * ?=?( char *& dst, string & src );
72void ?{}( char *& dst, string & src );
73
74// Alternate construction: request shared edits
75struct string_Share {
76 string * s;
77};
78string_Share ?`share( string & s );
79void ?{}( string & s, string_Share src );
80
81// Getters
82static inline size_t len( const string & s ) { return len( *s.inner ); }
83static inline size_t len( const char * cs ) { return strlen( cs ); };
84static inline size_t strlen( const string & s ) { return len( s ); }
85size_t strnlen( const string & s, size_t maxlen );
86
87// IO Operator
88forall( ostype & | basic_ostream( ostype ) ) {
89 ostype & ?|?( ostype & out, string s );
90 void ?|?( ostype & out, string s );
91}
92forall( istype & | basic_istream( istype ) )
93istype & ?|?( istype & in, string & s );
94
95static inline {
96 _Ostream_Manip(string) bin( string s ) { return (_Ostream_Manip(string))@{ .val = s, .wd = 1, .pc = 0, .base = 'b', { .all = 0 } }; }
97 _Ostream_Manip(string) oct( string s ) { return (_Ostream_Manip(string))@{ .val = s, .wd = 1, .pc = 0, .base = 'o', { .all = 0 } }; }
98 _Ostream_Manip(string) hex( string s ) { return (_Ostream_Manip(string))@{ .val = s, .wd = 1, .pc = 0, .base = 'x', { .all = 0 } }; }
99 _Ostream_Manip(string) quote( string s, const char qleft = '"', const char qright = '\0' ) {
100 return (_Ostream_Manip(string))@{ .val = s, .wd = 1, .pc = 0, .base = 's', { .flags.quote = true }, .qleft = qleft, .qright = qright }; }
101 _Ostream_Manip(string) wd( unsigned int wd, string s ) { return (_Ostream_Manip(string))@{ .val = s, .wd = wd, .pc = 0, .base = 's', { .all = 0 } }; }
102 _Ostream_Manip(string) wd( unsigned int wd, unsigned int pc, string s ) { return (_Ostream_Manip(string))@{ .val = s, .wd = wd, .pc = pc, .base = 's', { .flags.pc = true } }; }
103 _Ostream_Manip(string) & wd( unsigned int wd, _Ostream_Manip(string) & fmt ) { fmt.wd = wd; return fmt; }
104 _Ostream_Manip(string) & wd( unsigned int wd, unsigned int pc, _Ostream_Manip(string) & fmt ) { fmt.wd = wd; fmt.pc = pc; fmt.flags.pc = true; return fmt; }
105 _Ostream_Manip(string) & left( _Ostream_Manip(string) & fmt ) { fmt.flags.left = true; return fmt; }
106 _Ostream_Manip(string) & nobase( _Ostream_Manip(string) & fmt ) { fmt.flags.nobsdp = true; return fmt; }
107 _Ostream_Manip(string) & upcase( _Ostream_Manip(string) & fmt ) { if ( fmt.base == 'x' || fmt.base == 'b' ) fmt.base -= 32; /* upper case */ return fmt; }
108 _Ostream_Manip(string) & quote( _Ostream_Manip(string) & fmt, const char qleft = '"', const char qright = '\0' ) {
109 fmt.flags.quote = true; fmt.qleft = qleft, fmt.qright = qright; return fmt; }
110} // distribution
111
112forall( ostype & | basic_ostream( ostype ) ) {
113 ostype & ?|?( ostype & os, _Ostream_Manip(string) f );
114 void ?|?( ostype & os, _Ostream_Manip(string) );
115}
116
117struct _Istream_Swidth {
118 string & s;
119 inline _Istream_str_base;
120}; // _Istream_Swidth
121
122struct _Istream_Squote {
123 _Istream_Swidth sstr;
124}; // _Istream_Squote
125
126struct _Istream_Sstr {
127 string & s;
128 inline _Istream_str_base;
129// _Istream_Swidth sstr;
130}; // _Istream_Sstr
131
132static inline {
133 // read width does not include null terminator
134 _Istream_Swidth wdi( unsigned int rwd, string & s ) { return (_Istream_Swidth)@{ .s = s, { {.scanset = 0p}, .wd = rwd, {.flags.rwd = true} } }; }
135 _Istream_Sstr getline( string & s, const char delimiter = '\n' ) {
136 return (_Istream_Sstr)@{ .s = s, { {.delimiters = { delimiter, '\0' } }, .wd = -1, {.flags.delimiter = true} } };
137 }
138 _Istream_Sstr & getline( _Istream_Swidth & f, const char delimiter = '\n' ) {
139 f.delimiters[0] = delimiter; f.delimiters[1] = '\0'; f.flags.delimiter = true; return (_Istream_Sstr &)f;
140 }
141 _Istream_Squote quote( string & s, const char Ldelimiter = '\"', const char Rdelimiter = '\0' ) {
142 return (_Istream_Squote)@{ { .s = s, { {.delimiters = { Ldelimiter, Rdelimiter, '\0' }}, .wd = -1, {.flags.rwd = true} } } };
143 }
144 _Istream_Squote & quote( _Istream_Swidth & f, const char Ldelimiter = '"', const char Rdelimiter = '\0' ) {
145 f.delimiters[0] = Ldelimiter; f.delimiters[1] = Rdelimiter; f.delimiters[2] = '\0';
146 return (_Istream_Squote &)f;
147 }
148 _Istream_Sstr incl( const char scanset[], string & s ) { return (_Istream_Sstr)@{ .s = s, { {.scanset = scanset}, .wd = -1, {.flags.inex = false} } }; }
149 _Istream_Sstr & incl( const char scanset[], _Istream_Swidth & f ) { f.scanset = scanset; f.flags.inex = false; return (_Istream_Sstr &)f; }
150 _Istream_Sstr excl( const char scanset[], string & s ) { return (_Istream_Sstr)@{ .s = s, { {.scanset = scanset}, .wd = -1, {.flags.inex = true} } }; }
151 _Istream_Sstr & excl( const char scanset[], _Istream_Swidth & f ) { f.scanset = scanset; f.flags.inex = true; return (_Istream_Sstr &)f; }
152 _Istream_Sstr ignore( string & s ) { return (_Istream_Sstr)@{ .s = s, { {.scanset = 0p}, .wd = -1, {.flags.ignore = true} } }; }
153 _Istream_Sstr & ignore( _Istream_Swidth & f ) { f.flags.ignore = true; return (_Istream_Sstr &)f; }
154 _Istream_Squote & ignore( _Istream_Squote & f ) { f.sstr.flags.ignore = true; return (_Istream_Squote &)f; }
155 _Istream_Sstr & ignore( _Istream_Sstr & f ) { f.flags.ignore = true; return (_Istream_Sstr &)f; }
156} // distribution
157
158forall( istype & | basic_istream( istype ) ) {
159 istype & ?|?( istype & is, _Istream_Squote f );
160 istype & ?|?( istype & is, _Istream_Sstr f );
161 static inline istype & ?|?( istype & is, _Istream_Swidth f ) { return is | *(_Istream_Sstr *)&f; }
162}
163
164// Concatenation
165void ?+=?( string & s, char c );
166PBOOST void ?+=?( string & s, string );
167void append( string & s, const string & s2, size_t maxlen );
168void ?+=?( string & s, const char * cs );
169void append( string & s, const char * buffer, size_t bsize );
170
171string ?+?( string s, char c );
172string ?+?( char c, string s );
173PBOOST string ?+?( string s, string s2 );
174string ?+?( const char * cs, char c ); // not backwards compatible
175string ?+?( char c, const char * cs );
176string ?+?( const char * cs1 , const char * cs2 );
177string ?+?( const char * cs , string s );
178string ?+?( string s, const char * cs );
179string ?+?( char, char ); // not being called 8-(
180
181static inline string & strcat( string & s1, const string & s2 ) { s1 += s2; return s1; }
182static inline string & strcat( string & s, const char * cs ) { s += cs; return s; }
183static inline string & strncat( string & s1, const string & s2, size_t maxlen ) { append( s1, s2, maxlen ); return s1; }
184static inline string & strncat( string & s, const char * buffer, size_t bsize ) { append( s, buffer, bsize ); return s; }
185
186// Repetition
187
188// Type `signed long long int` chosen for `factor` argument to achieve cost detente.
189// This way, the call `'a' * 3` gets the same safe conversion cost calling here as for
190// the built-in definition `int * int`.
191typedef signed long long int strmul_factor_t;
192
193void ?*=?( string & s, strmul_factor_t factor );
194string ?*?( char c, strmul_factor_t factor ); // not backwards compatible
195PBOOST string ?*?( string s, strmul_factor_t factor );
196string ?*?( const char * cs, strmul_factor_t factor );
197static inline string ?*?( strmul_factor_t factor, char c ) { return c * factor; }
198PBOOST static inline string ?*?( strmul_factor_t factor, string s ) { return s * factor; }
199static inline string ?*?( strmul_factor_t factor, const char * cs ) { return cs * factor; }
200
201// Character access
202char ?[?]( const string & s, size_t index );
203string ?[?]( string & s, size_t index ); // mutable length-1 slice of original
204//char codePointAt(const string & s, size_t index ); // to revisit under Unicode
205
206// Comparisons
207static inline int strcmp( const string & s1, const string & s2 ) { return strcmp( *s1.inner, *s2.inner ); }
208int strncmp( const string & s1, const string & s2, size_t maxlen );
209static inline bool ?==?( const string & s1, const string & s2 ) { return *s1.inner == *s2.inner; }
210static inline bool ?!=?( const string & s1, const string & s2 ) { return *s1.inner != *s2.inner; }
211static inline bool ?>? ( const string & s1, const string & s2 ) { return *s1.inner > *s2.inner; }
212static inline bool ?>=?( const string & s1, const string & s2 ) { return *s1.inner >= *s2.inner; }
213static inline bool ?<=?( const string & s1, const string & s2 ) { return *s1.inner <= *s2.inner; }
214static inline bool ?<? ( const string & s1, const string & s2 ) { return *s1.inner < *s2.inner; }
215
216static inline int strcmp( const string & s1, const char * s2 ) { return strcmp( *s1.inner, s2 ); }
217int strncmp( const string & s1, const char * s2, size_t maxlen );
218static inline bool ?==?( const string & s1, const char * s2 ) { return *s1.inner == s2; }
219static inline bool ?!=?( const string & s1, const char * s2 ) { return *s1.inner != s2; }
220static inline bool ?>? ( const string & s1, const char * s2 ) { return *s1.inner > s2; }
221static inline bool ?>=?( const string & s1, const char * s2 ) { return *s1.inner >= s2; }
222static inline bool ?<=?( const string & s1, const char * s2 ) { return *s1.inner <= s2; }
223static inline bool ?<? ( const string & s1, const char * s2 ) { return *s1.inner < s2; }
224
225static inline int strcmp( const char * s1, const string & s2 ) { return strcmp( s1, *s2.inner ); }
226int strncmp( const char * s1, const string & s2, size_t maxlen );
227static inline bool ?==?( const char * s1, const string & s2 ) { return s1 == *s2.inner; }
228static inline bool ?!=?( const char * s1, const string & s2 ) { return s1 != *s2.inner; }
229static inline bool ?>? ( const char * s1, const string & s2 ) { return s1 > *s2.inner; }
230static inline bool ?>=?( const char * s1, const string & s2 ) { return s1 >= *s2.inner; }
231static inline bool ?<=?( const char * s1, const string & s2 ) { return s1 <= *s2.inner; }
232static inline bool ?<? ( const char * s1, const string & s2 ) { return s1 < *s2.inner; }
233
234// String search
235
236size_t find( const string & s, char key );
237size_t find( const string & s, const char * key );
238size_t find( const string & s, const string & key );
239size_t find( const string & s, const char * key, size_t keysize );
240
241size_t find( const string & s, size_t start, char key );
242size_t find( const string & s, size_t start, const string & key );
243size_t find( const string & s, size_t start, const char * key );
244size_t find( const string & s, size_t start, const char * key, size_t keysize );
245
246static inline bool includes( const string & s, char key ) { return find( s, key ) < len( s ); }
247static inline bool includes( const string & s, const char * key ) { return find( s, key ) < len( s ); }
248static inline bool includes( const string & s, const string & key ) { return find( s, key ) < len( s ); }
249static inline bool includes( const string & s, const char * key, size_t keysize ){ return find( s, key, keysize ) < len( s ); }
250
251bool startsWith( const string & s, const string & prefix );
252bool startsWith( const string & s, const char * prefix );
253bool startsWith( const string & s, const char * prefix, size_t prefixsize );
254
255bool endsWith( const string & s, const string & suffix );
256bool endsWith( const string & s, const char * suffix );
257bool endsWith( const string & s, const char * suffix, size_t suffixsize );
258
259// Slicing
260string ?()( string & s, ssize_t start, ssize_t len );
261static inline string ?()( const string & s, ssize_t start, ssize_t len ) { string & w = (string &)s; return w( start, len ); } // FIX ME
262string ?()( string & s, ssize_t start );
263static inline string ?()( const string & s, ssize_t start ) { string & w = (string &)s; return w( start ); } // FIX ME
264static inline string ?()( string & s, char m ) { return s( find( s, m ), 1 )`share; }
265static inline string ?()( const string & s, char m ) { string & w = (string &)s; return w( find( s, m ), 1 )`share; } // FIX ME
266static inline string ?()( string & s, const char * m ) { return s( find( s, m ), len( m ) )`share; }
267static inline string ?()( const string & s, const char * m ) { string & w = (string &)s; return w( find( s, m ), len( m ) )`share; } // FIX ME
268static inline string ?()( string & s, const string & m ) { return s( find( s, m ), len( m ) )`share; }
269static inline string ?()( const string & s, const string & m ) { string & w = (string &)s; return w( find( s, m ), len( m ) )`share; } // FIX ME
270
271struct charclass {
272 charclass_res * inner;
273};
274
275void ?{}( charclass & ) = void;
276void ?{}( charclass &, charclass ) = void;
277charclass ?=?( charclass &, charclass ) = void;
278
279void ?{}( charclass &, const string & chars );
280void ?{}( charclass &, const char * chars );
281void ?{}( charclass &, const char * chars, size_t charssize );
282void ^?{}( charclass & );
283
284size_t include( const string & s, const charclass & mask );
285static inline size_t include( const string & s, const char * mask ) { return include( s, (charclass){ mask } ); }
286static inline size_t include( const string & s, const string & mask ) { return include( s, (charclass){ mask } ); }
287static inline size_t include( const char * cs, const charclass & mask ) { return include( (string){ cs }, mask ); }
288static inline size_t include( const char * cs, const char * mask ) { return include( (string){ cs }, (charclass){ mask } ); }
289static inline size_t include( const char * cs, const string & mask ) { return include( (string){ cs }, (charclass){ mask } ); }
290
291static inline string include( const string & s, const charclass & mask ) { return s( 0, include( s, mask ) ); }
292static inline string include( const string & s, const char * mask ) { return s( 0, include( s, (charclass){ mask } ) ); }
293static inline string include( const string & s, const string & mask ) { return s( 0, include( s, (charclass){ mask } ) ); }
294static inline string include( const char * cs, const charclass & mask ) { const string s = cs; return s( 0, include( s, mask ) ); }
295static inline string include( const char * cs, const char * mask ) { const string s = cs; return s( 0, include( s, (charclass){ mask } ) ); }
296static inline string include( const char * cs, const string & mask ) { const string s = cs; return s( 0, include( s, (charclass){ mask } ) ); }
297
298size_t exclude( const string & s, const charclass & mask );
299static inline size_t exclude( const string & s, const char * mask ) { return exclude( s, (charclass){ mask } ); }
300static inline size_t exclude( const string & s, const string & mask ) { return exclude( s, (charclass){ mask } ); }
301static inline size_t exclude( const char * cs, const charclass & mask ) { return exclude( (string){ cs }, mask ); }
302static inline size_t exclude( const char * cs, const string & mask ) { return exclude( (string){ cs }, (charclass){ mask } ); }
303static inline size_t exclude( const char * cs, const char * mask ) { return exclude( (string){ cs }, (charclass){ mask } ); }
304
305static inline string exclude( const string & s, const charclass & mask ) { return s( 0, exclude( s, mask ) ); }
306static inline string exclude( const string & s, const char * mask ) { return s( 0, exclude( s, (charclass){ mask } ) ); }
307static inline string exclude( const string & s, const string & mask ) { return s( 0, exclude( s, (charclass){ mask } ) ); }
308static inline string exclude( const char * cs, const charclass & mask ) { const string s = cs; return s( 0, exclude( s, mask ) ); }
309static inline string exclude( const char * cs, const string & mask ) { const string s = cs; return s( 0, exclude( s, (charclass){ mask } ) ); }
310static inline string exclude( const char * cs, const char * mask ) { const string s = cs; return s( 0, exclude( s, (charclass){ mask } ) ); }
311
312size_t include( const string & s, int (* f)( int ) ); // for C character-class functions, e.g., isdigit
313static inline size_t include( const char * cs, int (* f)( int ) ) { return include( (string){ cs }, f ); }
314static inline string include( const string & s, int (* f)( int ) ) { return s( 0, include( s, f ) ); }
315static inline string include( const char * cs, int (* f)( int ) ) { const string s = cs; return s( 0, include( s, f ) ); }
316
317static inline size_t include( const string & s, bool (* f)( char ) ) { return include( s, (int (*)( int ))f ); }
318static inline size_t include( const char * cs, bool (* f)( char ) ) { return include( (string){ cs }, f ); }
319static inline string include( const string & s, bool (* f)( char ) ) { return s( 0, include( s, f ) ); }
320static inline string include( const char * cs, bool (* f)( char ) ) { const string s = cs; return s( 0, include( s, f ) ); }
321
322size_t exclude( const string & s, int (* f)( int ) ); // for C character-class functions, e.g., isdigit
323static inline size_t exclude( const char * cs, int (* f)( int ) ) { return exclude( (string){ cs }, f ); }
324static inline string exclude( const string & s, int (* f)( int ) ) { return s( 0, exclude( s, f ) ); }
325static inline string exclude( const char * cs, int (* f)( int ) ) { const string s = cs; return s( 0, exclude( s, f ) ); }
326
327static inline size_t exclude( const string & s, bool (* f)( char ) ) { return exclude( s, (int (*)( int ))f ); }
328static inline size_t exclude( const char * cs, bool (* f)( char ) ) { return exclude( (string){ cs }, f ); }
329static inline string exclude( const string & s, bool (* f)( char ) ) { return s( 0, exclude( s, f ) ); }
330static inline string exclude( const char * cs, bool (* f)( char ) ) { const string s = cs; return s( 0, exclude( s, f ) ); }
331
332string replace( const string & s, const string & from, const string & to );
333static inline string replace( const char * cs, const char * from, const char * to ) { return replace( (string){ cs }, (string){ from }, (string){ to } ); }
334static inline string replace( const string & s, const char * from, const char * to ) { return replace( s, (string){ from }, (string){ to } ); }
335static inline string replace( const string & s, const char * from, const string & to ) { return replace( s, (string){ from }, to ); }
336static inline string replace( const string & s, string & from, const char * to ) { return replace( s, from, (string){ to } ); }
337
338string translate( const string & s, int (* f)( int ) ); // for C character-class functions, e.g., isdigit
339static inline string translate( const char * cs, int (* f)( int ) ) { return translate( (string){ cs }, f ); }
340
341static inline string translate( const string & s, bool (* f)( char ) ) { return translate( s, (int (*)( int ))f ); }
342static inline string translate( const char * cs, bool (* f)( char ) ) { return translate( (string){ cs }, f ); }
343
344#ifndef _COMPILING_STRING_CFA_
345#undef PBOOST
346#endif
Note: See TracBrowser for help on using the repository browser.