source: libcfa/src/collections/string.hfa@ 2572add

Last change on this file since 2572add was ed5023d1, checked in by Peter A. Buhr <pabuhr@…>, 9 months ago

fix substring error being outside of string, simplify comparison operations, start refactoring string search operations

  • Property mode set to 100644
File size: 12.4 KB
Line 
1//
2// Cforall Version 1.0.0 Copyright (C) 2016 University of Waterloo
3//
4// The contents of this file are covered under the licence agreement in the
5// file "LICENCE" distributed with Cforall.
6//
7// string -- variable-length, mutable run of text, with value semantics
8//
9// Author : Michael L. Brooks
10// Created On : Fri Sep 03 11:00:00 2021
11// Last Modified By : Peter A. Buhr
12// Last Modified On : Sat Apr 5 15:16:23 2025
13// Update Count : 180
14//
15
16#pragma once
17
18#include <fstream.hfa>
19
20
21// in string_res.hfa
22struct string_res;
23struct charclass_res;
24
25struct string {
26 string_res * inner;
27};
28
29// Getters
30static inline size_t len( const char * cs ) { return strlen( cs ); };
31size_t len( const string & s );
32static inline size_t strlen( const string & s ) { return len( s ); }
33
34// RAII, assignment
35void ?{}( string & s ); // empty string
36void ?{}( string & s, const string & s2 );
37void ?{}( string & s, const string & s2, size_t maxlen );
38void ?{}( string & s, string & s2 );
39
40void ?{}( string & s, char );
41void ?{}( string & s, const char * c ); // copy from string literal (NULL-terminated)
42void ?{}( string & s, const char * c, size_t size ); // copy specific length from buffer
43
44void ?{}( string & s, ssize_t rhs );
45void ?{}( string & s, size_t rhs );
46void ?{}( string & s, double rhs );
47void ?{}( string & s, long double rhs );
48void ?{}( string & s, double _Complex rhs );
49void ?{}( string & s, long double _Complex rhs );
50
51// string str( ssize_t rhs );
52// string str( size_t rhs );
53// string str( double rhs );
54// string str( long double rhs );
55// string str( double _Complex rhs );
56// string str( long double _Complex rhs );
57
58string & ?=?( string & s, const string & c );
59string & ?=?( string & s, string & c );
60string & ?=?( string & s, const char * c ); // copy from "literal"
61string & ?=?( string & s, char c ); // copy from 'l'
62string & assign( string & s, const string & c, size_t n );
63string & assign( string & s, const char * c, size_t n );
64
65static inline string & strcpy( string & s, const char * c ) { s = c; return s; }
66static inline string & strncpy( string & s, const char * c, size_t n ) { assign( s, c, n ); return s; }
67static inline string & strcpy( string & s, const string & c ) { s = c; return s; }
68static inline string & strncpy( string & s, const string & c, size_t n ) { assign( s, c, n ); return s; }
69
70string & ?=?( string & s, ssize_t rhs );
71string & ?=?( string & s, size_t rhs );
72string & ?=?( string & s, double rhs );
73string & ?=?( string & s, long double rhs );
74string & ?=?( string & s, double _Complex rhs );
75string & ?=?( string & s, long double _Complex rhs );
76
77void ^?{}( string & s );
78
79// Alternate construction: request shared edits
80struct string_Share {
81 string * s;
82};
83string_Share ?`share( string & s );
84void ?{}( string & s, string_Share src );
85
86// IO Operator
87ofstream & ?|?( ofstream & out, const string & s );
88void ?|?( ofstream & out, const string & s );
89ifstream & ?|?( ifstream & in, string & s );
90
91static inline {
92 _Ostream_Manip(string) bin( string s ) { return (_Ostream_Manip(string))@{ s, 1, 0, 'b', { .all = 0 } }; }
93 _Ostream_Manip(string) oct( string s ) { return (_Ostream_Manip(string))@{ s, 1, 0, 'o', { .all = 0 } }; }
94 _Ostream_Manip(string) hex( string s ) { return (_Ostream_Manip(string))@{ s, 1, 0, 'x', { .all = 0 } }; }
95 _Ostream_Manip(string) wd( unsigned int w, string s ) { return (_Ostream_Manip(string))@{ s, w, 0, 's', { .all = 0 } }; }
96 _Ostream_Manip(string) wd( unsigned int w, unsigned int pc, string s ) { return (_Ostream_Manip(string))@{ s, w, pc, 's', { .flags.pc = true } }; }
97 _Ostream_Manip(string) & wd( unsigned int w, _Ostream_Manip(string) & fmt ) { fmt.wd = w; return fmt; }
98 _Ostream_Manip(string) & wd( unsigned int w, unsigned int pc, _Ostream_Manip(string) & fmt ) { fmt.wd = w; fmt.pc = pc; fmt.flags.pc = true; return fmt; }
99 _Ostream_Manip(string) & left( _Ostream_Manip(string) & fmt ) { fmt.flags.left = true; return fmt; }
100 _Ostream_Manip(string) & nobase( _Ostream_Manip(string) & fmt ) { fmt.flags.nobsdp = true; return fmt; }
101} // distribution
102ofstream & ?|?( ofstream & os, _Ostream_Manip(string) f );
103void ?|?( ofstream & os, _Ostream_Manip(string) );
104
105struct _Istream_Swidth {
106 string & s;
107 inline _Istream_str_base;
108}; // _Istream_Swidth
109
110struct _Istream_Squoted {
111 _Istream_Swidth sstr;
112}; // _Istream_Squoted
113
114struct _Istream_Sstr {
115 string & s;
116 inline _Istream_str_base;
117// _Istream_Swidth sstr;
118}; // _Istream_Sstr
119
120static inline {
121 // read width does not include null terminator
122 _Istream_Swidth wdi( unsigned int rwd, string & s ) { return (_Istream_Swidth)@{ .s = s, { {.scanset = 0p}, .wd = rwd, {.flags.rwd = true} } }; }
123 _Istream_Sstr getline( string & s, const char delimiter = '\n' ) {
124// return (_Istream_Sstr)@{ { .s = s, { {.delimiters = { delimiter, '\0' } }, .wd = -1, {.flags.delimiter = true} } } };
125 return (_Istream_Sstr)@{ .s = s, { {.delimiters = { delimiter, '\0' } }, .wd = -1, {.flags.delimiter = true} } };
126 }
127 _Istream_Sstr & getline( _Istream_Swidth & f, const char delimiter = '\n' ) {
128 f.delimiters[0] = delimiter; f.delimiters[1] = '\0'; f.flags.delimiter = true; return (_Istream_Sstr &)f;
129 }
130 _Istream_Squoted quoted( string & s, const char Ldelimiter = '\"', const char Rdelimiter = '\0' ) {
131 return (_Istream_Squoted)@{ { .s = s, { {.delimiters = { Ldelimiter, Rdelimiter, '\0' }}, .wd = -1, {.flags.rwd = true} } } };
132 }
133 _Istream_Squoted & quoted( _Istream_Swidth & f, const char Ldelimiter = '"', const char Rdelimiter = '\0' ) {
134 f.delimiters[0] = Ldelimiter; f.delimiters[1] = Rdelimiter; f.delimiters[2] = '\0';
135 return (_Istream_Squoted &)f;
136 }
137// _Istream_Sstr incl( const char scanset[], string & s ) { return (_Istream_Sstr)@{ { .s = s, { {.scanset = scanset}, .wd = -1, {.flags.inex = false} } } }; }
138 _Istream_Sstr incl( const char scanset[], string & s ) { return (_Istream_Sstr)@{ .s = s, { {.scanset = scanset}, .wd = -1, {.flags.inex = false} } }; }
139 _Istream_Sstr & incl( const char scanset[], _Istream_Swidth & f ) { f.scanset = scanset; f.flags.inex = false; return (_Istream_Sstr &)f; }
140// _Istream_Sstr excl( const char scanset[], string & s ) { return (_Istream_Sstr)@{ { .s = s, { {.scanset = scanset}, .wd = -1, {.flags.inex = true} } } }; }
141 _Istream_Sstr excl( const char scanset[], string & s ) { return (_Istream_Sstr)@{ .s = s, { {.scanset = scanset}, .wd = -1, {.flags.inex = true} } }; }
142 _Istream_Sstr & excl( const char scanset[], _Istream_Swidth & f ) { f.scanset = scanset; f.flags.inex = true; return (_Istream_Sstr &)f; }
143// _Istream_Sstr ignore( string & s ) { return (_Istream_Sstr)@{ { .s = s, { {.scanset = 0p}, .wd = -1, {.flags.ignore = true} } } }; }
144 _Istream_Sstr ignore( string & s ) { return (_Istream_Sstr)@{ .s = s, { {.scanset = 0p}, .wd = -1, {.flags.ignore = true} } }; }
145 _Istream_Sstr & ignore( _Istream_Swidth & f ) { f.flags.ignore = true; return (_Istream_Sstr &)f; }
146 _Istream_Squoted & ignore( _Istream_Squoted & f ) { f.sstr.flags.ignore = true; return (_Istream_Squoted &)f; }
147// _Istream_Sstr & ignore( _Istream_Sstr & f ) { f.sstr.flags.ignore = true; return (_Istream_Sstr &)f; }
148 _Istream_Sstr & ignore( _Istream_Sstr & f ) { f.flags.ignore = true; return (_Istream_Sstr &)f; }
149} // distribution
150ifstream & ?|?( ifstream & is, _Istream_Squoted f );
151ifstream & ?|?( ifstream & is, _Istream_Sstr f );
152static inline ifstream & ?|?( ifstream & is, _Istream_Swidth f ) { return is | *(_Istream_Sstr *)&f; }
153
154// Concatenation
155void ?+=?( string & s, char c );
156void ?+=?( string & s, const string & s2 );
157void append( string & s, const string & s2, size_t maxlen );
158void ?+=?( string & s, const char * s2 );
159void append( string & s, const char * buffer, size_t bsize );
160
161string ?+?( const string & s, char c );
162string ?+?( char c, const string & s );
163string ?+?( const string & s, const string & s2 );
164string ?+?( const char * s, char c ); // not backwards compatible
165string ?+?( char c, const char * s );
166string ?+?( const char * c, const char * s );
167string ?+?( const char * c, const string & s );
168string ?+?( const string & s, const char * c );
169string ?+?( char, char ); // not being called 8-(
170
171static inline string & strcat( string & s, const string & s2 ) { s += s2; return s; }
172static inline string & strcat( string & s, const char * c ) { s += c; return s; }
173static inline string & strncat( string & s, const string & s2, size_t maxlen ) { append( s, s2, maxlen ); return s; }
174static inline string & strncat( string & s, const char * buffer, size_t bsize ) { append( s, buffer, bsize ); return s; }
175
176// Repetition
177void ?*=?( string & s, size_t factor );
178string ?*?( char c, size_t factor ); // not backwards compatible
179string ?*?( const string & s, size_t factor );
180static inline string ?*?( size_t factor, const string & s ) { return s * factor; }
181string ?*?( const char * s, size_t factor );
182static inline string ?*?( size_t factor, const char * s ) { return s * factor; }
183
184// Character access
185char ?[?]( const string & s, size_t index );
186string ?[?]( string & s, size_t index ); // mutable length-1 slice of original
187//char codePointAt(const string & s, size_t index ); // to revisit under Unicode
188
189// Comparisons
190int strcmp ( const string &, const string & );
191bool ?==?( const string &, const string & );
192bool ?!=?( const string &, const string & );
193bool ?>? ( const string &, const string & );
194bool ?>=?( const string &, const string & );
195bool ?<=?( const string &, const string & );
196bool ?<? ( const string &, const string & );
197
198int strcmp( const string &, const char * );
199bool ?==?( const string &, const char * );
200bool ?!=?( const string &, const char * );
201bool ?>? ( const string &, const char * );
202bool ?>=?( const string &, const char * );
203bool ?<=?( const string &, const char * );
204bool ?<? ( const string &, const char * );
205
206int strcmp( const char *, const string & );
207bool ?==?( const char *, const string & );
208bool ?!=?( const char *, const string & );
209bool ?>? ( const char *, const string & );
210bool ?>=?( const char *, const string & );
211bool ?<=?( const char *, const string & );
212bool ?<? ( const char *, const string & );
213
214// String search
215bool contains( const string & s, char ch ); // single character
216
217int find( const string & s, char key );
218static inline int ?^? ( const string & s, char key ) { return find( s, key ); }
219int find( const string & s, const char * key );
220static inline int ?^? ( const string & s, const char * key ) { return find( s, key ); }
221int find( const string & s, const string & key );
222static inline int ?^? ( const string & s, const string & key ) { return find( s, key ); }
223int find( const string & s, const char * key, size_t keysize );
224
225int find( const string & s, size_t start, char key );
226int find( const string & s, size_t start, const string & key );
227int find( const string & s, size_t start, const char * key );
228int find( const string & s, size_t start, const char * key, size_t keysize );
229
230bool includes( const string & s, const string & mask );
231bool includes( const string & s, const char * mask );
232bool includes( const string & s, const char * mask, size_t masksize );
233
234bool startsWith( const string & s, const string & prefix );
235bool startsWith( const string & s, const char * prefix );
236bool startsWith( const string & s, const char * prefix, size_t prefixsize );
237
238bool endsWith( const string & s, const string & suffix );
239bool endsWith( const string & s, const char * suffix );
240bool endsWith( const string & s, const char * suffix, size_t suffixsize );
241
242// Slicing
243string ?()( string & s, ssize_t start, ssize_t len ); // TODO const?
244string ?()( string & s, ssize_t start );
245static inline string ?()( string & s, char m ) { return s( find( s, m ), 1 )`share; }
246static inline string ?()( string & s, const char * m ) { return s( find( s, m ), len( m ) )`share; }
247static inline string ?()( string & s, const string & m ) { return s( find( s, m ), len( m ) )`share; }
248
249// Modifiers
250void padStart( string & s, size_t n );
251void padStart( string & s, size_t n, char padding );
252void padEnd( string & s, size_t n );
253void padEnd( string & s, size_t n, char padding );
254
255
256struct charclass {
257 charclass_res * inner;
258};
259
260void ?{}( charclass & ) = void;
261void ?{}( charclass &, charclass ) = void;
262charclass ?=?( charclass &, charclass ) = void;
263
264void ?{}( charclass &, const string & chars );
265void ?{}( charclass &, const char * chars );
266void ?{}( charclass &, const char * chars, size_t charssize );
267void ^?{}( charclass & );
268
269int include( const string & s, const charclass & mask );
270
271int exclude( const string & s, const charclass & mask );
272
273/*
274What to do with?
275StrRet include( string & s, const charclass & mask );
276StrRet exclude( string & s, const charclass & mask );
277*/
Note: See TracBrowser for help on using the repository browser.