[f450f2f] | 1 | // |
---|
| 2 | // Cforall Version 1.0.0 Copyright (C) 2016 University of Waterloo |
---|
| 3 | // |
---|
| 4 | // The contents of this file are covered under the licence agreement in the |
---|
| 5 | // file "LICENCE" distributed with Cforall. |
---|
| 6 | // |
---|
| 7 | // string_res -- variable-length, mutable run of text, with resource semantics |
---|
| 8 | // |
---|
| 9 | // Author : Michael L. Brooks |
---|
| 10 | // Created On : Fri Sep 03 11:00:00 2021 |
---|
[9ca5e56] | 11 | // Last Modified By : Peter A. Buhr |
---|
| 12 | // Last Modified On : Sat Aug 12 15:45:47 2023 |
---|
| 13 | // Update Count : 2 |
---|
[f450f2f] | 14 | // |
---|
| 15 | |
---|
| 16 | #pragma once |
---|
| 17 | |
---|
| 18 | #include <fstream.hfa> |
---|
[4e8df745] | 19 | #include <string.h> // e.g. strlen |
---|
[f450f2f] | 20 | |
---|
| 21 | |
---|
| 22 | //######################### HandleNode ######################### |
---|
| 23 | //private |
---|
| 24 | |
---|
| 25 | struct VbyteHeap; |
---|
| 26 | |
---|
| 27 | struct HandleNode { |
---|
| 28 | HandleNode *flink; // forward link |
---|
| 29 | HandleNode *blink; // backward link |
---|
[0f781fb8] | 30 | VbyteHeap *ulink; // upward link |
---|
[f450f2f] | 31 | |
---|
[9ca5e56] | 32 | char *s; // pointer to byte string |
---|
[f450f2f] | 33 | unsigned int lnth; // length of byte string |
---|
| 34 | }; // HandleNode |
---|
| 35 | |
---|
[0f781fb8] | 36 | VbyteHeap * DEBUG_string_heap(); |
---|
[7b0e8b7] | 37 | size_t DEBUG_string_bytes_in_heap( VbyteHeap * heap ); |
---|
[6cc87c0] | 38 | size_t DEBUG_string_bytes_avail_until_gc( VbyteHeap * heap ); |
---|
| 39 | const char * DEBUG_string_heap_start( VbyteHeap * heap ); |
---|
| 40 | |
---|
[08ed947] | 41 | void TUNING_set_string_heap_liveness_threshold( double val ); |
---|
[f450f2f] | 42 | |
---|
| 43 | //######################### String ######################### |
---|
| 44 | |
---|
| 45 | // A dynamically-sized string |
---|
| 46 | struct string_res { |
---|
| 47 | HandleNode Handle; // chars, start, end, global neighbours |
---|
[804bf677] | 48 | bool shareEditSet_owns_ulink; |
---|
[f450f2f] | 49 | string_res * shareEditSet_prev; |
---|
| 50 | string_res * shareEditSet_next; |
---|
| 51 | }; |
---|
| 52 | |
---|
| 53 | |
---|
| 54 | //######################### charclass_res ######################### |
---|
| 55 | |
---|
| 56 | struct charclass_res { |
---|
| 57 | string_res chars; |
---|
| 58 | }; |
---|
| 59 | |
---|
| 60 | void ?{}( charclass_res & ) = void; |
---|
| 61 | void ?{}( charclass_res &, charclass_res) = void; |
---|
| 62 | charclass_res ?=?( charclass_res &, charclass_res) = void; |
---|
| 63 | void ?{}( charclass_res &, const string_res & chars); |
---|
| 64 | void ?{}( charclass_res &, const char * chars ); |
---|
| 65 | void ?{}( charclass_res &, const char * chars, size_t charssize ); |
---|
| 66 | void ^?{}( charclass_res & ); |
---|
| 67 | |
---|
| 68 | |
---|
| 69 | //######################### String ######################### |
---|
| 70 | |
---|
| 71 | // Getters |
---|
| 72 | size_t size(const string_res &s); |
---|
| 73 | |
---|
| 74 | // Constructors, Assignment Operators, Destructor |
---|
| 75 | void ?{}(string_res &s); // empty string |
---|
| 76 | void ?{}(string_res &s, const char* buffer, size_t bsize); // copy specific length from buffer |
---|
[4e8df745] | 77 | static inline void ?{}(string_res &s, const char* rhs) { // copy from string literal (NULL-terminated) |
---|
| 78 | (s){ rhs, strlen(rhs) }; |
---|
| 79 | } |
---|
[f450f2f] | 80 | |
---|
| 81 | void ?{}(string_res &s, const string_res & s2) = void; |
---|
| 82 | void ?{}(string_res &s, string_res & s2) = void; |
---|
| 83 | |
---|
| 84 | enum StrResInitMode { COPY_VALUE, SHARE_EDITS }; |
---|
| 85 | void ?{}(string_res &s, const string_res & src, StrResInitMode, size_t start, size_t end ); |
---|
| 86 | static inline void ?{}(string_res &s, const string_res & src, StrResInitMode mode ) { |
---|
| 87 | ?{}( s, src, mode, 0, size(src)); |
---|
| 88 | } |
---|
| 89 | |
---|
[1733184] | 90 | string_res & assign(string_res &s, const char* buffer, size_t bsize); // copy specific length from buffer |
---|
| 91 | static inline string_res & ?=?(string_res &s, const char* other) { // copy from string literal (NULL-terminated) |
---|
| 92 | return assign(s, other, strlen(other)); |
---|
[4e8df745] | 93 | } |
---|
[1733184] | 94 | string_res & ?=?(string_res &s, const string_res &other); |
---|
| 95 | string_res & ?=?(string_res &s, string_res &other); |
---|
| 96 | string_res & ?=?(string_res &s, char other); |
---|
[f450f2f] | 97 | |
---|
| 98 | void ^?{}(string_res &s); |
---|
| 99 | |
---|
| 100 | // IO Operator |
---|
| 101 | ofstream & ?|?(ofstream &out, const string_res &s); |
---|
| 102 | void ?|?(ofstream &out, const string_res &s); |
---|
[d32679d5] | 103 | ifstream & ?|?(ifstream &in, string_res &s); |
---|
[ff56dd2e] | 104 | void ?|?( ifstream & in, string_res & this ); |
---|
| 105 | |
---|
| 106 | struct _Istream_Rstr { |
---|
| 107 | string_res * s; |
---|
| 108 | inline _Istream_str_base; |
---|
| 109 | }; // _Istream_Rstr |
---|
| 110 | |
---|
| 111 | static inline { |
---|
| 112 | // read width does not include null terminator |
---|
| 113 | _Istream_Rstr wdi( unsigned int rwd, string_res & s ) { return (_Istream_Rstr)@{ &s, {{0p}, rwd, {.flags.rwd : true}} }; } |
---|
| 114 | _Istream_Rstr getline( string_res & s, const char delimiter = '\n' ) { |
---|
| 115 | return (_Istream_Rstr)@{ &s, {{.delimiter : { delimiter, '\0' } }, -1, {.flags.delimiter : true, .flags.inex : true}} }; |
---|
| 116 | } |
---|
| 117 | _Istream_Rstr & getline( _Istream_Rstr & fmt, const char delimiter = '\n' ) { |
---|
| 118 | fmt.delimiter[0] = delimiter; fmt.delimiter[1] = '\0'; fmt.flags.delimiter = true; fmt.flags.inex = true; return fmt; |
---|
| 119 | } |
---|
| 120 | _Istream_Rstr incl( const char scanset[], string_res & s ) { return (_Istream_Rstr)@{ &s, {{scanset}, -1, {.flags.inex : false}} }; } |
---|
| 121 | _Istream_Rstr & incl( const char scanset[], _Istream_Rstr & fmt ) { fmt.scanset = scanset; fmt.flags.inex = false; return fmt; } |
---|
| 122 | _Istream_Rstr excl( const char scanset[], string_res & s ) { return (_Istream_Rstr)@{ &s, {{scanset}, -1, {.flags.inex : true}} }; } |
---|
| 123 | _Istream_Rstr & excl( const char scanset[], _Istream_Rstr & fmt ) { fmt.scanset = scanset; fmt.flags.inex = true; return fmt; } |
---|
| 124 | _Istream_Rstr ignore( string_res & s ) { return (_Istream_Rstr)@{ &s, {{0p}, -1, {.flags.ignore : true}} }; } |
---|
| 125 | _Istream_Rstr & ignore( _Istream_Rstr & fmt ) { fmt.flags.ignore = true; return fmt; } |
---|
| 126 | } // distribution |
---|
| 127 | ifstream & ?|?( ifstream & is, _Istream_Rstr f ); |
---|
| 128 | void ?|?( ifstream & is, _Istream_Rstr t ); |
---|
[f450f2f] | 129 | |
---|
| 130 | // Concatenation |
---|
[4e8df745] | 131 | void append(string_res &s, const char* buffer, size_t bsize); |
---|
[f450f2f] | 132 | void ?+=?(string_res &s, char other); // append a character |
---|
| 133 | void ?+=?(string_res &s, const string_res &s2); // append-concatenate to first string |
---|
[4e8df745] | 134 | static inline void ?+=?(string_res &s, const char* other) { |
---|
| 135 | append( s, other, strlen(other) ); |
---|
| 136 | } |
---|
[f450f2f] | 137 | |
---|
| 138 | // Character access |
---|
[218096f] | 139 | void assignAt(const string_res &s, size_t index, char val); |
---|
[f450f2f] | 140 | char ?[?](const string_res &s, size_t index); // Mike changed to ret by val from Sunjay's ref, to match Peter's |
---|
| 141 | //char codePointAt(const string_res &s, size_t index); // revisit under Unicode |
---|
| 142 | |
---|
| 143 | // Comparisons |
---|
[416b443] | 144 | int cmp (const string_res &, const string_res &); |
---|
| 145 | bool ?==?(const string_res &, const string_res &); |
---|
| 146 | bool ?!=?(const string_res &, const string_res &); |
---|
| 147 | bool ?>? (const string_res &, const string_res &); |
---|
| 148 | bool ?>=?(const string_res &, const string_res &); |
---|
| 149 | bool ?<=?(const string_res &, const string_res &); |
---|
| 150 | bool ?<? (const string_res &, const string_res &); |
---|
| 151 | |
---|
| 152 | int cmp (const string_res &, const char*); |
---|
| 153 | bool ?==?(const string_res &, const char*); |
---|
| 154 | bool ?!=?(const string_res &, const char*); |
---|
| 155 | bool ?>? (const string_res &, const char*); |
---|
| 156 | bool ?>=?(const string_res &, const char*); |
---|
| 157 | bool ?<=?(const string_res &, const char*); |
---|
| 158 | bool ?<? (const string_res &, const char*); |
---|
| 159 | |
---|
| 160 | int cmp (const char*, const string_res &); |
---|
| 161 | bool ?==?(const char*, const string_res &); |
---|
| 162 | bool ?!=?(const char*, const string_res &); |
---|
| 163 | bool ?>? (const char*, const string_res &); |
---|
| 164 | bool ?>=?(const char*, const string_res &); |
---|
| 165 | bool ?<=?(const char*, const string_res &); |
---|
| 166 | bool ?<? (const char*, const string_res &); |
---|
[f450f2f] | 167 | |
---|
| 168 | // String search |
---|
| 169 | bool contains(const string_res &s, char ch); // single character |
---|
| 170 | |
---|
| 171 | int find(const string_res &s, char search); |
---|
| 172 | int find(const string_res &s, const string_res &search); |
---|
| 173 | int find(const string_res &s, const char* search); |
---|
| 174 | int find(const string_res &s, const char* search, size_t searchsize); |
---|
| 175 | |
---|
[08ed947] | 176 | int findFrom(const string_res &s, size_t fromPos, char search); |
---|
| 177 | int findFrom(const string_res &s, size_t fromPos, const string_res &search); |
---|
| 178 | int findFrom(const string_res &s, size_t fromPos, const char* search); |
---|
| 179 | int findFrom(const string_res &s, size_t fromPos, const char* search, size_t searchsize); |
---|
| 180 | |
---|
[f450f2f] | 181 | bool includes(const string_res &s, const string_res &search); |
---|
| 182 | bool includes(const string_res &s, const char* search); |
---|
| 183 | bool includes(const string_res &s, const char* search, size_t searchsize); |
---|
| 184 | |
---|
| 185 | bool startsWith(const string_res &s, const string_res &prefix); |
---|
| 186 | bool startsWith(const string_res &s, const char* prefix); |
---|
| 187 | bool startsWith(const string_res &s, const char* prefix, size_t prefixsize); |
---|
| 188 | |
---|
| 189 | bool endsWith(const string_res &s, const string_res &suffix); |
---|
| 190 | bool endsWith(const string_res &s, const char* suffix); |
---|
| 191 | bool endsWith(const string_res &s, const char* suffix, size_t suffixsize); |
---|
| 192 | |
---|
| 193 | int include(const string_res &s, const charclass_res &mask); |
---|
| 194 | int exclude(const string_res &s, const charclass_res &mask); |
---|
| 195 | |
---|
| 196 | // Modifiers |
---|
| 197 | void padStart(string_res &s, size_t n); |
---|
| 198 | void padStart(string_res &s, size_t n, char padding); |
---|
| 199 | void padEnd(string_res &s, size_t n); |
---|
| 200 | void padEnd(string_res &s, size_t n, char padding); |
---|
| 201 | |
---|