P4C
The P4 Compiler
All Classes Namespaces Functions Variables Typedefs Enumerations Enumerator Friends Modules Pages
cstring.h
1/*
2Copyright 2013-present Barefoot Networks, Inc.
3
4Licensed under the Apache License, Version 2.0 (the "License");
5you may not use this file except in compliance with the License.
6You may obtain a copy of the License at
7
8 http://www.apache.org/licenses/LICENSE-2.0
9
10Unless required by applicable law or agreed to in writing, software
11distributed under the License is distributed on an "AS IS" BASIS,
12WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13See the License for the specific language governing permissions and
14limitations under the License.
15*/
16
17#ifndef LIB_CSTRING_H_
18#define LIB_CSTRING_H_
19
20#include <cstddef>
21#include <cstring>
22#include <functional>
23#include <sstream>
24#include <string>
25#include <string_view>
26
27#include "hash.h"
28
74class cstring;
75
76namespace P4::literals {
77inline cstring operator""_cs(const char *str, std::size_t len);
78}
79
80class cstring {
81 const char *str = nullptr;
82
83 public:
84 cstring() = default;
85
86 cstring(std::nullptr_t) {} // NOLINT(runtime/explicit)
87
88 // Copy and assignment from other kinds of strings
89
90 // Owner of string is someone else, but we know size of string.
91 // Do not use if possible, this is linear time operation if string
92 // not exists in table, because the underlying string must be copied.
93 cstring(const char *string, std::size_t length) { // NOLINT(runtime/explicit)
94 if (string != nullptr) {
95 construct_from_shared(string, length);
96 }
97 }
98
99 // Owner of string is someone else, we do not know size of string.
100 // Do not use if possible, this is linear time operation if string
101 // not exists in table, because the underlying string must be copied.
102 explicit cstring(const char *string) {
103 if (string != nullptr) {
104 construct_from_shared(string, std::strlen(string));
105 }
106 }
107
108 // construct cstring from std::string. Do not use if possible, this is linear
109 // time operation if string not exists in table, because the underlying string must be copied.
110 cstring(const std::string &string) { // NOLINT(runtime/explicit)
111 construct_from_shared(string.data(), string.length());
112 }
113
114 // construct cstring from std::string_view. Do not use if possible, this is linear
115 // time operation if string not exists in table, because the underlying string must be copied.
116 explicit cstring(std::string_view string) { // NOLINT(runtime/explicit)
117 construct_from_shared(string.data(), string.length());
118 }
119
120 // TODO (DanilLutsenko): Make special case for r-value std::string?
121
122 // Just helper function, for lazies, who do not like to write .str()
123 // Do not use it, implicit std::string construction with implicit overhead
124 // TODO (DanilLutsenko): Remove it?
125 cstring(const std::stringstream &stream) // NOLINT(runtime/explicit)
126 : cstring(stream.str()) {}
127
128 // TODO (DanilLutsenko): Construct from StringRef?
129
130 // String was created outside and cstring is unique owner of it.
131 // cstring will control lifetime of passed object
132 static cstring own(const char *string, std::size_t length) {
133 if (string == nullptr) {
134 return {};
135 }
136
137 cstring result;
138 result.construct_from_unique(string, length);
139 return result;
140 }
141
142 // construct cstring wrapper for literal
143 template <typename T, std::size_t N,
144 typename = typename std::enable_if<std::is_same<T, const char>::value>::type>
145 static cstring literal(T (&string)[N]) { // NOLINT(runtime/explicit)
146 cstring result;
147 result.construct_from_literal(string, N - 1 /* String length without null terminator */);
148 return result;
149 }
150
152 static bool is_cached(std::string_view s);
154 static cstring get_cached(std::string_view s);
155
156 private:
157 // passed string is shared, we not unique owners
158 void construct_from_shared(const char *string, std::size_t length);
159
160 // we are unique owners of passed string
161 void construct_from_unique(const char *string, std::size_t length);
162
163 // string is literal
164 void construct_from_literal(const char *string, std::size_t length);
165
166 friend cstring P4::literals::operator""_cs(const char *str, std::size_t len);
167
168 public:
172 cstring escapeJson() const;
173
174 template <typename Iter>
175 cstring(Iter begin, Iter end) {
176 *this = std::string(begin, end);
177 }
178
179 char get(unsigned index) const { return (index < size()) ? str[index] : 0; }
180 const char *c_str() const { return str; }
181 operator const char *() const { return str; }
182
183 std::string string() const { return str ? std::string(str) : std::string(""); }
184 explicit operator std::string() const { return string(); }
185
186 std::string_view string_view() const {
187 return str ? std::string_view(str) : std::string_view("");
188 }
189 explicit operator std::string_view() const { return string_view(); }
190
191 // Size tests. Constant time except for size(), which is linear time.
192 size_t size() const {
193 // TODO (DanilLutsenko): We store size of string in table on object construction,
194 // compiler cannot optimize strlen if str not points to string literal.
195 // Probably better fetch size from table or store it to cstring on construction.
196 return str ? strlen(str) : 0;
197 }
198 bool isNull() const { return str == nullptr; }
199 bool isNullOrEmpty() const { return str == nullptr ? true : str[0] == 0; }
200
201 // iterate over characters
202 const char *begin() const { return str; }
203 const char *end() const { return str ? str + strlen(str) : str; }
204
205 // Search for characters. Linear time.
206 const char *find(int c) const { return str ? strchr(str, c) : nullptr; }
207 const char *findlast(int c) const { return str ? strrchr(str, c) : str; }
208
209 // Search for substring
210 const char *find(const char *s) const { return str ? strstr(str, s) : nullptr; }
211
212 // Equality tests with other cstrings. Constant time.
213 bool operator==(cstring a) const { return str == a.str; }
214 bool operator!=(cstring a) const { return str != a.str; }
215
216 bool operator==(std::nullptr_t) const { return str == nullptr; }
217 bool operator!=(std::nullptr_t) const { return str != nullptr; }
218
219 // Other comparisons and tests. Linear time.
220 bool operator==(const char *a) const { return str ? a && !strcmp(str, a) : !a; }
221 bool operator!=(const char *a) const { return str ? !a || !!strcmp(str, a) : !!a; }
222 bool operator<(cstring a) const { return *this < a.str; }
223 bool operator<(const char *a) const { return str ? a && strcmp(str, a) < 0 : !!a; }
224 bool operator<=(cstring a) const { return *this <= a.str; }
225 bool operator<=(const char *a) const { return str ? a && strcmp(str, a) <= 0 : true; }
226 bool operator>(cstring a) const { return *this > a.str; }
227 bool operator>(const char *a) const { return str ? !a || strcmp(str, a) > 0 : false; }
228 bool operator>=(cstring a) const { return *this >= a.str; }
229 bool operator>=(const char *a) const { return str ? !a || strcmp(str, a) >= 0 : !a; }
230 bool operator==(std::string_view a) const { return str ? a.compare(str) == 0 : a.empty(); }
231 bool operator!=(std::string_view a) const { return str ? a.compare(str) != 0 : !a.empty(); }
232
233 bool operator==(const std::string &a) const { return *this == a.c_str(); }
234 bool operator!=(const std::string &a) const { return *this != a.c_str(); }
235 bool operator<(const std::string &a) const { return *this < a.c_str(); }
236 bool operator<=(const std::string &a) const { return *this <= a.c_str(); }
237 bool operator>(const std::string &a) const { return *this > a.c_str(); }
238 bool operator>=(const std::string &a) const { return *this >= a.c_str(); }
239
240 bool startsWith(std::string_view prefix) const;
241 bool endsWith(std::string_view suffix) const;
242
243 // FIXME (DanilLutsenko): We really need mutations for immutable string?
244 // Probably better do transformation in std::string-like containter and
245 // then place result to cstring if needed.
246
247 // Mutation operations. These are linear time and always trigger a copy,
248 // since the underlying string is immutable. (Note that this is true even
249 // for substr(); cstrings are always null-terminated, so a copy is
250 // required.)
251 cstring operator+=(cstring a);
252 cstring operator+=(const char *a);
253 cstring operator+=(std::string a);
254 cstring operator+=(char a);
255
256 cstring before(const char *at) const;
257 cstring substr(size_t start) const {
258 return (start >= size()) ? cstring::literal("") : substr(start, size() - start);
259 }
260 cstring substr(size_t start, size_t length) const;
261 cstring replace(char find, char replace) const;
262 cstring replace(std::string_view find, std::string_view replace) const;
263 cstring exceptLast(size_t count) { return substr(0, size() - count); }
264
265 // trim leading and trailing whitespace (or other)
266 cstring trim(const char *ws = " \t\r\n") const;
267
268 // Useful singletons.
269 static cstring newline;
270 static cstring empty;
271
272 // Static factory functions.
273 template <typename T>
274 static cstring to_cstring(const T &t) {
275 std::stringstream ss;
276 ss << t;
277 return cstring(ss.str());
278 }
279 template <typename Iterator>
280 static cstring join(Iterator begin, Iterator end, const char *delim = ", ") {
281 std::stringstream ss;
282 for (auto current = begin; current != end; ++current) {
283 if (begin != current) ss << delim;
284 ss << *current;
285 }
286 return cstring(ss.str());
287 }
288 template <class T>
289 static cstring make_unique(const T &inuse, cstring base, char sep = '.');
290 template <class T>
291 static cstring make_unique(const T &inuse, cstring base, int &counter, char sep = '.');
292
295 static size_t cache_size(size_t &count);
296
298 cstring toUpper() const;
300 cstring toLower() const;
302 cstring capitalize() const;
304 cstring indent(size_t amount) const;
305};
306
307inline bool operator==(const char *a, cstring b) { return b == a; }
308inline bool operator!=(const char *a, cstring b) { return b != a; }
309inline bool operator==(const std::string &a, cstring b) { return b == a; }
310inline bool operator!=(const std::string &a, cstring b) { return b != a; }
311
312inline std::string operator+(cstring a, cstring b) {
313 std::string rv(a);
314 rv += b;
315 return rv;
316}
317inline std::string operator+(cstring a, const char *b) {
318 std::string rv(a);
319 rv += b;
320 return rv;
321}
322inline std::string operator+(cstring a, const std::string &b) {
323 std::string rv(a);
324 rv += b;
325 return rv;
326}
327inline std::string operator+(cstring a, char b) {
328 std::string rv(a);
329 rv += b;
330 return rv;
331}
332inline std::string operator+(const char *a, cstring b) {
333 std::string rv(a);
334 rv += b;
335 return rv;
336}
337inline std::string operator+(std::string a, cstring b) {
338 a += b;
339 return a;
340}
341inline std::string operator+(char a, cstring b) {
342 std::string rv(1, a);
343 rv += b;
344 return rv;
345}
346
347inline cstring cstring::operator+=(cstring a) {
348 *this = *this + a;
349 return *this;
350}
351inline cstring cstring::operator+=(const char *a) {
352 *this = *this + a;
353 return *this;
354}
355inline cstring cstring::operator+=(std::string a) {
356 *this = *this + a;
357 return *this;
358}
359inline cstring cstring::operator+=(char a) {
360 *this = *this + a;
361 return *this;
362}
363
364inline std::string &operator+=(std::string &a, cstring b) {
365 a.append(b.c_str());
366 return a;
367}
368
369template <class T>
370cstring cstring::make_unique(const T &inuse, cstring base, int &counter, char sep) {
371 if (!inuse.count(base)) return base;
372
373 char suffix[12];
374 cstring rv = base;
375 do {
376 snprintf(suffix, sizeof(suffix) / sizeof(suffix[0]), "%c%d", sep, counter++);
377 rv = base + suffix;
378 } while (inuse.count(rv));
379 return rv;
380}
381
382template <class T>
383cstring cstring::make_unique(const T &inuse, cstring base, char sep) {
384 int counter = 0;
385 return make_unique(inuse, base, counter, sep);
386}
387
388inline std::ostream &operator<<(std::ostream &out, cstring s) {
389 return out << (s ? s.c_str() : "<null>");
390}
391
394namespace P4::literals {
395
399inline cstring operator""_cs(const char *str, std::size_t len) {
400 cstring result;
401 result.construct_from_literal(str, len);
402 return result;
403}
404} // namespace P4::literals
405
406namespace std {
407template <>
408struct hash<cstring> {
409 std::size_t operator()(const cstring &c) const {
410 // cstrings are internalized, therefore their addresses are unique; we
411 // can just use their address to produce hash.
412 return Util::Hash{}(c.c_str());
413 }
414};
415} // namespace std
416
417namespace Util {
418template <>
420 size_t operator()(const cstring &c) const { return Util::Hash{}(c.c_str()); }
421};
422
423} // namespace Util
424
425#endif /* LIB_CSTRING_H_ */
Definition cstring.h:80
cstring toLower() const
Convert the cstring to lowercase.
Definition cstring.cpp:314
cstring escapeJson() const
Definition cstring.cpp:269
cstring toUpper() const
Convert the cstring to uppercase.
Definition cstring.cpp:308
static size_t cache_size(size_t &count)
Definition cstring.cpp:211
static cstring get_cached(std::string_view s)
Definition cstring.cpp:188
cstring capitalize() const
Capitalize the first symbol.
Definition cstring.cpp:320
cstring indent(size_t amount) const
Append this many spaces after each newline (and before the first string).
Definition cstring.cpp:262
static bool is_cached(std::string_view s)
Definition cstring.cpp:186
Definition cstring.h:76
STL namespace.
Definition hash.h:125
Definition hash.h:123