ustring.h 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447
  1. /*************************************************************************/
  2. /* ustring.h */
  3. /*************************************************************************/
  4. /* This file is part of: */
  5. /* GODOT ENGINE */
  6. /* https://godotengine.org */
  7. /*************************************************************************/
  8. /* Copyright (c) 2007-2021 Juan Linietsky, Ariel Manzur. */
  9. /* Copyright (c) 2014-2021 Godot Engine contributors (cf. AUTHORS.md). */
  10. /* */
  11. /* Permission is hereby granted, free of charge, to any person obtaining */
  12. /* a copy of this software and associated documentation files (the */
  13. /* "Software"), to deal in the Software without restriction, including */
  14. /* without limitation the rights to use, copy, modify, merge, publish, */
  15. /* distribute, sublicense, and/or sell copies of the Software, and to */
  16. /* permit persons to whom the Software is furnished to do so, subject to */
  17. /* the following conditions: */
  18. /* */
  19. /* The above copyright notice and this permission notice shall be */
  20. /* included in all copies or substantial portions of the Software. */
  21. /* */
  22. /* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, */
  23. /* EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF */
  24. /* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.*/
  25. /* IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY */
  26. /* CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, */
  27. /* TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE */
  28. /* SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. */
  29. /*************************************************************************/
  30. #ifndef USTRING_H
  31. #define USTRING_H
  32. #include "core/array.h"
  33. #include "core/cowdata.h"
  34. #include "core/typedefs.h"
  35. #include "core/vector.h"
  36. template <class T>
  37. class CharProxy {
  38. friend class CharString;
  39. friend class String;
  40. const int _index;
  41. CowData<T> &_cowdata;
  42. static const T _null = 0;
  43. _FORCE_INLINE_ CharProxy(const int &p_index, CowData<T> &cowdata) :
  44. _index(p_index),
  45. _cowdata(cowdata) {}
  46. public:
  47. _FORCE_INLINE_ operator T() const {
  48. if (unlikely(_index == _cowdata.size()))
  49. return _null;
  50. return _cowdata.get(_index);
  51. }
  52. _FORCE_INLINE_ const T *operator&() const {
  53. return _cowdata.ptr() + _index;
  54. }
  55. _FORCE_INLINE_ void operator=(const T &other) const {
  56. _cowdata.set(_index, other);
  57. }
  58. _FORCE_INLINE_ void operator=(const CharProxy<T> &other) const {
  59. _cowdata.set(_index, other.operator T());
  60. }
  61. };
  62. class CharString {
  63. CowData<char> _cowdata;
  64. static const char _null;
  65. public:
  66. _FORCE_INLINE_ char *ptrw() { return _cowdata.ptrw(); }
  67. _FORCE_INLINE_ const char *ptr() const { return _cowdata.ptr(); }
  68. _FORCE_INLINE_ int size() const { return _cowdata.size(); }
  69. Error resize(int p_size) { return _cowdata.resize(p_size); }
  70. _FORCE_INLINE_ char get(int p_index) const { return _cowdata.get(p_index); }
  71. _FORCE_INLINE_ void set(int p_index, const char &p_elem) { _cowdata.set(p_index, p_elem); }
  72. _FORCE_INLINE_ const char &operator[](int p_index) const {
  73. if (unlikely(p_index == _cowdata.size()))
  74. return _null;
  75. return _cowdata.get(p_index);
  76. }
  77. _FORCE_INLINE_ CharProxy<char> operator[](int p_index) { return CharProxy<char>(p_index, _cowdata); }
  78. _FORCE_INLINE_ CharString() {}
  79. _FORCE_INLINE_ CharString(const CharString &p_str) { _cowdata._ref(p_str._cowdata); }
  80. _FORCE_INLINE_ CharString operator=(const CharString &p_str) {
  81. _cowdata._ref(p_str._cowdata);
  82. return *this;
  83. }
  84. _FORCE_INLINE_ CharString(const char *p_cstr) { copy_from(p_cstr); }
  85. CharString &operator=(const char *p_cstr);
  86. bool operator<(const CharString &p_right) const;
  87. CharString &operator+=(char p_char);
  88. int length() const { return size() ? size() - 1 : 0; }
  89. const char *get_data() const;
  90. operator const char *() const { return get_data(); };
  91. protected:
  92. void copy_from(const char *p_cstr);
  93. };
  94. typedef wchar_t CharType;
  95. struct StrRange {
  96. const CharType *c_str;
  97. int len;
  98. StrRange(const CharType *p_c_str = NULL, int p_len = 0) {
  99. c_str = p_c_str;
  100. len = p_len;
  101. }
  102. };
  103. class String {
  104. CowData<CharType> _cowdata;
  105. static const CharType _null;
  106. void copy_from(const char *p_cstr);
  107. void copy_from(const CharType *p_cstr, const int p_clip_to = -1);
  108. void copy_from(const CharType &p_char);
  109. void copy_from_unchecked(const CharType *p_char, const int p_length);
  110. bool _base_is_subsequence_of(const String &p_string, bool case_insensitive) const;
  111. int _count(const String &p_string, int p_from, int p_to, bool p_case_insensitive) const;
  112. public:
  113. enum {
  114. npos = -1 ///<for "some" compatibility with std::string (npos is a huge value in std::string)
  115. };
  116. _FORCE_INLINE_ CharType *ptrw() { return _cowdata.ptrw(); }
  117. _FORCE_INLINE_ const CharType *ptr() const { return _cowdata.ptr(); }
  118. void remove(int p_index) { _cowdata.remove(p_index); }
  119. _FORCE_INLINE_ void clear() { resize(0); }
  120. _FORCE_INLINE_ CharType get(int p_index) const { return _cowdata.get(p_index); }
  121. _FORCE_INLINE_ void set(int p_index, const CharType &p_elem) { _cowdata.set(p_index, p_elem); }
  122. _FORCE_INLINE_ int size() const { return _cowdata.size(); }
  123. Error resize(int p_size) { return _cowdata.resize(p_size); }
  124. _FORCE_INLINE_ const CharType &operator[](int p_index) const {
  125. if (unlikely(p_index == _cowdata.size()))
  126. return _null;
  127. return _cowdata.get(p_index);
  128. }
  129. _FORCE_INLINE_ CharProxy<CharType> operator[](int p_index) { return CharProxy<CharType>(p_index, _cowdata); }
  130. bool operator==(const String &p_str) const;
  131. bool operator!=(const String &p_str) const;
  132. String operator+(const String &p_str) const;
  133. //String operator+(CharType p_char) const;
  134. String &operator+=(const String &);
  135. String &operator+=(CharType p_char);
  136. String &operator+=(const char *p_str);
  137. String &operator+=(const CharType *p_str);
  138. /* Compatibility Operators */
  139. void operator=(const char *p_str);
  140. void operator=(const CharType *p_str);
  141. bool operator==(const char *p_str) const;
  142. bool operator==(const CharType *p_str) const;
  143. bool operator==(const StrRange &p_str_range) const;
  144. bool operator!=(const char *p_str) const;
  145. bool operator!=(const CharType *p_str) const;
  146. bool operator<(const CharType *p_str) const;
  147. bool operator<(const char *p_str) const;
  148. bool operator<(const String &p_str) const;
  149. bool operator<=(const String &p_str) const;
  150. signed char casecmp_to(const String &p_str) const;
  151. signed char nocasecmp_to(const String &p_str) const;
  152. signed char naturalnocasecmp_to(const String &p_str) const;
  153. const CharType *c_str() const;
  154. /* standard size stuff */
  155. _FORCE_INLINE_ int length() const {
  156. int s = size();
  157. return s ? (s - 1) : 0; // length does not include zero
  158. }
  159. /* complex helpers */
  160. String substr(int p_from, int p_chars = -1) const;
  161. int find(const String &p_str, int p_from = 0) const; ///< return <0 if failed
  162. int find(const char *p_str, int p_from = 0) const; ///< return <0 if failed
  163. int find_char(const CharType &p_char, int p_from = 0) const; ///< return <0 if failed
  164. int find_last(const String &p_str) const; ///< return <0 if failed
  165. int findn(const String &p_str, int p_from = 0) const; ///< return <0 if failed, case insensitive
  166. int rfind(const String &p_str, int p_from = -1) const; ///< return <0 if failed
  167. int rfindn(const String &p_str, int p_from = -1) const; ///< return <0 if failed, case insensitive
  168. int findmk(const Vector<String> &p_keys, int p_from = 0, int *r_key = NULL) const; ///< return <0 if failed
  169. bool match(const String &p_wildcard) const;
  170. bool matchn(const String &p_wildcard) const;
  171. bool begins_with(const String &p_string) const;
  172. bool begins_with(const char *p_string) const;
  173. bool ends_with(const String &p_string) const;
  174. bool is_enclosed_in(const String &p_string) const;
  175. bool is_subsequence_of(const String &p_string) const;
  176. bool is_subsequence_ofi(const String &p_string) const;
  177. bool is_quoted() const;
  178. Vector<String> bigrams() const;
  179. float similarity(const String &p_string) const;
  180. String format(const Variant &values, String placeholder = "{_}") const;
  181. String replace_first(const String &p_key, const String &p_with) const;
  182. String replace(const String &p_key, const String &p_with) const;
  183. String replace(const char *p_key, const char *p_with) const;
  184. String replacen(const String &p_key, const String &p_with) const;
  185. String repeat(int p_count) const;
  186. String insert(int p_at_pos, const String &p_string) const;
  187. String pad_decimals(int p_digits) const;
  188. String pad_zeros(int p_digits) const;
  189. String trim_prefix(const String &p_prefix) const;
  190. String trim_suffix(const String &p_suffix) const;
  191. String lpad(int min_length, const String &character = " ") const;
  192. String rpad(int min_length, const String &character = " ") const;
  193. String sprintf(const Array &values, bool *error) const;
  194. String quote(String quotechar = "\"") const;
  195. String unquote() const;
  196. static String num(double p_num, int p_decimals = -1);
  197. static String num_scientific(double p_num);
  198. static String num_real(double p_num);
  199. static String num_int64(int64_t p_num, int base = 10, bool capitalize_hex = false);
  200. static String num_uint64(uint64_t p_num, int base = 10, bool capitalize_hex = false);
  201. static String chr(CharType p_char);
  202. static String md5(const uint8_t *p_md5);
  203. static String hex_encode_buffer(const uint8_t *p_buffer, int p_len);
  204. bool is_numeric() const;
  205. double to_double() const;
  206. float to_float() const;
  207. int hex_to_int(bool p_with_prefix = true) const;
  208. int to_int() const;
  209. int64_t hex_to_int64(bool p_with_prefix = true) const;
  210. int64_t bin_to_int64(bool p_with_prefix = true) const;
  211. int64_t to_int64() const;
  212. static int to_int(const char *p_str, int p_len = -1);
  213. static double to_double(const char *p_str);
  214. static double to_double(const CharType *p_str, const CharType **r_end = NULL);
  215. static int64_t to_int(const CharType *p_str, int p_len = -1);
  216. String capitalize() const;
  217. String camelcase_to_underscore(bool lowercase = true) const;
  218. int get_slice_count(String p_splitter) const;
  219. String get_slice(String p_splitter, int p_slice) const;
  220. String get_slicec(CharType p_splitter, int p_slice) const;
  221. Vector<String> split(const String &p_splitter, bool p_allow_empty = true, int p_maxsplit = 0) const;
  222. Vector<String> rsplit(const String &p_splitter, bool p_allow_empty = true, int p_maxsplit = 0) const;
  223. Vector<String> split_spaces() const;
  224. Vector<float> split_floats(const String &p_splitter, bool p_allow_empty = true) const;
  225. Vector<float> split_floats_mk(const Vector<String> &p_splitters, bool p_allow_empty = true) const;
  226. Vector<int> split_ints(const String &p_splitter, bool p_allow_empty = true) const;
  227. Vector<int> split_ints_mk(const Vector<String> &p_splitters, bool p_allow_empty = true) const;
  228. String join(Vector<String> parts);
  229. static CharType char_uppercase(CharType p_char);
  230. static CharType char_lowercase(CharType p_char);
  231. String to_upper() const;
  232. String to_lower() const;
  233. int count(const String &p_string, int p_from = 0, int p_to = 0) const;
  234. int countn(const String &p_string, int p_from = 0, int p_to = 0) const;
  235. String left(int p_pos) const;
  236. String right(int p_pos) const;
  237. String dedent() const;
  238. String strip_edges(bool left = true, bool right = true) const;
  239. String strip_escapes() const;
  240. String lstrip(const String &p_chars) const;
  241. String rstrip(const String &p_chars) const;
  242. String get_extension() const;
  243. String get_basename() const;
  244. String plus_file(const String &p_file) const;
  245. CharType ord_at(int p_idx) const;
  246. void erase(int p_pos, int p_chars);
  247. CharString ascii(bool p_allow_extended = false) const;
  248. CharString utf8() const;
  249. bool parse_utf8(const char *p_utf8, int p_len = -1); //return true on error
  250. static String utf8(const char *p_utf8, int p_len = -1);
  251. static uint32_t hash(const CharType *p_cstr, int p_len); /* hash the string */
  252. static uint32_t hash(const CharType *p_cstr); /* hash the string */
  253. static uint32_t hash(const char *p_cstr, int p_len); /* hash the string */
  254. static uint32_t hash(const char *p_cstr); /* hash the string */
  255. uint32_t hash() const; /* hash the string */
  256. uint64_t hash64() const; /* hash the string */
  257. String md5_text() const;
  258. String sha1_text() const;
  259. String sha256_text() const;
  260. Vector<uint8_t> md5_buffer() const;
  261. Vector<uint8_t> sha1_buffer() const;
  262. Vector<uint8_t> sha256_buffer() const;
  263. _FORCE_INLINE_ bool empty() const { return length() == 0; }
  264. // path functions
  265. bool is_abs_path() const;
  266. bool is_rel_path() const;
  267. bool is_resource_file() const;
  268. String path_to(const String &p_path) const;
  269. String path_to_file(const String &p_path) const;
  270. String get_base_dir() const;
  271. String get_file() const;
  272. static String humanize_size(uint64_t p_size);
  273. String simplify_path() const;
  274. String xml_escape(bool p_escape_quotes = false) const;
  275. String xml_unescape() const;
  276. String http_escape() const;
  277. String http_unescape() const;
  278. String c_escape() const;
  279. String c_escape_multiline() const;
  280. String c_unescape() const;
  281. String json_escape() const;
  282. String word_wrap(int p_chars_per_line) const;
  283. Error parse_url(String &r_scheme, String &r_host, int &r_port, String &r_path) const;
  284. String percent_encode() const;
  285. String percent_decode() const;
  286. String property_name_encode() const;
  287. // node functions
  288. static const String invalid_node_name_characters;
  289. String validate_node_name() const;
  290. bool is_valid_identifier() const;
  291. bool is_valid_integer() const;
  292. bool is_valid_float() const;
  293. bool is_valid_hex_number(bool p_with_prefix) const;
  294. bool is_valid_html_color() const;
  295. bool is_valid_ip_address() const;
  296. bool is_valid_filename() const;
  297. /**
  298. * The constructors must not depend on other overloads
  299. */
  300. /* String(CharType p_char);*/
  301. _FORCE_INLINE_ String() {}
  302. _FORCE_INLINE_ String(const String &p_str) { _cowdata._ref(p_str._cowdata); }
  303. String operator=(const String &p_str) {
  304. _cowdata._ref(p_str._cowdata);
  305. return *this;
  306. }
  307. String(const char *p_str);
  308. String(const CharType *p_str, int p_clip_to_len = -1);
  309. String(const StrRange &p_range);
  310. };
  311. bool operator==(const char *p_chr, const String &p_str);
  312. String operator+(const char *p_chr, const String &p_str);
  313. String operator+(CharType p_chr, const String &p_str);
  314. String itos(int64_t p_val);
  315. String uitos(uint64_t p_val);
  316. String rtos(double p_val);
  317. String rtoss(double p_val); //scientific version
  318. struct NoCaseComparator {
  319. bool operator()(const String &p_a, const String &p_b) const {
  320. return p_a.nocasecmp_to(p_b) < 0;
  321. }
  322. };
  323. struct NaturalNoCaseComparator {
  324. bool operator()(const String &p_a, const String &p_b) const {
  325. return p_a.naturalnocasecmp_to(p_b) < 0;
  326. }
  327. };
  328. template <typename L, typename R>
  329. _FORCE_INLINE_ bool is_str_less(const L *l_ptr, const R *r_ptr) {
  330. while (true) {
  331. if (*l_ptr == 0 && *r_ptr == 0)
  332. return false;
  333. else if (*l_ptr == 0)
  334. return true;
  335. else if (*r_ptr == 0)
  336. return false;
  337. else if (*l_ptr < *r_ptr)
  338. return true;
  339. else if (*l_ptr > *r_ptr)
  340. return false;
  341. l_ptr++;
  342. r_ptr++;
  343. }
  344. }
  345. /* end of namespace */
  346. //tool translate
  347. #ifdef TOOLS_ENABLED
  348. //gets parsed
  349. String TTR(const String &);
  350. //use for C strings
  351. #define TTRC(m_value) (m_value)
  352. //use to avoid parsing (for use later with C strings)
  353. #define TTRGET(m_value) TTR(m_value)
  354. #else
  355. #define TTR(m_value) (String())
  356. #define TTRC(m_value) (m_value)
  357. #define TTRGET(m_value) (m_value)
  358. #endif
  359. //tool or regular translate
  360. String RTR(const String &);
  361. bool is_symbol(CharType c);
  362. bool select_word(const String &p_s, int p_col, int &r_beg, int &r_end);
  363. #endif // USTRING_H