Mercurial > minori
annotate src/core/strings.cc @ 298:dec4d3c9a909
scripts/win32/deploy_build: be more verbose with libs
| author | Paper <paper@paper.us.eu.org> |
|---|---|
| date | Mon, 13 May 2024 03:28:42 -0400 |
| parents | f6a756c19bfb |
| children | 1b5c04268d6a |
| rev | line source |
|---|---|
| 9 | 1 /** |
| 2 * strings.cpp: Useful functions for manipulating strings | |
| 3 **/ | |
| 4 #include "core/strings.h" | |
|
187
9613d72b097e
*: multiple performance improvements
Paper <mrpapersonic@gmail.com>
parents:
120
diff
changeset
|
5 #include "core/session.h" // locale |
|
9613d72b097e
*: multiple performance improvements
Paper <mrpapersonic@gmail.com>
parents:
120
diff
changeset
|
6 |
| 64 | 7 #include <QByteArray> |
|
101
c537996cf67b
*: multitude of config changes
Paper <mrpapersonic@gmail.com>
parents:
100
diff
changeset
|
8 #include <QDebug> |
| 258 | 9 #include <QLocale> |
| 64 | 10 #include <QString> |
|
274
f6a756c19bfb
anime_list.cc: use mutexes so we don't sex the stack
Paper <paper@paper.us.eu.org>
parents:
273
diff
changeset
|
11 #include <QTextDocument> |
|
187
9613d72b097e
*: multiple performance improvements
Paper <mrpapersonic@gmail.com>
parents:
120
diff
changeset
|
12 |
| 15 | 13 #include <algorithm> |
| 14 #include <cctype> | |
| 62 | 15 #include <codecvt> |
| 258 | 16 #include <iostream> |
|
273
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
17 #include <iomanip> |
| 9 | 18 #include <locale> |
| 19 #include <string> | |
| 258 | 20 #include <unordered_map> |
| 9 | 21 #include <vector> |
| 22 | |
| 264 | 23 #include "utf8proc.h" |
| 24 | |
| 9 | 25 namespace Strings { |
| 26 | |
|
99
503bc1547d49
strings: clarify on some functions and make some of them miniscule
Paper <mrpapersonic@gmail.com>
parents:
98
diff
changeset
|
27 /* ew */ |
| 9 | 28 std::string Implode(const std::vector<std::string>& vector, const std::string& delimiter) { |
| 29 if (vector.size() < 1) | |
| 250 | 30 return ""; |
|
187
9613d72b097e
*: multiple performance improvements
Paper <mrpapersonic@gmail.com>
parents:
120
diff
changeset
|
31 |
|
221
53211cb1e7f5
library: add initial library stuff
Paper <paper@paper.us.eu.org>
parents:
211
diff
changeset
|
32 std::string out; |
|
187
9613d72b097e
*: multiple performance improvements
Paper <mrpapersonic@gmail.com>
parents:
120
diff
changeset
|
33 |
| 9 | 34 for (unsigned long long i = 0; i < vector.size(); i++) { |
| 35 out.append(vector.at(i)); | |
| 36 if (i < vector.size() - 1) | |
| 37 out.append(delimiter); | |
| 38 } | |
|
187
9613d72b097e
*: multiple performance improvements
Paper <mrpapersonic@gmail.com>
parents:
120
diff
changeset
|
39 |
| 9 | 40 return out; |
| 41 } | |
| 42 | |
| 226 | 43 std::string Implode(const std::set<std::string>& set, const std::string& delimiter) { |
| 44 if (set.size() < 1) | |
| 250 | 45 return ""; |
| 226 | 46 |
| 47 std::string out; | |
| 48 | |
| 49 for (auto it = set.cbegin(); it != set.cend(); it++) { | |
| 50 out.append(*it); | |
| 51 if (it != std::prev(set.cend(), 1)) | |
| 52 out.append(delimiter); | |
| 53 } | |
| 54 | |
| 55 return out; | |
| 56 } | |
| 57 | |
| 258 | 58 std::vector<std::string> Split(const std::string& text, const std::string& delimiter) { |
| 250 | 59 if (text.length() < 1) |
| 60 return {}; | |
| 61 | |
|
118
39521c47c7a3
*: another huge megacommit, SORRY
Paper <mrpapersonic@gmail.com>
parents:
116
diff
changeset
|
62 std::vector<std::string> tokens; |
|
39521c47c7a3
*: another huge megacommit, SORRY
Paper <mrpapersonic@gmail.com>
parents:
116
diff
changeset
|
63 |
|
39521c47c7a3
*: another huge megacommit, SORRY
Paper <mrpapersonic@gmail.com>
parents:
116
diff
changeset
|
64 std::size_t start = 0, end = 0; |
|
39521c47c7a3
*: another huge megacommit, SORRY
Paper <mrpapersonic@gmail.com>
parents:
116
diff
changeset
|
65 while ((end = text.find(delimiter, start)) != std::string::npos) { |
|
39521c47c7a3
*: another huge megacommit, SORRY
Paper <mrpapersonic@gmail.com>
parents:
116
diff
changeset
|
66 tokens.push_back(text.substr(start, end - start)); |
|
39521c47c7a3
*: another huge megacommit, SORRY
Paper <mrpapersonic@gmail.com>
parents:
116
diff
changeset
|
67 start = end + delimiter.length(); |
|
39521c47c7a3
*: another huge megacommit, SORRY
Paper <mrpapersonic@gmail.com>
parents:
116
diff
changeset
|
68 } |
|
39521c47c7a3
*: another huge megacommit, SORRY
Paper <mrpapersonic@gmail.com>
parents:
116
diff
changeset
|
69 tokens.push_back(text.substr(start)); |
|
39521c47c7a3
*: another huge megacommit, SORRY
Paper <mrpapersonic@gmail.com>
parents:
116
diff
changeset
|
70 |
|
39521c47c7a3
*: another huge megacommit, SORRY
Paper <mrpapersonic@gmail.com>
parents:
116
diff
changeset
|
71 return tokens; |
|
39521c47c7a3
*: another huge megacommit, SORRY
Paper <mrpapersonic@gmail.com>
parents:
116
diff
changeset
|
72 } |
|
39521c47c7a3
*: another huge megacommit, SORRY
Paper <mrpapersonic@gmail.com>
parents:
116
diff
changeset
|
73 |
|
99
503bc1547d49
strings: clarify on some functions and make some of them miniscule
Paper <mrpapersonic@gmail.com>
parents:
98
diff
changeset
|
74 /* This function is really only used for cleaning up the synopsis of |
|
221
53211cb1e7f5
library: add initial library stuff
Paper <paper@paper.us.eu.org>
parents:
211
diff
changeset
|
75 * horrible HTML debris from AniList :) |
| 258 | 76 */ |
|
260
dd211ff68b36
pages/seasons: add initial functionality
Paper <paper@paper.us.eu.org>
parents:
258
diff
changeset
|
77 void ReplaceAll(std::string& string, std::string_view find, std::string_view replace) { |
|
98
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
78 size_t pos = 0; |
|
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
79 while ((pos = string.find(find, pos)) != std::string::npos) { |
|
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
80 string.replace(pos, find.length(), replace); |
|
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
81 pos += replace.length(); |
| 9 | 82 } |
| 83 } | |
| 84 | |
|
260
dd211ff68b36
pages/seasons: add initial functionality
Paper <paper@paper.us.eu.org>
parents:
258
diff
changeset
|
85 void SanitizeLineEndings(std::string& string) { |
|
114
ab191e28e69d
*: add initial torrent stuff
Paper <mrpapersonic@gmail.com>
parents:
102
diff
changeset
|
86 /* LOL */ |
|
260
dd211ff68b36
pages/seasons: add initial functionality
Paper <paper@paper.us.eu.org>
parents:
258
diff
changeset
|
87 ReplaceAll(string, "\r\n", "\n"); |
|
dd211ff68b36
pages/seasons: add initial functionality
Paper <paper@paper.us.eu.org>
parents:
258
diff
changeset
|
88 ReplaceAll(string, "</p>", "\n"); |
|
dd211ff68b36
pages/seasons: add initial functionality
Paper <paper@paper.us.eu.org>
parents:
258
diff
changeset
|
89 ReplaceAll(string, "<br>", "\n"); |
|
dd211ff68b36
pages/seasons: add initial functionality
Paper <paper@paper.us.eu.org>
parents:
258
diff
changeset
|
90 ReplaceAll(string, "<br />", "\n"); |
|
dd211ff68b36
pages/seasons: add initial functionality
Paper <paper@paper.us.eu.org>
parents:
258
diff
changeset
|
91 ReplaceAll(string, "\n\n\n", "\n\n"); |
|
dd211ff68b36
pages/seasons: add initial functionality
Paper <paper@paper.us.eu.org>
parents:
258
diff
changeset
|
92 } |
|
dd211ff68b36
pages/seasons: add initial functionality
Paper <paper@paper.us.eu.org>
parents:
258
diff
changeset
|
93 |
|
dd211ff68b36
pages/seasons: add initial functionality
Paper <paper@paper.us.eu.org>
parents:
258
diff
changeset
|
94 void ConvertRomanNumerals(std::string& string) { |
|
dd211ff68b36
pages/seasons: add initial functionality
Paper <paper@paper.us.eu.org>
parents:
258
diff
changeset
|
95 static const std::vector<std::pair<std::string_view, std::string_view>> vec = { |
|
dd211ff68b36
pages/seasons: add initial functionality
Paper <paper@paper.us.eu.org>
parents:
258
diff
changeset
|
96 {"2", "II"}, {"3", "III"}, {"4", "IV"}, {"5", "V"}, {"6", "VI"}, |
|
dd211ff68b36
pages/seasons: add initial functionality
Paper <paper@paper.us.eu.org>
parents:
258
diff
changeset
|
97 {"7", "VII"}, {"8", "VIII"}, {"9", "IX"}, {"11", "XI"}, {"12", "XII"}, |
|
dd211ff68b36
pages/seasons: add initial functionality
Paper <paper@paper.us.eu.org>
parents:
258
diff
changeset
|
98 {"13", "XIII"} |
|
dd211ff68b36
pages/seasons: add initial functionality
Paper <paper@paper.us.eu.org>
parents:
258
diff
changeset
|
99 }; |
|
dd211ff68b36
pages/seasons: add initial functionality
Paper <paper@paper.us.eu.org>
parents:
258
diff
changeset
|
100 |
|
dd211ff68b36
pages/seasons: add initial functionality
Paper <paper@paper.us.eu.org>
parents:
258
diff
changeset
|
101 for (const auto& item : vec) |
|
dd211ff68b36
pages/seasons: add initial functionality
Paper <paper@paper.us.eu.org>
parents:
258
diff
changeset
|
102 ReplaceAll(string, item.second, item.first); |
| 9 | 103 } |
| 104 | |
| 264 | 105 /* this also performs case folding, so our string is lowercase after this */ |
| 106 void NormalizeUnicode(std::string& string) { | |
| 107 static constexpr utf8proc_option_t options = static_cast<utf8proc_option_t>( | |
| 108 UTF8PROC_COMPAT | UTF8PROC_COMPOSE | UTF8PROC_STABLE | | |
| 109 UTF8PROC_IGNORE | UTF8PROC_STRIPCC | UTF8PROC_STRIPMARK | | |
| 110 UTF8PROC_LUMP | UTF8PROC_CASEFOLD | UTF8PROC_NLF2LS | |
| 111 ); | |
| 112 | |
| 113 /* ack */ | |
| 114 utf8proc_uint8_t* buf = nullptr; | |
| 115 | |
| 116 const utf8proc_ssize_t size = utf8proc_map( | |
| 117 reinterpret_cast<const utf8proc_uint8_t*>(string.data()), | |
| 118 string.size(), | |
| 119 &buf, | |
| 120 options | |
| 121 ); | |
| 122 | |
| 123 if (size) | |
| 124 string = std::string(reinterpret_cast<const char*>(buf), size); | |
| 125 | |
| 126 if (buf) | |
| 127 free(buf); | |
| 128 } | |
| 129 | |
| 130 void NormalizeAnimeTitle(std::string& string) { | |
| 131 ConvertRomanNumerals(string); | |
| 132 NormalizeUnicode(string); | |
| 133 RemoveLeadingChars(string, ' '); | |
| 134 RemoveTrailingChars(string, ' '); | |
| 135 } | |
| 136 | |
|
98
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
137 /* removes dumb HTML tags because anilist is aids and |
| 250 | 138 * gives us HTML for synopses :/ |
| 258 | 139 */ |
|
260
dd211ff68b36
pages/seasons: add initial functionality
Paper <paper@paper.us.eu.org>
parents:
258
diff
changeset
|
140 void RemoveHtmlTags(std::string& string) { |
|
99
503bc1547d49
strings: clarify on some functions and make some of them miniscule
Paper <mrpapersonic@gmail.com>
parents:
98
diff
changeset
|
141 while (string.find("<") != std::string::npos) { |
|
503bc1547d49
strings: clarify on some functions and make some of them miniscule
Paper <mrpapersonic@gmail.com>
parents:
98
diff
changeset
|
142 auto startpos = string.find("<"); |
|
503bc1547d49
strings: clarify on some functions and make some of them miniscule
Paper <mrpapersonic@gmail.com>
parents:
98
diff
changeset
|
143 auto endpos = string.find(">") + 1; |
| 9 | 144 |
|
99
503bc1547d49
strings: clarify on some functions and make some of them miniscule
Paper <mrpapersonic@gmail.com>
parents:
98
diff
changeset
|
145 if (endpos != std::string::npos) |
|
503bc1547d49
strings: clarify on some functions and make some of them miniscule
Paper <mrpapersonic@gmail.com>
parents:
98
diff
changeset
|
146 string.erase(startpos, endpos - startpos); |
| 9 | 147 } |
| 148 } | |
| 149 | |
|
98
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
150 /* e.g. "<" for "<" */ |
|
260
dd211ff68b36
pages/seasons: add initial functionality
Paper <paper@paper.us.eu.org>
parents:
258
diff
changeset
|
151 void ParseHtmlEntities(std::string& string) { |
|
98
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
152 const std::unordered_map<std::string, std::string> map = { |
|
274
f6a756c19bfb
anime_list.cc: use mutexes so we don't sex the stack
Paper <paper@paper.us.eu.org>
parents:
273
diff
changeset
|
153 {"<", "<"}, |
|
f6a756c19bfb
anime_list.cc: use mutexes so we don't sex the stack
Paper <paper@paper.us.eu.org>
parents:
273
diff
changeset
|
154 {"&rt;", ">"}, |
| 258 | 155 {" ", "\xA0"}, |
|
274
f6a756c19bfb
anime_list.cc: use mutexes so we don't sex the stack
Paper <paper@paper.us.eu.org>
parents:
273
diff
changeset
|
156 {"&", "&"}, |
|
f6a756c19bfb
anime_list.cc: use mutexes so we don't sex the stack
Paper <paper@paper.us.eu.org>
parents:
273
diff
changeset
|
157 {""", "\""}, |
|
f6a756c19bfb
anime_list.cc: use mutexes so we don't sex the stack
Paper <paper@paper.us.eu.org>
parents:
273
diff
changeset
|
158 {"'", "'"}, |
|
f6a756c19bfb
anime_list.cc: use mutexes so we don't sex the stack
Paper <paper@paper.us.eu.org>
parents:
273
diff
changeset
|
159 {"¢", "¢"}, |
|
f6a756c19bfb
anime_list.cc: use mutexes so we don't sex the stack
Paper <paper@paper.us.eu.org>
parents:
273
diff
changeset
|
160 {"£", "£"}, |
|
f6a756c19bfb
anime_list.cc: use mutexes so we don't sex the stack
Paper <paper@paper.us.eu.org>
parents:
273
diff
changeset
|
161 {"€", "€"}, |
|
f6a756c19bfb
anime_list.cc: use mutexes so we don't sex the stack
Paper <paper@paper.us.eu.org>
parents:
273
diff
changeset
|
162 {"¥", "Â¥"}, |
|
f6a756c19bfb
anime_list.cc: use mutexes so we don't sex the stack
Paper <paper@paper.us.eu.org>
parents:
273
diff
changeset
|
163 {"©", "©"}, |
|
f6a756c19bfb
anime_list.cc: use mutexes so we don't sex the stack
Paper <paper@paper.us.eu.org>
parents:
273
diff
changeset
|
164 {"®", "®"}, |
|
f6a756c19bfb
anime_list.cc: use mutexes so we don't sex the stack
Paper <paper@paper.us.eu.org>
parents:
273
diff
changeset
|
165 {"×", "×"}, |
| 258 | 166 {"’", "’" } // Haibane Renmei, AniList |
|
98
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
167 }; |
|
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
168 |
|
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
169 for (const auto& item : map) |
|
260
dd211ff68b36
pages/seasons: add initial functionality
Paper <paper@paper.us.eu.org>
parents:
258
diff
changeset
|
170 ReplaceAll(string, item.first, item.second); |
| 9 | 171 } |
| 172 | |
|
99
503bc1547d49
strings: clarify on some functions and make some of them miniscule
Paper <mrpapersonic@gmail.com>
parents:
98
diff
changeset
|
173 /* removes stupid HTML stuff */ |
|
260
dd211ff68b36
pages/seasons: add initial functionality
Paper <paper@paper.us.eu.org>
parents:
258
diff
changeset
|
174 void TextifySynopsis(std::string& string) { |
|
274
f6a756c19bfb
anime_list.cc: use mutexes so we don't sex the stack
Paper <paper@paper.us.eu.org>
parents:
273
diff
changeset
|
175 #if 1 |
|
f6a756c19bfb
anime_list.cc: use mutexes so we don't sex the stack
Paper <paper@paper.us.eu.org>
parents:
273
diff
changeset
|
176 /* Just let Qt deal with it. */ |
|
f6a756c19bfb
anime_list.cc: use mutexes so we don't sex the stack
Paper <paper@paper.us.eu.org>
parents:
273
diff
changeset
|
177 QTextDocument text; |
|
f6a756c19bfb
anime_list.cc: use mutexes so we don't sex the stack
Paper <paper@paper.us.eu.org>
parents:
273
diff
changeset
|
178 text.setHtml(Strings::ToQString(string)); |
|
f6a756c19bfb
anime_list.cc: use mutexes so we don't sex the stack
Paper <paper@paper.us.eu.org>
parents:
273
diff
changeset
|
179 string = Strings::ToUtf8String(text.toPlainText()); |
|
f6a756c19bfb
anime_list.cc: use mutexes so we don't sex the stack
Paper <paper@paper.us.eu.org>
parents:
273
diff
changeset
|
180 #else |
|
f6a756c19bfb
anime_list.cc: use mutexes so we don't sex the stack
Paper <paper@paper.us.eu.org>
parents:
273
diff
changeset
|
181 /* old implementation here... beware of jankiness */ |
|
260
dd211ff68b36
pages/seasons: add initial functionality
Paper <paper@paper.us.eu.org>
parents:
258
diff
changeset
|
182 SanitizeLineEndings(string); |
|
dd211ff68b36
pages/seasons: add initial functionality
Paper <paper@paper.us.eu.org>
parents:
258
diff
changeset
|
183 RemoveHtmlTags(string); |
|
dd211ff68b36
pages/seasons: add initial functionality
Paper <paper@paper.us.eu.org>
parents:
258
diff
changeset
|
184 ParseHtmlEntities(string); |
|
274
f6a756c19bfb
anime_list.cc: use mutexes so we don't sex the stack
Paper <paper@paper.us.eu.org>
parents:
273
diff
changeset
|
185 #endif |
|
98
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
186 } |
|
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
187 |
|
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
188 /* let Qt handle the heavy lifting of locale shit |
|
221
53211cb1e7f5
library: add initial library stuff
Paper <paper@paper.us.eu.org>
parents:
211
diff
changeset
|
189 * I don't want to deal with |
| 258 | 190 */ |
| 15 | 191 std::string ToUpper(const std::string& string) { |
|
187
9613d72b097e
*: multiple performance improvements
Paper <mrpapersonic@gmail.com>
parents:
120
diff
changeset
|
192 return ToUtf8String(session.config.locale.GetLocale().toUpper(ToQString(string))); |
| 15 | 193 } |
| 194 | |
| 195 std::string ToLower(const std::string& string) { | |
|
187
9613d72b097e
*: multiple performance improvements
Paper <mrpapersonic@gmail.com>
parents:
120
diff
changeset
|
196 return ToUtf8String(session.config.locale.GetLocale().toLower(ToQString(string))); |
| 15 | 197 } |
| 198 | |
| 62 | 199 std::wstring ToWstring(const std::string& string) { |
|
230
2f5a9247e501
torrents: implement download button
Paper <paper@paper.us.eu.org>
parents:
221
diff
changeset
|
200 static std::wstring_convert<std::codecvt_utf8<wchar_t>> converter("", L""); |
|
2f5a9247e501
torrents: implement download button
Paper <paper@paper.us.eu.org>
parents:
221
diff
changeset
|
201 |
|
2f5a9247e501
torrents: implement download button
Paper <paper@paper.us.eu.org>
parents:
221
diff
changeset
|
202 std::wstring wstr; |
|
2f5a9247e501
torrents: implement download button
Paper <paper@paper.us.eu.org>
parents:
221
diff
changeset
|
203 try { |
|
2f5a9247e501
torrents: implement download button
Paper <paper@paper.us.eu.org>
parents:
221
diff
changeset
|
204 wstr = converter.from_bytes(string); |
|
2f5a9247e501
torrents: implement download button
Paper <paper@paper.us.eu.org>
parents:
221
diff
changeset
|
205 } catch (std::range_error const& ex) { |
|
2f5a9247e501
torrents: implement download button
Paper <paper@paper.us.eu.org>
parents:
221
diff
changeset
|
206 std::cerr << "Failed to convert UTF-8 to wide string!" << std::endl; |
|
2f5a9247e501
torrents: implement download button
Paper <paper@paper.us.eu.org>
parents:
221
diff
changeset
|
207 } |
|
2f5a9247e501
torrents: implement download button
Paper <paper@paper.us.eu.org>
parents:
221
diff
changeset
|
208 return wstr; |
| 62 | 209 } |
| 210 | |
| 64 | 211 std::wstring ToWstring(const QString& string) { |
| 212 std::wstring arr(string.size(), L'\0'); | |
| 213 string.toWCharArray(&arr.front()); | |
| 214 return arr; | |
| 215 } | |
| 216 | |
| 62 | 217 std::string ToUtf8String(const std::wstring& wstring) { |
|
230
2f5a9247e501
torrents: implement download button
Paper <paper@paper.us.eu.org>
parents:
221
diff
changeset
|
218 static std::wstring_convert<std::codecvt_utf8<wchar_t>> converter("", L""); |
| 62 | 219 return converter.to_bytes(wstring); |
| 220 } | |
| 221 | |
| 64 | 222 std::string ToUtf8String(const QString& string) { |
|
187
9613d72b097e
*: multiple performance improvements
Paper <mrpapersonic@gmail.com>
parents:
120
diff
changeset
|
223 const QByteArray ba = string.toUtf8(); |
| 77 | 224 return std::string(ba.constData(), ba.size()); |
| 225 } | |
| 226 | |
| 227 std::string ToUtf8String(const QByteArray& ba) { | |
| 228 return std::string(ba.constData(), ba.size()); | |
| 64 | 229 } |
| 230 | |
| 231 QString ToQString(const std::string& string) { | |
| 232 return QString::fromUtf8(string.c_str(), string.length()); | |
| 233 } | |
| 234 | |
| 235 QString ToQString(const std::wstring& wstring) { | |
| 236 return QString::fromWCharArray(wstring.c_str(), wstring.length()); | |
| 237 } | |
| 238 | |
|
211
7cf53145de11
strings: use templates for ToInt, std::to_string -> Strings::ToUtf8String
Paper <mrpapersonic@gmail.com>
parents:
187
diff
changeset
|
239 std::string ToUtf8String(const bool b) { |
|
7cf53145de11
strings: use templates for ToInt, std::to_string -> Strings::ToUtf8String
Paper <mrpapersonic@gmail.com>
parents:
187
diff
changeset
|
240 return b ? "true" : "false"; // lol |
|
101
c537996cf67b
*: multitude of config changes
Paper <mrpapersonic@gmail.com>
parents:
100
diff
changeset
|
241 } |
|
c537996cf67b
*: multitude of config changes
Paper <mrpapersonic@gmail.com>
parents:
100
diff
changeset
|
242 |
|
211
7cf53145de11
strings: use templates for ToInt, std::to_string -> Strings::ToUtf8String
Paper <mrpapersonic@gmail.com>
parents:
187
diff
changeset
|
243 bool ToBool(const std::string& str, bool def) { |
|
7cf53145de11
strings: use templates for ToInt, std::to_string -> Strings::ToUtf8String
Paper <mrpapersonic@gmail.com>
parents:
187
diff
changeset
|
244 std::istringstream s(Strings::ToLower(str)); |
|
7cf53145de11
strings: use templates for ToInt, std::to_string -> Strings::ToUtf8String
Paper <mrpapersonic@gmail.com>
parents:
187
diff
changeset
|
245 s >> std::boolalpha >> def; |
|
116
254b1d2b7096
settings: add torrents page, make rss feed configurable
Paper <mrpapersonic@gmail.com>
parents:
114
diff
changeset
|
246 return def; |
|
254b1d2b7096
settings: add torrents page, make rss feed configurable
Paper <mrpapersonic@gmail.com>
parents:
114
diff
changeset
|
247 } |
|
254b1d2b7096
settings: add torrents page, make rss feed configurable
Paper <mrpapersonic@gmail.com>
parents:
114
diff
changeset
|
248 |
|
211
7cf53145de11
strings: use templates for ToInt, std::to_string -> Strings::ToUtf8String
Paper <mrpapersonic@gmail.com>
parents:
187
diff
changeset
|
249 /* util funcs */ |
|
114
ab191e28e69d
*: add initial torrent stuff
Paper <mrpapersonic@gmail.com>
parents:
102
diff
changeset
|
250 uint64_t HumanReadableSizeToBytes(const std::string& str) { |
|
187
9613d72b097e
*: multiple performance improvements
Paper <mrpapersonic@gmail.com>
parents:
120
diff
changeset
|
251 static const std::unordered_map<std::string, uint64_t> bytes_map = { |
|
273
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
252 {"KB", 1000ull}, |
|
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
253 {"MB", 1000000ull}, |
|
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
254 {"GB", 1000000000ull}, |
|
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
255 {"TB", 1000000000000ull}, |
|
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
256 {"PB", 1000000000000000ull}, |
|
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
257 {"KiB", 1ull << 10}, |
|
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
258 {"MiB", 1ull << 20}, |
|
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
259 {"GiB", 1ull << 30}, |
|
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
260 {"TiB", 1ull << 40}, |
|
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
261 {"PiB", 1ull << 50} /* surely we won't need more than this */ |
|
114
ab191e28e69d
*: add initial torrent stuff
Paper <mrpapersonic@gmail.com>
parents:
102
diff
changeset
|
262 }; |
|
ab191e28e69d
*: add initial torrent stuff
Paper <mrpapersonic@gmail.com>
parents:
102
diff
changeset
|
263 |
|
ab191e28e69d
*: add initial torrent stuff
Paper <mrpapersonic@gmail.com>
parents:
102
diff
changeset
|
264 for (const auto& suffix : bytes_map) { |
|
ab191e28e69d
*: add initial torrent stuff
Paper <mrpapersonic@gmail.com>
parents:
102
diff
changeset
|
265 if (str.find(suffix.first) != std::string::npos) { |
|
ab191e28e69d
*: add initial torrent stuff
Paper <mrpapersonic@gmail.com>
parents:
102
diff
changeset
|
266 try { |
|
ab191e28e69d
*: add initial torrent stuff
Paper <mrpapersonic@gmail.com>
parents:
102
diff
changeset
|
267 uint64_t size = std::stod(str) * suffix.second; |
|
ab191e28e69d
*: add initial torrent stuff
Paper <mrpapersonic@gmail.com>
parents:
102
diff
changeset
|
268 return size; |
|
ab191e28e69d
*: add initial torrent stuff
Paper <mrpapersonic@gmail.com>
parents:
102
diff
changeset
|
269 } catch (std::invalid_argument const& ex) { |
|
ab191e28e69d
*: add initial torrent stuff
Paper <mrpapersonic@gmail.com>
parents:
102
diff
changeset
|
270 continue; |
|
ab191e28e69d
*: add initial torrent stuff
Paper <mrpapersonic@gmail.com>
parents:
102
diff
changeset
|
271 } |
|
ab191e28e69d
*: add initial torrent stuff
Paper <mrpapersonic@gmail.com>
parents:
102
diff
changeset
|
272 } |
|
ab191e28e69d
*: add initial torrent stuff
Paper <mrpapersonic@gmail.com>
parents:
102
diff
changeset
|
273 } |
|
ab191e28e69d
*: add initial torrent stuff
Paper <mrpapersonic@gmail.com>
parents:
102
diff
changeset
|
274 |
|
ab191e28e69d
*: add initial torrent stuff
Paper <mrpapersonic@gmail.com>
parents:
102
diff
changeset
|
275 return ToInt(str, 0); |
|
ab191e28e69d
*: add initial torrent stuff
Paper <mrpapersonic@gmail.com>
parents:
102
diff
changeset
|
276 } |
|
ab191e28e69d
*: add initial torrent stuff
Paper <mrpapersonic@gmail.com>
parents:
102
diff
changeset
|
277 |
|
273
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
278 std::string BytesToHumanReadableSize(uint64_t bytes, int precision) { |
|
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
279 #if QT_VERSION >= QT_VERSION_CHECK(5, 10, 0) |
|
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
280 /* QLocale in Qt >= 5.10.0 has a function for this */ |
|
274
f6a756c19bfb
anime_list.cc: use mutexes so we don't sex the stack
Paper <paper@paper.us.eu.org>
parents:
273
diff
changeset
|
281 return Strings::ToUtf8String(session.config.locale.GetLocale().formattedDataSize(bytes, precision)); |
|
273
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
282 #else |
|
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
283 static const std::unordered_map<uint64_t, std::string> map = { |
|
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
284 {1ull << 10, "KiB"}, |
|
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
285 {1ull << 20, "MiB"}, |
|
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
286 {1ull << 30, "GiB"}, |
|
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
287 {1ull << 40, "TiB"}, |
|
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
288 {1ull << 50, "PiB"} |
|
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
289 }; |
|
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
290 |
|
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
291 for (const auto& suffix : map) { |
|
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
292 if (bytes / suffix.first < 1) |
|
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
293 continue; |
|
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
294 |
|
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
295 std::stringstream ss; |
|
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
296 ss << std::setprecision(precision) |
|
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
297 << (static_cast<double>(bytes) / suffix.first) << " " |
|
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
298 << suffix.second; |
|
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
299 return ss.str(); |
|
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
300 } |
|
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
301 |
|
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
302 /* better luck next time */ |
|
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
303 return "0 bytes"; |
|
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
304 #endif |
|
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
305 } |
|
f31305b9f60a
*: various code safety changes
Paper <paper@paper.us.eu.org>
parents:
264
diff
changeset
|
306 |
| 264 | 307 void RemoveLeadingChars(std::string& s, const char c) { |
|
118
39521c47c7a3
*: another huge megacommit, SORRY
Paper <mrpapersonic@gmail.com>
parents:
116
diff
changeset
|
308 s.erase(0, std::min(s.find_first_not_of(c), s.size() - 1)); |
|
114
ab191e28e69d
*: add initial torrent stuff
Paper <mrpapersonic@gmail.com>
parents:
102
diff
changeset
|
309 } |
|
ab191e28e69d
*: add initial torrent stuff
Paper <mrpapersonic@gmail.com>
parents:
102
diff
changeset
|
310 |
| 264 | 311 void RemoveTrailingChars(std::string& s, const char c) { |
|
114
ab191e28e69d
*: add initial torrent stuff
Paper <mrpapersonic@gmail.com>
parents:
102
diff
changeset
|
312 s.erase(s.find_last_not_of(c) + 1, std::string::npos); |
|
ab191e28e69d
*: add initial torrent stuff
Paper <mrpapersonic@gmail.com>
parents:
102
diff
changeset
|
313 } |
|
ab191e28e69d
*: add initial torrent stuff
Paper <mrpapersonic@gmail.com>
parents:
102
diff
changeset
|
314 |
| 102 | 315 bool BeginningMatchesSubstring(const std::string& str, const std::string& sub) { |
| 316 for (unsigned long long i = 0; i < str.length() && i < sub.length(); i++) | |
| 317 if (str[i] != sub[i]) | |
| 318 return false; | |
|
187
9613d72b097e
*: multiple performance improvements
Paper <mrpapersonic@gmail.com>
parents:
120
diff
changeset
|
319 |
| 102 | 320 return true; |
| 321 } | |
| 322 | |
| 9 | 323 } // namespace Strings |
