Mercurial > minori
annotate src/core/strings.cc @ 102:b315f3759c56
*: big patch
1. use a wrapper for mINI that enables case sensitivity
(personal preference)
2. rename dark_theme.cc to theme.cc and change it to be
a class
3. include the "dep" folder so we don't have stupidity in
json.h or ini.h
4. I think the graph was also tweaked a lot in this, nothing
is constexpr and size is found at runtime...
| author | Paper <mrpapersonic@gmail.com> |
|---|---|
| date | Fri, 03 Nov 2023 21:32:52 -0400 |
| parents | c537996cf67b |
| children | ab191e28e69d |
| rev | line source |
|---|---|
| 9 | 1 /** |
| 2 * strings.cpp: Useful functions for manipulating strings | |
| 3 **/ | |
| 4 #include "core/strings.h" | |
| 64 | 5 #include <QByteArray> |
|
101
c537996cf67b
*: multitude of config changes
Paper <mrpapersonic@gmail.com>
parents:
100
diff
changeset
|
6 #include <QDebug> |
| 64 | 7 #include <QString> |
|
98
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
8 #include <QLocale> |
| 15 | 9 #include <algorithm> |
| 10 #include <cctype> | |
| 62 | 11 #include <codecvt> |
| 9 | 12 #include <locale> |
| 13 #include <string> | |
| 14 #include <vector> | |
| 102 | 15 #include <unordered_map> |
| 9 | 16 |
| 17 namespace Strings { | |
| 18 | |
|
99
503bc1547d49
strings: clarify on some functions and make some of them miniscule
Paper <mrpapersonic@gmail.com>
parents:
98
diff
changeset
|
19 /* ew */ |
| 9 | 20 std::string Implode(const std::vector<std::string>& vector, const std::string& delimiter) { |
| 21 if (vector.size() < 1) | |
| 22 return "-"; | |
| 23 std::string out = ""; | |
| 24 for (unsigned long long i = 0; i < vector.size(); i++) { | |
| 25 out.append(vector.at(i)); | |
| 26 if (i < vector.size() - 1) | |
| 27 out.append(delimiter); | |
| 28 } | |
| 29 return out; | |
| 30 } | |
| 31 | |
|
99
503bc1547d49
strings: clarify on some functions and make some of them miniscule
Paper <mrpapersonic@gmail.com>
parents:
98
diff
changeset
|
32 /* This function is really only used for cleaning up the synopsis of |
|
503bc1547d49
strings: clarify on some functions and make some of them miniscule
Paper <mrpapersonic@gmail.com>
parents:
98
diff
changeset
|
33 horrible HTML debris from AniList :) */ |
|
98
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
34 std::string ReplaceAll(std::string string, const std::string& find, const std::string& replace) { |
|
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
35 size_t pos = 0; |
|
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
36 while ((pos = string.find(find, pos)) != std::string::npos) { |
|
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
37 string.replace(pos, find.length(), replace); |
|
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
38 pos += replace.length(); |
| 9 | 39 } |
|
98
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
40 return string; |
| 9 | 41 } |
| 42 | |
| 43 std::string SanitizeLineEndings(const std::string& string) { | |
|
98
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
44 return ReplaceAll(ReplaceAll(ReplaceAll(string, "\r\n", "\n"), "<br>", "\n"), "\n\n\n", "\n\n"); |
| 9 | 45 } |
| 46 | |
|
98
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
47 /* removes dumb HTML tags because anilist is aids and |
|
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
48 gives us HTML for synopses :/ */ |
|
99
503bc1547d49
strings: clarify on some functions and make some of them miniscule
Paper <mrpapersonic@gmail.com>
parents:
98
diff
changeset
|
49 std::string RemoveHtmlTags(std::string string) { |
|
503bc1547d49
strings: clarify on some functions and make some of them miniscule
Paper <mrpapersonic@gmail.com>
parents:
98
diff
changeset
|
50 while (string.find("<") != std::string::npos) { |
|
503bc1547d49
strings: clarify on some functions and make some of them miniscule
Paper <mrpapersonic@gmail.com>
parents:
98
diff
changeset
|
51 auto startpos = string.find("<"); |
|
503bc1547d49
strings: clarify on some functions and make some of them miniscule
Paper <mrpapersonic@gmail.com>
parents:
98
diff
changeset
|
52 auto endpos = string.find(">") + 1; |
| 9 | 53 |
|
99
503bc1547d49
strings: clarify on some functions and make some of them miniscule
Paper <mrpapersonic@gmail.com>
parents:
98
diff
changeset
|
54 if (endpos != std::string::npos) |
|
503bc1547d49
strings: clarify on some functions and make some of them miniscule
Paper <mrpapersonic@gmail.com>
parents:
98
diff
changeset
|
55 string.erase(startpos, endpos - startpos); |
| 9 | 56 } |
|
99
503bc1547d49
strings: clarify on some functions and make some of them miniscule
Paper <mrpapersonic@gmail.com>
parents:
98
diff
changeset
|
57 return string; |
| 9 | 58 } |
| 59 | |
|
98
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
60 /* e.g. "<" for "<" */ |
|
99
503bc1547d49
strings: clarify on some functions and make some of them miniscule
Paper <mrpapersonic@gmail.com>
parents:
98
diff
changeset
|
61 std::string ParseHtmlEntities(std::string string) { |
|
98
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
62 const std::unordered_map<std::string, std::string> map = { |
|
99
503bc1547d49
strings: clarify on some functions and make some of them miniscule
Paper <mrpapersonic@gmail.com>
parents:
98
diff
changeset
|
63 /* The only one of these I can understand using are the first |
|
503bc1547d49
strings: clarify on some functions and make some of them miniscule
Paper <mrpapersonic@gmail.com>
parents:
98
diff
changeset
|
64 three. why do the rest of these exist? */ |
|
98
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
65 {"<", "<"}, |
|
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
66 {"&rt;", ">"}, |
|
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
67 {" ", "\xA0"}, |
|
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
68 {"&", "&"}, |
|
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
69 {""", "\""}, |
|
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
70 {"'", "'"}, |
|
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
71 {"¢", "¢"}, |
|
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
72 {"£", "£"}, |
|
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
73 {"€", "€"}, |
|
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
74 {"¥", "¥"}, |
|
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
75 {"©", "©"}, |
|
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
76 {"®", "®"}, |
|
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
77 {"’", "’"} // Haibane Renmei, AniList |
|
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
78 }; |
|
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
79 |
|
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
80 for (const auto& item : map) |
|
100
f5940a575d83
track/constants: add many more video formats
Paper <mrpapersonic@gmail.com>
parents:
99
diff
changeset
|
81 string = ReplaceAll(string, item.first, item.second); |
|
99
503bc1547d49
strings: clarify on some functions and make some of them miniscule
Paper <mrpapersonic@gmail.com>
parents:
98
diff
changeset
|
82 return string; |
| 9 | 83 } |
| 84 | |
|
99
503bc1547d49
strings: clarify on some functions and make some of them miniscule
Paper <mrpapersonic@gmail.com>
parents:
98
diff
changeset
|
85 /* removes stupid HTML stuff */ |
|
98
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
86 std::string TextifySynopsis(const std::string& string) { |
|
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
87 return ParseHtmlEntities(RemoveHtmlTags(SanitizeLineEndings(string))); |
|
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
88 } |
|
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
89 |
|
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
90 /* let Qt handle the heavy lifting of locale shit |
|
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
91 I don't want to deal with */ |
| 15 | 92 std::string ToUpper(const std::string& string) { |
|
99
503bc1547d49
strings: clarify on some functions and make some of them miniscule
Paper <mrpapersonic@gmail.com>
parents:
98
diff
changeset
|
93 /* todo: this "locale" will have to be moved to session.h |
|
503bc1547d49
strings: clarify on some functions and make some of them miniscule
Paper <mrpapersonic@gmail.com>
parents:
98
diff
changeset
|
94 it also defaults to en-US, which sucks very much for |
|
503bc1547d49
strings: clarify on some functions and make some of them miniscule
Paper <mrpapersonic@gmail.com>
parents:
98
diff
changeset
|
95 anyone who doesn't speak american english... */ |
|
98
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
96 QLocale locale; |
|
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
97 return ToUtf8String(locale.toUpper(ToQString(string))); |
| 15 | 98 } |
| 99 | |
| 100 std::string ToLower(const std::string& string) { | |
|
98
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
101 QLocale locale; |
|
582b2fca1561
strings: parse HTML entities when reading synopsis, make the
Paper <mrpapersonic@gmail.com>
parents:
81
diff
changeset
|
102 return ToUtf8String(locale.toLower(ToQString(string))); |
| 15 | 103 } |
| 104 | |
| 62 | 105 std::wstring ToWstring(const std::string& string) { |
| 106 std::wstring_convert<std::codecvt_utf8<wchar_t>, wchar_t> converter; | |
| 107 return converter.from_bytes(string); | |
| 108 } | |
| 109 | |
| 64 | 110 std::wstring ToWstring(const QString& string) { |
| 111 std::wstring arr(string.size(), L'\0'); | |
| 112 string.toWCharArray(&arr.front()); | |
| 113 return arr; | |
| 114 } | |
| 115 | |
| 62 | 116 std::string ToUtf8String(const std::wstring& wstring) { |
| 117 std::wstring_convert<std::codecvt_utf8<wchar_t>, wchar_t> converter; | |
| 118 return converter.to_bytes(wstring); | |
| 119 } | |
| 120 | |
| 64 | 121 std::string ToUtf8String(const QString& string) { |
| 122 QByteArray ba = string.toUtf8(); | |
| 77 | 123 return std::string(ba.constData(), ba.size()); |
| 124 } | |
| 125 | |
| 126 std::string ToUtf8String(const QByteArray& ba) { | |
| 127 return std::string(ba.constData(), ba.size()); | |
| 64 | 128 } |
| 129 | |
| 130 QString ToQString(const std::string& string) { | |
| 131 return QString::fromUtf8(string.c_str(), string.length()); | |
| 132 } | |
| 133 | |
| 134 QString ToQString(const std::wstring& wstring) { | |
| 135 return QString::fromWCharArray(wstring.c_str(), wstring.length()); | |
| 136 } | |
| 137 | |
|
101
c537996cf67b
*: multitude of config changes
Paper <mrpapersonic@gmail.com>
parents:
100
diff
changeset
|
138 int ToInt(const std::string& str, int def) { |
|
c537996cf67b
*: multitude of config changes
Paper <mrpapersonic@gmail.com>
parents:
100
diff
changeset
|
139 int tmp = 0; |
|
c537996cf67b
*: multitude of config changes
Paper <mrpapersonic@gmail.com>
parents:
100
diff
changeset
|
140 try { |
|
c537996cf67b
*: multitude of config changes
Paper <mrpapersonic@gmail.com>
parents:
100
diff
changeset
|
141 tmp = std::stoi(str); |
|
c537996cf67b
*: multitude of config changes
Paper <mrpapersonic@gmail.com>
parents:
100
diff
changeset
|
142 } catch (std::invalid_argument const& ex) { |
|
c537996cf67b
*: multitude of config changes
Paper <mrpapersonic@gmail.com>
parents:
100
diff
changeset
|
143 qDebug() << "Failed to parse int from std::string: no number found in " << ToQString(str) << " defaulting to " << def; |
|
c537996cf67b
*: multitude of config changes
Paper <mrpapersonic@gmail.com>
parents:
100
diff
changeset
|
144 tmp = def; |
|
c537996cf67b
*: multitude of config changes
Paper <mrpapersonic@gmail.com>
parents:
100
diff
changeset
|
145 } |
|
c537996cf67b
*: multitude of config changes
Paper <mrpapersonic@gmail.com>
parents:
100
diff
changeset
|
146 return tmp; |
|
c537996cf67b
*: multitude of config changes
Paper <mrpapersonic@gmail.com>
parents:
100
diff
changeset
|
147 } |
|
c537996cf67b
*: multitude of config changes
Paper <mrpapersonic@gmail.com>
parents:
100
diff
changeset
|
148 |
| 102 | 149 bool BeginningMatchesSubstring(const std::string& str, const std::string& sub) { |
| 150 for (unsigned long long i = 0; i < str.length() && i < sub.length(); i++) | |
| 151 if (str[i] != sub[i]) | |
| 152 return false; | |
| 153 return true; | |
| 154 } | |
| 155 | |
| 9 | 156 } // namespace Strings |
