Mercurial > minori
comparison dep/fmt/doc/html/_static/language_data.js @ 343:1faa72660932
*: transfer back to cmake from autotools
autotools just made lots of things more complicated than
they should have and many things broke (i.e. translations)
author | Paper <paper@paper.us.eu.org> |
---|---|
date | Thu, 20 Jun 2024 05:56:06 -0400 |
parents | |
children |
comparison
equal
deleted
inserted
replaced
342:adb79bdde329 | 343:1faa72660932 |
---|---|
1 /* | |
2 * language_data.js | |
3 * ~~~~~~~~~~~~~~~~ | |
4 * | |
5 * This script contains the language-specific data used by searchtools.js, | |
6 * namely the list of stopwords, stemmer, scorer and splitter. | |
7 * | |
8 * :copyright: Copyright 2007-2020 by the Sphinx team, see AUTHORS. | |
9 * :license: BSD, see LICENSE for details. | |
10 * | |
11 */ | |
12 | |
13 var stopwords = ["a","and","are","as","at","be","but","by","for","if","in","into","is","it","near","no","not","of","on","or","such","that","the","their","then","there","these","they","this","to","was","will","with"]; | |
14 | |
15 | |
16 /* Non-minified version JS is _stemmer.js if file is provided */ | |
17 /** | |
18 * Porter Stemmer | |
19 */ | |
20 var Stemmer = function() { | |
21 | |
22 var step2list = { | |
23 ational: 'ate', | |
24 tional: 'tion', | |
25 enci: 'ence', | |
26 anci: 'ance', | |
27 izer: 'ize', | |
28 bli: 'ble', | |
29 alli: 'al', | |
30 entli: 'ent', | |
31 eli: 'e', | |
32 ousli: 'ous', | |
33 ization: 'ize', | |
34 ation: 'ate', | |
35 ator: 'ate', | |
36 alism: 'al', | |
37 iveness: 'ive', | |
38 fulness: 'ful', | |
39 ousness: 'ous', | |
40 aliti: 'al', | |
41 iviti: 'ive', | |
42 biliti: 'ble', | |
43 logi: 'log' | |
44 }; | |
45 | |
46 var step3list = { | |
47 icate: 'ic', | |
48 ative: '', | |
49 alize: 'al', | |
50 iciti: 'ic', | |
51 ical: 'ic', | |
52 ful: '', | |
53 ness: '' | |
54 }; | |
55 | |
56 var c = "[^aeiou]"; // consonant | |
57 var v = "[aeiouy]"; // vowel | |
58 var C = c + "[^aeiouy]*"; // consonant sequence | |
59 var V = v + "[aeiou]*"; // vowel sequence | |
60 | |
61 var mgr0 = "^(" + C + ")?" + V + C; // [C]VC... is m>0 | |
62 var meq1 = "^(" + C + ")?" + V + C + "(" + V + ")?$"; // [C]VC[V] is m=1 | |
63 var mgr1 = "^(" + C + ")?" + V + C + V + C; // [C]VCVC... is m>1 | |
64 var s_v = "^(" + C + ")?" + v; // vowel in stem | |
65 | |
66 this.stemWord = function (w) { | |
67 var stem; | |
68 var suffix; | |
69 var firstch; | |
70 var origword = w; | |
71 | |
72 if (w.length < 3) | |
73 return w; | |
74 | |
75 var re; | |
76 var re2; | |
77 var re3; | |
78 var re4; | |
79 | |
80 firstch = w.substr(0,1); | |
81 if (firstch == "y") | |
82 w = firstch.toUpperCase() + w.substr(1); | |
83 | |
84 // Step 1a | |
85 re = /^(.+?)(ss|i)es$/; | |
86 re2 = /^(.+?)([^s])s$/; | |
87 | |
88 if (re.test(w)) | |
89 w = w.replace(re,"$1$2"); | |
90 else if (re2.test(w)) | |
91 w = w.replace(re2,"$1$2"); | |
92 | |
93 // Step 1b | |
94 re = /^(.+?)eed$/; | |
95 re2 = /^(.+?)(ed|ing)$/; | |
96 if (re.test(w)) { | |
97 var fp = re.exec(w); | |
98 re = new RegExp(mgr0); | |
99 if (re.test(fp[1])) { | |
100 re = /.$/; | |
101 w = w.replace(re,""); | |
102 } | |
103 } | |
104 else if (re2.test(w)) { | |
105 var fp = re2.exec(w); | |
106 stem = fp[1]; | |
107 re2 = new RegExp(s_v); | |
108 if (re2.test(stem)) { | |
109 w = stem; | |
110 re2 = /(at|bl|iz)$/; | |
111 re3 = new RegExp("([^aeiouylsz])\\1$"); | |
112 re4 = new RegExp("^" + C + v + "[^aeiouwxy]$"); | |
113 if (re2.test(w)) | |
114 w = w + "e"; | |
115 else if (re3.test(w)) { | |
116 re = /.$/; | |
117 w = w.replace(re,""); | |
118 } | |
119 else if (re4.test(w)) | |
120 w = w + "e"; | |
121 } | |
122 } | |
123 | |
124 // Step 1c | |
125 re = /^(.+?)y$/; | |
126 if (re.test(w)) { | |
127 var fp = re.exec(w); | |
128 stem = fp[1]; | |
129 re = new RegExp(s_v); | |
130 if (re.test(stem)) | |
131 w = stem + "i"; | |
132 } | |
133 | |
134 // Step 2 | |
135 re = /^(.+?)(ational|tional|enci|anci|izer|bli|alli|entli|eli|ousli|ization|ation|ator|alism|iveness|fulness|ousness|aliti|iviti|biliti|logi)$/; | |
136 if (re.test(w)) { | |
137 var fp = re.exec(w); | |
138 stem = fp[1]; | |
139 suffix = fp[2]; | |
140 re = new RegExp(mgr0); | |
141 if (re.test(stem)) | |
142 w = stem + step2list[suffix]; | |
143 } | |
144 | |
145 // Step 3 | |
146 re = /^(.+?)(icate|ative|alize|iciti|ical|ful|ness)$/; | |
147 if (re.test(w)) { | |
148 var fp = re.exec(w); | |
149 stem = fp[1]; | |
150 suffix = fp[2]; | |
151 re = new RegExp(mgr0); | |
152 if (re.test(stem)) | |
153 w = stem + step3list[suffix]; | |
154 } | |
155 | |
156 // Step 4 | |
157 re = /^(.+?)(al|ance|ence|er|ic|able|ible|ant|ement|ment|ent|ou|ism|ate|iti|ous|ive|ize)$/; | |
158 re2 = /^(.+?)(s|t)(ion)$/; | |
159 if (re.test(w)) { | |
160 var fp = re.exec(w); | |
161 stem = fp[1]; | |
162 re = new RegExp(mgr1); | |
163 if (re.test(stem)) | |
164 w = stem; | |
165 } | |
166 else if (re2.test(w)) { | |
167 var fp = re2.exec(w); | |
168 stem = fp[1] + fp[2]; | |
169 re2 = new RegExp(mgr1); | |
170 if (re2.test(stem)) | |
171 w = stem; | |
172 } | |
173 | |
174 // Step 5 | |
175 re = /^(.+?)e$/; | |
176 if (re.test(w)) { | |
177 var fp = re.exec(w); | |
178 stem = fp[1]; | |
179 re = new RegExp(mgr1); | |
180 re2 = new RegExp(meq1); | |
181 re3 = new RegExp("^" + C + v + "[^aeiouwxy]$"); | |
182 if (re.test(stem) || (re2.test(stem) && !(re3.test(stem)))) | |
183 w = stem; | |
184 } | |
185 re = /ll$/; | |
186 re2 = new RegExp(mgr1); | |
187 if (re.test(w) && re2.test(w)) { | |
188 re = /.$/; | |
189 w = w.replace(re,""); | |
190 } | |
191 | |
192 // and turn initial Y back to y | |
193 if (firstch == "y") | |
194 w = firstch.toLowerCase() + w.substr(1); | |
195 return w; | |
196 } | |
197 } | |
198 | |
199 | |
200 | |
201 | |
202 | |
203 var splitChars = (function() { | |
204 var result = {}; | |
205 var singles = [96, 180, 187, 191, 215, 247, 749, 885, 903, 907, 909, 930, 1014, 1648, | |
206 1748, 1809, 2416, 2473, 2481, 2526, 2601, 2609, 2612, 2615, 2653, 2702, | |
207 2706, 2729, 2737, 2740, 2857, 2865, 2868, 2910, 2928, 2948, 2961, 2971, | |
208 2973, 3085, 3089, 3113, 3124, 3213, 3217, 3241, 3252, 3295, 3341, 3345, | |
209 3369, 3506, 3516, 3633, 3715, 3721, 3736, 3744, 3748, 3750, 3756, 3761, | |
210 3781, 3912, 4239, 4347, 4681, 4695, 4697, 4745, 4785, 4799, 4801, 4823, | |
211 4881, 5760, 5901, 5997, 6313, 7405, 8024, 8026, 8028, 8030, 8117, 8125, | |
212 8133, 8181, 8468, 8485, 8487, 8489, 8494, 8527, 11311, 11359, 11687, 11695, | |
213 11703, 11711, 11719, 11727, 11735, 12448, 12539, 43010, 43014, 43019, 43587, | |
214 43696, 43713, 64286, 64297, 64311, 64317, 64319, 64322, 64325, 65141]; | |
215 var i, j, start, end; | |
216 for (i = 0; i < singles.length; i++) { | |
217 result[singles[i]] = true; | |
218 } | |
219 var ranges = [[0, 47], [58, 64], [91, 94], [123, 169], [171, 177], [182, 184], [706, 709], | |
220 [722, 735], [741, 747], [751, 879], [888, 889], [894, 901], [1154, 1161], | |
221 [1318, 1328], [1367, 1368], [1370, 1376], [1416, 1487], [1515, 1519], [1523, 1568], | |
222 [1611, 1631], [1642, 1645], [1750, 1764], [1767, 1773], [1789, 1790], [1792, 1807], | |
223 [1840, 1868], [1958, 1968], [1970, 1983], [2027, 2035], [2038, 2041], [2043, 2047], | |
224 [2070, 2073], [2075, 2083], [2085, 2087], [2089, 2307], [2362, 2364], [2366, 2383], | |
225 [2385, 2391], [2402, 2405], [2419, 2424], [2432, 2436], [2445, 2446], [2449, 2450], | |
226 [2483, 2485], [2490, 2492], [2494, 2509], [2511, 2523], [2530, 2533], [2546, 2547], | |
227 [2554, 2564], [2571, 2574], [2577, 2578], [2618, 2648], [2655, 2661], [2672, 2673], | |
228 [2677, 2692], [2746, 2748], [2750, 2767], [2769, 2783], [2786, 2789], [2800, 2820], | |
229 [2829, 2830], [2833, 2834], [2874, 2876], [2878, 2907], [2914, 2917], [2930, 2946], | |
230 [2955, 2957], [2966, 2968], [2976, 2978], [2981, 2983], [2987, 2989], [3002, 3023], | |
231 [3025, 3045], [3059, 3076], [3130, 3132], [3134, 3159], [3162, 3167], [3170, 3173], | |
232 [3184, 3191], [3199, 3204], [3258, 3260], [3262, 3293], [3298, 3301], [3312, 3332], | |
233 [3386, 3388], [3390, 3423], [3426, 3429], [3446, 3449], [3456, 3460], [3479, 3481], | |
234 [3518, 3519], [3527, 3584], [3636, 3647], [3655, 3663], [3674, 3712], [3717, 3718], | |
235 [3723, 3724], [3726, 3731], [3752, 3753], [3764, 3772], [3774, 3775], [3783, 3791], | |
236 [3802, 3803], [3806, 3839], [3841, 3871], [3892, 3903], [3949, 3975], [3980, 4095], | |
237 [4139, 4158], [4170, 4175], [4182, 4185], [4190, 4192], [4194, 4196], [4199, 4205], | |
238 [4209, 4212], [4226, 4237], [4250, 4255], [4294, 4303], [4349, 4351], [4686, 4687], | |
239 [4702, 4703], [4750, 4751], [4790, 4791], [4806, 4807], [4886, 4887], [4955, 4968], | |
240 [4989, 4991], [5008, 5023], [5109, 5120], [5741, 5742], [5787, 5791], [5867, 5869], | |
241 [5873, 5887], [5906, 5919], [5938, 5951], [5970, 5983], [6001, 6015], [6068, 6102], | |
242 [6104, 6107], [6109, 6111], [6122, 6127], [6138, 6159], [6170, 6175], [6264, 6271], | |
243 [6315, 6319], [6390, 6399], [6429, 6469], [6510, 6511], [6517, 6527], [6572, 6592], | |
244 [6600, 6607], [6619, 6655], [6679, 6687], [6741, 6783], [6794, 6799], [6810, 6822], | |
245 [6824, 6916], [6964, 6980], [6988, 6991], [7002, 7042], [7073, 7085], [7098, 7167], | |
246 [7204, 7231], [7242, 7244], [7294, 7400], [7410, 7423], [7616, 7679], [7958, 7959], | |
247 [7966, 7967], [8006, 8007], [8014, 8015], [8062, 8063], [8127, 8129], [8141, 8143], | |
248 [8148, 8149], [8156, 8159], [8173, 8177], [8189, 8303], [8306, 8307], [8314, 8318], | |
249 [8330, 8335], [8341, 8449], [8451, 8454], [8456, 8457], [8470, 8472], [8478, 8483], | |
250 [8506, 8507], [8512, 8516], [8522, 8525], [8586, 9311], [9372, 9449], [9472, 10101], | |
251 [10132, 11263], [11493, 11498], [11503, 11516], [11518, 11519], [11558, 11567], | |
252 [11622, 11630], [11632, 11647], [11671, 11679], [11743, 11822], [11824, 12292], | |
253 [12296, 12320], [12330, 12336], [12342, 12343], [12349, 12352], [12439, 12444], | |
254 [12544, 12548], [12590, 12592], [12687, 12689], [12694, 12703], [12728, 12783], | |
255 [12800, 12831], [12842, 12880], [12896, 12927], [12938, 12976], [12992, 13311], | |
256 [19894, 19967], [40908, 40959], [42125, 42191], [42238, 42239], [42509, 42511], | |
257 [42540, 42559], [42592, 42593], [42607, 42622], [42648, 42655], [42736, 42774], | |
258 [42784, 42785], [42889, 42890], [42893, 43002], [43043, 43055], [43062, 43071], | |
259 [43124, 43137], [43188, 43215], [43226, 43249], [43256, 43258], [43260, 43263], | |
260 [43302, 43311], [43335, 43359], [43389, 43395], [43443, 43470], [43482, 43519], | |
261 [43561, 43583], [43596, 43599], [43610, 43615], [43639, 43641], [43643, 43647], | |
262 [43698, 43700], [43703, 43704], [43710, 43711], [43715, 43738], [43742, 43967], | |
263 [44003, 44015], [44026, 44031], [55204, 55215], [55239, 55242], [55292, 55295], | |
264 [57344, 63743], [64046, 64047], [64110, 64111], [64218, 64255], [64263, 64274], | |
265 [64280, 64284], [64434, 64466], [64830, 64847], [64912, 64913], [64968, 65007], | |
266 [65020, 65135], [65277, 65295], [65306, 65312], [65339, 65344], [65371, 65381], | |
267 [65471, 65473], [65480, 65481], [65488, 65489], [65496, 65497]]; | |
268 for (i = 0; i < ranges.length; i++) { | |
269 start = ranges[i][0]; | |
270 end = ranges[i][1]; | |
271 for (j = start; j <= end; j++) { | |
272 result[j] = true; | |
273 } | |
274 } | |
275 return result; | |
276 })(); | |
277 | |
278 function splitQuery(query) { | |
279 var result = []; | |
280 var start = -1; | |
281 for (var i = 0; i < query.length; i++) { | |
282 if (splitChars[query.charCodeAt(i)]) { | |
283 if (start !== -1) { | |
284 result.push(query.slice(start, i)); | |
285 start = -1; | |
286 } | |
287 } else if (start === -1) { | |
288 start = i; | |
289 } | |
290 } | |
291 if (start !== -1) { | |
292 result.push(query.slice(start)); | |
293 } | |
294 return result; | |
295 } | |
296 | |
297 |