[fix] make data.traits - partial revert of commit 30a8204

The entries in the catalog of search languages are build up from the "Engine
Traits" [1] and which entries are included in the catalog is controlled qby two
threshold values [2].

If possible, the values should ensure that no languages or regions disappear
from the catalog of search languages [3].

The threshold values should have been adjusted in commit 30a8204:

- ``min_eng_per_region = 18``
- ``min_eng_per_lang = 22``

Because the threshold values were not adjusted, many entries were missing in the
search language catalog.  This bug has been fixed with this patch: the threshold
values have been adjusted and the catalog of search languages has been completed
again.

[1] https://docs.searxng.org/dev/engines/enginelib.html#module-searx.enginelib.traits
[2] 96a6e3dcb2/searxng_extra/update/update_engine_traits.py (L104-L105)
[3] https://github.com/searxng/searxng/blob/master/searx/sxng_locales.py

Closes: https://github.com/searxng/searxng/issues/4519
Signed-off-by: Markus Heiser <markus.heiser@darmarit.de>
This commit is contained in:
Markus Heiser 2025-03-21 10:34:15 +01:00 committed by Markus Heiser
parent 7e680d8e8e
commit 5986629c6b
4 changed files with 91 additions and 5 deletions

View file

@ -6680,6 +6680,7 @@
"custom": {},
"data_type": "traits_v1",
"languages": {
"ar": "ar",
"ca": "ca",
"cs": "cs",
"de": "de",
@ -6688,17 +6689,30 @@
"eo": "eo",
"es": "es",
"eu": "eu",
"fa": "fa",
"fi": "fi",
"fr": "fr",
"gd": "gd",
"gl": "gl",
"hr": "hr",
"hu": "hu",
"is": "is",
"it": "it",
"ja": "ja",
"kab": "kab",
"nl": "nl",
"no": "no",
"pl": "pl",
"pt": "pt",
"ru": "ru",
"sk": "sk",
"sq": "sq",
"sv": "sv",
"zh": "zh",
"th": "th",
"tok": "tok",
"tr": "tr",
"uk": "uk",
"vi": "vi",
"zh_Hans": "zh",
"zh_Hant": "zh"
},
@ -6915,6 +6929,7 @@
"BQ",
"BR",
"BS",
"BT",
"BW",
"BY",
"BZ",
@ -6937,6 +6952,7 @@
"CY",
"CZ",
"DE",
"DJ",
"DK",
"DM",
"DO",
@ -6950,8 +6966,10 @@
"FI",
"FJ",
"FK",
"FM",
"FO",
"FR",
"GA",
"GB",
"GD",
"GE",
@ -6961,6 +6979,7 @@
"GI",
"GL",
"GM",
"GN",
"GP",
"GQ",
"GR",
@ -6989,6 +7008,7 @@
"KE",
"KG",
"KH",
"KI",
"KM",
"KN",
"KP",
@ -7001,6 +7021,7 @@
"LC",
"LI",
"LK",
"LR",
"LS",
"LT",
"LU",
@ -7011,15 +7032,18 @@
"MD",
"ME",
"MG",
"MH",
"MK",
"ML",
"MM",
"MN",
"MO",
"MQ",
"MR",
"MS",
"MT",
"MU",
"MV",
"MW",
"MX",
"MY",
@ -7032,6 +7056,7 @@
"NL",
"NO",
"NP",
"NR",
"NU",
"NZ",
"OM",
@ -7055,6 +7080,7 @@
"RU",
"RW",
"SA",
"SB",
"SC",
"SD",
"SE",
@ -7082,8 +7108,10 @@
"TL",
"TM",
"TN",
"TO",
"TR",
"TT",
"TV",
"TW",
"TZ",
"UA",
@ -7239,6 +7267,7 @@
"custom": {},
"data_type": "traits_v1",
"languages": {
"ar": "ar",
"ca": "ca",
"cs": "cs",
"de": "de",
@ -7247,17 +7276,30 @@
"eo": "eo",
"es": "es",
"eu": "eu",
"fa": "fa",
"fi": "fi",
"fr": "fr",
"gd": "gd",
"gl": "gl",
"hr": "hr",
"hu": "hu",
"is": "is",
"it": "it",
"ja": "ja",
"kab": "kab",
"nl": "nl",
"no": "no",
"pl": "pl",
"pt": "pt",
"ru": "ru",
"sk": "sk",
"sq": "sq",
"sv": "sv",
"zh": "zh",
"th": "th",
"tok": "tok",
"tr": "tr",
"uk": "uk",
"vi": "vi",
"zh_Hans": "zh",
"zh_Hant": "zh"
},