From 71c595f56b2376e189a73bd8ff25528005539e41 Mon Sep 17 00:00:00 2001 From: Thomas Mannay Date: Mon, 13 Apr 2026 12:54:21 +0100 Subject: [PATCH] Use hbs to lemmatize Bosnian, Croatian, and Serbian --- vocabsieve/lemmatizer.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/vocabsieve/lemmatizer.py b/vocabsieve/lemmatizer.py index a9a996f..b6d461e 100644 --- a/vocabsieve/lemmatizer.py +++ b/vocabsieve/lemmatizer.py @@ -89,6 +89,8 @@ def lemmatize(word, language, greedy=False): return morph[language].parse(word)[0].normal_form if language in simplemma_languages: return simplemma.lemmatize(word, lang=language, greedy=greedy) # pyright: ignore[reportPrivateImportUsage] + if language in ['bs', 'hr', 'sr']: + return simplemma.lemmatize(word, lang='hbs', greedy=greedy) # pyright: ignore[reportPrivateImportUsage] else: return word except ValueError as e: # pylint: disable=redefined-outer-name