diff --git a/test_uralicnlp.py b/test_uralicnlp.py index 7c3521f..7e0493d 100644 --- a/test_uralicnlp.py +++ b/test_uralicnlp.py @@ -82,7 +82,7 @@ #print(uralicApi.analyze("kissat", "fin")) #print(uralicApi.generate("koira+N+Pl+Nom", "fin")) -print(uralicApi.segment("kissanikin", "fin")) +print(uralicApi.segment("luutapiirinikin", "fin")) #print(uralicApi.analyze("on", ["fin","olo"])) #print(uralicApi.analyze("on", ["fin","olo"], language_flags=True)) diff --git a/uralicNLP/uralicApi.py b/uralicNLP/uralicApi.py index bce9864..105fa37 100644 --- a/uralicNLP/uralicApi.py +++ b/uralicNLP/uralicApi.py @@ -433,5 +433,5 @@ def _get_dictionary(language, backend=TinyDictionary): return dictionary def segment(query, language): - return [x[0].split(">") for x in analyze(query, language, segmentation=True)] + return [x[0].replace("#",">").split(">") for x in analyze(query, language, segmentation=True)]