Spaces:

robinhad
/

ukrainian-tts

Running

Yurii Paniv commited on Aug 28, 2023

Commit

17873e4

•

1 Parent(s): 6180416

Fix formatter

Files changed (2) hide show

tests/test_formatter.py CHANGED Viewed

@@ -1,6 +1,7 @@
 from ukrainian_tts.formatter import preprocess_text
 import pytest
 @pytest.mark.parametrize(
     "text,expected",
     [
@@ -40,6 +41,7 @@ import pytest
 def test_formatter(text, expected):
     assert preprocess_text(text) == expected
 # Purspose of these tests, to have clearly separate list of issues
 # in the conversion. Once fixed, these cases should move to test_formatter
 # We still want make sure that no changes happens there, as any regressions

 from ukrainian_tts.formatter import preprocess_text
 import pytest
 @pytest.mark.parametrize(
     "text,expected",
     [
 def test_formatter(text, expected):
     assert preprocess_text(text) == expected
 # Purspose of these tests, to have clearly separate list of issues
 # in the conversion. Once fixed, these cases should move to test_formatter
 # We still want make sure that no changes happens there, as any regressions

ukrainian_tts/formatter.py CHANGED Viewed

@@ -29,6 +29,7 @@ def replace_currency_with_words(text, currency, num_form):
         text = text.replace("€", CURRENCY[currency][num_form])
     return text
 def find_any_char(text: str, find: str, start: int):
     result = -1
     for c in find:
@@ -38,11 +39,12 @@ def find_any_char(text: str, find: str, start: int):
     return result
 # Have to check if I can use https://github.com/lang-uk/tokenize-uk
 def simple_tokenizer(text: str):
     start = 0
     index = find_any_char(text, " ,", start)
-    while (index >= 0):
         word = text[start:index]
         yield word
         separator = text[index]
@@ -52,6 +54,7 @@ def simple_tokenizer(text: str):
     yield text[start:]
 def preprocess_text(text):
     text = text.lower()
     # currencies

         text = text.replace("€", CURRENCY[currency][num_form])
     return text
 def find_any_char(text: str, find: str, start: int):
     result = -1
     for c in find:
     return result
 # Have to check if I can use https://github.com/lang-uk/tokenize-uk
 def simple_tokenizer(text: str):
     start = 0
     index = find_any_char(text, " ,", start)
+    while index >= 0:
         word = text[start:index]
         yield word
         separator = text[index]
     yield text[start:]
 def preprocess_text(text):
     text = text.lower()
     # currencies