diff --git a/etc/test_sentences/nl.txt b/etc/test_sentences/nl.txt new file mode 100644 index 0000000..cc3d499 --- /dev/null +++ b/etc/test_sentences/nl.txt @@ -0,0 +1,6 @@ +Een regenboog is een gekleurde cirkelboog die aan de hemel waargenomen kan worden als de, laagstaande, zon tegen een nevel van waterdruppeltjes aan schijnt en de zon zich achter de waarnemer bevindt. +Het is een optisch effect dat wordt veroorzaakt door de breking en weerspiegeling van licht in de waterdruppels. +Het middelpunt van de boog staat gezien vanuit de waarnemer lijnrecht tegenover de zon, en bevindt zich dus altijd onder de horizon. +Waarnemer en boog vormen samen een denkbeeldige kegel met de waarnemer op de punt van de kegel en de regenboog langs de boogrand van het grondvlak van de kegel. +De boog heeft binnen de kegel een halve tophoek van ongeveer 42 graden; de breedte van de kleurenband van rood tot violet is circa 2 graden. +Pa’s wijze lynx bezag vroom het fikse aquaduct. diff --git a/etc/test_sentences/no.txt b/etc/test_sentences/no.txt new file mode 100644 index 0000000..c6b34ee --- /dev/null +++ b/etc/test_sentences/no.txt @@ -0,0 +1,6 @@ +Regnbuen eller regnbogen er et optisk fenomen som oppstår når solen skinner gjennom regndråper i atmosfæren og betrakteren står med solen i ryggen. +Gulhvitt sollys består av alle synlige bølgelengder av lys. +Lysbrytningen er forskjellig avhengig av bølgelengden slik at sollyset spaltes til et spektrum av rødt ytterst og deretter oransje, gult, grønt, blått, indigo (blålilla) og fiolett. +En fullstendig regnbue har en tydelig hovedregnbue (primærbue) innerst og en svakere regnbue (sekundærbue) ytterst der fargene ligger i omvendt rekkefølge. +Vår sære Zulu fra badeøya spilte jo whist og quickstep i min taxi. +Høvdingens kjære squaw får litt pizza i Mexico by. diff --git a/etc/test_sentences/ru.txt b/etc/test_sentences/ru.txt index 6856f36..8f29717 100644 --- a/etc/test_sentences/ru.txt +++ b/etc/test_sentences/ru.txt @@ -1,4 +1,4 @@ -Ра́дуга, атмосферное, оптическое и метеорологическое явление, наблюдаемое при освещении ярким источником света множества водяных капель. +Радуга, атмосферное, оптическое и метеорологическое явление, наблюдаемое при освещении ярким источником света множества водяных капель. Радуга выглядит как разноцветная дуга или окружность, составленная из цветов спектра видимого излучения. Это те семь цветов, которые принято выделять в радуге в русской культуре, но следует иметь в виду, что на самом деле спектр непрерывен, и его цвета плавно переходят друг в друга через множество промежуточных оттенков. Широкая электрификация южных губерний даст мощный толчок подъёму сельского хозяйства. diff --git a/etc/test_sentences/test_nb.jsonl b/etc/test_sentences/test_nb.jsonl new file mode 100644 index 0000000..280b271 --- /dev/null +++ b/etc/test_sentences/test_nb.jsonl @@ -0,0 +1,6 @@ +{"phoneme_ids":[1,0,30,0,120,0,61,0,44,0,26,0,15,0,99,0,122,0,59,0,26,0,3,0,121,0,61,0,24,0,24,0,59,0,30,0,3,0,30,0,120,0,61,0,44,0,26,0,15,0,33,0,122,0,66,0,59,0,26,0,3,0,121,0,61,0,122,0,30,0,3,0,61,0,32,0,3,0,120,0,54,0,28,0,32,0,74,0,31,0,23,0,3,0,19,0,120,0,18,0,122,0,26,0,33,0,122,0,25,0,59,0,26,0,3,0,31,0,33,0,122,0,25,0,3,0,120,0,54,0,28,0,122,0,31,0,32,0,27,0,122,0,30,0,3,0,26,0,120,0,27,0,122,0,30,0,3,0,31,0,120,0,33,0,122,0,24,0,59,0,26,0,3,0,96,0,120,0,74,0,26,0,26,0,59,0,30,0,3,0,22,0,120,0,61,0,26,0,26,0,33,0,122,0,25,0,3,0,30,0,120,0,61,0,44,0,26,0,26,0,30,0,27,0,122,0,28,0,59,0,30,0,3,0,21,0,122,0,3,0,120,0,51,0,32,0,25,0,54,0,31,0,19,0,121,0,14,0,122,0,30,0,59,0,26,0,3,0,33,0,122,0,66,0,3,0,15,0,59,0,32,0,30,0,120,0,51,0,23,0,32,0,18,0,122,0,30,0,59,0,26,0,3,0,31,0,32,0,120,0,27,0,122,0,30,0,3,0,25,0,18,0,122,0,17,0,3,0,31,0,120,0,33,0,122,0,24,0,59,0,26,0,3,0,21,0,122,0,3,0,30,0,120,0,37,0,66,0,122,0,59,0,26,0,10,0,2],"phonemes":["r","ˈ","ɛ","ŋ","n","b","ʉ","ː","ə","n"," ","ˌ","ɛ","l","l","ə","r"," ","r","ˈ","ɛ","ŋ","n","b","u","ː","ɡ","ə","n"," ","ˌ","ɛ","ː","r"," ","ɛ","t"," ","ˈ","ɔ","p","t","ɪ","s","k"," ","f","ˈ","e","ː","n","u","ː","m","ə","n"," ","s","u","ː","m"," ","ˈ","ɔ","p","ː","s","t","o","ː","r"," ","n","ˈ","o","ː","r"," ","s","ˈ","u","ː","l","ə","n"," ","ʃ","ˈ","ɪ","n","n","ə","r"," ","j","ˈ","ɛ","n","n","u","ː","m"," ","r","ˈ","ɛ","ŋ","n","n","r","o","ː","p","ə","r"," ","i","ː"," ","ˈ","ɑ","t","m","ɔ","s","f","ˌ","a","ː","r","ə","n"," ","u","ː","ɡ"," ","b","ə","t","r","ˈ","ɑ","k","t","e","ː","r","ə","n"," ","s","t","ˈ","o","ː","r"," ","m","e","ː","d"," ","s","ˈ","u","ː","l","ə","n"," ","i","ː"," ","r","ˈ","y","ɡ","ː","ə","n","."],"processed_text":"Regnbuen eller regnbogen er et optisk fenomen som oppstår når solen skinner gjennom regndråper i atmosfæren og betrakteren står med solen i ryggen.","text":"Regnbuen eller regnbogen er et optisk fenomen som oppstår når solen skinner gjennom regndråper i atmosfæren og betrakteren står med solen i ryggen."} +{"phoneme_ids":[1,0,66,0,120,0,99,0,24,0,34,0,74,0,32,0,122,0,3,0,31,0,120,0,54,0,24,0,24,0,37,0,122,0,31,0,3,0,15,0,59,0,31,0,32,0,120,0,27,0,122,0,30,0,3,0,14,0,34,0,3,0,120,0,51,0,24,0,24,0,14,0,3,0,31,0,120,0,37,0,26,0,24,0,21,0,122,0,66,0,14,0,3,0,15,0,120,0,45,0,24,0,66,0,18,0,122,0,24,0,121,0,61,0,44,0,17,0,59,0,30,0,3,0,14,0,34,0,3,0,24,0,120,0,37,0,122,0,31,0,10,0,2],"phonemes":["ɡ","ˈ","ʉ","l","v","ɪ","t","ː"," ","s","ˈ","ɔ","l","l","y","ː","s"," ","b","ə","s","t","ˈ","o","ː","r"," ","a","v"," ","ˈ","ɑ","l","l","a"," ","s","ˈ","y","n","l","i","ː","ɡ","a"," ","b","ˈ","œ","l","ɡ","e","ː","l","ˌ","ɛ","ŋ","d","ə","r"," ","a","v"," ","l","ˈ","y","ː","s","."],"processed_text":"Gulhvitt sollys består av alle synlige bølgelengder av lys.","text":"Gulhvitt sollys består av alle synlige bølgelengder av lys."} +{"phoneme_ids":[1,0,24,0,120,0,37,0,31,0,15,0,30,0,37,0,32,0,26,0,121,0,74,0,44,0,59,0,26,0,3,0,121,0,61,0,122,0,30,0,3,0,19,0,120,0,54,0,30,0,96,0,59,0,24,0,24,0,121,0,74,0,3,0,120,0,51,0,34,0,20,0,59,0,44,0,121,0,74,0,3,0,14,0,34,0,3,0,15,0,120,0,45,0,24,0,66,0,18,0,122,0,24,0,121,0,61,0,44,0,17,0,59,0,26,0,3,0,96,0,24,0,120,0,21,0,122,0,23,0,3,0,14,0,32,0,3,0,31,0,120,0,54,0,24,0,24,0,37,0,122,0,31,0,59,0,32,0,3,0,31,0,28,0,120,0,51,0,24,0,32,0,59,0,31,0,3,0,32,0,21,0,122,0,24,0,3,0,61,0,32,0,3,0,31,0,28,0,120,0,61,0,23,0,32,0,30,0,99,0,122,0,25,0,3,0,14,0,34,0,3,0,30,0,120,0,45,0,17,0,32,0,3,0,120,0,37,0,32,0,122,0,14,0,30,0,96,0,32,0,3,0,33,0,122,0,66,0,3,0,17,0,120,0,18,0,122,0,30,0,61,0,32,0,122,0,59,0,30,0,3,0,120,0,33,0,122,0,30,0,51,0,26,0,96,0,14,0,8,0,66,0,120,0,99,0,24,0,32,0,8,0,66,0,30,0,120,0,45,0,26,0,32,0,8,0,15,0,24,0,120,0,54,0,32,0,122,0,8,0,120,0,74,0,26,0,26,0,21,0,122,0,66,0,121,0,33,0,122,0,3,0,15,0,24,0,120,0,27,0,122,0,24,0,74,0,24,0,24,0,121,0,51,0,3,0,33,0,122,0,66,0,3,0,19,0,120,0,21,0,122,0,33,0,122,0,24,0,121,0,61,0,32,0,122,0,10,0,2],"phonemes":["l","ˈ","y","s","b","r","y","t","n","ˌ","ɪ","ŋ","ə","n"," ","ˌ","ɛ","ː","r"," ","f","ˈ","ɔ","r","ʃ","ə","l","l","ˌ","ɪ"," ","ˈ","ɑ","v","h","ə","ŋ","ˌ","ɪ"," ","a","v"," ","b","ˈ","œ","l","ɡ","e","ː","l","ˌ","ɛ","ŋ","d","ə","n"," ","ʃ","l","ˈ","i","ː","k"," ","a","t"," ","s","ˈ","ɔ","l","l","y","ː","s","ə","t"," ","s","p","ˈ","ɑ","l","t","ə","s"," ","t","i","ː","l"," ","ɛ","t"," ","s","p","ˈ","ɛ","k","t","r","ʉ","ː","m"," ","a","v"," ","r","ˈ","œ","d","t"," ","ˈ","y","t","ː","a","r","ʃ","t"," ","u","ː","ɡ"," ","d","ˈ","e","ː","r","ɛ","t","ː","ə","r"," ","ˈ","u","ː","r","ɑ","n","ʃ","a",",","ɡ","ˈ","ʉ","l","t",",","ɡ","r","ˈ","œ","n","t",",","b","l","ˈ","ɔ","t","ː",",","ˈ","ɪ","n","n","i","ː","ɡ","ˌ","u","ː"," ","b","l","ˈ","o","ː","l","ɪ","l","l","ˌ","ɑ"," ","u","ː","ɡ"," ","f","ˈ","i","ː","u","ː","l","ˌ","ɛ","t","ː","."],"processed_text":"Lysbrytningen er forskjellig avhengig av bølgelengden slik at sollyset spaltes til et spektrum av rødt ytterst og deretter oransje, gult, grønt, blått, indigo (blålilla) og fiolett.","text":"Lysbrytningen er forskjellig avhengig av bølgelengden slik at sollyset spaltes til et spektrum av rødt ytterst og deretter oransje, gult, grønt, blått, indigo (blålilla) og fiolett."} +{"phoneme_ids":[1,0,18,0,122,0,26,0,3,0,19,0,120,0,99,0,24,0,31,0,32,0,59,0,26,0,26,0,121,0,74,0,3,0,30,0,120,0,61,0,44,0,26,0,15,0,99,0,122,0,14,0,3,0,20,0,14,0,30,0,3,0,18,0,122,0,26,0,3,0,32,0,120,0,37,0,122,0,17,0,18,0,122,0,24,0,121,0,74,0,3,0,20,0,120,0,33,0,122,0,34,0,59,0,17,0,30,0,121,0,61,0,44,0,26,0,15,0,99,0,122,0,14,0,3,0,28,0,30,0,120,0,21,0,122,0,25,0,14,0,30,0,15,0,121,0,99,0,122,0,14,0,3,0,120,0,74,0,26,0,26,0,14,0,30,0,96,0,32,0,3,0,33,0,122,0,66,0,3,0,18,0,122,0,26,0,3,0,31,0,34,0,120,0,14,0,23,0,18,0,122,0,30,0,14,0,3,0,30,0,120,0,61,0,44,0,26,0,15,0,99,0,122,0,14,0,3,0,31,0,120,0,18,0,122,0,23,0,99,0,26,0,26,0,121,0,14,0,30,0,15,0,99,0,122,0,14,0,3,0,120,0,37,0,32,0,122,0,14,0,30,0,96,0,32,0,3,0,17,0,120,0,61,0,122,0,30,0,3,0,19,0,120,0,51,0,30,0,66,0,61,0,26,0,14,0,3,0,24,0,120,0,74,0,66,0,122,0,59,0,30,0,3,0,21,0,122,0,3,0,120,0,54,0,25,0,34,0,61,0,26,0,26,0,32,0,3,0,30,0,120,0,61,0,23,0,122,0,18,0,122,0,19,0,121,0,45,0,24,0,66,0,14,0,10,0,2],"phonemes":["e","ː","n"," ","f","ˈ","ʉ","l","s","t","ə","n","n","ˌ","ɪ"," ","r","ˈ","ɛ","ŋ","n","b","ʉ","ː","a"," ","h","a","r"," ","e","ː","n"," ","t","ˈ","y","ː","d","e","ː","l","ˌ","ɪ"," ","h","ˈ","u","ː","v","ə","d","r","ˌ","ɛ","ŋ","n","b","ʉ","ː","a"," ","p","r","ˈ","i","ː","m","a","r","b","ˌ","ʉ","ː","a"," ","ˈ","ɪ","n","n","a","r","ʃ","t"," ","u","ː","ɡ"," ","e","ː","n"," ","s","v","ˈ","a","k","e","ː","r","a"," ","r","ˈ","ɛ","ŋ","n","b","ʉ","ː","a"," ","s","ˈ","e","ː","k","ʉ","n","n","ˌ","a","r","b","ʉ","ː","a"," ","ˈ","y","t","ː","a","r","ʃ","t"," ","d","ˈ","ɛ","ː","r"," ","f","ˈ","ɑ","r","ɡ","ɛ","n","a"," ","l","ˈ","ɪ","ɡ","ː","ə","r"," ","i","ː"," ","ˈ","ɔ","m","v","ɛ","n","n","t"," ","r","ˈ","ɛ","k","ː","e","ː","f","ˌ","œ","l","ɡ","a","."],"processed_text":"En fullstendig regnbue har en tydelig hovedregnbue (primærbue) innerst og en svakere regnbue (sekundærbue) ytterst der fargene ligger i omvendt rekkefølge.","text":"En fullstendig regnbue har en tydelig hovedregnbue (primærbue) innerst og en svakere regnbue (sekundærbue) ytterst der fargene ligger i omvendt rekkefølge."} +{"phoneme_ids":[1,0,34,0,27,0,122,0,30,0,3,0,31,0,120,0,14,0,122,0,30,0,14,0,3,0,31,0,120,0,99,0,122,0,24,0,99,0,122,0,3,0,19,0,30,0,51,0,3,0,15,0,120,0,14,0,17,0,18,0,122,0,121,0,42,0,37,0,51,0,3,0,31,0,28,0,120,0,74,0,24,0,32,0,14,0,3,0,22,0,120,0,33,0,122,0,3,0,34,0,20,0,120,0,74,0,31,0,32,0,3,0,33,0,122,0,66,0,3,0,23,0,35,0,120,0,74,0,23,0,23,0,31,0,32,0,59,0,28,0,3,0,21,0,122,0,3,0,25,0,21,0,122,0,26,0,3,0,32,0,120,0,14,0,23,0,31,0,21,0,122,0,10,0,2],"phonemes":["v","o","ː","r"," ","s","ˈ","a","ː","r","a"," ","s","ˈ","ʉ","ː","l","ʉ","ː"," ","f","r","ɑ"," ","b","ˈ","a","d","e","ː","ˌ","ø","y","ɑ"," ","s","p","ˈ","ɪ","l","t","a"," ","j","ˈ","u","ː"," ","v","h","ˈ","ɪ","s","t"," ","u","ː","ɡ"," ","k","w","ˈ","ɪ","k","k","s","t","ə","p"," ","i","ː"," ","m","i","ː","n"," ","t","ˈ","a","k","s","i","ː","."],"processed_text":"Vår sære Zulu fra badeøya spilte jo whist og quickstep i min taxi.","text":"Vår sære Zulu fra badeøya spilte jo whist og quickstep i min taxi."} +{"phoneme_ids":[1,0,20,0,120,0,45,0,34,0,17,0,74,0,44,0,59,0,26,0,31,0,3,0,36,0,120,0,14,0,122,0,30,0,14,0,3,0,31,0,23,0,35,0,120,0,14,0,34,0,3,0,19,0,120,0,27,0,122,0,30,0,3,0,24,0,120,0,74,0,32,0,122,0,3,0,28,0,120,0,74,0,38,0,51,0,3,0,21,0,122,0,3,0,25,0,120,0,18,0,122,0,23,0,31,0,21,0,122,0,23,0,121,0,33,0,122,0,3,0,15,0,120,0,37,0,122,0,10,0,2],"phonemes":["h","ˈ","œ","v","d","ɪ","ŋ","ə","n","s"," ","x","ˈ","a","ː","r","a"," ","s","k","w","ˈ","a","v"," ","f","ˈ","o","ː","r"," ","l","ˈ","ɪ","t","ː"," ","p","ˈ","ɪ","z","ɑ"," ","i","ː"," ","m","ˈ","e","ː","k","s","i","ː","k","ˌ","u","ː"," ","b","ˈ","y","ː","."],"processed_text":"Høvdingens kjære squaw får litt pizza i Mexico by.","text":"Høvdingens kjære squaw får litt pizza i Mexico by."} diff --git a/etc/test_sentences/test_nl.jsonl b/etc/test_sentences/test_nl.jsonl new file mode 100644 index 0000000..91a6f42 --- /dev/null +++ b/etc/test_sentences/test_nl.jsonl @@ -0,0 +1,6 @@ +{"phoneme_ids":[1,0,59,0,26,0,3,0,30,0,121,0,18,0,122,0,68,0,59,0,26,0,15,0,120,0,27,0,122,0,36,0,3,0,74,0,31,0,3,0,59,0,26,0,3,0,68,0,120,0,61,0,23,0,24,0,42,0,122,0,30,0,17,0,59,0,3,0,31,0,121,0,74,0,30,0,23,0,61,0,24,0,15,0,120,0,27,0,122,0,36,0,3,0,17,0,21,0,3,0,14,0,122,0,26,0,3,0,17,0,59,0,3,0,20,0,120,0,18,0,122,0,25,0,59,0,24,0,3,0,101,0,121,0,14,0,122,0,30,0,68,0,59,0,26,0,120,0,27,0,122,0,25,0,59,0,26,0,3,0,23,0,51,0,26,0,3,0,101,0,121,0,54,0,30,0,17,0,59,0,26,0,3,0,51,0,24,0,31,0,3,0,17,0,59,0,8,0,24,0,120,0,14,0,122,0,36,0,31,0,32,0,14,0,122,0,26,0,17,0,59,0,8,0,38,0,120,0,54,0,26,0,3,0,32,0,120,0,18,0,122,0,68,0,59,0,26,0,3,0,59,0,26,0,3,0,26,0,120,0,18,0,122,0,34,0,59,0,24,0,3,0,34,0,51,0,26,0,3,0,101,0,120,0,14,0,122,0,32,0,59,0,30,0,17,0,30,0,121,0,85,0,28,0,61,0,24,0,32,0,119,0,59,0,31,0,3,0,14,0,122,0,26,0,3,0,31,0,36,0,120,0,61,0,74,0,26,0,32,0,3,0,61,0,26,0,3,0,17,0,59,0,3,0,38,0,120,0,54,0,26,0,3,0,38,0,74,0,36,0,3,0,120,0,51,0,36,0,32,0,59,0,30,0,3,0,17,0,59,0,3,0,101,0,120,0,14,0,122,0,30,0,26,0,18,0,122,0,25,0,59,0,30,0,3,0,15,0,59,0,34,0,120,0,74,0,26,0,32,0,10,0,2],"phonemes":["ə","n"," ","r","ˌ","e","ː","ɣ","ə","n","b","ˈ","o","ː","x"," ","ɪ","s"," ","ə","n"," ","ɣ","ˈ","ɛ","k","l","ø","ː","r","d","ə"," ","s","ˌ","ɪ","r","k","ɛ","l","b","ˈ","o","ː","x"," ","d","i"," ","a","ː","n"," ","d","ə"," ","h","ˈ","e","ː","m","ə","l"," ","ʋ","ˌ","a","ː","r","ɣ","ə","n","ˈ","o","ː","m","ə","n"," ","k","ɑ","n"," ","ʋ","ˌ","ɔ","r","d","ə","n"," ","ɑ","l","s"," ","d","ə",",","l","ˈ","a","ː","x","s","t","a","ː","n","d","ə",",","z","ˈ","ɔ","n"," ","t","ˈ","e","ː","ɣ","ə","n"," ","ə","n"," ","n","ˈ","e","ː","v","ə","l"," ","v","ɑ","n"," ","ʋ","ˈ","a","ː","t","ə","r","d","r","ˌ","ɵ","p","ɛ","l","t","ʲ","ə","s"," ","a","ː","n"," ","s","x","ˈ","ɛ","ɪ","n","t"," ","ɛ","n"," ","d","ə"," ","z","ˈ","ɔ","n"," ","z","ɪ","x"," ","ˈ","ɑ","x","t","ə","r"," ","d","ə"," ","ʋ","ˈ","a","ː","r","n","e","ː","m","ə","r"," ","b","ə","v","ˈ","ɪ","n","t","."],"processed_text":"Een regenboog is een gekleurde cirkelboog die aan de hemel waargenomen kan worden als de, laagstaande, zon tegen een nevel van waterdruppeltjes aan schijnt en de zon zich achter de waarnemer bevindt.","text":"Een regenboog is een gekleurde cirkelboog die aan de hemel waargenomen kan worden als de, laagstaande, zon tegen een nevel van waterdruppeltjes aan schijnt en de zon zich achter de waarnemer bevindt."} +{"phoneme_ids":[1,0,20,0,59,0,32,0,3,0,74,0,31,0,3,0,59,0,26,0,3,0,120,0,54,0,28,0,32,0,21,0,31,0,3,0,120,0,61,0,19,0,61,0,23,0,32,0,3,0,17,0,51,0,32,0,3,0,101,0,54,0,30,0,32,0,3,0,34,0,59,0,30,0,120,0,54,0,122,0,30,0,38,0,14,0,122,0,23,0,32,0,3,0,17,0,27,0,122,0,30,0,3,0,17,0,59,0,3,0,15,0,30,0,120,0,18,0,122,0,23,0,74,0,44,0,3,0,61,0,26,0,3,0,101,0,120,0,74,0,122,0,30,0,31,0,28,0,121,0,21,0,68,0,59,0,24,0,121,0,74,0,44,0,3,0,34,0,51,0,26,0,3,0,24,0,120,0,74,0,36,0,32,0,3,0,74,0,26,0,3,0,17,0,59,0,3,0,101,0,120,0,14,0,122,0,32,0,59,0,30,0,17,0,30,0,121,0,85,0,28,0,59,0,24,0,31,0,10,0,2],"phonemes":["h","ə","t"," ","ɪ","s"," ","ə","n"," ","ˈ","ɔ","p","t","i","s"," ","ˈ","ɛ","f","ɛ","k","t"," ","d","ɑ","t"," ","ʋ","ɔ","r","t"," ","v","ə","r","ˈ","ɔ","ː","r","z","a","ː","k","t"," ","d","o","ː","r"," ","d","ə"," ","b","r","ˈ","e","ː","k","ɪ","ŋ"," ","ɛ","n"," ","ʋ","ˈ","ɪ","ː","r","s","p","ˌ","i","ɣ","ə","l","ˌ","ɪ","ŋ"," ","v","ɑ","n"," ","l","ˈ","ɪ","x","t"," ","ɪ","n"," ","d","ə"," ","ʋ","ˈ","a","ː","t","ə","r","d","r","ˌ","ɵ","p","ə","l","s","."],"processed_text":"Het is een optisch effect dat wordt veroorzaakt door de breking en weerspiegeling van licht in de waterdruppels.","text":"Het is een optisch effect dat wordt veroorzaakt door de breking en weerspiegeling van licht in de waterdruppels."} +{"phoneme_ids":[1,0,20,0,59,0,32,0,3,0,25,0,120,0,74,0,17,0,61,0,24,0,28,0,121,0,85,0,26,0,32,0,3,0,34,0,51,0,26,0,3,0,17,0,59,0,3,0,15,0,120,0,27,0,122,0,36,0,3,0,31,0,32,0,120,0,14,0,122,0,32,0,3,0,68,0,59,0,38,0,120,0,21,0,26,0,3,0,34,0,51,0,26,0,120,0,45,0,37,0,3,0,32,0,59,0,3,0,101,0,120,0,14,0,122,0,30,0,26,0,18,0,122,0,25,0,59,0,30,0,3,0,24,0,120,0,61,0,74,0,26,0,30,0,61,0,36,0,3,0,32,0,120,0,18,0,122,0,68,0,59,0,26,0,121,0,27,0,122,0,34,0,59,0,30,0,3,0,17,0,59,0,3,0,38,0,120,0,54,0,26,0,8,0,61,0,26,0,3,0,15,0,59,0,34,0,120,0,74,0,26,0,32,0,3,0,38,0,74,0,36,0,3,0,17,0,85,0,31,0,3,0,120,0,51,0,24,0,32,0,61,0,74,0,32,0,3,0,120,0,54,0,26,0,17,0,59,0,30,0,3,0,17,0,59,0,3,0,20,0,121,0,27,0,122,0,30,0,21,0,38,0,120,0,54,0,26,0,10,0,2],"phonemes":["h","ə","t"," ","m","ˈ","ɪ","d","ɛ","l","p","ˌ","ɵ","n","t"," ","v","ɑ","n"," ","d","ə"," ","b","ˈ","o","ː","x"," ","s","t","ˈ","a","ː","t"," ","ɣ","ə","z","ˈ","i","n"," ","v","ɑ","n","ˈ","œ","y"," ","t","ə"," ","ʋ","ˈ","a","ː","r","n","e","ː","m","ə","r"," ","l","ˈ","ɛ","ɪ","n","r","ɛ","x"," ","t","ˈ","e","ː","ɣ","ə","n","ˌ","o","ː","v","ə","r"," ","d","ə"," ","z","ˈ","ɔ","n",",","ɛ","n"," ","b","ə","v","ˈ","ɪ","n","t"," ","z","ɪ","x"," ","d","ɵ","s"," ","ˈ","ɑ","l","t","ɛ","ɪ","t"," ","ˈ","ɔ","n","d","ə","r"," ","d","ə"," ","h","ˌ","o","ː","r","i","z","ˈ","ɔ","n","."],"processed_text":"Het middelpunt van de boog staat gezien vanuit de waarnemer lijnrecht tegenover de zon, en bevindt zich dus altijd onder de horizon.","text":"Het middelpunt van de boog staat gezien vanuit de waarnemer lijnrecht tegenover de zon, en bevindt zich dus altijd onder de horizon."} +{"phoneme_ids":[1,0,101,0,120,0,14,0,122,0,30,0,26,0,18,0,122,0,25,0,59,0,30,0,3,0,61,0,26,0,3,0,15,0,120,0,27,0,122,0,36,0,3,0,34,0,120,0,54,0,30,0,25,0,59,0,26,0,3,0,31,0,120,0,14,0,122,0,25,0,59,0,26,0,3,0,59,0,26,0,3,0,17,0,61,0,44,0,23,0,15,0,120,0,18,0,122,0,24,0,17,0,59,0,68,0,59,0,3,0,23,0,120,0,18,0,122,0,68,0,59,0,24,0,3,0,25,0,61,0,3,0,32,0,59,0,3,0,101,0,120,0,14,0,122,0,30,0,26,0,18,0,122,0,25,0,59,0,30,0,3,0,54,0,28,0,3,0,17,0,59,0,3,0,28,0,120,0,85,0,26,0,32,0,3,0,34,0,51,0,26,0,3,0,17,0,59,0,3,0,23,0,120,0,18,0,122,0,68,0,59,0,24,0,3,0,61,0,26,0,3,0,17,0,59,0,3,0,30,0,121,0,18,0,122,0,68,0,59,0,26,0,15,0,120,0,27,0,122,0,36,0,3,0,24,0,120,0,51,0,44,0,31,0,3,0,17,0,59,0,3,0,15,0,120,0,27,0,122,0,68,0,30,0,51,0,26,0,32,0,3,0,34,0,51,0,26,0,3,0,20,0,59,0,32,0,3,0,68,0,30,0,120,0,54,0,26,0,17,0,34,0,24,0,51,0,23,0,3,0,34,0,51,0,26,0,3,0,17,0,59,0,3,0,23,0,120,0,18,0,122,0,68,0,59,0,24,0,10,0,2],"phonemes":["ʋ","ˈ","a","ː","r","n","e","ː","m","ə","r"," ","ɛ","n"," ","b","ˈ","o","ː","x"," ","v","ˈ","ɔ","r","m","ə","n"," ","s","ˈ","a","ː","m","ə","n"," ","ə","n"," ","d","ɛ","ŋ","k","b","ˈ","e","ː","l","d","ə","ɣ","ə"," ","k","ˈ","e","ː","ɣ","ə","l"," ","m","ɛ"," ","t","ə"," ","ʋ","ˈ","a","ː","r","n","e","ː","m","ə","r"," ","ɔ","p"," ","d","ə"," ","p","ˈ","ɵ","n","t"," ","v","ɑ","n"," ","d","ə"," ","k","ˈ","e","ː","ɣ","ə","l"," ","ɛ","n"," ","d","ə"," ","r","ˌ","e","ː","ɣ","ə","n","b","ˈ","o","ː","x"," ","l","ˈ","ɑ","ŋ","s"," ","d","ə"," ","b","ˈ","o","ː","ɣ","r","ɑ","n","t"," ","v","ɑ","n"," ","h","ə","t"," ","ɣ","r","ˈ","ɔ","n","d","v","l","ɑ","k"," ","v","ɑ","n"," ","d","ə"," ","k","ˈ","e","ː","ɣ","ə","l","."],"processed_text":"Waarnemer en boog vormen samen een denkbeeldige kegel met de waarnemer op de punt van de kegel en de regenboog langs de boogrand van het grondvlak van de kegel.","text":"Waarnemer en boog vormen samen een denkbeeldige kegel met de waarnemer op de punt van de kegel en de regenboog langs de boogrand van het grondvlak van de kegel."} +{"phoneme_ids":[1,0,17,0,59,0,3,0,15,0,120,0,27,0,122,0,36,0,3,0,20,0,18,0,122,0,19,0,32,0,3,0,15,0,120,0,74,0,26,0,59,0,26,0,3,0,17,0,59,0,3,0,23,0,120,0,18,0,122,0,68,0,59,0,24,0,3,0,59,0,26,0,3,0,20,0,120,0,51,0,24,0,34,0,59,0,3,0,32,0,54,0,28,0,20,0,120,0,33,0,23,0,3,0,34,0,51,0,26,0,3,0,121,0,54,0,26,0,68,0,59,0,34,0,120,0,74,0,122,0,30,0,3,0,32,0,101,0,120,0,18,0,122,0,61,0,26,0,19,0,121,0,74,0,122,0,30,0,32,0,59,0,36,0,3,0,68,0,30,0,120,0,14,0,122,0,17,0,59,0,26,0,12,0,17,0,59,0,3,0,15,0,30,0,120,0,18,0,122,0,32,0,59,0,3,0,34,0,51,0,26,0,3,0,17,0,59,0,3,0,23,0,24,0,120,0,42,0,122,0,30,0,59,0,26,0,15,0,121,0,51,0,26,0,32,0,3,0,34,0,51,0,26,0,3,0,30,0,120,0,27,0,122,0,17,0,3,0,32,0,54,0,32,0,3,0,34,0,121,0,21,0,27,0,122,0,24,0,120,0,61,0,32,0,3,0,74,0,3,0,31,0,120,0,74,0,30,0,23,0,14,0,122,0,3,0,32,0,101,0,120,0,18,0,122,0,3,0,68,0,30,0,120,0,14,0,122,0,17,0,59,0,26,0,10,0,2],"phonemes":["d","ə"," ","b","ˈ","o","ː","x"," ","h","e","ː","f","t"," ","b","ˈ","ɪ","n","ə","n"," ","d","ə"," ","k","ˈ","e","ː","ɣ","ə","l"," ","ə","n"," ","h","ˈ","ɑ","l","v","ə"," ","t","ɔ","p","h","ˈ","u","k"," ","v","ɑ","n"," ","ˌ","ɔ","n","ɣ","ə","v","ˈ","ɪ","ː","r"," ","t","ʋ","ˈ","e","ː","ɛ","n","f","ˌ","ɪ","ː","r","t","ə","x"," ","ɣ","r","ˈ","a","ː","d","ə","n",";","d","ə"," ","b","r","ˈ","e","ː","t","ə"," ","v","ɑ","n"," ","d","ə"," ","k","l","ˈ","ø","ː","r","ə","n","b","ˌ","ɑ","n","t"," ","v","ɑ","n"," ","r","ˈ","o","ː","d"," ","t","ɔ","t"," ","v","ˌ","i","o","ː","l","ˈ","ɛ","t"," ","ɪ"," ","s","ˈ","ɪ","r","k","a","ː"," ","t","ʋ","ˈ","e","ː"," ","ɣ","r","ˈ","a","ː","d","ə","n","."],"processed_text":"De boog heeft binnen de kegel een halve tophoek van ongeveer 42 graden; de breedte van de kleurenband van rood tot violet is circa 2 graden.","text":"De boog heeft binnen de kegel een halve tophoek van ongeveer 42 graden; de breedte van de kleurenband van rood tot violet is circa 2 graden."} +{"phoneme_ids":[1,0,28,0,120,0,14,0,122,0,31,0,3,0,101,0,120,0,61,0,74,0,38,0,59,0,3,0,24,0,120,0,74,0,26,0,23,0,31,0,3,0,15,0,59,0,38,0,120,0,51,0,36,0,3,0,34,0,30,0,120,0,27,0,122,0,25,0,3,0,20,0,59,0,32,0,3,0,19,0,120,0,74,0,23,0,31,0,59,0,3,0,120,0,14,0,122,0,23,0,34,0,14,0,122,0,17,0,121,0,85,0,23,0,32,0,10,0,2],"phonemes":["p","ˈ","a","ː","s"," ","ʋ","ˈ","ɛ","ɪ","z","ə"," ","l","ˈ","ɪ","n","k","s"," ","b","ə","z","ˈ","ɑ","x"," ","v","r","ˈ","o","ː","m"," ","h","ə","t"," ","f","ˈ","ɪ","k","s","ə"," ","ˈ","a","ː","k","v","a","ː","d","ˌ","ɵ","k","t","."],"processed_text":"Pa’s wijze lynx bezag vroom het fikse aquaduct.","text":"Pa’s wijze lynx bezag vroom het fikse aquaduct."} diff --git a/etc/test_sentences/test_ru.jsonl b/etc/test_sentences/test_ru.jsonl index 4ec4674..a9d47e3 100644 --- a/etc/test_sentences/test_ru.jsonl +++ b/etc/test_sentences/test_ru.jsonl @@ -1,6 +1,6 @@ -{"text": "Ра́дуга, атмосферное, оптическое и метеорологическое явление, наблюдаемое при освещении ярким источником света множества водяных капель.", "phonemes": ["r", "a", "d", "ˈ", "u", "ɡ", "a", ",", " ", "a", "t", "m", "ʌ", "s", "f", "ʲ", "ˈ", "e", "r", "n", "ʌ", "j", "ɪ", ",", " ", "ʌ", "p", "t", "ʲ", "ˈ", "i", "t", "ʃ", "ʲ", "i", "s", "k", "ʌ", "j", "ɪ", " ", "ˈ", "i", " ", "m", "ʲ", "i", "t", "ʲ", "i", "ʌ", "r", "ʌ", "ɭ", "ʌ", "ɡ", "ʲ", "ˈ", "i", "t", "ʃ", "ʲ", "i", "s", "k", "ʌ", "j", "ɪ", " ", "j", "a", "v", "ɭ", "ʲ", "ˈ", "e", "n", "ʲ", "i", "j", "ɪ", ",", " ", "n", "ʌ", "b", "ɭ", "ʲ", "u", "\"", "d", "ˈ", "ɑ", "j", "i", "m", "ʌ", "j", "ɪ", " ", "p", "r", "ʲ", "ˈ", "i", " ", "ʌ", "s", "v", "ʲ", "i", "ɕ", "ˈ", "e", "n", "ʲ", "i", "ɪ", " ", "ˈ", "j", "a", "r", "k", "ʲ", "i", "m", " ", "ɪ", "s", "t", "ˈ", "o", "t", "ʃ", "ʲ", "n", "ʲ", "i", "k", "ʌ", "m", " ", "s", "v", "ʲ", "ˈ", "e", "t", "a", " ", "m", "n", "ˈ", "o", "ʒ", "y", "s", "t", "v", "a", " ", "v", "ʌ", "d", "ʲ", "a", "n", "ˈ", "y", "x", " ", "k", "ˈ", "ɑ", "p", "ʲ", "i", "ɭ", "."], "phoneme_ids": [1, 0, 30, 0, 14, 0, 17, 0, 120, 0, 33, 0, 66, 0, 14, 0, 8, 0, 3, 0, 14, 0, 32, 0, 25, 0, 102, 0, 31, 0, 19, 0, 119, 0, 120, 0, 18, 0, 30, 0, 26, 0, 102, 0, 22, 0, 74, 0, 8, 0, 3, 0, 102, 0, 28, 0, 32, 0, 119, 0, 120, 0, 21, 0, 32, 0, 96, 0, 119, 0, 21, 0, 31, 0, 23, 0, 102, 0, 22, 0, 74, 0, 3, 0, 120, 0, 21, 0, 3, 0, 25, 0, 119, 0, 21, 0, 32, 0, 119, 0, 21, 0, 102, 0, 30, 0, 102, 0, 77, 0, 102, 0, 66, 0, 119, 0, 120, 0, 21, 0, 32, 0, 96, 0, 119, 0, 21, 0, 31, 0, 23, 0, 102, 0, 22, 0, 74, 0, 3, 0, 22, 0, 14, 0, 34, 0, 77, 0, 119, 0, 120, 0, 18, 0, 26, 0, 119, 0, 21, 0, 22, 0, 74, 0, 8, 0, 3, 0, 26, 0, 102, 0, 15, 0, 77, 0, 119, 0, 33, 0, 150, 0, 17, 0, 120, 0, 51, 0, 22, 0, 21, 0, 25, 0, 102, 0, 22, 0, 74, 0, 3, 0, 28, 0, 30, 0, 119, 0, 120, 0, 21, 0, 3, 0, 102, 0, 31, 0, 34, 0, 119, 0, 21, 0, 55, 0, 120, 0, 18, 0, 26, 0, 119, 0, 21, 0, 74, 0, 3, 0, 120, 0, 22, 0, 14, 0, 30, 0, 23, 0, 119, 0, 21, 0, 25, 0, 3, 0, 74, 0, 31, 0, 32, 0, 120, 0, 27, 0, 32, 0, 96, 0, 119, 0, 26, 0, 119, 0, 21, 0, 23, 0, 102, 0, 25, 0, 3, 0, 31, 0, 34, 0, 119, 0, 120, 0, 18, 0, 32, 0, 14, 0, 3, 0, 25, 0, 26, 0, 120, 0, 27, 0, 108, 0, 37, 0, 31, 0, 32, 0, 34, 0, 14, 0, 3, 0, 34, 0, 102, 0, 17, 0, 119, 0, 14, 0, 26, 0, 120, 0, 37, 0, 36, 0, 3, 0, 23, 0, 120, 0, 51, 0, 28, 0, 119, 0, 21, 0, 77, 0, 10, 0, 2]} -{"text": "Радуга выглядит как разноцветная дуга или окружность, составленная из цветов спектра видимого излучения.", "phonemes": ["r", "ˈ", "ɑ", "d", "u", "ɡ", "a", " ", "v", "ˈ", "y", "ɡ", "ɭ", "ʲ", "ʌ", "d", "ʲ", "i", "t", " ", "k", "ˈ", "ɑ", "k", " ", "r", "ʌ", "z", "n", "ʌ", "t", "s", "v", "ʲ", "ˈ", "e", "t", "n", "ʌ", "j", "a", " ", "d", "u", "ɡ", "ˈ", "ɑ", " ", "ˈ", "i", "ɭ", "ʲ", "ɪ", " ", "ʌ", "k", "r", "ˈ", "u", "ʒ", "n", "ʌ", "s", "t", "ʲ", ",", " ", "s", "ʌ", "s", "t", "ˈ", "ɑ", "v", "ɭ", "ʲ", "i", "n", "n", "ʌ", "j", "a", " ", "ˈ", "i", "s", " ", "t", "s", "v", "ʲ", "i", "t", "ˈ", "o", "f", " ", "s", "p", "ʲ", "ˈ", "e", "k", "t", "r", "a", " ", "v", "ʲ", "ˈ", "i", "d", "ʲ", "i", "m", "ʌ", "v", "ʌ", " ", "ɪ", "z", "ɭ", "u", "t", "ʃ", "ʲ", "ˈ", "e", "n", "ʲ", "i", "j", "a", "."], "phoneme_ids": [1, 0, 30, 0, 120, 0, 51, 0, 17, 0, 33, 0, 66, 0, 14, 0, 3, 0, 34, 0, 120, 0, 37, 0, 66, 0, 77, 0, 119, 0, 102, 0, 17, 0, 119, 0, 21, 0, 32, 0, 3, 0, 23, 0, 120, 0, 51, 0, 23, 0, 3, 0, 30, 0, 102, 0, 38, 0, 26, 0, 102, 0, 32, 0, 31, 0, 34, 0, 119, 0, 120, 0, 18, 0, 32, 0, 26, 0, 102, 0, 22, 0, 14, 0, 3, 0, 17, 0, 33, 0, 66, 0, 120, 0, 51, 0, 3, 0, 120, 0, 21, 0, 77, 0, 119, 0, 74, 0, 3, 0, 102, 0, 23, 0, 30, 0, 120, 0, 33, 0, 108, 0, 26, 0, 102, 0, 31, 0, 32, 0, 119, 0, 8, 0, 3, 0, 31, 0, 102, 0, 31, 0, 32, 0, 120, 0, 51, 0, 34, 0, 77, 0, 119, 0, 21, 0, 26, 0, 26, 0, 102, 0, 22, 0, 14, 0, 3, 0, 120, 0, 21, 0, 31, 0, 3, 0, 32, 0, 31, 0, 34, 0, 119, 0, 21, 0, 32, 0, 120, 0, 27, 0, 19, 0, 3, 0, 31, 0, 28, 0, 119, 0, 120, 0, 18, 0, 23, 0, 32, 0, 30, 0, 14, 0, 3, 0, 34, 0, 119, 0, 120, 0, 21, 0, 17, 0, 119, 0, 21, 0, 25, 0, 102, 0, 34, 0, 102, 0, 3, 0, 74, 0, 38, 0, 77, 0, 33, 0, 32, 0, 96, 0, 119, 0, 120, 0, 18, 0, 26, 0, 119, 0, 21, 0, 22, 0, 14, 0, 10, 0, 2]} -{"text": "Это те семь цветов, которые принято выделять в радуге в русской культуре, но следует иметь в виду, что на самом деле спектр непрерывен, и его цвета плавно переходят друг в друга через множество промежуточных оттенков.", "phonemes": ["ˈ", "ɛ", "t", "ʌ", " ", "t", "ʲ", "ˈ", "e", " ", "s", "ʲ", "ˈ", "e", "m", "ʲ", " ", "t", "s", "v", "ʲ", "i", "t", "ˈ", "o", "f", ",", " ", "k", "ʌ", "t", "ˈ", "o", "r", "y", "j", "ɪ", " ", "p", "r", "ʲ", "ˈ", "i", "n", "ʲ", "ʌ", "t", "ʌ", " ", "v", "y", "d", "ʲ", "i", "ɭ", "ʲ", "ˈ", "ɑ", "t", "ʲ", " ", "v", " ", "r", "ˈ", "ɑ", "d", "u", "ɡ", "ʲ", "i", " ", "v", " ", "r", "ˈ", "u", "s", "s", "k", "ʌ", "j", " ", "k", "u", "ɭ", "t", "ˈ", "u", "r", "ʲ", "i", ",", " ", "n", "o", " ", "s", "ɭ", "ʲ", "ˈ", "e", "d", "u", "j", "i", "t", " ", "ɪ", "m", "ʲ", "ˈ", "e", "t", "ʲ", " ", "v", " ", "v", "ʲ", "ˈ", "i", "d", "u", ",", " ", "ʃ", "t", "o", " ", "n", "ə", " ", "s", "ˈ", "ɑ", "m", "ʌ", "m", " ", "d", "ʲ", "ˈ", "e", "ɭ", "ʲ", "i", " ", "s", "p", "ʲ", "ˈ", "e", "k", "t", "r", " ", "n", "ʲ", "i", "p", "r", "ʲ", "i", "r", "ˈ", "y", "v", "ʲ", "i", "n", ",", " ", "ˈ", "i", " ", "j", "ɪ", "v", "ˈ", "o", " ", "t", "s", "v", "ʲ", "ˈ", "e", "t", "a", " ", "p", "ɭ", "ˈ", "ɑ", "v", "n", "ʌ", " ", "p", "ʲ", "i", "r", "ʲ", "i", "x", "ˈ", "o", "d", "ʲ", "ʌ", "t", " ", "d", "r", "ˈ", "u", "k", " ", "v", " ", "d", "r", "ˈ", "u", "ɡ", "a", " ", "t", "ʃ", "ʲ", "ˈ", "e", "r", "ʲ", "i", "s", " ", "m", "n", "ˈ", "o", "ʒ", "y", "s", "t", "v", "ʌ", " ", "p", "r", "ʌ", "m", "ʲ", "i", "ʒ", "ˈ", "u", "t", "ʌ", "t", "ʃ", "ʲ", "n", "y", "x", " ", "ʌ", "t", "ʲ", "t", "ʲ", "ˈ", "e", "n", "k", "ʌ", "f", "."], "phoneme_ids": [1, 0, 120, 0, 61, 0, 32, 0, 102, 0, 3, 0, 32, 0, 119, 0, 120, 0, 18, 0, 3, 0, 31, 0, 119, 0, 120, 0, 18, 0, 25, 0, 119, 0, 3, 0, 32, 0, 31, 0, 34, 0, 119, 0, 21, 0, 32, 0, 120, 0, 27, 0, 19, 0, 8, 0, 3, 0, 23, 0, 102, 0, 32, 0, 120, 0, 27, 0, 30, 0, 37, 0, 22, 0, 74, 0, 3, 0, 28, 0, 30, 0, 119, 0, 120, 0, 21, 0, 26, 0, 119, 0, 102, 0, 32, 0, 102, 0, 3, 0, 34, 0, 37, 0, 17, 0, 119, 0, 21, 0, 77, 0, 119, 0, 120, 0, 51, 0, 32, 0, 119, 0, 3, 0, 34, 0, 3, 0, 30, 0, 120, 0, 51, 0, 17, 0, 33, 0, 66, 0, 119, 0, 21, 0, 3, 0, 34, 0, 3, 0, 30, 0, 120, 0, 33, 0, 31, 0, 31, 0, 23, 0, 102, 0, 22, 0, 3, 0, 23, 0, 33, 0, 77, 0, 32, 0, 120, 0, 33, 0, 30, 0, 119, 0, 21, 0, 8, 0, 3, 0, 26, 0, 27, 0, 3, 0, 31, 0, 77, 0, 119, 0, 120, 0, 18, 0, 17, 0, 33, 0, 22, 0, 21, 0, 32, 0, 3, 0, 74, 0, 25, 0, 119, 0, 120, 0, 18, 0, 32, 0, 119, 0, 3, 0, 34, 0, 3, 0, 34, 0, 119, 0, 120, 0, 21, 0, 17, 0, 33, 0, 8, 0, 3, 0, 96, 0, 32, 0, 27, 0, 3, 0, 26, 0, 59, 0, 3, 0, 31, 0, 120, 0, 51, 0, 25, 0, 102, 0, 25, 0, 3, 0, 17, 0, 119, 0, 120, 0, 18, 0, 77, 0, 119, 0, 21, 0, 3, 0, 31, 0, 28, 0, 119, 0, 120, 0, 18, 0, 23, 0, 32, 0, 30, 0, 3, 0, 26, 0, 119, 0, 21, 0, 28, 0, 30, 0, 119, 0, 21, 0, 30, 0, 120, 0, 37, 0, 34, 0, 119, 0, 21, 0, 26, 0, 8, 0, 3, 0, 120, 0, 21, 0, 3, 0, 22, 0, 74, 0, 34, 0, 120, 0, 27, 0, 3, 0, 32, 0, 31, 0, 34, 0, 119, 0, 120, 0, 18, 0, 32, 0, 14, 0, 3, 0, 28, 0, 77, 0, 120, 0, 51, 0, 34, 0, 26, 0, 102, 0, 3, 0, 28, 0, 119, 0, 21, 0, 30, 0, 119, 0, 21, 0, 36, 0, 120, 0, 27, 0, 17, 0, 119, 0, 102, 0, 32, 0, 3, 0, 17, 0, 30, 0, 120, 0, 33, 0, 23, 0, 3, 0, 34, 0, 3, 0, 17, 0, 30, 0, 120, 0, 33, 0, 66, 0, 14, 0, 3, 0, 32, 0, 96, 0, 119, 0, 120, 0, 18, 0, 30, 0, 119, 0, 21, 0, 31, 0, 3, 0, 25, 0, 26, 0, 120, 0, 27, 0, 108, 0, 37, 0, 31, 0, 32, 0, 34, 0, 102, 0, 3, 0, 28, 0, 30, 0, 102, 0, 25, 0, 119, 0, 21, 0, 108, 0, 120, 0, 33, 0, 32, 0, 102, 0, 32, 0, 96, 0, 119, 0, 26, 0, 37, 0, 36, 0, 3, 0, 102, 0, 32, 0, 119, 0, 32, 0, 119, 0, 120, 0, 18, 0, 26, 0, 23, 0, 102, 0, 19, 0, 10, 0, 2]} -{"text": "Широкая электрификация южных губерний даст мощный толчок подъёму сельского хозяйства.", "phonemes": ["ʃ", "y", "r", "ˈ", "o", "k", "ʌ", "j", "a", " ", "ɛ", "ɭ", "ʲ", "i", "k", "t", "r", "ʲ", "i", "f", "ʲ", "i", "k", "ˈ", "ɑ", "t", "s", "y", "j", "a", " ", "ˈ", "j", "u", "ʒ", "n", "y", "x", " ", "ɡ", "u", "b", "ʲ", "ˈ", "e", "r", "n", "ʲ", "i", "j", " ", "d", "ˈ", "ɑ", "s", "t", " ", "m", "ˈ", "o", "ɕ", "n", "y", "j", " ", "t", "ʌ", "ɭ", "t", "ʃ", "ʲ", "ˈ", "o", "k", " ", "p", "ʌ", "d", "j", "ˈ", "ɵ", "m", "u", " ", "s", "ʲ", "ˈ", "e", "ɭ", "s", "k", "ʌ", "v", "ʌ", " ", "x", "ʌ", "ʑ", "ˈ", "ɑ", "j", "s", "t", "v", "a", "."], "phoneme_ids": [1, 0, 96, 0, 37, 0, 30, 0, 120, 0, 27, 0, 23, 0, 102, 0, 22, 0, 14, 0, 3, 0, 61, 0, 77, 0, 119, 0, 21, 0, 23, 0, 32, 0, 30, 0, 119, 0, 21, 0, 19, 0, 119, 0, 21, 0, 23, 0, 120, 0, 51, 0, 32, 0, 31, 0, 37, 0, 22, 0, 14, 0, 3, 0, 120, 0, 22, 0, 33, 0, 108, 0, 26, 0, 37, 0, 36, 0, 3, 0, 66, 0, 33, 0, 15, 0, 119, 0, 120, 0, 18, 0, 30, 0, 26, 0, 119, 0, 21, 0, 22, 0, 3, 0, 17, 0, 120, 0, 51, 0, 31, 0, 32, 0, 3, 0, 25, 0, 120, 0, 27, 0, 55, 0, 26, 0, 37, 0, 22, 0, 3, 0, 32, 0, 102, 0, 77, 0, 32, 0, 96, 0, 119, 0, 120, 0, 27, 0, 23, 0, 3, 0, 28, 0, 102, 0, 17, 0, 22, 0, 120, 0, 85, 0, 25, 0, 33, 0, 3, 0, 31, 0, 119, 0, 120, 0, 18, 0, 77, 0, 31, 0, 23, 0, 102, 0, 34, 0, 102, 0, 3, 0, 36, 0, 102, 0, 107, 0, 120, 0, 51, 0, 22, 0, 31, 0, 32, 0, 34, 0, 14, 0, 10, 0, 2]} -{"text": "Разъяренный чтец эгоистично бьёт пятью жердями шустрого фехтовальщика.", "phonemes": ["r", "ʌ", "z", "j", "j", "a", "r", "ʲ", "ˈ", "e", "n", "n", "y", "j", " ", "t", "ʃ", "ʲ", "t", "ʲ", "ˈ", "e", "t", "s", " ", "ɛ", "ɡ", "ʌ", "i", "s", "ʲ", "t", "ʲ", "ˈ", "i", "t", "ʃ", "ʲ", "n", "ʌ", " ", "b", "j", "ˈ", "ɵ", "t", " ", "p", "ʲ", "ˈ", "ɑ", "t", "ʲ", "j", "j", "u", " ", "ʒ", "y", "r", "d", "ʲ", "ˈ", "ɑ", "m", "ʲ", "ɪ", " ", "ʃ", "ˈ", "u", "s", "t", "r", "ʌ", "v", "ʌ", " ", "f", "ʲ", "i", "x", "t", "ʌ", "v", "ˈ", "ɑ", "ɭ", "ɕ", "i", "k", "a", "."], "phoneme_ids": [1, 0, 30, 0, 102, 0, 38, 0, 22, 0, 22, 0, 14, 0, 30, 0, 119, 0, 120, 0, 18, 0, 26, 0, 26, 0, 37, 0, 22, 0, 3, 0, 32, 0, 96, 0, 119, 0, 32, 0, 119, 0, 120, 0, 18, 0, 32, 0, 31, 0, 3, 0, 61, 0, 66, 0, 102, 0, 21, 0, 31, 0, 119, 0, 32, 0, 119, 0, 120, 0, 21, 0, 32, 0, 96, 0, 119, 0, 26, 0, 102, 0, 3, 0, 15, 0, 22, 0, 120, 0, 85, 0, 32, 0, 3, 0, 28, 0, 119, 0, 120, 0, 51, 0, 32, 0, 119, 0, 22, 0, 22, 0, 33, 0, 3, 0, 108, 0, 37, 0, 30, 0, 17, 0, 119, 0, 120, 0, 51, 0, 25, 0, 119, 0, 74, 0, 3, 0, 96, 0, 120, 0, 33, 0, 31, 0, 32, 0, 30, 0, 102, 0, 34, 0, 102, 0, 3, 0, 19, 0, 119, 0, 21, 0, 36, 0, 32, 0, 102, 0, 34, 0, 120, 0, 51, 0, 77, 0, 55, 0, 21, 0, 23, 0, 14, 0, 10, 0, 2]} -{"text": "В чащах юга жил бы цитрус? Да, но фальшивый экземпляр!", "phonemes": ["f", " ", "t", "ʃ", "ʲ", "ˈ", "ɑ", "ɕ", "ʌ", "x", " ", "ˈ", "j", "u", "ɡ", "a", " ", "ʒ", "ˈ", "y", "ɭ", " ", "b", "ˈ", "y", " ", "t", "s", "ˈ", "y", "t", "r", "u", "s", "?", " ", "d", "ˈ", "ɑ", ",", " ", "n", "o", " ", "f", "a", "ɭ", "ʃ", "ˈ", "y", "v", "y", "j", " ", "ɛ", "ɡ", "ʑ", "i", "m", "p", "ɭ", "ʲ", "ˈ", "ɑ", "r", "!"], "phoneme_ids": [1, 0, 19, 0, 3, 0, 32, 0, 96, 0, 119, 0, 120, 0, 51, 0, 55, 0, 102, 0, 36, 0, 3, 0, 120, 0, 22, 0, 33, 0, 66, 0, 14, 0, 3, 0, 108, 0, 120, 0, 37, 0, 77, 0, 3, 0, 15, 0, 120, 0, 37, 0, 3, 0, 32, 0, 31, 0, 120, 0, 37, 0, 32, 0, 30, 0, 33, 0, 31, 0, 13, 0, 3, 0, 17, 0, 120, 0, 51, 0, 8, 0, 3, 0, 26, 0, 27, 0, 3, 0, 19, 0, 14, 0, 77, 0, 96, 0, 120, 0, 37, 0, 34, 0, 37, 0, 22, 0, 3, 0, 61, 0, 66, 0, 107, 0, 21, 0, 25, 0, 28, 0, 77, 0, 119, 0, 120, 0, 51, 0, 30, 0, 4, 0, 2]} +{"phoneme_ids":[1,0,30,0,120,0,51,0,17,0,33,0,66,0,14,0,8,0,14,0,32,0,25,0,102,0,31,0,19,0,119,0,120,0,18,0,30,0,26,0,102,0,22,0,74,0,8,0,102,0,28,0,32,0,119,0,120,0,21,0,32,0,96,0,119,0,21,0,31,0,23,0,102,0,22,0,74,0,3,0,74,0,3,0,25,0,119,0,21,0,32,0,119,0,21,0,102,0,30,0,102,0,77,0,102,0,66,0,119,0,120,0,21,0,32,0,96,0,119,0,21,0,31,0,23,0,102,0,22,0,74,0,3,0,22,0,14,0,34,0,77,0,119,0,120,0,18,0,26,0,119,0,21,0,22,0,74,0,8,0,26,0,102,0,15,0,77,0,119,0,33,0,150,0,17,0,120,0,51,0,22,0,21,0,25,0,102,0,22,0,74,0,3,0,28,0,30,0,119,0,74,0,3,0,102,0,31,0,34,0,119,0,21,0,55,0,120,0,18,0,26,0,119,0,21,0,74,0,3,0,120,0,22,0,14,0,30,0,23,0,119,0,21,0,25,0,3,0,74,0,31,0,32,0,120,0,27,0,32,0,96,0,119,0,26,0,119,0,21,0,23,0,102,0,25,0,3,0,31,0,34,0,119,0,120,0,18,0,32,0,14,0,3,0,25,0,26,0,120,0,27,0,108,0,37,0,31,0,32,0,34,0,14,0,3,0,34,0,102,0,17,0,119,0,14,0,26,0,120,0,37,0,36,0,3,0,23,0,120,0,51,0,28,0,119,0,21,0,77,0,10,0,2],"phonemes":["r","ˈ","ɑ","d","u","ɡ","a",",","a","t","m","ʌ","s","f","ʲ","ˈ","e","r","n","ʌ","j","ɪ",",","ʌ","p","t","ʲ","ˈ","i","t","ʃ","ʲ","i","s","k","ʌ","j","ɪ"," ","ɪ"," ","m","ʲ","i","t","ʲ","i","ʌ","r","ʌ","ɭ","ʌ","ɡ","ʲ","ˈ","i","t","ʃ","ʲ","i","s","k","ʌ","j","ɪ"," ","j","a","v","ɭ","ʲ","ˈ","e","n","ʲ","i","j","ɪ",",","n","ʌ","b","ɭ","ʲ","u","\"","d","ˈ","ɑ","j","i","m","ʌ","j","ɪ"," ","p","r","ʲ","ɪ"," ","ʌ","s","v","ʲ","i","ɕ","ˈ","e","n","ʲ","i","ɪ"," ","ˈ","j","a","r","k","ʲ","i","m"," ","ɪ","s","t","ˈ","o","t","ʃ","ʲ","n","ʲ","i","k","ʌ","m"," ","s","v","ʲ","ˈ","e","t","a"," ","m","n","ˈ","o","ʒ","y","s","t","v","a"," ","v","ʌ","d","ʲ","a","n","ˈ","y","x"," ","k","ˈ","ɑ","p","ʲ","i","ɭ","."],"processed_text":"Радуга, атмосферное, оптическое и метеорологическое явление, наблюдаемое при освещении ярким источником света множества водяных капель.","text":"Радуга, атмосферное, оптическое и метеорологическое явление, наблюдаемое при освещении ярким источником света множества водяных капель."} +{"phoneme_ids":[1,0,30,0,120,0,51,0,17,0,33,0,66,0,14,0,3,0,34,0,120,0,37,0,66,0,77,0,119,0,102,0,17,0,119,0,21,0,32,0,3,0,23,0,120,0,51,0,23,0,3,0,30,0,102,0,38,0,26,0,102,0,32,0,31,0,34,0,119,0,120,0,18,0,32,0,26,0,102,0,22,0,14,0,3,0,17,0,33,0,66,0,120,0,51,0,3,0,121,0,74,0,77,0,119,0,74,0,3,0,102,0,23,0,30,0,120,0,33,0,108,0,26,0,102,0,31,0,32,0,119,0,8,0,31,0,102,0,31,0,32,0,120,0,51,0,34,0,77,0,119,0,21,0,26,0,26,0,102,0,22,0,14,0,3,0,74,0,31,0,3,0,32,0,31,0,34,0,119,0,21,0,32,0,120,0,27,0,19,0,3,0,31,0,28,0,119,0,120,0,18,0,23,0,32,0,30,0,14,0,3,0,34,0,119,0,120,0,21,0,17,0,119,0,21,0,25,0,102,0,34,0,102,0,3,0,74,0,38,0,77,0,33,0,32,0,96,0,119,0,120,0,18,0,26,0,119,0,21,0,22,0,14,0,10,0,2],"phonemes":["r","ˈ","ɑ","d","u","ɡ","a"," ","v","ˈ","y","ɡ","ɭ","ʲ","ʌ","d","ʲ","i","t"," ","k","ˈ","ɑ","k"," ","r","ʌ","z","n","ʌ","t","s","v","ʲ","ˈ","e","t","n","ʌ","j","a"," ","d","u","ɡ","ˈ","ɑ"," ","ˌ","ɪ","ɭ","ʲ","ɪ"," ","ʌ","k","r","ˈ","u","ʒ","n","ʌ","s","t","ʲ",",","s","ʌ","s","t","ˈ","ɑ","v","ɭ","ʲ","i","n","n","ʌ","j","a"," ","ɪ","s"," ","t","s","v","ʲ","i","t","ˈ","o","f"," ","s","p","ʲ","ˈ","e","k","t","r","a"," ","v","ʲ","ˈ","i","d","ʲ","i","m","ʌ","v","ʌ"," ","ɪ","z","ɭ","u","t","ʃ","ʲ","ˈ","e","n","ʲ","i","j","a","."],"processed_text":"Радуга выглядит как разноцветная дуга или окружность, составленная из цветов спектра видимого излучения.","text":"Радуга выглядит как разноцветная дуга или окружность, составленная из цветов спектра видимого излучения."} +{"phoneme_ids":[1,0,120,0,61,0,32,0,102,0,3,0,32,0,119,0,120,0,18,0,3,0,31,0,119,0,120,0,18,0,25,0,119,0,3,0,32,0,31,0,34,0,119,0,21,0,32,0,120,0,27,0,19,0,8,0,23,0,102,0,32,0,120,0,27,0,30,0,37,0,22,0,74,0,3,0,28,0,30,0,119,0,120,0,21,0,26,0,119,0,102,0,32,0,102,0,3,0,34,0,37,0,17,0,119,0,21,0,77,0,119,0,120,0,51,0,32,0,119,0,3,0,34,0,3,0,30,0,120,0,51,0,17,0,33,0,66,0,119,0,21,0,3,0,34,0,3,0,30,0,120,0,33,0,31,0,31,0,23,0,102,0,22,0,3,0,23,0,33,0,77,0,32,0,120,0,33,0,30,0,119,0,21,0,8,0,26,0,27,0,3,0,31,0,77,0,119,0,120,0,18,0,17,0,33,0,22,0,21,0,32,0,3,0,74,0,25,0,119,0,120,0,18,0,32,0,119,0,3,0,34,0,34,0,119,0,21,0,17,0,120,0,33,0,8,0,96,0,32,0,27,0,3,0,26,0,59,0,3,0,31,0,120,0,51,0,25,0,102,0,25,0,3,0,17,0,119,0,120,0,18,0,77,0,119,0,21,0,3,0,31,0,28,0,119,0,120,0,18,0,23,0,32,0,30,0,3,0,26,0,119,0,21,0,28,0,30,0,119,0,21,0,30,0,120,0,37,0,34,0,119,0,21,0,26,0,8,0,74,0,3,0,22,0,74,0,34,0,120,0,27,0,3,0,32,0,31,0,34,0,119,0,120,0,18,0,32,0,14,0,3,0,28,0,77,0,120,0,51,0,34,0,26,0,102,0,3,0,28,0,119,0,21,0,30,0,119,0,21,0,36,0,120,0,27,0,17,0,119,0,102,0,32,0,3,0,17,0,30,0,120,0,33,0,23,0,3,0,34,0,3,0,17,0,30,0,120,0,33,0,66,0,14,0,3,0,32,0,96,0,119,0,120,0,18,0,30,0,119,0,21,0,31,0,3,0,25,0,26,0,120,0,27,0,108,0,37,0,31,0,32,0,34,0,102,0,3,0,28,0,30,0,102,0,25,0,119,0,21,0,108,0,120,0,33,0,32,0,102,0,32,0,96,0,119,0,26,0,37,0,36,0,3,0,102,0,32,0,119,0,32,0,119,0,120,0,18,0,26,0,23,0,102,0,19,0,10,0,2],"phonemes":["ˈ","ɛ","t","ʌ"," ","t","ʲ","ˈ","e"," ","s","ʲ","ˈ","e","m","ʲ"," ","t","s","v","ʲ","i","t","ˈ","o","f",",","k","ʌ","t","ˈ","o","r","y","j","ɪ"," ","p","r","ʲ","ˈ","i","n","ʲ","ʌ","t","ʌ"," ","v","y","d","ʲ","i","ɭ","ʲ","ˈ","ɑ","t","ʲ"," ","v"," ","r","ˈ","ɑ","d","u","ɡ","ʲ","i"," ","v"," ","r","ˈ","u","s","s","k","ʌ","j"," ","k","u","ɭ","t","ˈ","u","r","ʲ","i",",","n","o"," ","s","ɭ","ʲ","ˈ","e","d","u","j","i","t"," ","ɪ","m","ʲ","ˈ","e","t","ʲ"," ","v","v","ʲ","i","d","ˈ","u",",","ʃ","t","o"," ","n","ə"," ","s","ˈ","ɑ","m","ʌ","m"," ","d","ʲ","ˈ","e","ɭ","ʲ","i"," ","s","p","ʲ","ˈ","e","k","t","r"," ","n","ʲ","i","p","r","ʲ","i","r","ˈ","y","v","ʲ","i","n",",","ɪ"," ","j","ɪ","v","ˈ","o"," ","t","s","v","ʲ","ˈ","e","t","a"," ","p","ɭ","ˈ","ɑ","v","n","ʌ"," ","p","ʲ","i","r","ʲ","i","x","ˈ","o","d","ʲ","ʌ","t"," ","d","r","ˈ","u","k"," ","v"," ","d","r","ˈ","u","ɡ","a"," ","t","ʃ","ʲ","ˈ","e","r","ʲ","i","s"," ","m","n","ˈ","o","ʒ","y","s","t","v","ʌ"," ","p","r","ʌ","m","ʲ","i","ʒ","ˈ","u","t","ʌ","t","ʃ","ʲ","n","y","x"," ","ʌ","t","ʲ","t","ʲ","ˈ","e","n","k","ʌ","f","."],"processed_text":"Это те семь цветов, которые принято выделять в радуге в русской культуре, но следует иметь в виду, что на самом деле спектр непрерывен, и его цвета плавно переходят друг в друга через множество промежуточных оттенков.","text":"Это те семь цветов, которые принято выделять в радуге в русской культуре, но следует иметь в виду, что на самом деле спектр непрерывен, и его цвета плавно переходят друг в друга через множество промежуточных оттенков."} +{"phoneme_ids":[1,0,96,0,37,0,30,0,120,0,27,0,23,0,102,0,22,0,14,0,3,0,61,0,77,0,119,0,21,0,23,0,32,0,30,0,119,0,21,0,19,0,119,0,21,0,23,0,120,0,51,0,32,0,31,0,37,0,22,0,14,0,3,0,120,0,22,0,33,0,108,0,26,0,37,0,36,0,3,0,66,0,33,0,15,0,119,0,120,0,18,0,30,0,26,0,119,0,21,0,22,0,3,0,17,0,120,0,51,0,31,0,32,0,3,0,25,0,120,0,27,0,55,0,26,0,37,0,22,0,3,0,32,0,102,0,77,0,32,0,96,0,119,0,120,0,27,0,23,0,3,0,28,0,102,0,17,0,22,0,120,0,85,0,25,0,33,0,3,0,31,0,119,0,120,0,18,0,77,0,31,0,23,0,102,0,34,0,102,0,3,0,36,0,102,0,107,0,120,0,51,0,22,0,31,0,32,0,34,0,14,0,10,0,2],"phonemes":["ʃ","y","r","ˈ","o","k","ʌ","j","a"," ","ɛ","ɭ","ʲ","i","k","t","r","ʲ","i","f","ʲ","i","k","ˈ","ɑ","t","s","y","j","a"," ","ˈ","j","u","ʒ","n","y","x"," ","ɡ","u","b","ʲ","ˈ","e","r","n","ʲ","i","j"," ","d","ˈ","ɑ","s","t"," ","m","ˈ","o","ɕ","n","y","j"," ","t","ʌ","ɭ","t","ʃ","ʲ","ˈ","o","k"," ","p","ʌ","d","j","ˈ","ɵ","m","u"," ","s","ʲ","ˈ","e","ɭ","s","k","ʌ","v","ʌ"," ","x","ʌ","ʑ","ˈ","ɑ","j","s","t","v","a","."],"processed_text":"Широкая электрификация южных губерний даст мощный толчок подъёму сельского хозяйства.","text":"Широкая электрификация южных губерний даст мощный толчок подъёму сельского хозяйства."} +{"phoneme_ids":[1,0,30,0,102,0,38,0,22,0,22,0,14,0,30,0,119,0,120,0,18,0,26,0,26,0,37,0,22,0,3,0,32,0,96,0,119,0,32,0,119,0,120,0,18,0,32,0,31,0,3,0,61,0,66,0,102,0,21,0,31,0,119,0,32,0,119,0,120,0,21,0,32,0,96,0,119,0,26,0,102,0,3,0,15,0,22,0,120,0,85,0,32,0,3,0,28,0,119,0,14,0,32,0,119,0,22,0,120,0,22,0,33,0,3,0,108,0,37,0,30,0,17,0,119,0,120,0,51,0,25,0,119,0,74,0,3,0,96,0,120,0,33,0,31,0,32,0,30,0,102,0,34,0,102,0,3,0,19,0,119,0,21,0,36,0,32,0,102,0,34,0,120,0,51,0,77,0,55,0,21,0,23,0,14,0,10,0,2],"phonemes":["r","ʌ","z","j","j","a","r","ʲ","ˈ","e","n","n","y","j"," ","t","ʃ","ʲ","t","ʲ","ˈ","e","t","s"," ","ɛ","ɡ","ʌ","i","s","ʲ","t","ʲ","ˈ","i","t","ʃ","ʲ","n","ʌ"," ","b","j","ˈ","ɵ","t"," ","p","ʲ","a","t","ʲ","j","ˈ","j","u"," ","ʒ","y","r","d","ʲ","ˈ","ɑ","m","ʲ","ɪ"," ","ʃ","ˈ","u","s","t","r","ʌ","v","ʌ"," ","f","ʲ","i","x","t","ʌ","v","ˈ","ɑ","ɭ","ɕ","i","k","a","."],"processed_text":"Разъяренный чтец эгоистично бьёт пятью жердями шустрого фехтовальщика.","text":"Разъяренный чтец эгоистично бьёт пятью жердями шустрого фехтовальщика."} +{"phoneme_ids":[1,0,19,0,3,0,32,0,96,0,119,0,120,0,51,0,55,0,102,0,36,0,3,0,120,0,22,0,33,0,66,0,14,0,3,0,108,0,120,0,37,0,77,0,3,0,15,0,37,0,3,0,32,0,31,0,120,0,37,0,32,0,30,0,33,0,31,0,13,0,2,1,0,17,0,120,0,51,0,8,0,26,0,27,0,3,0,19,0,14,0,77,0,96,0,120,0,37,0,34,0,37,0,22,0,3,0,61,0,66,0,107,0,21,0,25,0,28,0,77,0,119,0,120,0,51,0,30,0,4,0,2],"phonemes":["f"," ","t","ʃ","ʲ","ˈ","ɑ","ɕ","ʌ","x"," ","ˈ","j","u","ɡ","a"," ","ʒ","ˈ","y","ɭ"," ","b","y"," ","t","s","ˈ","y","t","r","u","s","?","d","ˈ","ɑ",",","n","o"," ","f","a","ɭ","ʃ","ˈ","y","v","y","j"," ","ɛ","ɡ","ʑ","i","m","p","ɭ","ʲ","ˈ","ɑ","r","!"],"processed_text":"В чащах юга жил бы цитрус? Да, но фальшивый экземпляр!","text":"В чащах юга жил бы цитрус? Да, но фальшивый экземпляр!"} diff --git a/src/cpp/main.cpp b/src/cpp/main.cpp index b3fe24e..c7446b7 100644 --- a/src/cpp/main.cpp +++ b/src/cpp/main.cpp @@ -329,6 +329,9 @@ void printUsage(char *argv[]) { << endl; cerr << " --espeak_data DIR path to espeak-ng data directory" << endl; + cerr << " --tashkeel_model FILE path to libtashkeel onnx model " + "(arabic)" + << endl; cerr << " --debug print DEBUG messages to the console" << endl; cerr << endl;