diff --git "a/eval-results/phonemes_1760931179_WavLM.json" "b/eval-results/phonemes_1760931179_WavLM.json" new file mode 100644--- /dev/null +++ "b/eval-results/phonemes_1760931179_WavLM.json" @@ -0,0 +1,6502 @@ +[ + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.7676210403442383, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "ð ɛ ɹ ɑ ɹ p i p ə l h u t ɹ æ v ə l l ɔ ŋ d ɪ s t ə n s ə z t ə ə ʃ ʊ ɹ majk ə n t ɪ n j u d ɛ ɡ z ɪ s t ə n s", + "ref_phonemes": "ðɛr ɑr pipʌl hu trævʌl lɔŋ dɪstʌnsʌz tu ʌʃʊr maɪ kʌntɪnjud ɛɡzɪstʌns ", + "duration": 0.30870747566223145, + "PER": 22.807017543859647, + "score": { + "S": 13, + "D": 0, + "I": 0, + "N": 57 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.23907136917114258, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.24864411354064941, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "t ɹ ɪ m ɛ k s ɛ s k ə lejf ɹ ʌ mɹ̩awn d l ɪ p ʌ v mowl d æ n d s ɛ t ə sajd wajl ə s ɪ m b l ɪ ŋ l ɛ d", + "ref_phonemes": "trɪm ɛksɛs kleɪ frʌm ɝaʊnd lɪp ʌv moʊld ʌnd sɛt ʌsaɪd waɪl ʌsɛmbʌlɪŋ lɪd ", + "duration": 0.395296573638916, + "PER": 27.11864406779661, + "score": { + "S": 13, + "D": 1, + "I": 2, + "N": 59 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.26347899436950684, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "ð əajd i v ə s ɛ n w ə l t ɛ ŋ k w ɪ lajn it͡ʃ haws ɪ z dajn ɪn ɪ t s ɛ l f ə n ɑ v ə l t i", + "ref_phonemes": "ðʌ aɪdiʌ ʌv ʌ sɛntrʌl tæŋk wɪð laɪnz tu itʃ haʊs ɪz nɑt ɪn ɪtsɛlf ʌ nɑvʌlti ", + "duration": 0.2761378288269043, + "PER": 37.28813559322034, + "score": { + "S": 15, + "D": 6, + "I": 1, + "N": 59 + } + }, + { + "model": "WavLM", + "phonemes": "ɪ f j u j u s p ɑ ɹ k ɪ ŋ ə t ɛ n d ə n t s k æ n ðejb i ɹ i p lejs t bajɔ t ə m æ t ɪ k p ɑ ɹ k ɪ ŋ ɡejt s", + "ref_phonemes": "ɪf ju juz pɑrkɪŋ ʌtɛndʌnts kæn ðeɪ bi ripleɪst baɪ ɔtʌmætɪk pɑrkɪŋ ɡeɪts ", + "duration": 0.3360767364501953, + "PER": 18.333333333333332, + "score": { + "S": 11, + "D": 0, + "I": 0, + "N": 60 + } + }, + { + "model": "WavLM", + "phonemes": "ð ɛ ɹ ɑ ɹ ɹ ɪ z ʌ l t sajs t ʌ d i ʌ v l ɪ dɹ̩ t͡ʃɹ̩ t͡ʃɹ̩ɔ ɹ i d f ɹ ʌ m ð ə t ɪ ɹ ə n i ʌ v ð ə k ə n t ɛ m ɛ ɹ i", + "ref_phonemes": "ðɛr rɪzʌlts ʌ stʌdi ʌv lɪtɝʌtʃɝ frid frʌm ðʌ tɪrʌni ʌv ðʌ kʌntɛmpɝɛri ", + "duration": 0.31690073013305664, + "PER": 47.368421052631575, + "score": { + "S": 15, + "D": 2, + "I": 10, + "N": 57 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə θ ɪ k ɛ l m f ɔ ɹ ə s t w ɑ z n ɪ ɹ l iowvɹ̩w ɛ l m d bajd ʌt͡ʃɛ l m d ɪ z i z", + "ref_phonemes": "ðʌ θɪk ɛlm fɔrʌst wɑz nɪrli oʊvɝwɛlmd baɪ dʌtʃ ɛlm dɪziz ", + "duration": 0.3514721393585205, + "PER": 19.565217391304348, + "score": { + "S": 7, + "D": 0, + "I": 2, + "N": 46 + } + }, + { + "model": "WavLM", + "phonemes": "b ʌ t t ə k ə n t ɪ n j u t ə d ɪ v ɔ ɹ s ə d v æ n s t s t u d ə n t s f ɹ ʌ m ɹ i æ l ə t i ɪ z ɪ n ɪ k s k j u z ə b ə l", + "ref_phonemes": "bʌt tu kʌntɪnju tu dɪvɔrs ʌdvænst studʌnts frʌm riælʌti ɪz ɪnɪkskjuzʌbʌl ", + "duration": 0.3164839744567871, + "PER": 17.741935483870968, + "score": { + "S": 11, + "D": 0, + "I": 0, + "N": 62 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.21106934547424316, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.2427692413330078, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.29290175437927246, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "h ɪ z fejl jɹ̩t əowp ə n ð ə s t ɔ ɹ bajejt k ɑ s t h ɪ m h ɪ zd͡ʒɑ b", + "ref_phonemes": "hɪz feɪljɝ tu oʊpʌn ðʌ stɔr baɪ eɪt kɑst hɪm hɪz dʒɑb ", + "duration": 0.2788529396057129, + "PER": 26.190476190476193, + "score": { + "S": 9, + "D": 0, + "I": 2, + "N": 42 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.23898911476135254, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.2802753448486328, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "k m ə n h i w ɪ s pɹ̩d f ɔ ɹ l ɛ v ə l z ə bawt θ ɹ i f i t dawn sowd ɑ n t f ɔ l", + "ref_phonemes": "kʌmɑn hi wɪspɝd fɔr lɛvʌlz ʌbaʊt θri fit daʊn soʊ doʊnt fɔl ", + "duration": 0.31653666496276855, + "PER": 27.083333333333332, + "score": { + "S": 10, + "D": 2, + "I": 1, + "N": 48 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.3020026683807373, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "h ɪ z k æ p t ə n w ɑ z θ ɪ n æ n d h æ ɡɹ̩d æ n d h ɪ z b j u t ə f ə l b u t s wɹ̩w ɔ ɹ n n nʃ æ b i", + "ref_phonemes": "hɪz kæptʌn wɑz θɪn ʌnd hæɡɝd ʌnd hɪz bjutʌfʌl buts wɝ wɔrn ʌnd ʃæbi ", + "duration": 0.35302281379699707, + "PER": 22.22222222222222, + "score": { + "S": 9, + "D": 1, + "I": 2, + "N": 54 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.2581608295440674, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "ɪ f n ɛ əsejd ɹ i p lejs bowθ h æ v s ɑə n ɡ ɹ i l s ɪ k ʌ t s æ n ə l ɑ t ɛ k s t ə tajm", + "ref_phonemes": "ɪf nɛsʌsɛri tu ripleɪs boʊθ hævz ɑn ɡrɪl sɪr kʌts ʌnd ʌlɑt ɛkstrʌ taɪm ", + "duration": 0.3364701271057129, + "PER": 36.84210526315789, + "score": { + "S": 14, + "D": 6, + "I": 1, + "N": 57 + } + }, + { + "model": "WavLM", + "phonemes": "majd ɪ zajɹ̩z ɑ ɹ s ɪ m p ə l ɡ ɪ v m i w ʌ n ɪ n f ɔ ɹ m ə t ɪ v p æ ɹ ə ɡ ɹ æ f ɑ n ð ə s ʌ bd͡ʒɪ k t", + "ref_phonemes": "maɪ dɪzaɪɝz ɑr sɪmpʌl ɡɪv mi wʌn ɪnfɔrmʌtɪv pærʌɡræf ɑn ðʌ sʌbdʒɪkt ", + "duration": 0.28726720809936523, + "PER": 23.214285714285715, + "score": { + "S": 11, + "D": 0, + "I": 2, + "N": 56 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.25632667541503906, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.27121973037719727, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə s t ɹ ʌ kt͡ʃɹ̩z haws ɪ ŋ ð ə ə p ɑ ɹ t m ə n t s ɑ ɹ ʌ v mejs ə n i i ɪ n f ɹejm k ə n s t ɹ ʌ k ʃ ə n", + "ref_phonemes": "ðʌ strʌktʃɝz haʊzɪŋ ðʌ ʌpɑrtmʌnts ɑr ʌv meɪsʌnri ʌnd freɪm kʌnstrʌkʃʌn ", + "duration": 0.33422422409057617, + "PER": 36.666666666666664, + "score": { + "S": 19, + "D": 1, + "I": 2, + "N": 60 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.2658257484436035, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.25932765007019043, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "d u j u l ʌ v t ə ɹ ʌ n ʌ p ə h ɛ m sowɑ n b ʌ t ə n z mejk n i t b ʌ t ə n howl z", + "ref_phonemes": "du ju lʌv tu rʌn ʌp ʌ hɛm soʊ ɑn bʌtʌnz meɪk nit bʌtʌnhoʊlz ", + "duration": 0.33860349655151367, + "PER": 17.391304347826086, + "score": { + "S": 8, + "D": 0, + "I": 0, + "N": 46 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.21791839599609375, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "h i ɪ z ə m æ n ʌ mejd͡ʒɹ̩k t æ ə n t bʌ t m æ n ʌ v s ɑ l ə t ɛ ɹ i ə n sɹ̩t ə n ɪ m p ɔ l s ə z", + "ref_phonemes": "hi ɪz ʌ mæn ʌv meɪdʒɝ tælʌnt bʌt ʌ mæn ʌv sɑlʌtɛri ʌnsɝtʌn ɪmpʌlsɪz ", + "duration": 0.3020315170288086, + "PER": 33.33333333333333, + "score": { + "S": 11, + "D": 3, + "I": 4, + "N": 54 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.19781994819641113, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.22919940948486328, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.321089506149292, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "æ n ɑ t t ə l i æ najawt ə m z n æ l ɛ d ʌ s s i w ɛ ð ɪ s pawɹ̩awkp ʌ m z f ɹ ʌ m", + "ref_phonemes": "æn ɑktɪljʌn ætʌmz naʊ lɛt ʌs si wɛr ðɪs paʊɝ kʌmz frʌm ", + "duration": 0.2782766819000244, + "PER": 46.51162790697674, + "score": { + "S": 11, + "D": 2, + "I": 7, + "N": 43 + } + }, + { + "model": "WavLM", + "phonemes": "ə d i tejl l d s t ʌ d i ʌ v ð ɪ s l æ dɹ̩f ə n ɑ m ə n ɑ n æn w ɑ z n ɑ t ə t ɛ m p t ɪ d ɪ n ð ɪ s p pejpɹ̩", + "ref_phonemes": "ʌ dɪteɪld stʌdi ʌv ðɪs lætɝ fʌnɑmʌnɑn wɑz nɑt ʌtɛmptʌd ɪn ðɪs peɪpɝ ", + "duration": 0.3078286647796631, + "PER": 30.909090909090907, + "score": { + "S": 11, + "D": 0, + "I": 6, + "N": 55 + } + }, + { + "model": "WavLM", + "phonemes": "ð ɛ ɹ ɪ z l ɪ t ə l dawt ð æ t ð ə s t u d ə n t s b ɛ n ə f ɪ t f ɹ ʌ m vowkejʃ ə n ə l ɛd͡ʒə kejʃ ə n", + "ref_phonemes": "ðɛr ɪz lɪtʌl daʊt ðæt ðʌ studʌnts bɛnʌfɪt frʌm voʊkeɪʃʌnʌl ɛdʒʌkeɪʃʌn ", + "duration": 0.33649778366088867, + "PER": 25.423728813559322, + "score": { + "S": 14, + "D": 0, + "I": 1, + "N": 59 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.24863839149475098, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "ə kɹ̩ɹ ɪd͡ʒd k ɹ ʌ nt͡ʃt bajɪ s d ɪ m lajt s f ɪ l tɹ̩ ɪ ŋ θ ɹ u ð ə ɡ l u m", + "ref_phonemes": "ʌ kærɪdʒ krʌntʃt baɪ ɪts dɪm laɪts fɪltɝɪŋ θru ðʌ ɡlum ", + "duration": 0.2714357376098633, + "PER": 34.090909090909086, + "score": { + "S": 9, + "D": 1, + "I": 5, + "N": 44 + } + }, + { + "model": "WavLM", + "phonemes": "nowp ɹajs ɪ z t u hajw ɛ n t ɹ u l ʌ v ɪ z æ t s tejk", + "ref_phonemes": "noʊ praɪs ɪz tu haɪ wɛn tru lʌv ɪz æt steɪk ", + "duration": 0.25475358963012695, + "PER": 18.181818181818183, + "score": { + "S": 6, + "D": 0, + "I": 0, + "N": 33 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.25559520721435547, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.23946857452392578, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "pejpɹ̩wejt mejb i pɹ̩s ə n ə lajz d ɑ n b æ k wajl k lejɪ z l ɛ ðɹ̩h ɑ ɹ d", + "ref_phonemes": "peɪpɝweɪt meɪ bi pɝsʌnʌlaɪzd ɑn bæk waɪl kleɪ ɪz lɛðɝ hɑrd ", + "duration": 0.32948994636535645, + "PER": 31.25, + "score": { + "S": 12, + "D": 0, + "I": 3, + "N": 48 + } + }, + { + "model": "WavLM", + "phonemes": "hawɛ vɹ̩ð ə l ɪ tɹ̩vɹ̩i mejn d ɑ ɡ m ɛ n t ə d bajs ɛ v ɹ ə l dowz ə n l ʌ ɹ u m s ʌ pɹ̩z", + "ref_phonemes": "haʊɛvɝ ðʌ lɪtɝ rɪmeɪnd ɑɡmɛntʌd baɪ sɛvrʌl dʌzʌn lʌntʃrum sʌpɝz ", + "duration": 0.3341076374053955, + "PER": 44.44444444444444, + "score": { + "S": 15, + "D": 3, + "I": 6, + "N": 54 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.267993688583374, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "æ l ɹ ə s i v d əd͡ʒojn t ə pojn t m ə n t ɪ n ð ə bajɑ l əd͡ʒi æ n d ð ə ɛ nd͡ʒə n ɪ ɹ ɪ ŋ d ɪ p ɑ ɹ t m ə n t s", + "ref_phonemes": "æl rʌsivd ʌ dʒɔɪnt ʌpɔɪntmʌnt ɪn ðʌ baɪɑlʌdʒi ʌnd ðʌ ɛndʒʌnɪrɪŋ dɪpɑrtmʌnts ", + "duration": 0.3672051429748535, + "PER": 32.8125, + "score": { + "S": 18, + "D": 0, + "I": 3, + "N": 64 + } + }, + { + "model": "WavLM", + "phonemes": "w i k ə n ɡ ɹ ɛd͡ʒə lejt ð ə ɪ n tajɹ̩m ɛ m bɹ̩ʃ ɪ p ɑ n ɪ t s ɹ ɛ kɹ̩d ʌ v ɡ ʊ d l ɛd͡ʒə s lejʃ ə n", + "ref_phonemes": "wi kʌŋrætʃʌleɪt ðʌ ɪntaɪɝ mɛmbɝʃɪp ɑn ɪts rɛkɝd ʌv ɡʊd lɛdʒʌsleɪʃʌn ", + "duration": 0.34999942779541016, + "PER": 40.35087719298245, + "score": { + "S": 17, + "D": 0, + "I": 6, + "N": 57 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.27208518981933594, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "ɪ t w ʊ d b i w ɛ l t ə ʃowwð ə p ɑ p j ə l ə s haww i d i l w ɪ ð ə l d ʌ l tɹ̩z", + "ref_phonemes": "ɪt wʊd bi wɛl tu ʃoʊ ðʌ pɑpjʌlʌs haʊ wi dil wɪð ʌdʌltɝɝz ", + "duration": 0.2910006046295166, + "PER": 25.0, + "score": { + "S": 9, + "D": 0, + "I": 2, + "N": 44 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə t u θ f ɛ ɹ i f ɹ̩ ɡ ɑ t t ə k ʌ m w ɛ n ɹ ɑ ɹd͡ʒz z t u θ f ɛ lawt", + "ref_phonemes": "ðʌ tuθ fɛri fɝɡɑt tu kʌm wɛn rɑdʒɝz tuθ fɛl aʊt ", + "duration": 0.27805233001708984, + "PER": 27.027027027027028, + "score": { + "S": 7, + "D": 0, + "I": 3, + "N": 37 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə hajə s t ɹejt ə d n ɑ n s u pɹ̩vajzɹ̩i ɛ nd͡ʒə n ɪ ɹ ɪ ŋ tajt ə l ɪ z ɹ i sɹ̩t͡ʃɛ nd͡ʒə n ɪ ɹ", + "ref_phonemes": "ðʌ haɪʌst reɪtʌd nɑn supɝvaɪzɝi ɛndʒʌnɪrɪŋ taɪtʌl ɪz risɝtʃ ɛndʒʌnɪr ", + "duration": 0.31966328620910645, + "PER": 38.983050847457626, + "score": { + "S": 17, + "D": 0, + "I": 6, + "N": 59 + } + }, + { + "model": "WavLM", + "phonemes": "mejb i ɪ t s tejk ɪ ŋ l ɔ ŋ ɡɹ̩t ə ɡ ɛ t θ ɪ ŋ z s k w ɛ ɹ d ə wejð æ n ð ə b æ ŋ kɹ̩z ɪ k s p ɛ k t ə d", + "ref_phonemes": "meɪbi ɪts teɪkɪŋ lɔŋɡɝ tu ɡɛt θɪŋz skwɛrd ʌweɪ ðæn ðʌ bæŋkɝz ɪkspɛktʌd ", + "duration": 0.3713505268096924, + "PER": 20.689655172413794, + "score": { + "S": 10, + "D": 0, + "I": 2, + "N": 58 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə h ɔ n t ə d haws w ɑ z ə h ɪ t d u t əawt s t æ n d ɪ ŋ ɑ d iowv ɪ ʒ ə w ə l ɪ f ɛ k t s", + "ref_phonemes": "ðʌ hɔntʌd haʊs wɑz ʌ hɪt du tu aʊtstændɪŋ ɑdioʊ vɪʒʌwʌl ɪfɛkts ", + "duration": 0.33238935470581055, + "PER": 17.647058823529413, + "score": { + "S": 9, + "D": 0, + "I": 0, + "N": 51 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.2077500820159912, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə b ɪ ɡ d ɔ ɡ l ʌ v d t ət͡ʃu ɑ n ð əowl d ɹ æ ɡ d ɑ l", + "ref_phonemes": "ðʌ bɪɡ dɔɡ lʌvd tu tʃu ɑn ðʌ oʊld ræɡ dɑl ", + "duration": 0.2202455997467041, + "PER": 19.35483870967742, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 31 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.31469106674194336, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə l ɔ ɹ powʃ ə n p ɹ ɹ̩ vajd z ə ɹejt ɪ ŋ æ t ɛ n i s tejt b ɪ t w i ŋ ɪ m f ə n s i æ n ə d ʌ h ʊ d", + "ref_phonemes": "ðʌ loʊɝ pɔrʃʌn prʌvaɪdz ʌ reɪtɪŋ æt ɛni steɪdʒ bɪtwin ɪnfʌnsi ʌnd ʌdʌlθhʊd ", + "duration": 0.40774035453796387, + "PER": 40.32258064516129, + "score": { + "S": 19, + "D": 5, + "I": 1, + "N": 62 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.2584800720214844, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "h i ɔ l sowɹ i majn d ə d h ɪ m s ɛ l f ð æ t h i h æ d æ n ə n j u ʒ ə l n ʌ m bɹ̩ʌ v p ɑ s ə b ɪ l ə t i z", + "ref_phonemes": "hi ɔlsoʊ rimaɪndʌd hɪmsɛlf ðæt hi hæd æn ʌnjuʒʌwʌl nʌmbɝ ʌv pɑsʌbɪlʌtiz ", + "duration": 0.3168179988861084, + "PER": 20.0, + "score": { + "S": 9, + "D": 2, + "I": 1, + "N": 60 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.20502138137817383, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.25573062896728516, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "ɹ ɪt͡ʃl ʊ k t f ɔ ɹ s p ɑ t ə d haji n ə z æ n dd͡ʒæ ɡ w ɑ ɹ z ɑ n ð ə s ə f ɑ ɹ i", + "ref_phonemes": "rɪtʃ lʊkt fɔr spɑtʌd haɪinʌz ʌnd dʒæɡwɑrz ɑn ðʌ sʌfɑri ", + "duration": 0.27758097648620605, + "PER": 26.666666666666668, + "score": { + "S": 10, + "D": 0, + "I": 2, + "N": 45 + } + }, + { + "model": "WavLM", + "phonemes": "ajt ʊ k hɹ̩wɹ̩d f ɔ ɹ ɪ t b ʌ t ɪ z ʃ i ɹ ɪ l i ɡowɪ ŋ w ɪ ð j u", + "ref_phonemes": "aɪ tʊk hɝ wɝd fɔr ɪt bʌt ɪz ʃi rɪli ɡoʊɪŋ wɪð ju ", + "duration": 0.22235393524169922, + "PER": 22.22222222222222, + "score": { + "S": 6, + "D": 0, + "I": 2, + "N": 36 + } + }, + { + "model": "WavLM", + "phonemes": "ajt ʊ k hɹ̩wɹ̩d f ɔ ɹ ɪ t b ʌ t ɪ z ʃ i ɹ ɪ l i ɡowɪ ŋ w ɪ ð j u", + "ref_phonemes": "aɪ tʊk hɝ wɝd fɔr ɪt bʌt ɪz ʃi rɪli ɡoʊɪŋ wɪð ju ", + "duration": 0.24224209785461426, + "PER": 22.22222222222222, + "score": { + "S": 6, + "D": 0, + "I": 2, + "N": 36 + } + }, + { + "model": "WavLM", + "phonemes": "ɹ æ l f p ɹ i p ɛ ɹ d ɹ ɛ d s n æ pɹ̩w ɪ ð f ɹ ɛ ʃ l ɛ m ə n s ɔ s f ɔ ɹ d ɪ nɹ̩", + "ref_phonemes": "rælf pripɛrd rɛd snæpɝ wɪð frɛʃ lɛmʌn sɔs fɔr dɪnɝ ", + "duration": 0.28021836280822754, + "PER": 26.82926829268293, + "score": { + "S": 9, + "D": 0, + "I": 2, + "N": 41 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.26004934310913086, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "powl t i ɪ z ʌ l t s ʌ v i ɹejd iejʃ ə n t ɛ s t w ɪ ð ə pow t i i h æ vb ɪ n k wajt s ə k s ɛ s f ə l", + "ref_phonemes": "poʊltri rɪzʌlts ʌv ɪreɪdieɪʃʌn tɛsts wɪð poʊltri hæv bɪn kwaɪt sʌksɛsfʌl ", + "duration": 0.3404362201690674, + "PER": 25.806451612903224, + "score": { + "S": 11, + "D": 4, + "I": 1, + "N": 62 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.27492523193359375, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.2312765121459961, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "d ɪ s ɛ m bɹ̩n nd͡ʒæ n j u ɛ ɹ i ɑɹ̩ ɹ najs m ʌ n θ s t ə s p ɛ n d ɪ n majæ m i", + "ref_phonemes": "dɪsɛmbɝ ʌnd dʒænjuɛri ɑr naɪs mʌnθs tu spɛnd ɪn maɪæmi ", + "duration": 0.2511005401611328, + "PER": 24.444444444444443, + "score": { + "S": 8, + "D": 0, + "I": 3, + "N": 45 + } + }, + { + "model": "WavLM", + "phonemes": "j u t u wɹ̩s s t u b ə d͡ʒ æ k æ s ə n t ɪ j u pojz ə n m i", + "ref_phonemes": "ju tu wɝ ʌ stupʌd dʒækæs ʌntɪl ju pɔɪzʌnd mi ", + "duration": 0.2597544193267822, + "PER": 34.285714285714285, + "score": { + "S": 9, + "D": 2, + "I": 1, + "N": 35 + } + }, + { + "model": "WavLM", + "phonemes": "m ɛ n i w ɛ l θ i tajk u n z s p lɹ̩d͡ʒd æ n d b ɑ t bowθ ə j ɑ t æ n d ə s k u nɹ̩", + "ref_phonemes": "mɛni wɛlθi taɪkunz splɝdʒd ʌnd bɑt boʊθ ʌ jɑt ʌnd ʌ skunɝ ", + "duration": 0.41628575325012207, + "PER": 23.91304347826087, + "score": { + "S": 8, + "D": 0, + "I": 3, + "N": 46 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.3869636058807373, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.30303263664245605, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "ɪ f k ɛ ɹ l k ʌ m z t ə m ɑ ɹowh h æ vhɹ̩ɹɹ̩ɹejnd͡ʒ f ɔ ɹ ə m i t ɪ ŋ ɪ t t u", + "ref_phonemes": "ɪf kærʌl kʌmz tʌmɑroʊ hæv hɝ ɝeɪndʒ fɔr ʌ mitɪŋ æt tu ", + "duration": 0.2974681854248047, + "PER": 42.857142857142854, + "score": { + "S": 11, + "D": 1, + "I": 6, + "N": 42 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.34694576263427734, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.3885922431945801, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.3741879463195801, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "ɪ f p i p ə l wɹ̩m ɔ ɹd͡ʒɛ nɹ̩ə s ð ɛ ɹ b b i nown n i d f ɔ ɹ w ɛ l f ɛ ɹ", + "ref_phonemes": "ɪf pipʌl wɝ mɔr dʒɛnɝʌs ðɛr wʊd bi noʊ nid fɔr wɛlfɛr ", + "duration": 0.33899760246276855, + "PER": 38.095238095238095, + "score": { + "S": 10, + "D": 2, + "I": 4, + "N": 42 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.3293449878692627, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.42726874351501465, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "æ n ə d ʌ l t mejl b æ b u n z t i θ ɑ ɹ n ɑ t s u t ə b ə l f ɔ ɹ i t ɪ ŋ ʃ ɛ l f ɪ ʃ", + "ref_phonemes": "æn ʌdʌlt meɪl bæbunz tiθ ɑr nɑt sutʌbʌl fɔr itɪŋ ʃɛlfɪʃ ", + "duration": 0.5163755416870117, + "PER": 13.333333333333334, + "score": { + "S": 6, + "D": 0, + "I": 0, + "N": 45 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i s ɛ d ʃ ɑ ɹ k s h æ v nowb own z æ n d ʃ ɹ ɪ m p s w æ m b æ k wɹ̩d", + "ref_phonemes": "ʃi sɛd ʃɑrks hæv noʊ boʊnz ʌnd ʃrɪmp swæm bækwɝd ", + "duration": 0.5094194412231445, + "PER": 17.94871794871795, + "score": { + "S": 6, + "D": 0, + "I": 1, + "N": 39 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.3949165344238281, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.35875558853149414, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.40939974784851074, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "ə s ɛ k ə n t t w ɪt͡ʃt h ɪ z ʃɹ̩t s l i v æ n dh i f ɛ l t t ə b ɹ i v bɹ̩n ɑ n h ɪ z ʌ bpɹ̩ɑ ɑ ɹ m", + "ref_phonemes": "ʌ sɛkʌnd twɪtʃt hɪz ʃɝtsliv ʌnd hi fɛlt ʌ brif bɝn ɑn hɪz ʌpɝ ɑrm ", + "duration": 0.6499893665313721, + "PER": 35.294117647058826, + "score": { + "S": 11, + "D": 0, + "I": 7, + "N": 51 + } + }, + { + "model": "WavLM", + "phonemes": "k ɔ ɹ i æ n t ɹ ɪ ʃ lejd t æ ɡ w ɪ ð b it͡ʃ b ɔ l z f ɔ ɹajawɹ̩z", + "ref_phonemes": "kɔri ʌnd trɪʃ pleɪd tæɡ wɪð bitʃ bɔlz fɔr aʊɝz ", + "duration": 0.4642961025238037, + "PER": 35.13513513513514, + "score": { + "S": 7, + "D": 2, + "I": 4, + "N": 37 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.37650442123413086, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.35536980628967285, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "d ɪ s ɛ m bɹ̩ɪ nd͡ʒæ n j u w ɛ ɹ i ɹ najs m ʌ n θ s t ə s p ɛ n d ɪ n majæ m i", + "ref_phonemes": "dɪsɛmbɝ ʌnd dʒænjuɛri ɑr naɪs mʌnθs tu spɛnd ɪn maɪæmi ", + "duration": 0.4925537109375, + "PER": 24.444444444444443, + "score": { + "S": 8, + "D": 1, + "I": 2, + "N": 45 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.4487802982330322, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "s ɛ d j u w ɔ ɹ j ɹ̩s ɹ ɛ l fawt ɪ n k l i ɪ ŋ ɔ l ð i z ɛ m p t i ɹ u m z", + "ref_phonemes": "sɛd ju wɔr jɝsɛlf aʊt klinɪŋ ɔl ðiz ɛmpti rumz ", + "duration": 0.3630070686340332, + "PER": 24.324324324324326, + "score": { + "S": 4, + "D": 1, + "I": 4, + "N": 37 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə dajə ɡ nows ə s w ɑ z d ɪ s kɹ̩əd͡ʒɪ ŋ hawɛ vɹ̩h i w ɑ z n ɑ towvɹ̩l i wɹ̩i d", + "ref_phonemes": "ðʌ daɪʌɡnoʊsʌs wɑz dɪskɝʌdʒɪŋ haʊɛvɝ hi wɑz nɑt oʊvɝli wɝid ", + "duration": 0.4380757808685303, + "PER": 34.0, + "score": { + "S": 12, + "D": 0, + "I": 5, + "N": 50 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə t ɑ ɹ ɡ ə t ɑ ɹ t k w ɪ k t l i æ n b ɹ i f l i t ɛ l j u w ɪt͡ʃð æ t ə t ɪ v z d u w ʌ t", + "ref_phonemes": "ðʌ tɑrɡʌt tʃɑrt kwɪkli ʌnd brifli tɛlz ju wɪtʃ ædʌtɪvz du wʌt ", + "duration": 0.44401097297668457, + "PER": 30.0, + "score": { + "S": 8, + "D": 4, + "I": 3, + "N": 50 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.413409948348999, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.44327354431152344, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "h i ɡejv v ə ʃ ɔ ɹ t h ɑ ɹ d l æ f æ n d l ʊ k t æ t hɹ̩n nowɪ ŋ l i", + "ref_phonemes": "hi ɡeɪv ʌ ʃɔrt hɑrd læf ʌnd lʊkt æt hɝ noʊɪŋli ", + "duration": 0.391984224319458, + "PER": 27.77777777777778, + "score": { + "S": 7, + "D": 0, + "I": 3, + "N": 36 + } + }, + { + "model": "WavLM", + "phonemes": "ɡ ɹ ɛ ɡɹ̩i æ n d t ɑ mt͡ʃowz t ə w ɑt͡ʃk ɑ ɹ t u n z ɪ n ð ə æ f tɹ̩n u n", + "ref_phonemes": "ɡrɛɡɝi ʌnd tɑm tʃoʊz tu wɑtʃ kɑrtunz ɪn ðʌ æftɝnun ", + "duration": 0.34044718742370605, + "PER": 29.268292682926827, + "score": { + "S": 8, + "D": 0, + "I": 4, + "N": 41 + } + }, + { + "model": "WavLM", + "phonemes": "k ɔ ɹ i ə n t ɹ ɪ ʃ p lejd t æ ɡ w ɪ ð b it͡ʃb ɔɑ l s f ɔ ɹawɹ̩z", + "ref_phonemes": "kɔri ʌnd trɪʃ pleɪd tæɡ wɪð bitʃ bɔlz fɔr aʊɝz ", + "duration": 0.46051716804504395, + "PER": 32.432432432432435, + "score": { + "S": 8, + "D": 1, + "I": 3, + "N": 37 + } + }, + { + "model": "WavLM", + "phonemes": "ajnow i æ t b ɪ ɡ ð ə j l ə d ʌ t ɔ ɪ b æ ɡ m k ajm n d taw t", + "ref_phonemes": "aɪ lʌv maɪ fæmʌli ʌnd ɪn ðʌ fjutʃɝ aɪ wɑnt tu meɪk maɪ pændʌz praʊd ", + "duration": 0.8025057315826416, + "PER": 79.24528301886792, + "score": { + "S": 20, + "D": 20, + "I": 2, + "N": 53 + } + }, + { + "model": "WavLM", + "phonemes": "ə lawʌ majf m i æ n n m i m j u ɛ dajw ɑ n t t ə mbejk k lajf h æ vb ə towɔ l", + "ref_phonemes": "aɪ lʌv maɪ fæmʌli ʌnd ɪn ðʌ fjutʃɝ aɪ wɑnt tu meɪk maɪ fæmʌli praʊd ", + "duration": 0.8194689750671387, + "PER": 66.0377358490566, + "score": { + "S": 21, + "D": 9, + "I": 5, + "N": 53 + } + }, + { + "model": "WavLM", + "phonemes": "w i ʃ ʊ ɹd ɹ ɪ z p ɛ k t æ n l ʌ v ɔ l m ɛ m bɹ̩z z ʌ v ð ə f æ m ə l i", + "ref_phonemes": "wi ʃʊr rɪspɛkt ʌnd lʌv ɔl mɛmbɝz ʌv ðʌ fæmʌli ", + "duration": 0.36646294593811035, + "PER": 30.555555555555557, + "score": { + "S": 7, + "D": 1, + "I": 3, + "N": 36 + } + }, + { + "model": "WavLM", + "phonemes": "ajɹ ɪ l n tajm æ v dajm b ə w ɪ l i d ow ajn lejæ ŋ b ɪ ɡ ɪ", + "ref_phonemes": "aɪ doʊnt hæv taɪm tu ɡoʊ wɪð ðʌ aɪm pleɪɪŋ krɪkʌt ", + "duration": 0.394118070602417, + "PER": 74.35897435897436, + "score": { + "S": 23, + "D": 4, + "I": 2, + "N": 39 + } + }, + { + "model": "WavLM", + "phonemes": "ajl aj ow majf aj æ m i aj ajæ n d ɪ ɪ n ðow owʌ v v j i ut͡ʃæ ajn ɔ n j u l mejb majmv f æ m ə i ow ow", + "ref_phonemes": "aɪ lʌv maɪ fæmʌli ʌnd ɪn ðʌ fjutʃɝ aɪ wɑnt tu meɪk maɪ fæmʌli praʊd ", + "duration": 0.641082763671875, + "PER": 79.24528301886792, + "score": { + "S": 22, + "D": 3, + "I": 17, + "N": 53 + } + }, + { + "model": "WavLM", + "phonemes": "ɪ v ɛ n ɪ najn n ejt ɪ n s ɛ ə n n n əɪ iɪ n ɪ f i n f ɔ ɹ ɪ n sajʌ t ɪ n v aj l ɛ v æ d æ nɹ̩najn n ɪ s ɛ ə s ɪ n z fajn ɔ ɹ θ i t͡ʃ l bajʌ", + "ref_phonemes": "twɛnti naɪntin eɪtin sɛvʌntin sɪkstin fɪftin fɔrtin θɝtin wʌn ɪlɛvʌn tɛn naɪn eɪt sɛvʌn sɪks faɪv fɔr θri tu wʌn ", + "duration": 0.8542327880859375, + "PER": 62.365591397849464, + "score": { + "S": 32, + "D": 18, + "I": 8, + "N": 93 + } + }, + { + "model": "WavLM", + "phonemes": "nej ɛ t iɛ z æ s ɡ ɛ ɪ ŋ æ z t mʌ ð ə d ɪ t s ɔ l w z s w i lajk ʊ h", + "ref_phonemes": "neɪtʃɝ ɪz dʒʌst ɡɛtɪŋ æz aʊɝ mʌðɝ ɪts ɔlweɪz swit laɪk hɝ ", + "duration": 0.3707752227783203, + "PER": 45.65217391304348, + "score": { + "S": 7, + "D": 11, + "I": 3, + "N": 46 + } + }, + { + "model": "WavLM", + "phonemes": "d d ɑ ɡ i b ɔ n majtk ɡlaj bajk s ə saj n s ʌ ɔ n d ɪæ k ajs d ɛ m l ɪ ɹ æ s ə b", + "ref_phonemes": "dɑk sid boʊnz mɪk laɪts baɪks ɛlsʌ wɑnt ʌ bʊk ædʌm pleɪz bæskʌtbɔl ", + "duration": 0.6522798538208008, + "PER": 72.22222222222221, + "score": { + "S": 15, + "D": 15, + "I": 9, + "N": 54 + } + }, + { + "model": "WavLM", + "phonemes": "ɪ n ð iə ɪ ŋ d ʌ d m ɛ n t ɪ s nowh h i i z nowl i tejk s ɛ ʃ ɑ vw ɔɑ k ɪ ŋ ð i ow ɪ ow ɹ m ɛ n iejt s ɛ", + "ref_phonemes": "ɪn ðʌ wɪntɝ wɛn ɪt snoʊ hi sloʊli teɪks ʌ ʃɔrt wɔk ɪn ðʌ oʊpʌn ɛr itʃ deɪ ", + "duration": 0.45820069313049316, + "PER": 62.5, + "score": { + "S": 26, + "D": 2, + "I": 7, + "N": 56 + } + }, + { + "model": "WavLM", + "phonemes": "d u d æ n t v ɛ d dajə n i f ɔ m ə n v ɔ s s ʊ l dejl i", + "ref_phonemes": "ðʌ studʌnt wɛr ðʌ junʌfɔrm ʌnd ɡoʊz θru skul daɪʌli ", + "duration": 0.4857807159423828, + "PER": 61.904761904761905, + "score": { + "S": 15, + "D": 11, + "I": 0, + "N": 42 + } + }, + { + "model": "WavLM", + "phonemes": "w i ʃ ʊ d l ɛ s f ɛ k d æ m lawɹ̩æ m ɛ m v ʌ s ʌ v ð ə f æ m i l i", + "ref_phonemes": "wi ʃʊd rɪspɛkt ʌnd ʌlaʊ aʊɝ mɛmbɝz ʌv ðʌ fæmʌli ", + "duration": 0.4355905055999756, + "PER": 44.73684210526316, + "score": { + "S": 15, + "D": 2, + "I": 0, + "N": 38 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə nejs ɛ d i v ɛ d i æ k æ k ɑ n f u l ɔ majfv k ɡ ɪ ŋ k ʌ lɹ̩", + "ref_phonemes": "ðʌ neɪtʃɝ ɪz vɛri ʌtræktɪv ʌnd fʊl ʌv maɪ feɪvɝɪt ɡrin kʌlɝ ", + "duration": 0.4749624729156494, + "PER": 62.5, + "score": { + "S": 17, + "D": 12, + "I": 1, + "N": 48 + } + }, + { + "model": "WavLM", + "phonemes": "j u ɪ s u nowɔ ow ɔ æ b ɔ k mejd ɡ dajn n f ɔ ð d v h i iɪ z n i ə d ɛ nejajd ɪ d i z w l b ɪ ðɡ ə l ɔ ŋ b ɪ ɹ", + "ref_phonemes": "juv mɪst tu noʊ ɔl ʌbaʊt maɪ ɡrændfɑðɝ wɛl hi ɪz nɪrli naɪntɪfri jɪrz oʊld wɪð ʌ lɔŋ bɪrd ", + "duration": 0.6093778610229492, + "PER": 66.19718309859155, + "score": { + "S": 24, + "D": 15, + "I": 8, + "N": 71 + } + }, + { + "model": "WavLM", + "phonemes": "ðejɪ ɪ ʃ iu ʊ l ɛ z v ɛ d l ʌ aj ɔ l m ɛ m bɹ̩ z ʌ v ð ə f æ m ə i", + "ref_phonemes": "wi ʃʊd rɪspɛkt ʌnd lʌv ɔl mɛmbɝz ʌv ðʌ fæmʌli ", + "duration": 0.38248133659362793, + "PER": 58.333333333333336, + "score": { + "S": 16, + "D": 2, + "I": 3, + "N": 36 + } + }, + { + "model": "WavLM", + "phonemes": "w b nejd nawajt æ n dawajsw ʊ dej s t ɪ ʃ ʊ æ b ʌ ə dawt ə ʌ", + "ref_phonemes": "oʊ maɪ ɡɑd ʌnd aɪ wʊd laɪk tu fɝst steɪʃʌn bʌt raɪt ɪt æt ðʌ fɝst steɪʃʌn ", + "duration": 0.5269742012023926, + "PER": 78.94736842105263, + "score": { + "S": 28, + "D": 17, + "I": 0, + "N": 57 + } + }, + { + "model": "WavLM", + "phonemes": "b ɑ i d b ɑ n z majk lajk bajk ə s ʌ v w ɑ n tej ə ə l æ d ə m lejb baj ʌ s ə t b ɑ", + "ref_phonemes": "dɔɡ it boʊnz laɪk baɪk ɛlsʌ wɑnt ʌ bʊk ædʌm pleɪ bæskʌtbɔl ", + "duration": 0.5830471515655518, + "PER": 63.829787234042556, + "score": { + "S": 17, + "D": 5, + "I": 8, + "N": 47 + } + }, + { + "model": "WavLM", + "phonemes": "ə n dɹ̩ najt ɪ najdn nejt d iejt najn ɪ s æ v ə n n najt ɪ z ɪ s najt i majdej najdt i v ɔ ɹ t najt i d d ej najt ŋ ə d u ɹ najn d i i n majd i ej d ɪ najn ejt i ej ə ej ɪ s ɛ v ə iɪ z ɪ k s ɛ ɪ vajdej i ɔ ɹ kt ð ejt d ɔ ɹ mejtd ʌ n t", + "ref_phonemes": "wʌn hʌndrʌd naɪntaɪnti naɪntaɪt naɪntɪvsɪn naɪntɪkis naɪntɪfaɪtɝ naɪntwɪfɝ naɪntɪfri niɪntutioʊ naɪnʃeɪn naɪnti eɪtinaɪn aɪtit eɪtɪɡstʌn aɪtiksɪs eɪtaɪvɪf eɪtifʊr eɪtritɛr eɪtitwɑtoʊ eɪtiʌn eɪti ", + "duration": 1.202256679534912, + "PER": 69.36416184971098, + "score": { + "S": 78, + "D": 32, + "I": 10, + "N": 173 + } + }, + { + "model": "WavLM", + "phonemes": "w i d ə s m æ n d ʌ tow m ə æ n i z ejk ej æ n faj ð æɪ n æ i l s m ɛ b ʌ t m æ n d i m ə ej i ʊ d", + "ref_phonemes": "ðʌ oʊldʌst mɛmbɝ ʌv maɪ fæmʌli ɪz maɪ frɛnd kæðɝ ʌnd ðʌ jʌŋɡʌst mɛmbɝ ʌv maɪ fæmʌli ɪz maɪ beɪbi bjurt ", + "duration": 0.6516366004943848, + "PER": 74.39024390243902, + "score": { + "S": 33, + "D": 28, + "I": 0, + "N": 82 + } + }, + { + "model": "WavLM", + "phonemes": "ð j u v i ʃ j ʊ ɹ mn ɔɑɔ ə h ə majn ɡaw n n aj d ə v i ɪ zs n ɪ n n ɪ f w ɔʌ ɹ i æ k k h ɪ ɪ l ɪ awæ s ɪ z h ɪ ð ɛ v ə i d ʌ ɛ ɪ n s ɛz ɪ ɪ ŋ aw æ n ɔ ə ðaw k f ɹ ɔ ɹ j u i aw v d ə ə b ʌ awə n m ɪ ɪ ŋ h ɛ l ɔ ɔ ŋn b ɪ dɹ ɪ ŋ d u h ɪ z ʃ n ɡ ɪ m ɪ ŋ ɡ ɔ h u u ə s h ɪi ŋ æ ɹn ʌ n n f i l ɪ ŋ ɑ s ʌ m ɔ ʌ p ɛ k b n h ɪ i h ɪ z w ajl i ɪ z d ʌ ɛ i ɹ ajæ k daj n ə s z b ɪ", + "ref_phonemes": "ju wɪʃ tu noʊ ɔl ʌbaʊt maɪ ɡrændfɑðɝ wɛl hi ɪz nɪrli naɪntɪfri jɪrz oʊld jɛt hi stɪl θɪŋks hi hæz sɪftɪd æz ɛvɝ hi drɛsʌz hɪmsɛlf ɪn æn oʊld blæk rɑk kɔrt juʒʌwʌli sɛvrʌl bʌtʌnz mɪsɪŋ ʌ lɔŋ ɡreɪt klɪŋz tu hɪz tʃɪn ɡɪvɪŋ ðoʊz hu ʌbzɝv hɪm hir prʌnaʊns ðʌ filɪŋ ʌv ðʌ ʌtmoʊst rɪspɛkt ", + "duration": 2.5314571857452393, + "PER": 77.33333333333333, + "score": { + "S": 103, + "D": 48, + "I": 23, + "N": 225 + } + }, + { + "model": "WavLM", + "phonemes": "m d͡ʒ d i z i z ɛ dɹ̩ z vawt t majt ð æ t ɔ iɪ ɔ l wejs ʃ ʃ t ə s p i lajk", + "ref_phonemes": "neɪtʃɝ ɪz æz kɛr æz aʊɝ mʌðɝ ɪt ɔlweɪz fɪts laɪk hɝ ", + "duration": 0.4421703815460205, + "PER": 85.0, + "score": { + "S": 18, + "D": 5, + "I": 11, + "N": 40 + } + }, + { + "model": "WavLM", + "phonemes": "ð ɛ n i ɡ ɪ v zs ʌ s u k s v ɛd͡ʒt ə b ə l z æ n d ɡ v ɛ n tə i t", + "ref_phonemes": "boʊθ jɔr ɡɪvz ʌs fruts vɛdʒtʌbʌlz ʌnd ɡreɪnz tu it ", + "duration": 0.2660713195800781, + "PER": 48.78048780487805, + "score": { + "S": 11, + "D": 7, + "I": 2, + "N": 41 + } + }, + { + "model": "WavLM", + "phonemes": "m ɔ ɹ m ʌ n d ɹd taj l dajw ʊ dajd f ʌ p b ʌ ʃ t ɛ ə n ə t i b ʌ t ɪ vejl t d dʌ majk i l i n ʌ p ʌ s t k ɛ t", + "ref_phonemes": "mɑm ʌnd dæd ʌnd aɪ wʊd æd ðʌ bʌs steɪʃʌnɝ liv ɪt tu hɝ ʌntɪl ðʌ bʌs keɪm ", + "duration": 0.4169883728027344, + "PER": 76.36363636363637, + "score": { + "S": 24, + "D": 5, + "I": 13, + "N": 55 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ w ɪ d u l z majfk p lejæ s bajk s æ z w ɔ ɹn z ə b ʊ l k ajk æ m p æ z b ʌ s t ə d b ɑ ɹ", + "ref_phonemes": "dɑɡz it boʊlz maɪk laɪks baɪks æz ʌ wʌns ʌ bʊk ædʌm pleɪz bæskʌtbɔl ", + "duration": 0.48065853118896484, + "PER": 61.111111111111114, + "score": { + "S": 22, + "D": 6, + "I": 5, + "N": 54 + } + }, + { + "model": "WavLM", + "phonemes": "j u v ɪ ʃ ɛ n nowh ɔ l ə mawt mejd ɹawn d f ɔ ðowb b ɛ i z m i ɪ ɹ l i najt ə ɪ ɹæ l ʌ v ð ə l ɔ ŋ ɪ ɹ", + "ref_phonemes": "ju wɪʃ tu noʊ ɔl ʌbaʊt maɪ ɡrændfɑðɝ wɛr hi ɪz nɪrli naɪntɪfri jɪrz oʊld wɪð ʌ lɔŋ brɛθ ", + "duration": 0.40931105613708496, + "PER": 60.86956521739131, + "score": { + "S": 28, + "D": 11, + "I": 3, + "N": 69 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə nej ɹ̩ ɪ z v ejɛ i ə t ɹ æ k t ɪ æ n d f u l ʌ v majf ɛ vɹ̩ ə ɡ ɹ i n k ʌ lɹ̩", + "ref_phonemes": "ðʌ neɪtʃɝ ɪz vɛri ʌtræktɪv ʌnd fʊl ʌv maɪ feɪvɝɪt ɡrin kʌlɝ ", + "duration": 0.4253683090209961, + "PER": 45.83333333333333, + "score": { + "S": 15, + "D": 4, + "I": 3, + "N": 48 + } + }, + { + "model": "WavLM", + "phonemes": "b ɔm mejn n d d æ k æ tɹejajvɹ̩ v ɹ̩d d ɛ t ð ə b ʌ ʃ t ejʃ ʃ ə n æ t i ʌ t wejk ɪ ŋ ə n t ɪ ð ə b ʌ s k ɪ ŋ", + "ref_phonemes": "mɑm ʌnd dæd ɝaɪvd æt ðʌ bʌs steɪʃʌn ɝli bʌt weɪtɪŋ ʌntɪl ðʌ bʌs keɪm ", + "duration": 0.5759949684143066, + "PER": 66.66666666666666, + "score": { + "S": 18, + "D": 4, + "I": 14, + "N": 54 + } + }, + { + "model": "WavLM", + "phonemes": "ajej d ɑ n ɑ t ʃhawæ ɹajm t ə ɡ owɔ i j u sajb lejm ə ɡ ɛ t", + "ref_phonemes": "aɪ du nɑt hæv taɪm tu ɡoʊ wɪð ju aɪ pleɪ ɪn krɪkʌt ", + "duration": 0.4702260494232178, + "PER": 65.78947368421053, + "score": { + "S": 14, + "D": 5, + "I": 6, + "N": 38 + } + }, + { + "model": "WavLM", + "phonemes": "ɪ ð ʌ v ɛɪ n ʌ t i v v ɛ n h ɪ t s nowɔ h i s lowl i tdejk s ɪ ʃ ɑ k w ɔ k æɪ n d ðaw k n i it͡ʃ d d", + "ref_phonemes": "ɪn ðʌ wɪntɝ wɛn ɪt snoʊ hi sloʊli teɪks ʌ ʃɔrt wɔk ɪn ðʌ oʊpʌn ɛriʌ itʃ deɪ ", + "duration": 0.4842832088470459, + "PER": 51.724137931034484, + "score": { + "S": 13, + "D": 8, + "I": 9, + "N": 58 + } + }, + { + "model": "WavLM", + "phonemes": "ð ʌt͡ʃ ʃ u ɹ d ə n s w ɪ ð ə j u n ə ɑ m æ n d ʌ s tɹ̩ə s ɔ ɹ dejt i", + "ref_phonemes": "ðʌ studʌnts wɝ ðʌ junʌfɔrm ʌnd bɝst ðʌ skoʊld ɛriʌ ", + "duration": 0.2902028560638428, + "PER": 65.85365853658537, + "score": { + "S": 15, + "D": 7, + "I": 5, + "N": 41 + } + }, + { + "model": "WavLM", + "phonemes": "d ɔ ɡ z lajt d ɔ s i b ʊ ŋ s majt lajt s bajd s æ n d s ʌ m w ʌ n s ə b ʊ k ɑ d ɛ m lejs b ʌ z ə ə", + "ref_phonemes": "dɑɡz it boʊts maɪk laɪks baɪks ɛlsʌ wɑnts ʌ bʊk ædʌm pleɪz bæskʌtbɔl ", + "duration": 0.5105717182159424, + "PER": 62.5, + "score": { + "S": 20, + "D": 7, + "I": 8, + "N": 56 + } + }, + { + "model": "WavLM", + "phonemes": "w i ʌ ɪ n n ʌ t h i s n ow s i s owln i tejk s ɛ ʃ ɔ ɹ w ɔ k i nowə l ə vej nej t", + "ref_phonemes": "ɪn ðʌ wɪntɝ wɛn mɪkst noʊz hi sloʊli teɪks ʌ ʃɔrt wɔk ɪn ðʌ oʊpʌn ɛr itʃ deɪ ", + "duration": 0.35035085678100586, + "PER": 64.40677966101694, + "score": { + "S": 25, + "D": 12, + "I": 1, + "N": 59 + } + }, + { + "model": "WavLM", + "phonemes": "n i i sɡ i i z æd ajd ajɑ ɹ ɔ w d majə ə h i ɔ ɹ h i k æ k h", + "ref_phonemes": "neɪtʃɝ ɪz jɛs kæriɪŋ æz aʊɝ mʌðɝ it ðʌ hɑrvʌst wi teɪk hɝ ", + "duration": 0.5871403217315674, + "PER": 84.44444444444444, + "score": { + "S": 28, + "D": 10, + "I": 0, + "N": 45 + } + }, + { + "model": "WavLM", + "phonemes": "nejt h ɪ d ɪ z b ɛ ɪ ŋ æ ʌ v ɹ̩ m ʌ ðɹ̩ ɪ t ɔ l l wejz w i k l ɛ k", + "ref_phonemes": "neɪtʃɝ ɪz kɛrɪŋ æz aʊɝ mʌðɝ ɪt ɔlweɪz wik laɪk hɝ ", + "duration": 0.28220129013061523, + "PER": 46.15384615384615, + "score": { + "S": 11, + "D": 4, + "I": 3, + "N": 39 + } + }, + { + "model": "WavLM", + "phonemes": "əaj l majf æ m ə l i æ n ɪ n ð ə f j ud͡ʒʌ n sajw w ɑ n t b u mejb majf æ m l i ɡ ɹawowtb", + "ref_phonemes": "aɪ lʌv maɪ fæmʌli ʌnd ɪn ðʌ fjutʃɝ aɪ wɑnt tu meɪk maɪ fæmʌli praʊd ", + "duration": 0.4017832279205322, + "PER": 54.71698113207547, + "score": { + "S": 17, + "D": 4, + "I": 8, + "N": 53 + } + }, + { + "model": "WavLM", + "phonemes": "j j u ɪ s t ə nowɔh ə bawt majɡ awnɑ f ɔ ɛ v s ʃ i z n i ə d i n najn i k ɹ i i æ ɹ s ɔ d ɪ t ə l ɔ ŋ ɪ ɹ", + "ref_phonemes": "ju wɪʃ tu noʊ ɔl ʌbaʊt maɪ ɡrændfɑðɝ wɛr hi ɪz nɪrli naɪntɪfri jɪrz oʊld wɪð ʌ lɔŋ bɪrd ", + "duration": 0.5518200397491455, + "PER": 60.86956521739131, + "score": { + "S": 30, + "D": 10, + "I": 2, + "N": 69 + } + }, + { + "model": "WavLM", + "phonemes": "ajd ɑ n t hawæm tajɪ n t ə w ɪ l i j u aj m z p lejɪ ŋ ɪ k ɪ t", + "ref_phonemes": "aɪ doʊnt hæv taɪm tu ɡoʊ wɪð ju aɪ æm pleɪɪŋ krɪkʌt ", + "duration": 0.392162561416626, + "PER": 52.5, + "score": { + "S": 9, + "D": 7, + "I": 5, + "N": 40 + } + }, + { + "model": "WavLM", + "phonemes": "j u v ɪ ʃ d u n ɑ ɔ l ə bow t majɡ ɹawn n d v ʌ tð æ ɹt v hð ə z ð ə ɛæ b ɛ nej ɡ d ɪ d ð i ɛ s ʊ ɹ ɪ ð ɛ ɹ l ɔ m b ɑ ɹ d", + "ref_phonemes": "ju wɪʃ tu noʊ ɔl ʌbaʊt maɪ ɡrændfɑðɝ wɛl hi ɪz nɪr baɪ naɪntɪfri jɪrz oʊld wɪð ʌ lɔŋ vɝtwoʊ ", + "duration": 0.4680922031402588, + "PER": 69.44444444444444, + "score": { + "S": 36, + "D": 9, + "I": 5, + "N": 72 + } + }, + { + "model": "WavLM", + "phonemes": "ɪ ɪ s u n ɔ l i w ɑ ɹ w majd æ f ɔ ɹ ð əʌ v ɛ l i h z nowhow n ɪ ɹ i i najdt t i θ ɹ i j ɪ s w ɔ ɹ æ d b ɪ f j ə l ɑ ɹ ɪ ɹ", + "ref_phonemes": "ju just tu noʊ ɔl ʌbaʊt maɪ ɡrændfɑðɝ wɛl hi ɪz nɪrli naɪntɪfri jɪrz oʊld wɪð ʌ lɔŋ bɪrd ", + "duration": 0.6214485168457031, + "PER": 75.71428571428571, + "score": { + "S": 33, + "D": 11, + "I": 9, + "N": 70 + } + }, + { + "model": "WavLM", + "phonemes": "h ʌ n dej najejdt ɪ najæ n naj n d iejt n tæ n d ɪ s ɹ n tæ s ə k s mnajt ɪ fajn najt n d dt ɪ f ɹ naj æ n d s ɹ ɪ n æ i t n d w ʌ n najt t i t ɪ n æ n iejt iɪ s ɛ v ə ej d t i s ə k sejd i ɪ s ə k s ejd ɪ fajd d ɪ f ɔ ɹd d ɪ iɪ ə t i t n i d", + "ref_phonemes": "wʌn hʌndrʌd naɪntaɪnti naɪntaɪt naɪntɪvsɪn naɪntɪkis naɪntɪfaɪtɝ naɪntwɪfɝ naɪntɪfri niɪntutioʊ naɪnʃeɪn naɪnti eɪtinaɪn eɪtɪɡstʌn aɪtiksɪs eɪti aɪtiksɪs eɪtaɪvɪf eɪtifʊr eɪtritɛr eɪtitwɑtoʊ eɪtiʌn eɪti ", + "duration": 0.9346067905426025, + "PER": 69.44444444444444, + "score": { + "S": 63, + "D": 48, + "I": 14, + "N": 180 + } + }, + { + "model": "WavLM", + "phonemes": "ɪ n n ʌ ə n dð l w ɛ n ɪə s n ə l z h ɪ s lown i sejf ʃ ʃ ɑ ktk ɪ n ð ə owp p ɛ n ɪ ɹ i ej", + "ref_phonemes": "ɪn ðʌ wɪntɝ wɛn ɪt snoʊz hi sloʊli teɪks ʌ ʃɔrt wɔk ɪn ðʌ oʊpʌn ɛr itʃ deɪ ", + "duration": 0.47679996490478516, + "PER": 54.385964912280706, + "score": { + "S": 22, + "D": 7, + "I": 2, + "N": 57 + } + }, + { + "model": "WavLM", + "phonemes": "j j u w ɪ ʃ d u now ɔ l ɛ v majkɡk awn d f ɔ ɹ ð ð ɹ wv ɛ l z m ɪ j æ d ɪ d d ɪ ɹ s ɔ ɹl v ɪ l ɔ ɛ ɹ", + "ref_phonemes": "ju wɪʃ tu noʊ ɔl ʌbaʊt maɪ ɡrændfɑðɝ wɛl hi ɪz mɪrli naɪntɪfri jɪrz oʊld wɪð ʌ lɔŋ bɪrd ", + "duration": 0.5756106376647949, + "PER": 66.66666666666666, + "score": { + "S": 21, + "D": 19, + "I": 6, + "N": 69 + } + }, + { + "model": "WavLM", + "phonemes": "d d æ ʃ m ɛ m b ʌ t ʌ v ð ə sf æ m ə l i ɪ z majɡ ɹ æ f ɑ ð ə æ n d ʌ ŋ ɪ ʃ m ɛ m b ʌ t vf ajf f æ m l i ɪ z majɡ ɪ v i b ð", + "ref_phonemes": "ðʌ oʊldʌst mɛmbɝ ʌv ðʌ fæmʌli ɪz maɪ ɡrændfɑðɝ ʌnd ðʌ jʌŋɡʌst mɛmbɝ ʌv maɪ fæmʌli ɪz maɪ beɪbi brʌðɝ ", + "duration": 0.5663242340087891, + "PER": 48.148148148148145, + "score": { + "S": 17, + "D": 18, + "I": 4, + "N": 81 + } + }, + { + "model": "WavLM", + "phonemes": "d ɔ ɡ z t t bw ɔ n s majtk lajk s baj s æ sowɑ n s ə b əʊ k æ t æ m l ɪ z b ʌ s k ə b ə ɹ", + "ref_phonemes": "dɑɡz it boʊnz maɪk laɪks baɪts ɛlsʌ wɑnts ʌ bʊk ʌnd aɪm pleɪst ɪn bæskʌtbɔl ", + "duration": 0.39778685569763184, + "PER": 52.459016393442624, + "score": { + "S": 19, + "D": 11, + "I": 2, + "N": 61 + } + }, + { + "model": "WavLM", + "phonemes": "ajow majf æ m ə ɹ ɪi ɑ n i d ə f j ut͡ʃɹ̩ aj ɑ n t ɪ l mejk majf æ m ə ɪ ɹowl", + "ref_phonemes": "aɪ lʌv maɪ fæmʌli ʌnd ɪn ðʌ fjutʃɝ aɪ wɑnt tu meɪk maɪ fæmʌli praʊd ", + "duration": 0.43369221687316895, + "PER": 58.490566037735846, + "score": { + "S": 20, + "D": 7, + "I": 4, + "N": 53 + } + }, + { + "model": "WavLM", + "phonemes": "ð j i ʃ t u n owɑ aw ə ə majk ɡə n æ n ʌə b ʌz i h i i i z i æ n æ n ə i i ʌ hoj ə æ h ɪ d l ɪ ŋn z s h ə ɪ i ajz ɛæ v h ɪ d z ɛ s hɪ m s ʌz ɪ ŋn i æ n ɔ d t f ɹ ɔ ɔ ɹ j w ʌ ɪ s ɛ v td bajʌ t æ ɪ ɪ ŋ ə ɔ ɔ ŋ b ɪ ɪ ŋ z t ə ɪ sz ʃ ɪ ŋn j ɪ v ɪ ŋ ð l ə z h ɪ m i ɛ ʌ n ɑ ŋ ɹ̩ f i l ɪ ŋ m ɔs d ʌ b ɛ ə b æ h ɪ b ɪ h ɪ zs ɪ z d ʌz b i d͡ʒ ɛ ɹnawajæ kɹ̩ d ɹ b ɪ ɪ ɛ ə ɛ", + "ref_phonemes": "ju wɪʃ tu noʊ ɔl ʌbaʊt maɪ ɡrændfɑðɝ wɛl hi ɪz nɪrli naɪntɪfri jɪrz oʊld jɛt hi stɪl θɪŋks æz kwɪkli æz ɛvɝ hi drɛsʌz hɪmsɛlf ɪn æn oʊld lædprɑp pɔrt juʒʌwʌli sɛvrʌl bʌtʌnz mɪsɪŋ ʌlɔŋ bridz lɪŋks tu hɪz tʃɪn ɡɪvɪŋ ðoʊz hu ʌbzɝv hɪm ʌ prʌnaʊnst filɪŋ ʌv ", + "duration": 3.091754674911499, + "PER": 83.74384236453201, + "score": { + "S": 78, + "D": 47, + "I": 45, + "N": 203 + } + }, + { + "model": "WavLM", + "phonemes": "nej æ i s ɡej ɪ ɪ ŋ ə ðowð m ʌ ð æɛ d ɪ t s ɔ ɔ w d s w i lajk k ʊ d", + "ref_phonemes": "neɪtʃɝ ɪz skeɪtɪŋ æz aʊɝ mʌðɝ ɪts ɔlweɪz swit laɪk hɝ ", + "duration": 0.4073517322540283, + "PER": 60.46511627906976, + "score": { + "S": 15, + "D": 7, + "I": 4, + "N": 43 + } + }, + { + "model": "WavLM", + "phonemes": "h n ɹej i najt d i najn najt i ej nd i s ɛ v ə n najnd i s ɪ k s n t i fajf najn i ɔ ɹ n i æ n i d u majn i ʌ majn i ejt i najn ejt i ej tej ejt i s ɛ v ə ejt i s ɪ k s ejt i faj t i f ɔ ɹ ejt i ɪ kejt i d ɔ ej t ej w ʌ n ejt s", + "ref_phonemes": "wʌn hʌndrʌd naɪntaɪnti naɪntaɪt naɪntɪvsɪn naɪntɪkis naɪntɪfaɪtɝ naɪntwɪfɝ naɪntɪfri niɪntutioʊ naɪnʃeɪn naɪnti eɪtinaɪn aɪtit eɪtɪɡstʌn aɪtiksɪs eɪtaɪvɪf eɪtifʊr eɪtritɛr eɪtitwɑtoʊ eɪtiʌn eɪti ", + "duration": 1.035064935684204, + "PER": 63.58381502890174, + "score": { + "S": 63, + "D": 39, + "I": 8, + "N": 173 + } + }, + { + "model": "WavLM", + "phonemes": "n æd͡ʒaj i ɪ z æ s ɡ ɛ d ɪ ŋ ə æ s ɹ̩ m ɑ i t t ɔ ɹl ɛ s s i t lajk ʌ t", + "ref_phonemes": "neɪtʃɝ ɪz jɛs kɛrɪŋ æz aʊɝ mʌðɝ ɪt ɔlweɪz swit laɪk hɝ ", + "duration": 0.5525984764099121, + "PER": 67.44186046511628, + "score": { + "S": 19, + "D": 6, + "I": 4, + "N": 43 + } + }, + { + "model": "WavLM", + "phonemes": "d ɔɑ ɡ t h i i b ɔ ɹ n ə mɹejk æ t mejk lejk s bejk i i ʌ s ɔ ɹ z ə b ʊ k ʊ æ ɹ d ɑ ŋn z k z b ɑ s k ə b ə l", + "ref_phonemes": "dɑrkbit boʊn mɪk laɪts baɪkɝ ɛlsʌ wɑnts bʊk jæ ðæts pleɪst bæskʌtbɔl ", + "duration": 0.5028743743896484, + "PER": 80.7017543859649, + "score": { + "S": 31, + "D": 5, + "I": 10, + "N": 57 + } + }, + { + "model": "WavLM", + "phonemes": "mejtk ɪ ɪ z ejd ɪ ŋ æ z s ʌɹ̩ vɹ̩ ɹ̩ m ʌ ðɹ̩ t ɔ l vejz b i k lajk h", + "ref_phonemes": "neɪtʃɝ ɪz kɛrɪŋ æz aʊɝ mʌðɝ ɪt ɔlweɪz swit laɪk hɝ ", + "duration": 0.4122006893157959, + "PER": 62.5, + "score": { + "S": 17, + "D": 2, + "I": 6, + "N": 40 + } + }, + { + "model": "WavLM", + "phonemes": "ajd l m ajf aj m m i mejæ ɹ ɪ ɪ n d j u f j u ld͡ʒajs ɔ ɹ n t u l m ejk æ m i ɹawt", + "ref_phonemes": "aɪ lʌv maɪ fæmʌli ʌnd ɪn ðʌ fjutʃɝ aɪ wɑnt tu meɪk maɪ fæmʌli praʊd ", + "duration": 0.5023007392883301, + "PER": 73.58490566037736, + "score": { + "S": 19, + "D": 11, + "I": 9, + "N": 53 + } + }, + { + "model": "WavLM", + "phonemes": "ajd d ow ɑ n t h æ v t ɹajm t ə ɡowð ɪ t j u z ʌ v θ æ k ə k ɛɪ t", + "ref_phonemes": "aɪ doʊnt hæv taɪm tu ɡoʊ wɪð ju aɪm pleɪɪŋ krɪkʌt ", + "duration": 0.303286075592041, + "PER": 56.41025641025641, + "score": { + "S": 13, + "D": 5, + "I": 4, + "N": 39 + } + }, + { + "model": "WavLM", + "phonemes": "b nej z v ɛ ɛ d i ð æ k ajk n d f ʊ l ɔ l majf ɛ v ɹ̩ ɹ ɪ n k ə l ə", + "ref_phonemes": "ðʌ neɪtʃɝ ɪz vɛri ʌtræktɪv ʌnd fʊl ʌv maɪ feɪvɝɪt ɡrin kʌlaʊr ", + "duration": 0.40375375747680664, + "PER": 62.0, + "score": { + "S": 17, + "D": 13, + "I": 1, + "N": 50 + } + }, + { + "model": "WavLM", + "phonemes": "ajd u n ɑ t hawmʌ tejm d u wowəow i ð uajʌ m ɪ ŋ ɪ ɛ", + "ref_phonemes": "aɪ du nɑt hæv taɪm tu ɡoʊ wɪð ju aɪ æm pleɪɪŋ krɪkʌt ", + "duration": 0.35584378242492676, + "PER": 62.5, + "score": { + "S": 12, + "D": 9, + "I": 4, + "N": 40 + } + }, + { + "model": "WavLM", + "phonemes": "ɹejk æ j u z æ z f ɹ u s m ʌd͡ʒ d ʌ b ə l z æ n d d ɹ ɛ nt͡ʃɪ d u i t", + "ref_phonemes": "meɪk ʌ jus æz fruts vɛdʒtʌbʌlz ʌnd ɡreɪnz tu it ", + "duration": 0.3576474189758301, + "PER": 55.26315789473685, + "score": { + "S": 13, + "D": 3, + "I": 5, + "N": 38 + } + }, + { + "model": "WavLM", + "phonemes": "mejd æ j u ʌ s w u l θ s v ɪ ɛ vɹ̩ə s æ n d ɹ̩æ n s tə i", + "ref_phonemes": "leɪtɝ ɡɪvz ʌs fud wɪð teɪbʌlz ʌnd dreɪnz tu it ", + "duration": 0.28408193588256836, + "PER": 75.67567567567568, + "score": { + "S": 24, + "D": 4, + "I": 0, + "N": 37 + } + }, + { + "model": "WavLM", + "phonemes": "ðowb ɛ t m ɑ m ʌ t v ð ə v æ m m i z majɡ æ n f ɑ ð ə æ n d daj ʃ t m ɑ m tɹ̩ə l bð ʌ majɡ i i z majɡ d b i æ ðɹ̩", + "ref_phonemes": "ðʌ oʊldʌst mɛmbɝ ʌv ðʌ fæmʌli ɪz maɪ ɡrændfɑðɝ ʌnd ðʌ jʌŋɡʌst mɛmbɝ ʌv maɪ fæmʌli ɪz maɪ vɛri brʌðɝ ", + "duration": 0.6942565441131592, + "PER": 61.25000000000001, + "score": { + "S": 34, + "D": 14, + "I": 1, + "N": 80 + } + }, + { + "model": "WavLM", + "phonemes": "h n m ɛ nejd i najn nejdtd d iej ej najd ɪ s ə nejt i s ɪ k n ɪd i fajt ejd i f ɔ ɹ nejt i θ nejt i t u ɹ nejd i ʌ n nejd i ejiejt i nejn dejdt iejæ ejt ɪ s ɛ v n dej t i s ɪ k s ejt k i fajd ɪ f ɔ ɹ ej i θsɹ ɪ iejt i t u t i ʌ nejt i", + "ref_phonemes": "wʌn hʌndrʌd naɪntaɪnti naɪntaɪt naɪntɪvsɪn naɪntɪkis naɪntɪfaɪtɝ naɪntwɪfɝ naɪntɪfri niɪntutioʊ naɪnʃeɪn naɪnti eɪtinaɪn aɪtit eɪtɪɡstʌn aɪtiksɪs eɪtaɪvɪf eɪtifʊr eɪtritɛr eɪtitwɑtoʊ eɪtiʌn eɪti ", + "duration": 0.9913361072540283, + "PER": 69.36416184971098, + "score": { + "S": 86, + "D": 27, + "I": 7, + "N": 173 + } + }, + { + "model": "WavLM", + "phonemes": "w i ʃ ʊə d d ɪ k s p ɛ k ɛ n d l ə l l ɔ n m ɛ m bɹ̩əs s ɔ f ʌ f ð ə f æ m i i", + "ref_phonemes": "wi ʃʊd ɪkspɛkt ʌnd ʌlaʊ ɔl mɛmbɝz ʌv ðʌ fæmʌli ", + "duration": 0.4124128818511963, + "PER": 54.054054054054056, + "score": { + "S": 9, + "D": 3, + "I": 8, + "N": 37 + } + }, + { + "model": "WavLM", + "phonemes": "ɪ n ð ə v ɪ ŋ dowʌ v æ n d ɪ k s now ɪ s lowl i ɪ k s i ʃ ɑ ɹ k v ɔ l k ɪ n ɛ l p æ n ɛ ɹ it͡ʃjv i dej", + "ref_phonemes": "ɪn ðʌ wɪndoʊ wɛn ɪts noʊz hi sloʊli teɪks ʌ ʃɔrt wɔk ɪn ðʌ oʊpʌn ɛr itʃ deɪ ", + "duration": 0.3879508972167969, + "PER": 56.896551724137936, + "score": { + "S": 18, + "D": 7, + "I": 8, + "N": 58 + } + }, + { + "model": "WavLM", + "phonemes": "mejtej ə ɪ z æ s kejt ɪ ŋ ɡ ʌ v d m ʌ dðɹ̩d i z i t ɑ ɛ s i k l ɛ k", + "ref_phonemes": "neɪtʃɝ ɪz æz kɛrɪŋ æz aʊɝ mʌðɝ ɪz ɪts ɔlweɪz swit laɪk ", + "duration": 0.34732484817504883, + "PER": 72.09302325581395, + "score": { + "S": 18, + "D": 8, + "I": 5, + "N": 43 + } + }, + { + "model": "WavLM", + "phonemes": "ð ʌ n i i ð ɪ s w ɪ i ə ɹajd ə ʌ ʌ n dɹ̩ ʊ l i m ɔ f majndt ɪ fvawæ vɹ̩ ə ɪ ŋ ə l", + "ref_phonemes": "ðʌ neɪtʃɝ ɪz vɛri ʌtræktɪv ʌnd fʊl ʌv maɪ feɪvɝɪt ɡrin kʌlɝ ", + "duration": 0.48615312576293945, + "PER": 81.25, + "score": { + "S": 28, + "D": 5, + "I": 6, + "N": 48 + } + }, + { + "model": "WavLM", + "phonemes": "m ɑ ɹ m n dajdɹ̩ æ ɛ dʌ ð ə b ʌ s tejʃ ə n əl i w ʌ t ɹejktt͡ʃ daw n ɪ n ð ə b ʌ s k ej", + "ref_phonemes": "mɑm ʌnd dæd ɝaɪvd æt ðʌ bʌs steɪʃʌn ɝli bʌt weɪtʌd ʌntɪl ðʌ bʌs keɪm ", + "duration": 0.4270615577697754, + "PER": 53.70370370370371, + "score": { + "S": 19, + "D": 5, + "I": 5, + "N": 54 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə ɑ ɹ ʃ i d b n n z majk lejæ bejs z æ n sowɑ n ʃ i b u t bsajt ə m p l ɪ s b ʌ s ə d b ɑ k", + "ref_phonemes": "ðʌ ɔfʃid boʊnz mɪk laɪks baɪts ɛlsʌ wɑnts ʌ bʊk ædʌm pleɪz bæskʌtbɔl ", + "duration": 0.38758277893066406, + "PER": 64.28571428571429, + "score": { + "S": 27, + "D": 5, + "I": 4, + "N": 56 + } + }, + { + "model": "WavLM", + "phonemes": "ɔ ɑ ɹn i i najn i ej t ɪ n s æ ɪ n z ɪ ʃ d ɪ n ɪ f ɪ f ɔ ɹ d ɪ daj ʌ d ɪ n l ow n æ v ə n d æ n najn t s æ v vajəm ɔ ɹ d ʊu ɹ laj ʌ", + "ref_phonemes": "twɛnti naɪntin eɪtin sɛvʌntin fɪftin fɪftin fɔrtin θɝtin twɛlv ɪlɛvʌn tɛn naɪn eɪt sɛvʌn sɪks faɪv fɔr θri tu wʌn ", + "duration": 0.8868029117584229, + "PER": 69.14893617021278, + "score": { + "S": 42, + "D": 21, + "I": 2, + "N": 94 + } + }, + { + "model": "WavLM", + "phonemes": "ð i i ʊ d ɡ ɛ θ æ k ajm nawɹ̩ ɔ m ə m ɹ̩zʃ ʌ m", + "ref_phonemes": "wi ʃʊd rɪspɛkt ʌnd naʊ aɪ rɪmɛmbɝ soʊ mʌtʃ taɪm ", + "duration": 0.3870868682861328, + "PER": 73.68421052631578, + "score": { + "S": 18, + "D": 10, + "I": 0, + "N": 38 + } + }, + { + "model": "WavLM", + "phonemes": "i z j ʊ ɹ æ z pejk æ law ɔ l m ɛ m bɹ̩z ʌ v ð ə f æ m l i i", + "ref_phonemes": "wi ʃʊd rɪspɛkt ʌnd ʌlaʊ ɔl mɛmbɝz ʌv ðʌ fæmʌli ", + "duration": 0.3552117347717285, + "PER": 54.054054054054056, + "score": { + "S": 9, + "D": 7, + "I": 4, + "N": 37 + } + }, + { + "model": "WavLM", + "phonemes": "d ɔɑ s i i d b ow z m ɪ d l ajk bajæ s ə zs ɔ n zs ɛ b ʊ l k ə d ɑ ə m b ejk b ʌ s k ə t b ɑ", + "ref_phonemes": "dɑɡz it boʊnz mɪlk laɪks baɪts ɛls wʌns ʌ bʊk ʌnd ʌ pleɪs bæskʌt boʊnz ", + "duration": 0.6740868091583252, + "PER": 58.92857142857143, + "score": { + "S": 21, + "D": 8, + "I": 4, + "N": 56 + } + }, + { + "model": "WavLM", + "phonemes": "ɹ i s k u d ɛ n s v ɛ d i ɛ n ə f ɑ ɹ m m æ n d ɡowz t ə s k l ej", + "ref_phonemes": "ðʌ studʌnts wɛr ðʌ junʌfɔrm ʌnd ɡoʊz tu skul deɪli ", + "duration": 0.3390967845916748, + "PER": 56.09756097560976, + "score": { + "S": 15, + "D": 7, + "I": 1, + "N": 41 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə nej ɑ ʌ d ɪ z ð ɛ i ʌ ɹ æ k t ɪ v æ n d f ʊ l ʌ v majf ɪ vɹ̩ ə n k ɪ ŋ k ʌ lɹ̩", + "ref_phonemes": "ðʌ neɪtʃɝ ɪz vɛri ʌtræktɪv ʌnd fʊl ʌv maɪ feɪvɝɪt ɡrin kʌlɝ ", + "duration": 0.33075952529907227, + "PER": 43.75, + "score": { + "S": 17, + "D": 3, + "I": 1, + "N": 48 + } + }, + { + "model": "WavLM", + "phonemes": "ajd u n k ɹaj u n ɑ t k t kawæ ɹajɪ n u ɡ ɑ i k j uaj m lejɪm d ə kejt", + "ref_phonemes": "aɪ du nɑt hæv taɪm tu ɡoʊ wɪð ju aɪ æm pleɪɪŋ krɪkʌt ", + "duration": 0.44565320014953613, + "PER": 80.0, + "score": { + "S": 13, + "D": 7, + "I": 12, + "N": 40 + } + }, + { + "model": "WavLM", + "phonemes": "ð ɛ nej t͡ʃ d it͡ʃ v əɛ i æ k æ k u ʌ n u l ɑ f majb ə ə ɪ n k ʌ lɹ̩", + "ref_phonemes": "ðʌ neɪtʃɝ ɪz vɛri ʌtræktɪv ʌnd fʊl ʌv maɪ feɪvɝɪt ɡrin kʌlɝ ", + "duration": 0.32349324226379395, + "PER": 68.75, + "score": { + "S": 16, + "D": 12, + "I": 5, + "N": 48 + } + }, + { + "model": "WavLM", + "phonemes": "ajd n hawmɪ d u d ɑ n hawɛ æm u ɡow ɪ ŋ j u ajə m p lejɪ ŋ ɡæ n ɡ ɛ t", + "ref_phonemes": "aɪ dɪdʌnt hæv taɪm tu ɡoʊ wɪð ju aɪ æm pleɪɪŋ krɪkʌt ", + "duration": 0.34804415702819824, + "PER": 63.41463414634146, + "score": { + "S": 15, + "D": 4, + "I": 7, + "N": 41 + } + }, + { + "model": "WavLM", + "phonemes": "ɪ n ð ə v ɪ n d ʌ d ɹ̩ n iə s nows s i s ɹowl i dejæ i ʃ ʃ ɑ ɹ k w ɔ k ɪ n ð ʌ v ə l ejæ nejt z", + "ref_phonemes": "ɪn ðʌ wɪntɝ wɛn ɪt snoʊz ɪt sloʊli teɪks ʌ ʃɔrt wɔk ɪn ðʌ oʊpʌn ɛr itʃ deɪ ", + "duration": 0.4472849369049072, + "PER": 63.1578947368421, + "score": { + "S": 29, + "D": 4, + "I": 3, + "N": 57 + } + }, + { + "model": "WavLM", + "phonemes": "ɑ d ɑ n t h n ɹajm ɹ̩w ɪ l ɪ j u æ m p l æ ŋ k ə", + "ref_phonemes": "aɪ doʊnt hæv taɪm tu ɡoʊ wɪð ju aɪ æm pleɪɪŋ krɪkʌt ", + "duration": 0.2732377052307129, + "PER": 62.5, + "score": { + "S": 12, + "D": 13, + "I": 0, + "N": 40 + } + }, + { + "model": "WavLM", + "phonemes": "j iu w ɪ ʃ t u nowm ɔ l ə bowɑ majk ð æ n f ɔ dowð b ɛæ l ɪ z ð ɪ ɹ i najtn i ð ɹ i j ɪ ɹ s fowɔ l ð ɛə l ɔ ŋ b i ɑ ɹ", + "ref_phonemes": "ju wɪʃ tu noʊ ɔl ʌbaʊt maɪ ɡrændfɑðɝ wɛl hi ɪz nɪrli naɪntɪfri jɪrz oʊld wɪð ʌ lɔŋ bɪrd ", + "duration": 0.5228080749511719, + "PER": 59.42028985507246, + "score": { + "S": 26, + "D": 7, + "I": 8, + "N": 69 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə s t u d ə n s ɛ d d u n f ɔ m æ n d owɑ s tɹ̩ə s k u ɡɹejt", + "ref_phonemes": "ðʌ studʌnts wɛr ðʌ junʌfɔrm ʌnd ɡoʊz tu skul deɪ ", + "duration": 0.3008744716644287, + "PER": 56.41025641025641, + "score": { + "S": 11, + "D": 7, + "I": 4, + "N": 39 + } + }, + { + "model": "WavLM", + "phonemes": "ə n d itd d najn d ɪ najn nej æ d i owə nejn i s ʌ nd æɪ s ɪ k s n næ n ɪ fajn n ejd d ɪ f n d ɪ ɹ ɪ nejd n d i d ɹ nejd d w ʌ n ejd d i iej d ɪ nejt n it iej d s ɛ ə ɹ d s ɪ k ejt ɪ fajnd d ɪ f ɔ ow ə d sɹ i d d u ejt ɪ vaj n d", + "ref_phonemes": "wʌn hʌndrʌd naɪntaɪnti naɪntaɪt naɪntɪvsɪn naɪntɪvsɪn naɪntɪfaɪtɝ naɪntwɪfɝ naɪntɪfri niɪntutioʊ naɪnʃeɪn naɪnti eɪtinaɪn aɪtit eɪtɪɡstʌn aɪtiksɪs eɪtaɪvɪf eɪtifʊr eɪtritɛr eɪtitwɑtoʊ eɪtiʌn eɪti ", + "duration": 0.8680956363677979, + "PER": 72.98850574712644, + "score": { + "S": 85, + "D": 38, + "I": 4, + "N": 174 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə nej i z b ɪ æ æ k b i n ɔ f mejt f ɛ vɹ̩dv b i ɪ ŋ ɡ ʌ", + "ref_phonemes": "ðʌ neɪtʃɝ ɪz vɛri ʌtræktɪv ʌnd fʊl ʌv maɪ feɪvɝɪt ɡrin kʌlɝ ", + "duration": 0.42542386054992676, + "PER": 77.08333333333334, + "score": { + "S": 21, + "D": 15, + "I": 1, + "N": 48 + } + }, + { + "model": "WavLM", + "phonemes": "h n nejɛ i nejd i najn nejt iejt najt i sz ɛ v ə n najt i s ɪ k s najejt faj najt f ɔ ɹ ow nejt i ej d najejtd i d u ɹ nejt i v ʌ n nejt t i t i najd t t iejt ejt i z ɛ l ə n t i z ɪ k s sejt t i fajd ej t i f ɔ ɹ ɪ i t i d u l ejd i n d i", + "ref_phonemes": "wʌn hʌndrʌd naɪntaɪnti naɪntaɪt naɪntɪvsɪn naɪntɪkis naɪntɪfaɪtɝ naɪntwɪfɝ naɪntɪfri niɪntutioʊ naɪnʃeɪn naɪntaɪnti aɪtit eɪtɪɡstʌn aɪtiksɪs eɪtaɪvɪf eɪtifʊr eɪtritɛr eɪtitwɑtoʊ eɪtiʌn eɪti ", + "duration": 1.0899105072021484, + "PER": 71.59763313609467, + "score": { + "S": 71, + "D": 33, + "I": 17, + "N": 169 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ k i bw ɑ n szs s s mejk lejk s bejk i ʃ s vawajɑ n t ə b ʊ s ɑ d ʌ m dejk b ʌ s k ə t b ɔɑ ɹ", + "ref_phonemes": "dɑrk ʃit bɑndz meɪk laɪk baɪks ɪsisɛlʌ ɔr væŋk ʌ bʊk ædʌm pleɪz bæskʌtbɔl ", + "duration": 0.6476852893829346, + "PER": 63.33333333333333, + "score": { + "S": 25, + "D": 7, + "I": 6, + "N": 60 + } + }, + { + "model": "WavLM", + "phonemes": "ajl ʌ l majfə f æ m ə l i æ n d d d ʌ v j ut͡ʃ majw ɔ ɹ v ɪ l m mejæ majf æ m l i k ʌɹaw", + "ref_phonemes": "aɪ lʌv maɪ fæmʌli ʌnd ɪn ðʌ fjutʃɝ aɪ wɑnt tu meɪk maɪ fæmʌli praʊd ", + "duration": 0.45063090324401855, + "PER": 54.71698113207547, + "score": { + "S": 21, + "D": 3, + "I": 5, + "N": 53 + } + }, + { + "model": "WavLM", + "phonemes": "n i ɪ d i s ɛ d ɪ ŋ æ ɔ t m ə i ɔ v ə s l i k l k h", + "ref_phonemes": "mitʃɛru skwɛrɪŋ æz aʊɝ mʌðɝ ɪts ɔlweɪz swit laɪk hɝ ", + "duration": 0.28409361839294434, + "PER": 69.04761904761905, + "score": { + "S": 13, + "D": 16, + "I": 0, + "N": 42 + } + }, + { + "model": "WavLM", + "phonemes": "d n æ ʃ ɪ ɪ z v ɛ i æ k ɹ æ k t u ə n d f u l ʌ f majf ɛ ɹ ɡ ɹ i n k ʌ l", + "ref_phonemes": "ðʌ neɪtʃɝ ɪz vɛri ʌtræktɪv ʌnd fʊl ʌv maɪ feɪvɝɪt ɡrin kʌlɝ ", + "duration": 0.3346078395843506, + "PER": 50.0, + "score": { + "S": 14, + "D": 10, + "I": 0, + "N": 48 + } + }, + { + "model": "WavLM", + "phonemes": "n u v i ʃ u n nowm ɔ ə ɔ ɹ majɡ ɹ n d ɑ ð ə v ɛ l ɪ najn ə d wɹ̩ ɹl ɛ i t ɪ ŋ æ s v iɪ f t z t ɪ ð ʌ s ɛ s ɪ n s ɛ ɪ ŋn ɛ ɔ ɹ ɹ ɹ ɑ p æ k ɹ ɑ ɔ ɹ ʊ i z w oj i s towɔ z bʌ tawə n m ɪ z s ɪ ŋ ɛ l ɔ ŋ b ɑ i ɪ ŋ z u h ɪ z t ɪ ŋ ɡ ɪ v ɪ ŋ ɡ ɪ v ɪ ŋ dðowɔ z ʊ ə i ŋm ɪ m i n ɹ ʌ n ɔ m d ɔ ɪ ŋ ʌ ð ʌ ɹ m ɔ ʃ t s p ɛ v ɛ n n n ə h i z i h i z w ɔ i z d ʃ ɛ bajd t ɹ æ k ʃ ə n dɹ̩ w ɔ tow z ɛ bajk t", + "ref_phonemes": "ju wɪʃ tu noʊ ɔl ʌbaʊt maɪ ɡrændfɑðɝ waɪl hi ɪz nɪrli naɪntɪfri jɪrz oʊld ðæt hi stɪl θɪŋks æz fɪfti æz ɛvɝ hi dæsʌz hɪmsɛlf ɪn ʌ oʊld blæk rɑk ɡɑt ɡʊd vɪʒwʌli hi sɑroʊz bʌtʌnz mɪsɪŋ ʌ lɔŋbrɛd θɪŋz tu hɪz tʃɪn ɡɪvɪŋ ðoʊz hu ʌbzɝv hɪm hɪm hɪm hi meɪ prʌnaʊns jɔr filɪŋ ʌv ðʌ ", + "duration": 3.1034789085388184, + "PER": 83.79629629629629, + "score": { + "S": 87, + "D": 48, + "I": 46, + "N": 216 + } + }, + { + "model": "WavLM", + "phonemes": "ð ɛ t ʌ s u d æ n s v ɛ vajæə u n əi f ɔ m æ ŋ i w ɑ s t u s ɹɹ̩ dejl i", + "ref_phonemes": "ðʌ studʌnts wɝ ðʌ junʌfɔrm ʌnd ɡoʊz tu skul deɪli ", + "duration": 0.4150547981262207, + "PER": 62.5, + "score": { + "S": 16, + "D": 4, + "I": 5, + "N": 40 + } + }, + { + "model": "WavLM", + "phonemes": "ɪ n ð ə v ɪ n d ɛ v ə n əd͡ʒ n ows i s owl i pdejt p s ɛ ʃ ɑ k w ɔ k ɪ n ð əowl pejɛ n n ejt d", + "ref_phonemes": "ɪn ðʌ wɪntɝ wɛn ɪt snoʊ ʃi sloʊli teɪks ʌ ʃɔrt wɔk ɪn ðʌ oʊpʌn ɛr itʃ deɪ ", + "duration": 0.3846127986907959, + "PER": 62.5, + "score": { + "S": 24, + "D": 5, + "I": 6, + "N": 56 + } + }, + { + "model": "WavLM", + "phonemes": "ə lawt͡ʃ l majf æ m ə n i d æ n d ɪ n ð ə t iʌ t ajw ɑ n t b u mejk majf æ m l i awt", + "ref_phonemes": "ʌlaʊ maɪ fæmʌli ʌnd ɪn ðʌ fjutʃɝ aɪ wɑnt tu meɪk maɪ fæmʌli praʊd ", + "duration": 0.3682541847229004, + "PER": 50.0, + "score": { + "S": 16, + "D": 5, + "I": 5, + "N": 52 + } + }, + { + "model": "WavLM", + "phonemes": "ð ɔ ɹ ɛ ʃ m ə m m ʌ t ə l ə f æ ə l i i z mejk d æ f ɔ ɹ ð ə æ n d ð ɡ ɪ ʃ m əɛ m ʌ t ə majejk f æ m ə l i ɡ i i z majɡ b æ v i ʌ ð", + "ref_phonemes": "ðʌ oʊldʌst mɛmbɝ ʌv ðʌ fæmʌli ɪz maɪ ɡrændfɑðɝ ʌnd ðʌ ɪŋɡlɪʃ mɛmbɝ ʌv maɪ fæmʌli ɪz maɪ beɪbi brʌðɝ ", + "duration": 0.6738722324371338, + "PER": 66.25, + "score": { + "S": 31, + "D": 15, + "I": 7, + "N": 80 + } + }, + { + "model": "WavLM", + "phonemes": "ð ʌ n i ɪ s ə h i z v ɛ i æ k t æ k t ɑ n æ n f u l l ɔ f ajn f ɛ v ɹ ɛ d k ɹ ɪ ŋ ə", + "ref_phonemes": "ðʌ neɪtʃɝ ɪz vɛri ʌtræktɪv ʌnd fʊl ʌv maɪ feɪvɝɪt ɡrin kʌlaʊr ", + "duration": 0.5561819076538086, + "PER": 66.0, + "score": { + "S": 22, + "D": 9, + "I": 2, + "N": 50 + } + }, + { + "model": "WavLM", + "phonemes": "ð s t ɹ u d æ n ɹ ɛ daji f ɔ m æ n d ɡ ow ɑ s t ɪ s ʊ l dejt i", + "ref_phonemes": "ðʌ studʌnt wɪð ðʌ junʌfɔrm ʌnd ɡoʊz tu skul daɪʌlɪŋ ", + "duration": 0.35492420196533203, + "PER": 61.904761904761905, + "score": { + "S": 15, + "D": 9, + "I": 2, + "N": 42 + } + }, + { + "model": "WavLM", + "phonemes": "b ajs s i t eji i ejə s ɪ w ʊ l i æ n d v s ə h s m ɑ t ʌ v ɹ̩ ə ə s ɛ ɪ n ð ə v ɪ ŋn t sz s i v ɪ n dt əz v ɛ n ð s now ɔ ɔ t t ajs ɹl vɹ̩ n d h i s loj i tejsk s ɛ s ɔ w ɑ l n ð tow p æ n d ð ow ow n d d͡ʒə d w ɔ n i hawɹ̩k ɔ f t n ʌ ɪ h ɪ mn ə w w ɔ m ɔ ɹ taw æ n d ə s m k l ʌ t i ɑ n sɹ̩ z s b ʌ nɹ̩ɑ nɹ̩ i s aj æ n ð ə lajk s i b ɔ ɹ t t ɹ̩ n ɪ n ɪ l æ ŋ ɡv", + "ref_phonemes": "twaɪs itʃ deɪ hi pleɪz skɪfli ʌnd wɪð dʒʌst ʌpɑn ʌ smɔl ɔrɡʌn ɪksɛpt ɪn ðʌ wɪntɝ wɪntɝ wɛn ðʌ snoʊ ɔr aɪs prɪvɛnts hi sloʊli teɪks ʌ ʃɔrt wɔk ɪn ðʌ oʊpʌn ɪn ðʌ oʊpʌn ɛr itʃ deɪ wʌt wi hæv ɔfʌn ɝdʒ hɪm tu wɔk mɔr ʌnd smoʊk lɛs bʌt hi ɔl ", + "duration": 2.5446369647979736, + "PER": 86.81318681318682, + "score": { + "S": 68, + "D": 32, + "I": 58, + "N": 182 + } + }, + { + "model": "WavLM", + "phonemes": "ð æ ʃ m ɛ m æ tow ʌ ð ʌ v m i mejɡ æ d ɔ l ðow æ ŋ d dð æ ŋ ɡ s ʃ m ʌ m bɹ̩ʌ t ə majɡ v æ n i m ʌb b b i b t ð ow", + "ref_phonemes": "ðʌ oʊldʌst mɛmbɝ ʌv ðʌ fæmʌli ɪz maɪ ɡrændfɑðɝ ʌnd ðʌ jʌŋɡʌst mɛmbɝ ʌv maɪ fæmʌli ɪz maɪ beɪbi brʌðɝ ", + "duration": 0.5820846557617188, + "PER": 69.1358024691358, + "score": { + "S": 28, + "D": 22, + "I": 6, + "N": 81 + } + }, + { + "model": "WavLM", + "phonemes": "b i t ə l mej k lejk bejk z æ z ɛ l ɔ ŋ t ə ɪ ajz ð ɛ m ɪ z b ʌ s k d b", + "ref_phonemes": "dɑɡz it boʊnz meɪk lɛɡz baɪt ɛlsʌ wɑnts ʌ bʊk ʌðɝ pleɪs bæskʌtbɔl ", + "duration": 0.3970198631286621, + "PER": 73.58490566037736, + "score": { + "S": 27, + "D": 12, + "I": 0, + "N": 53 + } + }, + { + "model": "WavLM", + "phonemes": "k n d ɑ d ɪi ðdawæ z æ d ɪ ɪ ŋ d æ z j ɔ ɹ vðɹ̩ vɹ̩ m ɑʌ ðɹ̩ə v i ə æ ɹ̩v ɹ ɛ z s i d k k ɑ", + "ref_phonemes": "neɪtʃɝ ɪz æz kɛrɪŋ æz aʊɝ mʌðɝ ɪt ɔlweɪz swit laɪk hɝ ", + "duration": 0.72188401222229, + "PER": 100.0, + "score": { + "S": 30, + "D": 0, + "I": 12, + "N": 42 + } + }, + { + "model": "WavLM", + "phonemes": "n i i z æ z d ɪ d ɪ ŋ əaj æ v tə æ v t ə m ʌ ð ɪ i z ɑ s i mejkæ", + "ref_phonemes": "neɪtʃɝ ɪz æz kɛrɪŋ æz aʊɝ mʌðɝ ɪt ɪz ɔlweɪz swit laɪk hɝ ", + "duration": 0.5158836841583252, + "PER": 75.0, + "score": { + "S": 23, + "D": 9, + "I": 1, + "N": 44 + } + }, + { + "model": "WavLM", + "phonemes": "ajnow ʌ f æ m m n ð i ɪ ɪ ɪ n i d ʌ f j ɪ l æ d aj ɑɔ ŋ b ɪ l m æ u majt f æ m ə l ɪ k ɑ ə", + "ref_phonemes": "aɪ lʌv maɪ fæmʌli ʌnd ðʌ fjutʃɝ aɪ wɑnt tu meɪk maɪ fæmʌli praʊd ", + "duration": 0.5010967254638672, + "PER": 74.50980392156863, + "score": { + "S": 25, + "D": 7, + "I": 6, + "N": 51 + } + }, + { + "model": "WavLM", + "phonemes": "mej d d i z i n ɛɑ d i z i æ k ɛ ɪ ŋ ə ɔ v m ɑ ð ɛ t ɪ t ɔ l l ejz ʊ ʃ i lajk", + "ref_phonemes": "neɪtʃɝ ɪz æz kɛrɪŋ æz aʊɝ mʌðɝ ɪt ɔlweɪz swit laɪk hɝ ", + "duration": 0.6617977619171143, + "PER": 73.80952380952381, + "score": { + "S": 16, + "D": 7, + "I": 8, + "N": 42 + } + }, + { + "model": "WavLM", + "phonemes": "d d ɔ l s i b n n s majk k lejæ s bajk s æ z sow ɑ n zs ɛə b ʊ l k æ n d æ m l i z b ʌ s k ə d b ɔ ɹ", + "ref_phonemes": "dɔɡ sid boʊnz maɪklaɪk spaɪks ɛlsʌ wɑnts ʌ bʊk ʌnd ʌ pleɪs bæskʌt boʊnz ", + "duration": 0.5789206027984619, + "PER": 56.896551724137936, + "score": { + "S": 24, + "D": 5, + "I": 4, + "N": 58 + } + }, + { + "model": "WavLM", + "phonemes": "ajl ʌ v majmf f æ m l i k æ n d ɪ n ə u ʊ d b ʌ t iajwej ɑ n t b u mejk majf f æ m l i awt", + "ref_phonemes": "aɪ lʌv maɪ fæmʌli ʌnd ɪn ðʌ fjutʃɝ aɪ wɑnt tu meɪk maɪ fæmʌli praʊd ", + "duration": 0.3607306480407715, + "PER": 50.943396226415096, + "score": { + "S": 15, + "D": 5, + "I": 7, + "N": 53 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.376847505569458, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.2792940139770508, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "k ɑ f i ɪ z ɡ ɹown ɑ n s t i pd͡ʒʌ ŋ ɡ ə l lajk s lowp s ɪ n t ɛ m p ɹ ə t zown z", + "ref_phonemes": "kɑfi ɪz ɡroʊn ɑn stip dʒʌŋɡlʌkaɪ sloʊps ɪn tɛmprʌt zoʊnz ", + "duration": 0.293654203414917, + "PER": 25.53191489361702, + "score": { + "S": 8, + "D": 1, + "I": 3, + "N": 47 + } + }, + { + "model": "WavLM", + "phonemes": "t ɹ æ f ɪ k f ɹ i k w ə n t l i h æ z fejl d t ə m ɛ ʒɹ̩ʌ p t ə ɛ nd͡ʒə n ɪ ɹ z ɹowz i ɛ s t ə m ə t s", + "ref_phonemes": "træfɪk frikwʌntli hæz feɪld tu mɛʒɝ ʌp tu ɛndʒʌnɪrz ' roʊzi ɛstʌmʌts ", + "duration": 0.3267984390258789, + "PER": 28.07017543859649, + "score": { + "S": 13, + "D": 1, + "I": 2, + "N": 57 + } + }, + { + "model": "WavLM", + "phonemes": "m ɛ n i w ɛ l θ i tajk u n z s p lɹ̩d͡ʒd æ n d b ɑ t bowθ ə j ɑ t æ n d ə s k u nɹ̩", + "ref_phonemes": "mɛni wɛlθi taɪkunz splɝdʒd ʌnd bɑt boʊθ ʌ jɑt ʌnd ʌ skunɝ ", + "duration": 0.28540706634521484, + "PER": 23.91304347826087, + "score": { + "S": 8, + "D": 0, + "I": 3, + "N": 46 + } + }, + { + "model": "WavLM", + "phonemes": "h i p ɪ k t ʌ p najn p ɛ ɹ z ʌ v s ɑ k s f ɔ ɹ it͡ʃb ɹ ʌ ðɹ̩", + "ref_phonemes": "hi pɪkt ʌp naɪn pɛrz ʌv sɑks fɔr itʃ brʌðɝ ", + "duration": 0.2618722915649414, + "PER": 21.21212121212121, + "score": { + "S": 5, + "D": 0, + "I": 2, + "N": 33 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.3360610008239746, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "ɪ n ð ə lajt ə d ɪ n t ɪ ɹ iɹ̩h i s ɔ ʌ ðɹ̩m ɛ n æ n d w ɪ m ə n s t ɹ ʌ ɡ ə l ɪ ŋ ɪ n t u ð ɛ ɹ ɹ æ p s", + "ref_phonemes": "ɪn ðʌ laɪtʌd ɪntɪriɝ hi sɔ ʌðɝ mɛn ʌnd wɪmʌn strʌɡʌlɪŋ ɪntu ðɛr ræps ", + "duration": 0.35367774963378906, + "PER": 25.454545454545453, + "score": { + "S": 12, + "D": 0, + "I": 2, + "N": 55 + } + }, + { + "model": "WavLM", + "phonemes": "f u l z h i bejd w ʌ t d u j u θ ɪ ŋ k j u ɑ ɹ d u ɪ ŋ", + "ref_phonemes": "fulz hi beɪd wʌt du ju θɪŋk ju ɑr duɪŋ ", + "duration": 0.29234862327575684, + "PER": 6.896551724137931, + "score": { + "S": 2, + "D": 0, + "I": 0, + "N": 29 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə p ɹ ɛ s k u lɹ̩k ʊ d n t vɹ̩b ə lajz hɹ̩f i l ɪ ŋ z ə bawt ð ə ɪ mɹ̩d͡ʒə n s i k ə n d ɪ ʃ ə n z", + "ref_phonemes": "ðʌ priskulɝ kʊdʌnt vɝbʌlaɪz hɝ filɪŋz ʌbaʊt ðʌ ɪmɝdʒʌnsi kʌndɪʃʌnz ", + "duration": 0.3090527057647705, + "PER": 36.84210526315789, + "score": { + "S": 15, + "D": 1, + "I": 5, + "N": 57 + } + }, + { + "model": "WavLM", + "phonemes": "h i w ɪ l sejð æ tawɹ̩k ʌ n t ɹ i ɪ z i v ə n nawə howm əd͡ʒi n i ə s k ə m j u n ə t i", + "ref_phonemes": "hi wɪl seɪ ðæt aʊɝ kʌntri ɪz ivɪn naʊ ʌ hoʊmʌdʒiniʌs kʌmjunʌti ", + "duration": 0.23786139488220215, + "PER": 27.450980392156865, + "score": { + "S": 12, + "D": 0, + "I": 2, + "N": 51 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.27683424949645996, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.2647666931152344, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "ɛ v ə d ə n s ð æ t ʌ ðɹ̩s ɔ ɹ s ə z ʌ v f ə n æ n s ɪ ŋ ɑ ɹ ʌ n ə vejl ə b ə l m ʌ s t b i p ɹ ə vajd ə d", + "ref_phonemes": "ɛvʌdʌns ðæt ʌðɝ sɔrsʌz ʌv fʌnænsɪŋ ɑr ʌnʌveɪlʌbʌl mʌst bi prʌvaɪdʌd ", + "duration": 0.34983372688293457, + "PER": 28.07017543859649, + "score": { + "S": 15, + "D": 0, + "I": 1, + "N": 57 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i ɔ l wejzd͡ʒowk s ə bawt t u m ʌt͡ʃɡ ɑ ɹ l ɪ k ɪ n h ɪ z f u d", + "ref_phonemes": "ʃi ɔlweɪz dʒoʊks ʌbaʊt tu mʌtʃ ɡɑrlɪk ɪn hɪz fud ", + "duration": 0.2806410789489746, + "PER": 17.94871794871795, + "score": { + "S": 5, + "D": 0, + "I": 2, + "N": 39 + } + }, + { + "model": "WavLM", + "phonemes": "ðejp lejd k ɹ æ k ð ə w ɪ p ə f j u m ɪ n ə t s w ɪ θawt m ɪ s h æ p", + "ref_phonemes": "ðeɪ pleɪd kræk ðʌ wɪp ʌ fju mɪnʌts wɪθaʊt mɪʃhæp ", + "duration": 0.25751614570617676, + "PER": 20.51282051282051, + "score": { + "S": 8, + "D": 0, + "I": 0, + "N": 39 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.27626514434814453, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.31798219680786133, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə dajə ɡ nows ə s w ɑ z d ɪ s kɹ̩əd͡ʒɪ ŋ hawɛ vɹ̩h i w ɑ z n ɑ towvɹ̩l i wɹ̩i d", + "ref_phonemes": "ðʌ daɪʌɡnoʊsʌs wɑz dɪskɝʌdʒɪŋ haʊɛvɝ hi wɑz nɑt oʊvɝli wɝid ", + "duration": 0.251662015914917, + "PER": 34.0, + "score": { + "S": 12, + "D": 0, + "I": 5, + "N": 50 + } + }, + { + "model": "WavLM", + "phonemes": "ʌ ðɹ̩m ɔ ɹ f ə l ɑd͡ʒ�� k ə l f ɪ z ɪ k ə l æ n d ɑ p t ɪ k ə l p ɹ ɑ pɹ̩t i v æ l j u z ɑ ɹ ɔ l sowɡ ɪ v ə n", + "ref_phonemes": "ʌðɝ mɔrfʌlɑdʒɪkʌl fɪzɪkʌl ʌnd ɑptɪkʌl prɑpɝti væljuz ɑr ɔlsoʊ ɡɪvʌn ", + "duration": 0.5547962188720703, + "PER": 25.862068965517242, + "score": { + "S": 12, + "D": 0, + "I": 3, + "N": 58 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.31241631507873535, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.2459087371826172, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "b ʌ t ð ɪ s ɛ s ə t ɛ ɹ ɪ k d ɑ k t ɹ ə n w ɑ z l ɔ s t ɪ n ð ə ʃ ʌ f ə l t ə ə k wajɹ̩s p ɛ ʃ ə l pawɹ̩z", + "ref_phonemes": "bʌt ðɪs ɛsʌtɛrɪk dɑktrʌn wɑz lɔst ɪn ðʌ ʃʌfʌl tu ʌkwaɪɝ spɛʃʌl paʊɝz ", + "duration": 0.3260006904602051, + "PER": 26.785714285714285, + "score": { + "S": 13, + "D": 0, + "I": 2, + "N": 56 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.30620646476745605, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.3105604648590088, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.3216874599456787, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.24373769760131836, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.2570812702178955, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "h i ɹ ɪ l i k ɹ u s ə fajd h ɪ m h i nejl d ɪ t f ɔ ɹ ə j ɑ ɹ d l ɔ s", + "ref_phonemes": "hi rɪli krusʌfaɪd hɪm hi neɪld ɪt fɔr ʌ jɑrd lɔs ", + "duration": 0.33651137351989746, + "PER": 21.052631578947366, + "score": { + "S": 8, + "D": 0, + "I": 0, + "N": 38 + } + }, + { + "model": "WavLM", + "phonemes": "ð ɛ ɹ w ɑ z əd͡ʒajɡ æ n t ɪ k w ɑ s p n ɛ k s t t əɹ̩v ɪ ŋ ɡ z b ɪ ɡ t ɑ p h æ t", + "ref_phonemes": "ðɛr wɑz ʌ dʒaɪɡæntɪk wɑsp nɛkst tu ɝvɪŋz bɪɡ tɑp hæt ", + "duration": 0.33803558349609375, + "PER": 19.047619047619047, + "score": { + "S": 5, + "D": 0, + "I": 3, + "N": 42 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.25723862648010254, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "m ɑ ɹ k ə t s ʃ ʊ d b ɪ k ʌ m m ɔ ɹ k ə m p ɛ t ə t ɪ v æ z k ə n s u mɹ̩z b ɪ k ʌ m m ɔ ɹ s ə l ɛ k t ɪ v", + "ref_phonemes": "mɑrkʌts ʃʊd bɪkʌm mɔr kʌmpɛtʌtɪv æz kʌnsumɝz bɪkʌm mɔr sʌlɛktɪv ", + "duration": 0.2858893871307373, + "PER": 18.51851851851852, + "score": { + "S": 9, + "D": 0, + "I": 1, + "N": 54 + } + }, + { + "model": "WavLM", + "phonemes": "ɹ̩ɪd͡ʒə n ə l z ɑ ɹ n ɑ t n ɛ s ə s ɛ ɹ ə l i ɡ ʊ d æ n d æ d æ p tejʃ ə n z ɑ ɹ n ɑ t n ɛ s ə s ɛ ɹ ə l i b æ d", + "ref_phonemes": "ɝɪdʒʌnʌlz ɑr nɑt nɛsʌsɛrʌli ɡʊd ʌnd ædæpteɪʃʌnz ɑr nɑt nɛsʌsɛrʌli bæd ", + "duration": 0.3555145263671875, + "PER": 27.11864406779661, + "score": { + "S": 14, + "D": 0, + "I": 2, + "N": 59 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.2883741855621338, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "w ɪ ð ɪ n ə s ɪ s t ə m hawɛ vɹ̩ð ə ɔ t ɑ n ə m i ʌ v it͡ʃm ɛ m bɹ̩lajb ɹ ɛ ɹ i ɪ z p ɹ ə zɹ̩v d", + "ref_phonemes": "wɪðɪn ʌ sɪstʌm haʊɛvɝ ðʌ ɔtɑnʌmi ʌv itʃ mɛmbɝ laɪbrɛri ɪz prʌzɝvd ", + "duration": 0.3663361072540283, + "PER": 31.48148148148148, + "score": { + "S": 13, + "D": 0, + "I": 4, + "N": 54 + } + }, + { + "model": "WavLM", + "phonemes": "t ə p ɹ i p ɛ ɹ m ʌ s tɹ̩d k ɹ i m b l ɛ n d m ʌ s tɹ̩d w ɪ ð ɪ n ʌ f w ɔ tɹ̩t ə mejk ə θ ɪ n pejs t", + "ref_phonemes": "tu pripɛr mʌstɝd krim blɛnd mʌstɝd wɪð ɪnʌf wɔtɝ tu meɪk ʌ θɪn peɪst ", + "duration": 0.32247400283813477, + "PER": 25.454545454545453, + "score": { + "S": 11, + "D": 0, + "I": 3, + "N": 55 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.23595738410949707, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.2491612434387207, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "h ɪ z fejl jɹ̩t əowp ə n ð ə s t ɔ ɹ bajejt k ɑ s t h ɪ m h ɪ zd͡ʒɑ b", + "ref_phonemes": "hɪz feɪljɝ tu oʊpʌn ðʌ stɔr baɪ eɪt kɑst hɪm hɪz dʒɑb ", + "duration": 0.2431049346923828, + "PER": 26.190476190476193, + "score": { + "S": 9, + "D": 0, + "I": 2, + "N": 42 + } + }, + { + "model": "WavLM", + "phonemes": "h i k æ n f ɔ ɹ ɪ ɡ z æ m p ə l p ɹ ɛ z ə n t s ə ɡ n ɪ f ɪ k ə n t j u n ə vɹ̩s ə t i wajd ɪ ʃ u z t ə ð ə s ɛ n ə t", + "ref_phonemes": "hi kæn fɔr ɪɡzæmpʌl prɛzʌnt sʌɡnɪfɪkʌnt junʌvɝstʌfaɪtɝ ɪʃuz tu ðʌ sɛnʌt ", + "duration": 0.3670675754547119, + "PER": 29.508196721311474, + "score": { + "S": 15, + "D": 1, + "I": 2, + "N": 61 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.27671003341674805, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.2705497741699219, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə ɡ ɹawn d h ɑ ɡ k l ɪ ɹ l i s ɔ h ɪ z ʃ æ dowb ʌ t s tejdawtown l i ə mowm ə n t", + "ref_phonemes": "ðʌ ɡraʊnðhɑɡ klɪrli sɔ hɪz ʃædoʊ bʌt steɪd aʊt oʊnli ʌ moʊmʌnt ", + "duration": 0.2898874282836914, + "PER": 23.52941176470588, + "score": { + "S": 12, + "D": 0, + "I": 0, + "N": 51 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.2704038619995117, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.25534558296203613, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "ð ɛ ɹ ʃ ʊ d b i nowɹ i z ə n t ə m ɪ s ɪ n tɹ̩p ɹ ə t ɔ ɹ ɪ ɡ n ɔ ɹ ð ə ɪ n t ɛ n t ʌ v ð ɪ s l ɛ tɹ̩", + "ref_phonemes": "ðɛr ʃʊd bi noʊ rizʌn tu mɪsɪntɝprʌt ɔr ɪɡnɔr ðʌ ɪntɛnt ʌv ðɪs lɛtɝ ", + "duration": 0.3510599136352539, + "PER": 26.41509433962264, + "score": { + "S": 12, + "D": 0, + "I": 2, + "N": 53 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.24529814720153809, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə d ɛ d s p ɪ ɹ ə t s ɑ k j ə pajd ə p ɹ ɑ m ə n ə n t p lejs ɪ n ɛ vɹ̩i howp æ n d ɪ n ɛ vɹ̩i f ɪ ɹ", + "ref_phonemes": "ðʌ dɛd spɪrʌts ɑkjʌpaɪd ʌ prɑmʌnʌnt pleɪs ɪn ɛvɝi hoʊp ʌnd ɪn ɛvɝi fɪr ", + "duration": 0.3263838291168213, + "PER": 29.82456140350877, + "score": { + "S": 15, + "D": 0, + "I": 2, + "N": 57 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə θ ɪ k ɛ l m f ɔ ɹ ə s t w ɑ z n ɪ ɹ l iowvɹ̩w ɛ l m d bajd ʌt͡ʃɛ l m d ɪ z i z", + "ref_phonemes": "ðʌ θɪk ɛlm fɔrʌst wɑz nɪrli oʊvɝwɛlmd baɪ dʌtʃ ɛlm dɪziz ", + "duration": 0.36417198181152344, + "PER": 19.565217391304348, + "score": { + "S": 7, + "D": 0, + "I": 2, + "N": 46 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.25135135650634766, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.28206729888916016, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.29996275901794434, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.26892566680908203, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "ð ɪ s p ɹ ɑ s ɛ s ɪ z ə s p ɛ ʃ ə l i d ɪ f ə k ə l t ɛ n szd͡ʒajɹ̩ ɹowd ɹ ɪ f t ɪ ŋ ɪ z t ɪ f ə k l i ɹ æ n d ə m", + "ref_phonemes": "ðɪs prɑsɛs ɪz ʌspɛʃli dɪfʌkʌlt sɪns dʒaɪroʊ drɪftɪŋ ɪz tɪpɪkli rændʌm ", + "duration": 0.3674941062927246, + "PER": 32.20338983050847, + "score": { + "S": 13, + "D": 1, + "I": 5, + "N": 59 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.30811023712158203, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə w ɔ tɹ̩k ə n tejn d t u m ʌt͡ʃk l ɔ ɹ i n æ n d s t ʌ ŋ h ɪ zajz", + "ref_phonemes": "ðʌ wɔtɝ kʌnteɪnd tu mʌtʃ klɔrin ʌnd stʌŋ hɪz aɪz ", + "duration": 0.22925186157226562, + "PER": 23.076923076923077, + "score": { + "S": 7, + "D": 0, + "I": 2, + "N": 39 + } + }, + { + "model": "WavLM", + "phonemes": "wajd ɑ n t ðejt ɛ l m i ð ɛ m s ɛ l v z ɪ f ɪ t b ɑ ðɹ̩z ð ɛ m", + "ref_phonemes": "waɪ doʊnt ðeɪ tɛl mi ðɛmsɛlvz ɪf ɪt bɑðɝz ðɛm ", + "duration": 0.2567930221557617, + "PER": 16.666666666666664, + "score": { + "S": 4, + "D": 1, + "I": 1, + "N": 36 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.12937140464782715, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "s l ɹ i d ɛ p ə z ɪ ʃ ə n ɪ z ɪ v æ l j uejt ə d bajw ɑ ʃ ɪ n k l i n s w ɑt͡ʃə z w ɪ ð ə dɹ̩tɹ i w ə n z", + "ref_phonemes": "sɔɪl ridɛpʌzɪʃʌn ɪz ɪvæljueɪtʌd baɪ wɑʃɪŋ klin swɑtʃʌz wɪð ðʌ dɝti wʌnz ", + "duration": 0.3995089530944824, + "PER": 28.333333333333332, + "score": { + "S": 11, + "D": 3, + "I": 3, + "N": 60 + } + }, + { + "model": "WavLM", + "phonemes": "s m æ ʃ lajt b ʌ l b z æ n d ð ɛ ɹ k æ ʃ v æ l j u w ɪ l d ɪ m ɪ n ɪ ʃ t ə n ʌ θ ɪ ŋ", + "ref_phonemes": "smæʃ laɪtbʌlbz ʌnd ðɛr kæʃ vælju wɪl dɪmɪnɪʃ tu nʌθɪŋ ", + "duration": 0.19797563552856445, + "PER": 9.090909090909092, + "score": { + "S": 4, + "D": 0, + "I": 0, + "N": 44 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.24034333229064941, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "ð ɛ ɹ ɪ z l ɪ t ə l dawt ð æ t ð ə s t u d ə n t s b ɛ n ə f ɪ t f ɹ ʌ m vowkejʃ ə n ə l ɛd͡ʒə kejʃ ə n", + "ref_phonemes": "ðɛr ɪz lɪtʌl daʊt ðæt ðʌ studʌnts bɛnʌfɪt frʌm voʊkeɪʃʌnʌl ɛdʒʌkeɪʃʌn ", + "duration": 0.3554553985595703, + "PER": 25.423728813559322, + "score": { + "S": 14, + "D": 0, + "I": 1, + "N": 59 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.28074097633361816, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.26569437980651855, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə s ɪ ɡɹ̩ɛ t s ɪ n ð ə k lejæ ʃ t ɹejowvɹ̩f lowd ɑ n t u ð əowk tejb ə l", + "ref_phonemes": "ðʌ sɪɡɝɛts ɪn ðʌ kleɪ æʃtreɪ oʊvɝfloʊd ɑntu ðʌ oʊk teɪbʌl ", + "duration": 0.3515200614929199, + "PER": 31.914893617021278, + "score": { + "S": 13, + "D": 0, + "I": 2, + "N": 47 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.26127123832702637, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.25437378883361816, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.2972838878631592, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.3520088195800781, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.2755086421966553, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "s ʌ m ə b zɹ̩vɹ̩z s p ɛ k j ə lejt ə d ð æ t ð ɪ s majt b i h ɪ z ɹ i v ɛ nd͡ʒɑ n h ɪ z howm tawn", + "ref_phonemes": "sʌm ʌbzɝvɝz spɛkjʌleɪtʌd ðæt ðɪs maɪt bi hɪz rivɛndʒ ɑn hɪz hoʊm taʊn ", + "duration": 0.36054039001464844, + "PER": 22.807017543859647, + "score": { + "S": 10, + "D": 0, + "I": 3, + "N": 57 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.2756614685058594, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.25409626960754395, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.2854745388031006, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.2344825267791748, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "w ɪ ð ð ə s p ɹ ɪ ŋ ɹejn z ð ə f lowɹowz ɹ æ p ə d l i d u t ə ɪ n f ɪ l t ɹejʃ ə n ɪ nowp ə n s uɹ̩z", + "ref_phonemes": "wɪð ðʌ sprɪŋ reɪnz ðʌ floʊ roʊz ræpʌdli du tu ɪnfɪltreɪʃʌn ɪn oʊpʌn suɝz ", + "duration": 0.3461167812347412, + "PER": 30.508474576271187, + "score": { + "S": 17, + "D": 0, + "I": 1, + "N": 59 + } + }, + { + "model": "WavLM", + "phonemes": "bajð ð ə l ʊ k ʌ v ɪ m h i w ɑ z n t ð æ t f ɑ ɹ ɡ ɔ n", + "ref_phonemes": "baɪ ðʌ lʊk ʌv hɪm hi wɑzʌnt ðæt fɑr ɡɔn ", + "duration": 0.22136592864990234, + "PER": 20.0, + "score": { + "S": 3, + "D": 2, + "I": 1, + "N": 30 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.27400875091552734, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.295926570892334, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "h i s l ɪ p tawt sajd h ʌ ɡ ɪ ŋ ð ə w ɔ l z ʌ v b ɪ l d ɪ ŋ z æ n d d ɑd͡ʒɪ ŋ ɪ n t u d ɔ ɹ wejz", + "ref_phonemes": "hi slɪpt aʊtsaɪd hʌɡɪŋ ðʌ wɔlz ʌv bɪldɪŋz ʌnd dɑdʒɪŋ ɪntu dɔrweɪz ", + "duration": 0.38202524185180664, + "PER": 12.962962962962962, + "score": { + "S": 6, + "D": 0, + "I": 1, + "N": 54 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.2906956672668457, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "k wajt ɔ f ə n h ʌ n i b i z f ɔ ɹ m ə m əd͡ʒɔ ɹ ə t i ɑ n ð ə w ɪ lowk æ t k ə n z", + "ref_phonemes": "kwaɪt ɔfʌn hʌnibiz fɔrm ʌ mʌdʒɔrʌti ɑn ðʌ wɪloʊ kætkʌnz ", + "duration": 0.2944216728210449, + "PER": 23.91304347826087, + "score": { + "S": 10, + "D": 0, + "I": 1, + "N": 46 + } + }, + { + "model": "WavLM", + "phonemes": "ɪ f j u j u s p ɑ ɹ k ɪ ŋ ə t ɛ n d ə n t s k æ n ðejb i ɹ i p lejs t bajɔ t ə m æ t ɪ k p ɑ ɹ k ɪ ŋ ɡejt s", + "ref_phonemes": "ɪf ju juz pɑrkɪŋ ʌtɛndʌnts kæn ðeɪ bi ripleɪst baɪ ɔtʌmætɪk pɑrkɪŋ ɡeɪts ", + "duration": 0.3678114414215088, + "PER": 18.333333333333332, + "score": { + "S": 11, + "D": 0, + "I": 0, + "N": 60 + } + }, + { + "model": "WavLM", + "phonemes": "k æ n j ɔ ɹ ɪ n ʃ ʊ ɹ ə n s k ʌ m p ə n iejd j u ɪ n ɹ ə d u s ɪ ŋ ə d m ɪ n ə s t ɹejt ɪ v k ɑ s t s", + "ref_phonemes": "kæn jɔr ɪnʃʊrʌns kʌmpʌni eɪd ju ɪn rʌdusɪŋ ʌdmɪnʌstreɪtɪv kɑsts ", + "duration": 0.32718420028686523, + "PER": 20.37037037037037, + "score": { + "S": 11, + "D": 0, + "I": 0, + "N": 54 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.288224458694458, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.2349257469177246, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "w i k ə n ɡ ɹ ɛd͡ʒə lejt ð ə ɪ n tajɹ̩m ɛ m bɹ̩ʃ ɪ p ɑ n ɪ t s ɹ ɛ kɹ̩d ʌ v ɡ ʊ d l ɛd͡ʒə s lejʃ ə n", + "ref_phonemes": "wi kʌŋrætʃʌleɪt ðʌ ɪntaɪɝ mɛmbɝʃɪp ɑn ɪts rɛkɝd ʌv ɡʊd lɛdʒʌsleɪʃʌn ", + "duration": 0.32645201683044434, + "PER": 40.35087719298245, + "score": { + "S": 17, + "D": 0, + "I": 6, + "N": 57 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.26435303688049316, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i h æ d j ɔ ɹ d ɑ ɹ k s u t ɪ n ɡ ɹ i s i w ɑ ʃ w ɔ tɹ̩ɔ l j ɪ ɹ", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.2715134620666504, + "PER": 17.647058823529413, + "score": { + "S": 5, + "D": 0, + "I": 1, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "æ t nowt m w ɛ ɹ l ld͡ʒi fawn d ɪ n ð ə m ɪ k s t l ɪ k kɹ̩", + "ref_phonemes": "æt noʊ taɪm wɝ ældʒi faʊnd ɪn ðʌ mɪkst lɪkɝ ", + "duration": 0.28638720512390137, + "PER": 35.294117647058826, + "score": { + "S": 6, + "D": 2, + "I": 4, + "N": 34 + } + }, + { + "model": "WavLM", + "phonemes": "æ z ə p ɹ i k ɔ ʃ ə n ð əawt l ɔ z b ɑ t ɡ ʌ n pawdɹ̩f ɔ ɹ ð ɛ ɹ s t ɹ ɔ ŋ howl d", + "ref_phonemes": "æz ʌ prikɔʃʌn ðʌ aʊtlɔz bɑt ɡʌnpaʊdɝ fɔr ðɛr strɔŋhoʊld ", + "duration": 0.34174609184265137, + "PER": 26.08695652173913, + "score": { + "S": 11, + "D": 0, + "I": 1, + "N": 46 + } + }, + { + "model": "WavLM", + "phonemes": "ə vawdejθ i ə s t s ɔ ɹ f ɹ i θ ɪ ŋ kɹ̩z ɑ ɹ sowɹ ɛ ɹ æ z t ə b i ə k j ʊ ɹ i ɑ s ə t i", + "ref_phonemes": "ʌvaʊd eɪθiʌsts ɔr friθɪŋkɝz ɑr soʊ rɛr æz tu bi ʌ kjʊriɑsʌti ", + "duration": 0.38064026832580566, + "PER": 32.6530612244898, + "score": { + "S": 15, + "D": 0, + "I": 1, + "N": 49 + } + }, + { + "model": "WavLM", + "phonemes": "lajk ɪ n ʌ f w ɛ l ɔ l b i ʌ p ɑ n t ɑ p bajs ʌ n dawn", + "ref_phonemes": "laɪk ɪnʌf wil ɔl bi ʌp ɑn tɑp baɪ sʌndaʊn ", + "duration": 0.18879365921020508, + "PER": 12.5, + "score": { + "S": 4, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.2720632553100586, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "m ɛ n i w ɛ l θ i tajk u n z s p lɹ̩d͡ʒd æ n d b ɑ t bowθ ə j ɑ t æ n d ə s k u nɹ̩", + "ref_phonemes": "mɛni wɛlθi taɪkunz splɝdʒd ʌnd bɑt boʊθ ʌ jɑt ʌnd ʌ skunɝ ", + "duration": 0.34828710556030273, + "PER": 23.91304347826087, + "score": { + "S": 8, + "D": 0, + "I": 3, + "N": 46 + } + }, + { + "model": "WavLM", + "phonemes": "s m æ ʃ lajt b ʌ l b z æ n d ð ɛ ɹ k æ ʃ v æ l j u w ɪ l d ɪ m ɪ n ɪ ʃ t ə n ʌ θ ɪ ŋ", + "ref_phonemes": "smæʃ laɪtbʌlbz ʌnd ðɛr kæʃ vælju wɪl dɪmɪnɪʃ tu nʌθɪŋ ", + "duration": 0.3290541172027588, + "PER": 9.090909090909092, + "score": { + "S": 4, + "D": 0, + "I": 0, + "N": 44 + } + }, + { + "model": "WavLM", + "phonemes": "ɪ n ð ə l ɔ ŋ ɹ ʌ n ɪ t pejz t ə bajk w ɑ l ə t i k lowð ɪ ŋ", + "ref_phonemes": "ɪn ðʌ lɔŋ rʌn ɪt peɪz tu baɪ kwɑlʌti kloʊðɪŋ ", + "duration": 0.3233919143676758, + "PER": 20.0, + "score": { + "S": 7, + "D": 0, + "I": 0, + "N": 35 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.2833373546600342, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə p ɹ ɛ s k u l lɹ̩k ʊ d n d vɹ̩b ə lajz hɹ̩f ɪ l ɪ n z ə bawt ð ɛ ɹ mɹ̩d͡ʒə n s i k ə n d ɪ ʃ ə n z", + "ref_phonemes": "ðʌ priskulɝ kʊdʌnt vɝbʌlaɪz hɝ filɪŋz ʌbaʊt ðʌ ɪmɝdʒʌnsi kʌndɪʃʌnz ", + "duration": 0.3878297805786133, + "PER": 45.614035087719294, + "score": { + "S": 19, + "D": 1, + "I": 6, + "N": 57 + } + }, + { + "model": "WavLM", + "phonemes": "d ɑ n t æ s k m i t ə k æ ɹ i æ nojl i ɹ æ ɡ lajk ð æ t", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.22567224502563477, + "PER": 25.0, + "score": { + "S": 7, + "D": 1, + "I": 0, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə ɪ ŋ ɡ l ɪ ʃ fowət ə d t ə ð ə f ɹ̩ nt͡ʃb æ s k ə t s ə f lawɹ̩z ʌ v w ɪt͡ʃs ʃ h æ d mejd ə p l æ n t ə p ə l ɹ ə v ɪ ʒ ə n t ə ɡ ɹ i ð ə ə ɹ̩ajv ə l ʌ v ð ə j ʌ ŋ p ɹ ɪ n zs ɛ s ð ə f ɹ ɛ nt͡ʃb ɪ n ɹ tɹ̩n ɪ n vajt ə d ð ə ɪ ŋ ɡ l ɪ ʃ t ə ə s ʌ pɹ̩h ɪt͡ʃ t͡ʃ w ɑ z t ə b i ɡ ɪ v ə n ə n ɛ k s dej", + "ref_phonemes": "ðʌ ɪŋɡlɪʃ fɔrwɝdɪd tu ðʌ frɛntʃ bæskʌts ʌv flaʊɝz ʌv wɪtʃ ðeɪ hæd meɪd ʌ plɛntʌfʌl prʌvɪʒʌn tu ɡrit ðʌ ɝaɪvʌl ʌv ðʌ jʌŋ prɪnsɛs ðʌ frɛntʃ ɪn rɪtɝn ɪnvaɪtʌd ðʌ ɪŋɡlɪʃ tu ʌ sʌpɝ wɪtʃ wɑz tu bi ɡɪvʌn ðʌ nɛkst deɪ ", + "duration": 1.1118543148040771, + "PER": 41.31736526946108, + "score": { + "S": 47, + "D": 8, + "I": 14, + "N": 167 + } + }, + { + "model": "WavLM", + "phonemes": "k ə n ɡ ɹ æ d͡ʒ ə lejʃ ə n z wɹ̩ p ʊ ɹ d ɪ n ə p ɑ n ð ə p ɹ ɪ n s ʌ s ɛ vɹ̩i w ɛ ɹ ʊ ɹ ɪ ŋ hɹ̩d͡ʒɪ d͡ʒɹ̩ i", + "ref_phonemes": "kʌŋrætʃʌleɪʃʌnz wɝ pɔrd ɪn ʌpɑn ðʌ prɪnsɛs ɛvriwɛr dʊrɪŋ hɝ dʒɝni ", + "duration": 0.36662721633911133, + "PER": 58.18181818181818, + "score": { + "S": 21, + "D": 1, + "I": 10, + "N": 55 + } + }, + { + "model": "WavLM", + "phonemes": "f ɹ ʌ m ð ə ɹ ə s ɛ k t pej hɹ̩ɔɑ n ɔ l sajn z ʃ i s i mŋ z lajk ə k w i n æ n d ɹ ʌ m d ð æ d dɹ̩ɹejtʃ ə n d w ɪ ðθ w t͡ʃ ʃ i w ɑ s t ɹ i t ə d bajk t ʃ i ɔ ɹ s ɹ i ʃ i ə p iɪ ɹ d n d ɑ dd͡ʒɪ k ʌ v wɹ̩ʃ ʃ ɪ p ə k w i m m ʌ ðɹ̩d v ð ə f ɹ ɛ n ə mows s t ə f k ə n ə t ɹ s s ɛ p ʃ ə n f ɹ æ n s ɑ z hɹ̩nmnejt ʌ v k ʌn t ɹ i n ʃ h æ s ɛ fɹ̩ɔɹ̩t t u m ʌt͡ʃ d h æ p p ɪi n ə s ɪ n ɪ ŋ l æ d f ɔ ɪ ŋ l ə n t ə h æ v mejd hɹ̩ɹf f ɹ̩ə ɡ ɛ t f ɹ æ n z", + "ref_phonemes": "frʌm ðʌ rɪspɛkt peɪd hɝ ɑn ɔl saɪdz ʃi simd laɪk ʌ kwin ʌnd frʌm ðʌ ædɝeɪʃʌn wɪð wɪtʃ ʃi wɑz tritʌd baɪ tu ɔr θri ʃi ʌpɪrd æn ʌbdʒɛkt ʌv wɝʃʌp ðʌ kwin mʌðɝ ɡeɪv ðʌ frɛntʃ ðʌ moʊst ʌfɛkʃʌnʌt rɪsɛpʃʌn fræns wɑz hɝ neɪtɪv kʌntri ʌnd ʃi hæd sʌfɝd tu mʌtʃ ʌnhæpinɪs ɪn ɪŋɡlʌnd fɔr ɪŋɡlʌnd tu hæv meɪd hɝ fɝɡɛt fræns ", + "duration": 1.9053208827972412, + "PER": 49.797570850202426, + "score": { + "S": 64, + "D": 25, + "I": 34, + "N": 247 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ i t ɔ t hɹ̩d ɔ tɹ̩ð ð ɛ n bajk hɹ̩ɔɹow own ə f ɛ k ʃ ə n f ɔ ɹ ɪ ð æ t l ʌ v ɹ̩k k ʌ n t ɹ i w ɛ ɹ ðejə æ d bowθ b ɪ n h ə s ɪ t ə b l i ɹ ə s i d æ n d w ɛ ɹ ə b ɹ ɪ l l i ə n t f j kt͡ʃɹ̩əow p ə n f ɔ ɹ ð ɛ m", + "ref_phonemes": "ʃi tɔt hɝ dɔtɝ ðɛn baɪ hɝ oʊn ʌfɛkʃʌn fɔr ɪt ðæt lʌv fɔr ʌ kʌntri wɛr ðeɪ hæd boʊθ bɪn hɑspʌtʌbli rʌsivd ʌnd wɛr ʌ brɪljʌnt fjutʃɝ oʊpʌnd bɪfɔr ðɛm ", + "duration": 0.7435600757598877, + "PER": 44.44444444444444, + "score": { + "S": 32, + "D": 7, + "I": 13, + "N": 117 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə kawn t æ d ð ə ɹown h ɪ m s ɛ l fv b æ k ɑ n h ɪ z s i t l i n ɪ ŋ h ɪ ʃ dɹ̩z ə ɡ ɛ n s t ð ə p ɑ ɹ t ɪ ʃ ə n ʌ v ð ə t ɛ n n d ɹ i mejn ð ʌ s h ɪ z z fejs t b ɛ ɹ i d n h ɪ z h æ n d z w ɪ ð h i v ɪ ŋ ʃ ɛ s t æ n d ɹ ʌ s l ə s l ɪ m z", + "ref_phonemes": "ðʌ kaʊnt hæd θroʊn hɪmsɛlf bæk ɑn hɪz sit linɪŋ hɪz ʃoʊldɝz ʌɡɛnst ðʌ pɑrtɪʃʌn ʌv ðʌ tɛnt ʌnd rɪmeɪnd ðʌs hɪz feɪs bɛrid ɪn hɪz hændz wɪð hivɪŋ tʃɛst ʌnd rɛstlʌs lɪmz ", + "duration": 0.9364705085754395, + "PER": 26.865671641791046, + "score": { + "S": 22, + "D": 10, + "I": 4, + "N": 134 + } + }, + { + "model": "WavLM", + "phonemes": "ð ɪ s h æ z ɪ n d i d b ɪ n ə hɹ̩ɹ s ɪ ŋ d ejk ə n t ɪ n j ud ð ə j ʌ ŋ m æ n h ɪ zajz f ɪ k s t ə p ɑ n h ɪ z f ɹ ɛ n d", + "ref_phonemes": "ðɪs hæz ɪndid bɪn ʌ hɝæsɪŋ deɪ kʌntɪnjud ðʌ jʌŋ mæn hɪz aɪz fɪkst ʌpɑn hɪz frɛnd ", + "duration": 0.4499223232269287, + "PER": 15.625, + "score": { + "S": 9, + "D": 0, + "I": 1, + "N": 64 + } + }, + { + "model": "WavLM", + "phonemes": "k æ n j ɔ ɪ m æd͡ʒə n mwajb ʌ k ɪ ŋ h æ m h æ z b ɪ n sowv vajə l ə n t s ə s p ɛ k t", + "ref_phonemes": "kæn ju ɪmædʒʌn waɪ bʌkɪŋhæm hæz bɪn soʊ vaɪʌlʌnt aɪ sʌspɛkt ", + "duration": 0.37209153175354004, + "PER": 26.53061224489796, + "score": { + "S": 8, + "D": 2, + "I": 3, + "N": 49 + } + }, + { + "model": "WavLM", + "phonemes": "ɪ t ɪ z j u h ɹ m ə s tejk ə n d ɹawæ h æ v ɹ ɛ d h ɪ z d ɪ s t ɹ ɛ s ɪ n h ɪ zajz ɪ n h ɪ z ɛ vɹ̩ɪæ d͡ʒʌɛ s tɹ̩æ n æ k ʃ ə n ð ə howl d dej", + "ref_phonemes": "ɪt ɪz ju hu ɑr mɪsteɪkʌn rɑul aɪ hæv rɛd hɪz dɪstrɛs ɪn hɪz aɪz ɪn hɪz ɛvɝi dʒɛstʃɝ ʌnd ækʃʌn ðʌ hoʊl deɪ ", + "duration": 0.5227541923522949, + "PER": 36.58536585365854, + "score": { + "S": 21, + "D": 4, + "I": 5, + "N": 82 + } + }, + { + "model": "WavLM", + "phonemes": "ajɪ m k ə m v ɪ n s t ʌ v w ʌ tajs s ɛ d ð ə kawn t", + "ref_phonemes": "aɪ æm kʌnvɪnst ʌv wʌt aɪ seɪ sɛd ðʌ kaʊnt ", + "duration": 0.27578186988830566, + "PER": 28.125, + "score": { + "S": 5, + "D": 3, + "I": 1, + "N": 32 + } + }, + { + "model": "WavLM", + "phonemes": "b ʌ t æ n t ɪ n j u d ɹawt n ɑ t ɪ n t ɹ ʌ p t ə d bajð ɪ s m u m ə n t ʌ v h ɪ z f ɹ ɛ n d æɛ v ə b i p ɹejz ð ə f ɹ ɪ nt͡ʃh u ɑ ɹ p ɹ̩n ə naws s t ə b i θ ɔ t l ə s æ n ɪ n d ɪ s k ɹ i t ɛ k l ə s i v ə n ɑ ɹ kejp ə ə lʌ v b ɹ ɪ ŋ ɪ ŋ ʌ k ɑ m æ n d saw nd͡ʒʌd͡ʒh m ə n t t ə b ɛ ɹ mn m æ tɹ̩z ʌ v s ʌt͡ʃɪ h d n ɔ ɹ t ə n s", + "ref_phonemes": "bʌt kʌntɪnjud rɑul nɑt ɪntɝʌptɪd baɪ ðɪs muvmʌnt ʌv hɪz frɛnd hɛvʌn bi preɪzd ðʌ frɛntʃ hu ɑr prʌnaʊnst tu bi θɔtlʌs ʌnd ɪndɪskrit rɛklʌs ivɪn ɑr keɪpʌbʌl ʌv brɪŋɪŋ ʌ kɑm ʌnd saʊnd dʒʌdʒmʌnt tu bɛr ɑn mætɝz ʌv sʌtʃ haɪ ɪmpɔrtʌns ", + "duration": 1.1299736499786377, + "PER": 33.87096774193548, + "score": { + "S": 46, + "D": 10, + "I": 7, + "N": 186 + } + }, + { + "model": "WavLM", + "phonemes": "ð s t ɪ z ð æ t ð ə ɑ nɹ̩ʌ v θ ɹ i ɪ z sejv ɑ ɹ k ʌ n t ɹ i ɑ ɹ m æ s tɹ̩z æ n dawɹ̩ɹ own", + "ref_phonemes": "ðʌs ɪt ɪz ðæt ðʌ ɑnɝ ʌv θri ɪz seɪvd aʊɝ kʌntriz aʊɝ mæstɝz ʌnd aʊɝ oʊn ", + "duration": 0.4467191696166992, + "PER": 43.63636363636363, + "score": { + "S": 14, + "D": 6, + "I": 4, + "N": 55 + } + }, + { + "model": "WavLM", + "phonemes": "j ɛ s i ɹ i powz m ɛ n i θ ɪ ŋ z h æ v æd͡ʒə tejt ə d m i dejə bowθ θ ɪ n majn d æ n d b ɑ t i w ɛ n j u ɹ ɪ tɹ̩n t ə m ɑ ɹow ʃ ɑ n nowl ɔ ŋ ɡɹ̩aws bm i ð ə sej m æ n", + "ref_phonemes": "jɛs aɪ nid ripoʊz mɛni θɪŋz hæv ædʒʌteɪtʌd mi tu deɪ boʊθ ɪn maɪnd ʌnd bɑdi wɛn ju rɪtɝn tu mɑroʊ aɪ ʃæl noʊ lɔŋɡɝ bi ðʌ seɪm mæn ", + "duration": 0.7205471992492676, + "PER": 38.613861386138616, + "score": { + "S": 21, + "D": 9, + "I": 9, + "N": 101 + } + }, + { + "model": "WavLM", + "phonemes": "b ʌ t ɪ n ð ɪ s f ɹ ɛ n d l i p ɹ ɛ ʃɹ̩ɹ ɹaw k ʊ d ɪ t ɛ k ð ə nɹ̩v ə s æ æd͡ʒə tejʃ ə n ʌ v ə ɡ ɹejt n tɹ̩n ə l k ɑ n f l ɪ k t", + "ref_phonemes": "bʌt ɪn ðɪs frɛndli prɛʃɝ rɑul kʊd dɪtɛkt ðʌ nɝvʌs ædʒʌteɪʃʌn ʌv ʌ ɡreɪt ɪntɝnʌl kɑnflɪkt ", + "duration": 0.459522008895874, + "PER": 35.61643835616438, + "score": { + "S": 18, + "D": 3, + "I": 5, + "N": 73 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə najt w ɑ z k l ɪ ɹ s t ɑ ɹ l ə t æ n d d s p l ɛ n d ə d ð ə t ɛ m p ə t ɛ p æ s t ə wejæʌ n d ð ə s w i ɪ n l u ə s ə z ʌ v ð ə i v n ɪ ŋ h ænpd wɹ̩s t ɔ ɹ d lajf p i s æ n s əɪ k j ʊ ɹ ə t i ɛ vɹ̩i ɛ ɹ", + "ref_phonemes": "ðʌ naɪt wɑz klɪr stɑrlɪt ʌnd splɛndʌd ðʌ tɛmpʌst hæd pæst ʌweɪ ʌnd ðʌ swit ɪnfluʌnsɪz ʌv ðʌ ivnɪŋ hæd rɪstɔrd laɪf pis ʌnd sɪkjʊrʌti ɛvriwɛr ", + "duration": 0.7206153869628906, + "PER": 34.78260869565217, + "score": { + "S": 25, + "D": 8, + "I": 7, + "N": 115 + } + }, + { + "model": "WavLM", + "phonemes": "ə p ɑ n ð ə l ɑ ɹd͡ʒs s k w ɛ ɹ n f ɹ ʌn t ʌ v ð ə h owt th ɛ ð ə ʃ æ dowz ʌ v ð ə t ɛ n z ɪ n t ə sɛ k t ə d bajð ə ɡowl d ə n m u m b i ə m z f ɔ ɹ m d æ z ɪ t wɹ̩ h j mows ʌ v uʃd͡ʒɛ k æ n d j ɛ lowv f l æ ɡ s town z", + "ref_phonemes": "ʌpɑn ðʌ lɑrdʒ skwɛr ɪn frʌnt ʌv ðʌ hoʊtɛl ðʌ ʃædoʊz ʌv ðʌ tɛnts ɪntɝsɛktɪd baɪ ðʌ ɡoʊldʌn munbimz fɔrmd æz ɪt wɝ ʌ hjudʒ moʊzeɪɪk ʌv dʒɛt ʌnd jɛloʊ flæɡstoʊnz ", + "duration": 0.8381941318511963, + "PER": 35.9375, + "score": { + "S": 33, + "D": 7, + "I": 6, + "N": 128 + } + }, + { + "model": "WavLM", + "phonemes": "bajl ə l ɔ n w ɑt͡ʃf ɔ ɹ s ʌ m tajm ə k ɑ n d ʌ k t ʌ p ð ə t l ʌ vɹ̩z l ɪ s ə n t ə ð ə lawd æ n ə n s ɪ v ə l s l ʌ m bɹ̩z ʌ v m æ n ɪə kh æɪ m u s n ɔ ɹ d æ z ɪ n p ɪ ɹ l i æ z ðowh i w ɑ z w ɛ ɹ ɪ ŋ h ɪ z b l u ɪ n ɡowl d ɪ n s t ɛ d ʌ v ɪ z vajə ə t s u t", + "ref_phonemes": "bræɡʌloʊn wɑtʃt fɔr sʌm taɪm ðʌ kɑndʌkt ʌv ðʌ tu lʌvɝz lɪsʌnd tu ðʌ laʊd ʌnd ʌnsɪvʌl slʌmbɝz ʌv mænɪkæmp hu snɔrd æz ɪmpɪriʌsli æz ðoʊ hi wɑz wɛrɪŋ hɪz blu ʌnd ɡoʊld ɪnstɛd ʌv hɪz vaɪʌlɪt sut ", + "duration": 1.1246318817138672, + "PER": 31.818181818181817, + "score": { + "S": 29, + "D": 14, + "I": 6, + "N": 154 + } + }, + { + "model": "WavLM", + "phonemes": "ð ɹ w sɹ̩ n t l i nown ɪ ɹ ð ə s ə l u ʃ ə n ʌ v ð ɛ ɹ p ɹ ɑ b l ə m", + "ref_phonemes": "ðeɪ wɝ sɝtʌnli noʊ nɪrɝ ðʌ sʌluʃʌn ʌv ðɛr prɑblʌm ", + "duration": 0.2813563346862793, + "PER": 40.0, + "score": { + "S": 11, + "D": 4, + "I": 1, + "N": 40 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə p ʊ ɹ ɪ t ə l θ ɪ ŋ z k ɹajt ɪ n ð i ə θ ɪ ŋ k ʌ v ð ɛ m h æ v ɪ ŋ b ɪ n tɹ̩n t ə ð ə w ɔ ɔ l ð i z j ɪ ɹ z", + "ref_phonemes": "ðʌ pʊr lɪtʌl θɪŋz kraɪd sɪnθiʌ θɪŋk ʌv ðɛm hævɪŋ bɪn tɝnd tu ðʌ wɔl ɔl ðiz jɪrz ", + "duration": 0.4079165458679199, + "PER": 27.419354838709676, + "score": { + "S": 12, + "D": 4, + "I": 1, + "N": 62 + } + }, + { + "model": "WavLM", + "phonemes": "naww ʌ t ɪ z ð ə s ɛ n s ʌ v ɪ t t u ɪ n ə s ə n bejb i z lajk ð æ t", + "ref_phonemes": "naʊ wʌt wɑz ðʌ sɛns ʌv ɪt tu ɪnʌsʌnt beɪbiz laɪk ðæt ", + "duration": 0.23385953903198242, + "PER": 21.951219512195124, + "score": { + "S": 7, + "D": 2, + "I": 0, + "N": 41 + } + }, + { + "model": "WavLM", + "phonemes": "b ʌ t d͡ʒojs h æ d n ɑ t b ɪ n l ɪ s ə n ɪ ɔ l æ t w ʌ n z ʃ i p ʊ t taw hɹ̩k æ n d ɔ ɑ n ð ə tejsb b ə l ɪ n fejs t ɹ̩k ə m k p æ n j ə", + "ref_phonemes": "bʌt dʒɔɪs hæd nɑt bɪn lɪsʌnɪŋ ɔl æt wʌns ʃi pʊt daʊn hɝ kændʌl ɑn ðʌ teɪbʌl ʌnd feɪst hɝ kʌmpænjʌn ", + "duration": 0.4502134323120117, + "PER": 34.61538461538461, + "score": { + "S": 17, + "D": 5, + "I": 5, + "N": 78 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə t w ɪ n b ɹ ʌ ðɹ̩t d ɪ d s ʌ m θ ɪ ŋ ʃ i d ɪ n t lajk æ n d ʃ i tɹ̩n dh ɪ z p ɪ k kt͡ʃɹ̩t ə ð ə w ɔ l", + "ref_phonemes": "ðʌ twɪn brʌðɝ dɪd sʌmθɪŋ ʃi dɪdʌnt laɪk ʌnd ʃi tɝnd hɪz pɪktʃɝ tu ðʌ wɔl ", + "duration": 0.38143062591552734, + "PER": 29.82456140350877, + "score": { + "S": 9, + "D": 2, + "I": 6, + "N": 57 + } + }, + { + "model": "WavLM", + "phonemes": "hɹ̩h h æ p ə n t ə b i ɑ n ð ə sejm f ɹm t u b ʌ t ʃ i ɛ v ə d ɛə t l i dɪ ŋ k ɛ ɹ ə bawt ɪ t", + "ref_phonemes": "hɝz hæpʌnd tu bi ɪn ðʌ seɪm freɪm tu bʌt ʃi ɛvʌdʌntli dɪdʌnt kɛr ʌbaʊt ðæt ", + "duration": 0.3484354019165039, + "PER": 40.67796610169492, + "score": { + "S": 16, + "D": 7, + "I": 1, + "N": 59 + } + }, + { + "model": "WavLM", + "phonemes": "ajθ ɔ t w i wɹ̩s t ʌ m p t ə ɡ ɛ n wɛ n ajə fɹ̩s ɔ ð æ t b ɪ k ʃɹ̩b b ʌ t ɪ t s m ɪ n ʌ v s ʌ m j u s æ f tɹ̩ɔ ɔ l", + "ref_phonemes": "aɪ θɔt wi wɝ stʌmpt ʌɡɛn wɛn aɪ fɝst sɔ ðæt pɪktʃɝ bʌt ɪts bɪn ʌv sʌm jus æftɝ ɔl ", + "duration": 0.4332695007324219, + "PER": 29.03225806451613, + "score": { + "S": 10, + "D": 2, + "I": 6, + "N": 62 + } + }, + { + "model": "WavLM", + "phonemes": "d u u s ə powz ð ə m ɪn nt͡ʃɹ̩w ɑ z ə k ɑ m p i ʌ v ð ə sejm θ ɪ ŋ", + "ref_phonemes": "du ju sʌpoʊz ðʌ mɪniʌtʃʊr wɑz ʌ kɑpi ʌv ðʌ seɪm θɪŋ ", + "duration": 0.28787827491760254, + "PER": 32.5, + "score": { + "S": 9, + "D": 2, + "I": 2, + "N": 40 + } + }, + { + "model": "WavLM", + "phonemes": "mej w w ɹ m i t ɛ ɹ ə b l i æ m ə sajd z ə d lajk t ə s i w ʌ t ð ɪ s ʌ v l i f ɹ n kt͡ʃɹ̩l l ʊ sajk w ɪ θawt s ʌt͡ʃ ə k w ɑ t ə d i z ʌ v d ʌ s t ɔ lowvɹ̩ɪ t k ʊ d z s k i m s ɪ n", + "ref_phonemes": "ðeɪ wɝi mi tɛrʌbli ʌnd bɪsaɪdz aɪd laɪk tu si wʌt ðɪs lʌvli fɝnɪtʃɝ lʊks laɪk wɪθaʊt sʌtʃ kwɑntʌtiz ʌv dʌst ɔl oʊvɝ ɪt ɡʊd skim sɪn ", + "duration": 0.6430149078369141, + "PER": 35.23809523809524, + "score": { + "S": 23, + "D": 7, + "I": 7, + "N": 105 + } + }, + { + "model": "WavLM", + "phonemes": "w ɛ l k ʌ m ɪ n h ɪ ɹ ð ɪ s æ f tɹ̩n u n w ɪ ðowsowl d k lowz ɑ n ɪ n d h æ v ɹ̩ɹ ɛ j ə lɹ̩h aws k l i n ɪ ŋ", + "ref_phonemes": "wil kʌm ɪn hir ðɪs æftɝnun wɪð oʊld kloʊðz ɑn ʌnd hæv ʌ rɛɡjʌlɝ haʊs klinɪŋ ", + "duration": 0.37203526496887207, + "PER": 33.33333333333333, + "score": { + "S": 12, + "D": 2, + "I": 6, + "N": 60 + } + }, + { + "model": "WavLM", + "phonemes": "ɪ k æ n t hɹ̩d ɛ n i θ ɪ ŋ ə m ʃ ʊ ɹ f ɔ ɹ w i w ɑ n t d ɪ s tɹ̩b θ ɪ ŋ z æ t ɔ l", + "ref_phonemes": "ɪt kænt hɝt ɛniθɪŋ aɪm ʃʊr fɔr wi woʊnt dɪstɝb θɪŋz æt ɔl ", + "duration": 0.34667420387268066, + "PER": 26.666666666666668, + "score": { + "S": 7, + "D": 3, + "I": 2, + "N": 45 + } + }, + { + "model": "WavLM", + "phonemes": "ð ɪ s θ ɔ t hawɛ vɹ̩d d ɪ d n ɑ t ɛ n tɹ̩ð ə h ɛ d d z ʌ v ð ə ɪ n θð u z i æ s t ɪ k p ɛ ɹ", + "ref_phonemes": "ðɪs θɔt haʊɛvɝ dɪd nɑt ɛntɝ ðʌ hɛdz ʌv ðʌ ɪnθuziæstɪk pɛr ", + "duration": 0.3508870601654053, + "PER": 23.91304347826087, + "score": { + "S": 6, + "D": 0, + "I": 5, + "N": 46 + } + }, + { + "model": "WavLM", + "phonemes": "s ʌ ɡ ə l ɪ ŋ ð haws k l i ɪ ŋ p ɛ ɹ f ə n l i ə ɪ n t ð ə s ɛ lɹ̩w ɛɪ n dowt n ə b zɹ̩v d ð æ t ɔ f tɹ̩ nŋn u n p ɹ u v d nowh i z i t æ s k f ɔ ɹ s ɪ n ð ə h æ d æ d ə d ə w ɪ s p ɹ u æ n d d ʌ s p æ n t ə ð əawt f ɪ t", + "ref_phonemes": "smʌɡlɪŋ ðʌ haʊs klinɪŋ pɛrʌfʌneɪljʌ ɪntu ðʌ sɛlɝ wɪndoʊ ʌnʌbʌstɝvd ðæt æftɝnun pruvd noʊ izi tæsk fɔr sɪnθiʌ hæd ædʌd ʌ wɪsk brum ʌnd dʌst pæn tu ðʌ aʊtfɪt ", + "duration": 0.8441774845123291, + "PER": 37.00787401574803, + "score": { + "S": 28, + "D": 12, + "I": 7, + "N": 127 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə l ʊ p p ɹ u v d t u m ʌt͡ʃf f ɔ ɹ ɪ m æɛ n i kejm s p ɔ ɹ t ɪ ŋ æ f tɹ̩ ɪ æ s ɪ s k ə l i æ z ə j ʌ ŋ k æ n t ə n ʌt͡ʃf ʃ ɪ s ɪ n ð æ z d ɪ lajt w ɛ n ʃ i k ɑ sajt ʌ vh ɪ m", + "ref_phonemes": "ðʌ lʊr pruvd tu mʌtʃ fɔr hɪm ʌnd hi keɪm spɔrtɪŋ æftɝ ɪt æz frɪskʌli æz ʌ jʌŋ kɪtʌn mʌtʃ tu sɪnθiʌz dɪlaɪt wɛn ʃi kɑt saɪt ʌv hɪm ", + "duration": 0.6223185062408447, + "PER": 34.65346534653465, + "score": { + "S": 19, + "D": 9, + "I": 7, + "N": 101 + } + }, + { + "model": "WavLM", + "phonemes": "owl ɛ t ɪ m k ʌ m ə l ɔ ŋ ʃ iɹ̩d͡ʒd ajt u l ʌ p t ə s i h ɪ m ə bawt ð æ t owl l d haws", + "ref_phonemes": "oʊ lɛt hɪm kʌm ʌlɔŋ ʃi ɝdʒd aɪ du lʌv tu si hɪm ʌbaʊt ðæt oʊld haʊs ", + "duration": 0.4089372158050537, + "PER": 29.411764705882355, + "score": { + "S": 11, + "D": 1, + "I": 3, + "N": 51 + } + }, + { + "model": "WavLM", + "phonemes": "j j ɛ t l ɪ t ə l æ z ɪ t w ɑ z ɪ t h æ d ɔ ɹl ɹ ɛ d i mejd ʌ v v æ s d ɪ fɹ̩ə n s ɪ n ð ə æ s p ɛ k t ʌ v ð ə ɹ u m", + "ref_phonemes": "jɛt lɪtʌl æz ɪt wɑz ɪt hæd ɔlrɛdi meɪd ʌ væst dɪfɝʌns ɪn ðʌ æspɛkt ʌv ðʌ rum ", + "duration": 0.44442129135131836, + "PER": 22.033898305084744, + "score": { + "S": 8, + "D": 1, + "I": 4, + "N": 59 + } + }, + { + "model": "WavLM", + "phonemes": "sɹ̩f ɹ̩ ə s d ʌ s æ t l i s h æ d b ɪ n d ɹ̩m u d æ n d ð ə fajn owl d fɹ̩ n t͡ʃɹ̩kɡ ejv ə h ɪ n t ʌ v ɪ t s ɹ i l ɛ l ə ɡ ɛ n t s æ n d p ɑ l ɪ ʃ", + "ref_phonemes": "sɝfʌs dʌst æt list hæd bɪn rimuvd ʌnd ðʌ faɪn oʊld fɝnɪtʃɝ ɡeɪv ʌ hɪnt ʌv ɪts ril ɛlʌɡʌns ʌnd pɑlɪʃ ", + "duration": 0.5309398174285889, + "PER": 36.708860759493675, + "score": { + "S": 16, + "D": 4, + "I": 9, + "N": 79 + } + }, + { + "model": "WavLM", + "phonemes": "æ n dmajp ɑ k ə t m ʌ n d i ɡ ɪ z ɡ ɛ t ɪ ŋ lowʌ ɡ ɛ n æ n d j u h æ v ɪ ɛ n i l ɛ f t æ z j u ʒ ə w ə l", + "ref_phonemes": "ʌnd maɪ pɑkʌt mʌni ɪz ɡɛtɪŋ loʊ ʌɡɛn ʌnd ju hævʌnt ɛni lɛft æz juʒʌwʌl ", + "duration": 0.34665441513061523, + "PER": 21.428571428571427, + "score": { + "S": 8, + "D": 2, + "I": 2, + "N": 56 + } + }, + { + "model": "WavLM", + "phonemes": "ðejs lm u m ə nejʃ ə n bajk æ n d ə lajt ɪ z ð ə p ɹ ɪ t i ə s t ɪ n ð ə wɹ̩l d", + "ref_phonemes": "ðeɪ seɪ ɪlumʌneɪʃʌn baɪ kændʌl laɪt ɪz ðʌ prɪtiʌst ɪn ðʌ wɝld ", + "duration": 0.3289954662322998, + "PER": 36.0, + "score": { + "S": 14, + "D": 3, + "I": 1, + "N": 50 + } + }, + { + "model": "WavLM", + "phonemes": "wajɪ t k ə lajæ θ æ s j u ʒ ə w ə l ðejə bowθ k ɹajd p ɪ ɹ ɪ ŋ ɪ n", + "ref_phonemes": "waɪ ɪts ɡʌlaɪʌθ æz juʒʌwʌl ðeɪ boʊθ kraɪd pirɪŋ ɪn ", + "duration": 0.32218480110168457, + "PER": 39.02439024390244, + "score": { + "S": 14, + "D": 1, + "I": 1, + "N": 41 + } + }, + { + "model": "WavLM", + "phonemes": "f ɡ ɛ t ɪ ŋ ɔ l ð ɛ ɹ w ɪ ɹ i n ə s ə s i z ɛ k æ n d ə z n d s t ʊ ɹ i θɹ u ð ə haws fajn d ɪ ŋ ɑ n ə kejʃ ə n ə l pejpɹ̩ t ʌ k t ə wejæɪ n d s ʌ mn ɔ k ɔ ɹ nɹ̩", + "ref_phonemes": "fɝɡɛtɪŋ ɔl ðɛr wɪrinʌs ðeɪ sizd ðɛr kændʌlz ʌnd skɝid θru ðʌ haʊs faɪndɪŋ æn ʌkeɪʒʌnʌl peɪpɝ tʌkt ʌweɪ ɪn sʌm ɑd kɔrnɝ ", + "duration": 0.6297638416290283, + "PER": 40.625, + "score": { + "S": 25, + "D": 9, + "I": 5, + "N": 96 + } + }, + { + "model": "WavLM", + "phonemes": "w ɛ l m k ə m f ɪ n s ð æ t ð ə p ɔ ɹ t ə d ʌ p paws m ɪ s t ɹ i haw æ p b ɪ n n ɑ tɹ̩l iɪ ɹð æ n t p l s ɪ k s t i n θ t t i n s ɪ k s t i w ʌ n æ n d p ɹ ɑb ə b l i n ɑ t m ʌt͡ʃ lej ejtɹ̩", + "ref_phonemes": "wɛl aɪm kʌnvɪnst ðæt ðʌ bɔrdʌd ʌp haʊs mɪstɝi hæpʌnd nɑt ɝliɝ ðæn eɪprʌl sɪkstinθ eɪtin sɪksti wʌn ʌnd prɑbʌbli nɑt mʌtʃ leɪtɝ ", + "duration": 0.6966216564178467, + "PER": 36.53846153846153, + "score": { + "S": 21, + "D": 8, + "I": 9, + "N": 104 + } + }, + { + "model": "WavLM", + "phonemes": "nowwl w z wɹ̩s powk ə ŋn æ ŋ ɡ w ɑd͡ʒw w ɑ z ʌ tɹ̩d sejv ðawt ʌ v w ɪ ŋ æn h ɪ s s ɪ ŋ æ n d ð æ t s ʌ m haww ɑ z ɪ n d ɪs t ɪ ŋ t z ɪ f ɪ t ɪ ɡ z ɪ s t ɪ td ɪ n f æ n s i æ n d n ɑɔ t ɪ n d ɹ i æ l ə t i", + "ref_phonemes": "noʊ wɝdz wɝ spoʊkʌn noʊ læŋɡwʌdʒ wɑz ʌtɝd seɪv ðæt ʌv weɪlɪŋ ʌnd hɪsɪŋ ʌnd ðæt sʌmhaʊ wɑz ɪndɪstɪŋkt æz ɪf ɪt ɪɡzɪstʌd ɪn fænsi ʌnd nɑt ɪn riælʌti ", + "duration": 0.9916045665740967, + "PER": 30.508474576271187, + "score": { + "S": 18, + "D": 9, + "I": 9, + "N": 118 + } + }, + { + "model": "WavLM", + "phonemes": "bajh hɹ̩d ə nojs b ɪ hajn d aj tɹ̩d d æn d s ɔ l k æ ɹ̩ ɪ z b l æ kajz ʃajn m i m wajɔ l ɪ n h ɪ z h æ n d h hi h ɛ d ə ɡ l i m ɪ ŋ najf i l ɪ f t ə d ɪ aj ə b ʌ v h ɪ z h ɛ d ə ɪ f t h ə s t ɹajk ə h æ d ð ə s t ɹejɪ ŋ ʌ v t h ɛ n m æ n æ n dajz hɹ̩l d h ɪ m f ɹ ʌ m i", + "ref_phonemes": "aɪ hɝd ʌ nɔɪz bɪhaɪnd aɪ tɝnd ʌnd sɔ kæfɝ hɪz blæk aɪz ʃaɪnɪŋ waɪl ɪn hɪz hænd hi hɛld ʌ ɡlimɪŋ naɪf hi lɪftʌd ɪt ʌbʌv hɪz hɛd æz ɪf tu straɪk bʌt aɪ hæd ðʌ strɛŋkθ ʌv tɛn mɛn ʌnd aɪ hɝld hɪm frʌm mi ", + "duration": 1.3235931396484375, + "PER": 39.869281045751634, + "score": { + "S": 39, + "D": 9, + "I": 13, + "N": 153 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə s t ɔ ɹ i ʌ v ɪ t s i v ə l ɪ n f l u ə n s kejm æ k t ə m i æ n ɪ n majb ɪ w ɪ l dɹ̩dt k ə n d ɪ ʃ ə n w ʌ n dɹ̩d w ɛ ðɹ̩ð ð ɛ ɹ w ɑ z n ɑ t s ʌ m t ɹ u θ ɪ n wajbð h æ d b ɪ n s ɛ d", + "ref_phonemes": "ðʌ stɔri ʌv ɪts ivʌl ɪnfluʌns keɪm bæk tu mi ʌnd ɪn maɪ bɪwɪldɝd kʌndɪʃʌn aɪ wʌndɝd wɛðɝ ðɛr wɑz nɑt sʌm truθ ɪn wʌt hæd bɪn sɛd ", + "duration": 0.6587836742401123, + "PER": 27.722772277227726, + "score": { + "S": 17, + "D": 4, + "I": 7, + "N": 101 + } + }, + { + "model": "WavLM", + "phonemes": "w ʌ t ð ɛ n ə h j u m ə n h æ n d l ɑ ɹ ɹd͡ʒæ n d ʃejp l i ə p ɪ d ɪ s t ɪ ŋ l i ɑ n ð ə sɹ̩f ə s ʌ v ð ə p ɑ n d", + "ref_phonemes": "wʌt ðɛn ʌ hjumʌn hænd lɑrdʒ ʌnd ʃeɪpli ʌpɪrd dɪstɪŋktli ɑn ðʌ sɝfʌs ʌv ðʌ pɑnd ", + "duration": 0.49889254570007324, + "PER": 26.984126984126984, + "score": { + "S": 10, + "D": 4, + "I": 3, + "N": 63 + } + }, + { + "model": "WavLM", + "phonemes": "n ʌ θ ɪ ŋ m ɔ ɹ n ɑ t i v ə n ð ə ɹ ɪt͡ʃ s t u w ɪt͡ʃɪ t majt b i ə t æ t͡ʃɪ t", + "ref_phonemes": "nʌθɪŋ mɔr nɑt ivɪn ðʌ rɪst tu wɪtʃ ɪt maɪt bi ʌtætʃt ", + "duration": 0.32053065299987793, + "PER": 31.70731707317073, + "score": { + "S": 6, + "D": 1, + "I": 6, + "N": 41 + } + }, + { + "model": "WavLM", + "phonemes": "ɪ t d ɪ t n ɑ t b ɛ k ə n ɔ ɹ ɪ n d i d m u v æ t ɔ l ɪ t w ɑ z æ z s t ɪ l æ z ð ə h æ n d ʌ v d ɛ θ", + "ref_phonemes": "ɪt dɪd nɑt bɛkʌn ɔr ɪndid muv æt ɔl ɪt wɑz æz stɪl æz ðʌ hænd ʌv dɛθ ", + "duration": 0.4396700859069824, + "PER": 7.8431372549019605, + "score": { + "S": 4, + "D": 0, + "I": 0, + "N": 51 + } + }, + { + "model": "WavLM", + "phonemes": "ajə w k t ə k ɑ n nt͡ʃ ə s n ə s fajt ɪ ɪ ŋ æ t fɹ̩s t ɪ t s i ŋ d æ z ɪ fajw ɑ z fajt ɪ ŋ w ɪ ð ə fejæ n t ə m b ʌ t ɡ ɹɹ̩ ɪ nd͡ʒi l i majə pown ɪ t b ɪ kejm m ɔ ɹ ɹ i l t ə m i t w ɑ z k æ fɹ̩", + "ref_phonemes": "aɪ ʌwoʊk tu kɑnʃʌsnʌs faɪtɪŋ æt fɝst ɪt simd æz ɪf aɪ wɑz faɪtɪŋ wɪð ʌ fæntʌm bʌt ɡrædʒuʌli maɪ ʌpoʊnʌnt bɪkeɪm mɔr ril tu mi ɪt wɑz kæfɝ ", + "duration": 0.7734153270721436, + "PER": 37.61467889908257, + "score": { + "S": 24, + "D": 5, + "I": 12, + "N": 109 + } + }, + { + "model": "WavLM", + "phonemes": "bajh æ d s k ɛ ɹ s l i nown w ɛ najh æ d b ɪ n s ɪ ŋ ɔ ɹ d u ɪ ŋ ʌ p t ə ð ɪ s tajm b ʌ z h i s powk ajl ʊ d æ t majh h æ n d", + "ref_phonemes": "aɪ hæd skɛrsli noʊn wʌt aɪ hæd bɪn seɪɪŋ ɔr duɪŋ ʌp tu ðɪs taɪm bʌt æz hi spoʊk aɪ lʊkt æt maɪ hænd ", + "duration": 0.4765167236328125, + "PER": 26.31578947368421, + "score": { + "S": 13, + "D": 5, + "I": 2, + "N": 76 + } + }, + { + "model": "WavLM", + "phonemes": "ɪ n ð ə lajt ʌ ð ə m u n aj ajs ɔ n najf ɹ æ w ɪ ð b l ʌ d æ n d majh æ n d t u w ɑ z ɔ l sowd ɪ s k ʌ lɹ̩d", + "ref_phonemes": "ɪn ðʌ laɪt ʌv ðʌ mun aɪ sɔ ʌ naɪf rɛd wɪð blʌd ʌnd maɪ hænd tu wɑz ɔlsoʊ dɪskʌlɔrd ", + "duration": 0.5107150077819824, + "PER": 26.984126984126984, + "score": { + "S": 13, + "D": 2, + "I": 2, + "N": 63 + } + }, + { + "model": "WavLM", + "phonemes": "w lt͡ʃɛ ɹ p ɪ k t ʌ p s ʌ m θ ɪ ŋ fɹ ʌm ð ə ɡ ɹawn d æ n d l ʊ k t æ t ɪ t", + "ref_phonemes": "voʊltɛr pɪkt ʌp sʌmθɪŋ frʌm ðʌ ɡraʊnd ʌnd lʊkt æt ɪt ", + "duration": 0.2813985347747803, + "PER": 26.190476190476193, + "score": { + "S": 7, + "D": 2, + "I": 2, + "N": 42 + } + }, + { + "model": "WavLM", + "phonemes": "ajsej j u d j u noww ʌ t ð ɪ s m i n z æ n d j u m ʌ s t t ɛ l ʌ s", + "ref_phonemes": "aɪ seɪ ju du noʊ wʌt ðɪs minz ʌnd ju mʌst tɛl ʌs ", + "duration": 0.35033178329467773, + "PER": 13.88888888888889, + "score": { + "S": 4, + "D": 0, + "I": 1, + "N": 36 + } + }, + { + "model": "WavLM", + "phonemes": "ajh æ d ə ɡ ɛ n b ɪ n æ k t ɪ ŋ ʌ n dɹ̩ð ə ɪ n f l u ə n s ʌ v ð ɪ s m æ n z pawɹ̩ awhɹ̩", + "ref_phonemes": "aɪ hæd ʌɡɛn bɪn æktɪŋ ʌndɝ ðʌ ɪnfluʌns ʌv ðɪs mænz paʊɝ ", + "duration": 0.3282325267791748, + "PER": 31.818181818181817, + "score": { + "S": 7, + "D": 0, + "I": 7, + "N": 44 + } + }, + { + "model": "WavLM", + "phonemes": "pɹ̩t͡ʃt æ n s t u k æ fɹ̩z d ɛ θ majt sɹ̩v v h ɪ m ɪ n ɡ ʊ d s t ɛ d", + "ref_phonemes": "pɝtʃæns tu kæfɝz dɛθ maɪt sɝv hɪm ɪn ɡʊd stɛd ", + "duration": 0.34392333030700684, + "PER": 27.77777777777778, + "score": { + "S": 4, + "D": 0, + "I": 6, + "N": 36 + } + }, + { + "model": "WavLM", + "phonemes": "majt t ʌ ŋ ɹ i f j u z tə ɑ ɹ t ɪ k j ə lejt majp pawɹ̩ʌ v s p it͡ʃ l æ f t ə m i", + "ref_phonemes": "maɪ tʌŋ rʌfjuzd tu ɑrtɪkjʌlʌt maɪ paʊɝ ʌv spitʃ lɛft mi ", + "duration": 0.35213351249694824, + "PER": 40.0, + "score": { + "S": 11, + "D": 1, + "I": 6, + "N": 45 + } + }, + { + "model": "WavLM", + "phonemes": "n ɑ t w ɪ s t æ n d ɪ ŋ ð ə hajɹ ɛ z ə l u ʃ ə n ʌ v h ɑ k wh i f ʊ l i k ɑ m pɹɹ̩h ɛ n d ə d ɔ l ð ə d ɪ f ə k ə l t i z ɪ n d nd͡ʒɹ̩h i w ɑ z ə bawt t ə ɛ n kɹ̩ɪ kaj", + "ref_phonemes": "nɑtwɪθstændɪŋ ðʌ haɪ rɛzʌluʃʌn ʌv hɔkaɪ hi fʊli kɑmprɪhɛndɪd ɔl ðʌ dɪfʌkʌltiz ʌnd deɪndʒɝ hi wɑz ʌbaʊt tu ɪnkɝ ", + "duration": 0.5741944313049316, + "PER": 35.869565217391305, + "score": { + "S": 20, + "D": 5, + "I": 8, + "N": 92 + } + }, + { + "model": "WavLM", + "phonemes": "ɪ n h ɪ z ɹ ɪə tɹ̩n t ə ð ə k æ m p h ɪ z ə k j u t n p ɹ æ k t ə s t ɪ n t ɪə l ɛ k s wɹ̩ ɪ n t ɛ n t ə l i ɪ n ɡejd͡ʒd d ɪ nd d ɪ vajz ɪ ŋ m i n z t ə kawn tɹ̩æ k t ə w ɑt͡ʃk f ə l n ə s æ n s ə s p ɪ ʃ ə n ɑ n ð ə p ɑ ɹ t ʌ v h ɪ z æ n ə m i z æ t h i n u wɹ̩ n nowd ɪ ɡ ɹ i ɪ n f ɪ ɹ iɹ̩t ə h ɪ zown", + "ref_phonemes": "ɪn hɪz rɪtɝn tu ðʌ kæmp hɪz ʌkjut ʌnd præktʌst ɪntʌlɛkts wɝ ɪntɛntli ɛŋeɪdʒd ɪn dɪvaɪzɪŋ minz tu kaʊntɝækt ʌ wɑtʃfʌlnʌnz ʌnd sʌspɪʃʌn ɑn ðʌ pɑrt ʌv hɪz ɛnʌmiz ðæt hi nu wɝ ɪn noʊ dɪɡri ɪnfɪriɝ tu hɪz oʊn ", + "duration": 1.1538910865783691, + "PER": 32.926829268292686, + "score": { + "S": 35, + "D": 6, + "I": 13, + "N": 164 + } + }, + { + "model": "WavLM", + "phonemes": "ɪ n ʌ ðɹ̩wɹ̩z d zs aj l h i h æ d ɪ m p l ɪ s ə td fejθ ɪ n ð ə ə b ɪ l ə t i ʌ v bejl ɑ nm z æ s t ə s p i k i w ɑ s ʌ mw ʌ t s k ɛ p t ə k ə l ɑ n ð ə s ʌ b bd͡ʒə t ʌ v ə b ɛ ɹ s ɪ ŋ ɪ ŋ n d ð i æ i h æ d b ɪ n ɪ ʃ ʊ ɹ d v ð ə l æ tɹ̩ɑ n ð ə t ɛ s t ə mown i vh ɪ zown ɪ k s k w əɪ z ə t ɔ ɹ ɡ ə n z", + "ref_phonemes": "ɪn ʌðɝ wɝdz waɪl hi hæd ɪmplɪsʌt feɪθ ɪn ðʌ ʌbɪlʌti ʌv bælʌmz æs tu spik hi wɑz sʌmwʌt skɛptʌkʌl ɑn ðʌ sʌbdʒɪkt ʌv ʌ bɛrz sɪŋɪŋ ʌnd jɛt hi hæd bɪn ʌʃʊrd ʌv ðʌ lætɝ ɑn ðʌ tɛstʌmoʊni ʌv hɪz oʊn ɛkskwʌzʌt ɔrɡʌnz ", + "duration": 1.0794808864593506, + "PER": 31.515151515151512, + "score": { + "S": 34, + "D": 8, + "I": 10, + "N": 165 + } + }, + { + "model": "WavLM", + "phonemes": "ð ɛ ɹ w ɑ z s ʌ m θ ɪ ŋ ɪ n h ɪ z ɛ ɹ n d m æ nɹ̩ð æ t b ɪ t ɹejd t ə ð ə s kawt ð ə ʌ tɹ̩k ə n f j u ʒ ə n ʌ ð ə s tejt ʌ vh ɪ z majn d", + "ref_phonemes": "ðɛr wɑz sʌmθɪŋ ɪn hɪz ɛr ʌnd mænɝ ðæt bɪtreɪd tu ðʌ skaʊt ðʌ ʌtɝ kʌnfjuʒʌn ʌv ðʌ steɪt ʌv hɪz maɪnd ", + "duration": 0.4444913864135742, + "PER": 24.358974358974358, + "score": { + "S": 15, + "D": 2, + "I": 2, + "N": 78 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə ɪ nd͡ʒi n i ə s h ɔ kajht u ɹ i k ɔ l d ð ə hejs s t i m æ nɹ̩ɪ n w ɪt͡ʃð ə ʌ ðɹ̩h æ d ə b æ n d ə n h ɪ zs pows t æ t ð ə b ɛ d sajt ʌ v ð ə s ə k w ʊ m n ɑ z n ɑ t w ɪ θawt h ɪ s ə s p ɪ ʃ ə n z k ə n sɹ̩n ɪ ŋ ð ə sow ʌ bd͡ʒɪ k t ʌ v sowm ʌt͡ʃð s ɑ l ə m d ɪ l ɪ bɹ̩ejʃ ə n", + "ref_phonemes": "ðʌ ɪndʒinjʌs hɔkaɪ hu rɪkɔld ðʌ heɪsti mænɝ ɪn wɪtʃ ðʌ ʌðɝ hæd ʌbændʌnd hɪz poʊst æt ðʌ bɛdsaɪd ʌv ðʌ sɪk wʊmʌn wɑz nɑt wɪθaʊt hɪz sʌspɪʃʌnz kʌnsɝnɪŋ ðʌ sʌbdʒɪkt ʌv soʊ mʌtʃ sɑlʌm dɪlɪbɝeɪʃʌn ", + "duration": 0.7790179252624512, + "PER": 30.76923076923077, + "score": { + "S": 30, + "D": 4, + "I": 14, + "N": 156 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə b ɛ ɹ ʃ ʊ k h ɪ z ʃ æ ɡ i sajd z æ n d ð ɛ n ə w ɛ l nown vojs ɹ ɪ p lajd", + "ref_phonemes": "ðʌ bɛr ʃʊk hɪz ʃæɡi saɪdz ʌnd ðɛn ʌ wɛl noʊn vɔɪs rɪplaɪd ", + "duration": 0.31214070320129395, + "PER": 22.22222222222222, + "score": { + "S": 10, + "D": 0, + "I": 0, + "N": 45 + } + }, + { + "model": "WavLM", + "phonemes": "k æ n ð i z θ ɪ ŋ z b i ɹ i tɹ̩n dejv ə d b ɹ i ð ɪ ŋ m ɔ ɹ f ɹ i l i æ z ð ə t ɹ u θ b ɪ ɡ æ n t ə d ɑɔ n ə p ɑ n h ɪ m", + "ref_phonemes": "kæn ðiz θɪŋz bi rɪtɝnd deɪvɪd briðɪŋ mɔr frili æz ðʌ truθ bɪɡæn tu dɔn ʌpɑn hɪm ", + "duration": 0.3912985324859619, + "PER": 23.809523809523807, + "score": { + "S": 12, + "D": 1, + "I": 2, + "N": 63 + } + }, + { + "model": "WavLM", + "phonemes": "k ʌ m k ʌ m ɹɹ̩i tɹ̩n d h ɑ kajʌ n kejs ɪ ŋ h ɪ z ɑ ə s t kawn t ə n ə n s ə b ɛ tɹ̩t ə ə ʃ ʊ ɹ ð ə wejt vɹ̩ɪ n k ɑ n f ə d ə n s ʌ v h ɪ z k ə m p æ n j ə n u mejs s i ə s k ɪ n w ɪt͡ʃ f ɪ t b i n ɑ t æ z wajt z w ʌn ʌ v ð əd͡ʒɛ n t ə w ʌ n s æ z nowhʌ t ɪ n nd͡ʒ vɹ ɛ t ə ɪ t ð æ t ə w ɪ n z ʌ v ð ə h ɛ v æ n ɪ n ð ə s ʌ n h æ v n ɑ t b ə s towd awʌ l ɛ t ə s t ə b ɪ z n ə s", + "ref_phonemes": "kʌm kʌm rɪtɝnd hɔkaɪ ʌnkeɪsɪŋ hɪz ɑnʌst kaʊntʌnʌns ðʌ bɛtɝ tu ʌʃʊr ðʌ weɪvɝɪŋ kɑnfʌdʌns ʌv hɪz kʌmpænjʌn ju meɪ si ʌ skɪn wɪtʃ ɪf ɪt bi nɑt æz waɪt æz wʌn ʌv ðʌ dʒɛntʌl wʌnz hæz noʊ tɪndʒ ʌv rɛd tu ɪt ðæt ðʌ wɪndz ʌv ðʌ hɛvʌn ʌnd ðʌ sʌn hæv nɑt bɪstoʊd naʊ lɛt ʌs tu bɪznʌs ", + "duration": 1.5098304748535156, + "PER": 32.71028037383177, + "score": { + "S": 43, + "D": 13, + "I": 14, + "N": 214 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə j ʌ ŋ m æ n ɪ z ɪ n b ɑ n d əd͡ʒ n m ʌt͡ʃæ ajf ɪ ɹ h ɪ z d ɛ θ z d ɪ k ɹ i d", + "ref_phonemes": "ðʌ jʌŋ mæn ɪz ɪn bɑndɪdʒ ʌnd mʌtʃ aɪ fɪr hɪz dɛθ ɪz dɪkrid ", + "duration": 0.3160858154296875, + "PER": 24.444444444444443, + "score": { + "S": 5, + "D": 3, + "I": 3, + "N": 45 + } + }, + { + "model": "WavLM", + "phonemes": "aj ɹejt l i m ɔ ɹ n æ t w ʌ n soww ɛ l d ɪ s powz d ʃ ʊ d dajɪ n h ɪ z ɪ ɡ nɹ̩ɪ ə n s æ n dajf v s ɔ t ə ɡ ʊ d l i h ɪ m k æ n j u ðl i d m i t ə h ɪ m", + "ref_phonemes": "aɪ ɡreɪtli mɔrn ðæt wʌn soʊ wɛl dɪspoʊzd ʃʊd daɪ ɪn hɪz ɪɡnɝʌns ʌnd aɪ hæv sɔt ʌ ɡʊdli hɪm kæn ju lɛd mi tu hɪm ", + "duration": 0.594186544418335, + "PER": 24.418604651162788, + "score": { + "S": 15, + "D": 3, + "I": 3, + "N": 86 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə t æ s k w ɪ l n ɑ t b i d ɪ f ə k ə l t ɹ ɪ tɹ̩n n dejt ə h ɛ z ə tejt ɪ ŋ ow ɹejt l i f ɪ ɹ i ɔ p p ɹ ɛ z ə n s w ʊ d ɹ æ ðɹ̩ɪ ɪ n k ɹ i s ð æ n m ɪ t ə ɡejt h ɪ z ʌ n h æ p i f ɔ ɹ ɹt͡ʃə n z", + "ref_phonemes": "ðʌ tæsk wɪl nɑt bi dɪfʌkʌlt rɪtɝnd deɪvɪd hɛzʌteɪtɪŋ ðoʊ aɪ ɡreɪtli fɪr jɔr prɛzʌns wʊd ræðɝ ɪnkris ðæn mɪtʌɡeɪt hɪz ʌnhæpi fɔrtʃʌnz ", + "duration": 0.7237012386322021, + "PER": 32.72727272727273, + "score": { + "S": 26, + "D": 5, + "I": 5, + "N": 110 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə l ɑd͡ʒ n w t͡ʃɪ ɪ ŋ k ə s w ɑ z k ə n fajn d w ɑ z ɪ n ð v ɛ ɹ i s ɛ n tɹ̩ʌ v ð ə v �� l əd͡ʒ nd ɪ n ə s ɪt͡ʃuejʃ ə n pɹ̩h æ p s m ɔ ɹ d ɪ f ə k ə l ð æ n ɛ n i ʌ ðɹ̩t ə ə p ɹowt͡ʃj ɪ ɔ ɹ l i v w ɪ θawt ɑ b zɹ̩vejʃ ə n", + "ref_phonemes": "ðʌ lɑdʒ ɪn wɪtʃ ʌŋkʌz wɑz kʌnfaɪnd wɑz ɪn ðʌ vɛri sɛntɝ ʌv ðʌ vɪlʌdʒ ʌnd ɪn ʌ sɪtʃueɪʃʌn pɝhæps mɔr dɪfʌkʌlt ðæn ɛni ʌðɝ tu ʌproʊtʃ ɔr liv wɪθaʊt ɑbzɝveɪʃʌn ", + "duration": 0.7009220123291016, + "PER": 34.92063492063492, + "score": { + "S": 27, + "D": 5, + "I": 12, + "N": 126 + } + }, + { + "model": "WavLM", + "phonemes": "f ɔ ɹ fajv v ð ə l æ tɹ̩ɔ n l i l ɪ ŋ ɡɹ̩d ə bawt ð ə d ɔ ɹ v ð ə p ɹ ɪ z ə n t ʌ v ʌ ŋ k ə s w ɛ ɹ i b ʌ t k lows ə b zɹ̩vɹ̩z ʌ v ð ə m æ nɹ̩ v ð ɛ ɹ k æ p t ɪ v", + "ref_phonemes": "fɔr ɔr faɪv ʌv ðʌ lætɝ oʊnli lɪŋɡɝd ʌbaʊt ðʌ dɔr ʌv ðʌ prɪzʌn ʌv ʌŋkʌz wɛri bʌt kloʊs ʌbzɝvɝz ʌv ðʌ mænɝ ʌv ðɛr kæptɪv ", + "duration": 0.5421297550201416, + "PER": 35.483870967741936, + "score": { + "S": 25, + "D": 4, + "I": 4, + "N": 93 + } + }, + { + "model": "WavLM", + "phonemes": "ə ɪ l ɪ vɹ̩d ɪ n ə s t ɹ ɔ ŋ town ʌ v ə s ɛ n t nawʌ ð ə ɡ ɹ æ t ə f ə kejʃ ə n ð ə s æ v əd͡ʒf w ʊ d ɹɹ̩s s s i v æ w ɪ t s ɪ ŋ s ʌt͡ʃə n d ɪ k s ə b ɪ ə n ʌ v w i k n ə s æ n æ n ɛ n ə m i sowml ɔ ŋ h i d ə d æ n d sowm ʌt͡ʃk ɪ ɹ d", + "ref_phonemes": "dɪlɪvɝd ɪn ʌ strɔŋ toʊn ʌv ʌsɛnt ʌnaʊnst ðʌ ɡrætʌfʌkeɪʃʌn ðʌ sævʌdʒ wʊd rʌsiv ɪn wɪtnʌsɪŋ sʌtʃ æn ɛksʌbɪʃʌn ʌv wiknʌs ɪn æn ɛnʌmi soʊ lɔŋ heɪtʌd ʌnd soʊ mʌtʃ fɪrd ", + "duration": 0.7385311126708984, + "PER": 39.39393939393939, + "score": { + "S": 34, + "D": 8, + "I": 10, + "N": 132 + } + }, + { + "model": "WavLM", + "phonemes": "ðejd ɹ u b æ k ə l ɪ t ə l f ɹ ʌ m ð ə ɛ n t ɹ̩ɹə n s æ n d mowsʃ ə n t ə ð ə s ə powz ɪ d k ɑ n nd͡ʒɹ̩t ə ɛ n t ɹ̩ ɹ̩", + "ref_phonemes": "ðeɪ dru bæk ʌ lɪtʌl frʌm ðʌ ɛntrʌns ʌnd moʊʃʌnd tu ðʌ sʌpoʊzd kɑndʒɝɝ tu ɛntɝ ", + "duration": 0.35993003845214844, + "PER": 46.774193548387096, + "score": { + "S": 19, + "D": 1, + "I": 9, + "N": 62 + } + }, + { + "model": "WavLM", + "phonemes": "b ʌ t ð ə b ɛ ɹ n s t ɛ d ʌ vowbowb bejɪ ŋ mejn tejn d ð ə s i d ɪ h æ d tejk əɪ n æ n d ɡ ɹawɑ d", + "ref_phonemes": "bʌt ðʌ bɛr ɪnstɛd ʌv oʊbeɪɪŋ meɪnteɪnd ðʌ sit ɪt hæd teɪkʌn ʌnd ɡraʊld ", + "duration": 0.3658008575439453, + "PER": 36.84210526315789, + "score": { + "S": 14, + "D": 2, + "I": 5, + "N": 57 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə k ʌ n ɪ ŋ m æ n ɪ z ə f ɹejd æ h ɪ z b ɹ ɛ θ w ɪ l b lowʌ p ɑ n h z b ɹ ʌ ðɹ̩z æ n tejk ə weji ɛ ɹ kɹ̩d͡ʒɪəd͡ʒd t u k ə n t ɪ n j u dejv v ə d m p ɹ u v ɪ ŋ ð ə h ɪ n th i ɹ ɪ s i d m ʌ s t t æ n d fɹ̩ðɹ̩ɔ f", + "ref_phonemes": "ðʌ kʌnɪŋ mæn ɪz ʌfreɪd ðæt hɪz brɛθ wɪl bloʊ ʌpɑn hɪz brʌðɝz ʌnd teɪk ʌweɪ ðɛr kɝʌdʒ tu kʌntɪnjud deɪvɪd ɪmpruvɪŋ ðʌ hɪnt hi rʌsivd ðeɪ mʌst stænd fɝðɝ ɔf ", + "duration": 0.6833853721618652, + "PER": 37.903225806451616, + "score": { + "S": 25, + "D": 11, + "I": 11, + "N": 124 + } + }, + { + "model": "WavLM", + "phonemes": "ð ɛ n ɪ z ɪ f s æ t ə s fajd ʌ v ð ɛ ɹ sejf t i ð ə s kawt l ɛ f th ɪ z p ə z ɪ ʃ ə n æ n d s lowl i ɛ n tɹ̩d ð ə p lejs", + "ref_phonemes": "ðɛn æz ɪf sætʌsfaɪd ʌv ðɛr seɪfti ðʌ skaʊt lɛft hɪz pʌzɪʃʌn ʌnd sloʊli ɛntɝd ðʌ pleɪs ", + "duration": 0.43636631965637207, + "PER": 21.73913043478261, + "score": { + "S": 14, + "D": 0, + "I": 1, + "N": 69 + } + }, + { + "model": "WavLM", + "phonemes": "ɪ t w ɑ z sajl ə n t n d ɡ l u m i b i ɪ ŋ t ɛ n æ n t ɪ d sowl i bajð ə k æ p t ɪ v n d lajt ə d bajð ə dajɪ ŋ ɛ m bɹ̩z ʌ v ə fajɹ̩w æ ɪ æ d b ɪ n j u z d f ɔ ɹ ð ə pɹ̩p ə s ʌ v k ʊ kɹ̩i", + "ref_phonemes": "ɪt wɑz saɪlʌnt ʌnd ɡlumi biɪŋ tɛnʌntɪd soʊlli baɪ ðʌ kæptɪv ʌnd laɪtʌd baɪ ðʌ daɪɪŋ ɛmbɝz ʌv ʌ faɪɝ wɪtʃ hæd bɪn juzd fɔr ðʌ pɝpʌst ʌv kʊkɝi ", + "duration": 0.6995851993560791, + "PER": 28.57142857142857, + "score": { + "S": 20, + "D": 7, + "I": 5, + "N": 112 + } + }, + { + "model": "WavLM", + "phonemes": "ə ŋ k ə s ɑ k j ə pajd ə d ɪ s t ə n k ɔ ɹ nɹ̩ɪ n ɹ i k lajn ɪ ŋ æ t ə t u d b i ɪ ŋ ɹ d͡ʒ d͡ʒ d l i bawn d bowθ h æ n d z æ n d f i t bajs t ɹ ɔ ŋ æ n d pejn f ə l w ɪ θ s", + "ref_phonemes": "ʌŋkʌz ɑkjʌpaɪd ʌ dɪstʌnt kɔrnɝ ɪn ʌ rɪklaɪnɪŋ ætʌtud biɪŋ rɪdʒɪdli baʊnd boʊθ hændz ʌnd fit baɪ strɔŋ ʌnd peɪnfʌl wɪðz ", + "duration": 0.6401748657226562, + "PER": 32.6530612244898, + "score": { + "S": 25, + "D": 3, + "I": 4, + "N": 98 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə s kawt u æ d l ɛ f t dejv t æ t ð ə d ɔ ɹ t ə æ sɹ̩tejn ðejw wɹ̩n n ɑ t ə b zɹ̩v d θ ɔ t ə dt p ɹ u d ə n t t ə p ɹ ə zɹ̩v h ɪ z d ɪ s kɡajz æə n d t ɪ l ə ʃ ʊ ɹ d ʌ v ð ɛ ɹ p ɹajv ə s i", + "ref_phonemes": "ðʌ skaʊt hu hæd lɛft deɪvɪd æt ðʌ dɔr tu æsɝteɪn ðeɪ wɝ nɑt ʌbzɝvd θɔt ɪt prudʌnt tu prʌzɝv hɪz dɪsɡaɪz ʌntɪl ʌʃʊrd ʌv ðɛr praɪvʌsi ", + "duration": 0.6588010787963867, + "PER": 39.04761904761905, + "score": { + "S": 28, + "D": 3, + "I": 10, + "N": 105 + } + }, + { + "model": "WavLM", + "phonemes": "w ʌ t͡ʃt ʃ æ l w i d u w ɪ t ð ə m ɪ ŋ ɡowz æ ð ə d ɔ ɹ ðejk k awn t s ɪ k s æ n ð ɪ s ɪ ŋ ɡɹ̩æɹ̩ æ z ɡ ʊ d æ z n ʌ θ ɪ ŋ", + "ref_phonemes": "wʌt ʃæl wi du wɪð ðʌ mɪŋɡoʊz æt ðʌ dɔr ðeɪ kaʊnt sɪks ʌnd ðɪs sɪŋɝ ɪz æz ɡʊd æz nʌθɪŋ ", + "duration": 0.4378678798675537, + "PER": 32.30769230769231, + "score": { + "S": 11, + "D": 3, + "I": 7, + "N": 65 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə d ɛ l ə w ɛ ɹ z ɑ ɹt͡ʃɪ l dɹ ən ʌ v ð ə t ɔ ɹ t ə s ɪ n ð əawt s t ɹ ɪ p ð d ɪ ɹ", + "ref_phonemes": "ðʌ dɛlʌwɛrz ɑr tʃɪldrʌn ʌv ðʌ tɔrtʌs ʌnd ðeɪ aʊtstrɪp ðʌ dɪr ", + "duration": 0.27994799613952637, + "PER": 36.734693877551024, + "score": { + "S": 14, + "D": 3, + "I": 1, + "N": 49 + } + }, + { + "model": "WavLM", + "phonemes": "h ŋ k ə s h u ʊ æ d ɔ l ɹ ɛ d i ə p ɹowt͡ʃt ð ə d ɔ ɹ n d ɹ ɛ d ɪ ŋ ə s t ə l i d ð ə wejɪ ɹ i kojl d m p lejsd͡ʒ t ɪ m s ɛ l f w ʌ n s m ɔ ɹɪ n ð ə b ɑ t m ʌ v ð ə l ɑ d͡ʒ", + "ref_phonemes": "ʌŋkʌz hu hæd ɔlrɛdi ʌproʊtʃt ðʌ dɔr ɪn rɛdinʌs tu lɛd ðʌ weɪ naʊ rikɔɪld ʌnd pleɪst hɪmsɛlf wʌns mɔr ɪn ðʌ bɑtʌm ʌv ðʌ lɑdʒ ", + "duration": 0.5629482269287109, + "PER": 40.816326530612244, + "score": { + "S": 25, + "D": 8, + "I": 7, + "N": 98 + } + }, + { + "model": "WavLM", + "phonemes": "b ʌ t h ɑ kajh u wh ɑ z t u m ʌt͡ʃk k j ə pajd w ɪ ð zown θ ɔ t s t ə nowt ð ə m u v m ə n t ə n t ɪ n j u d s p i k ɪ ŋ m ɔ ɹ t ə ɪ m s ɛ l f ð æ n t ə ɪ z k ə m p æ n j ə n", + "ref_phonemes": "bʌt hɔkaɪ hu wɑz tu mʌtʃ ɑkjʌpaɪd wɪð hɪz oʊn θɔts tu noʊt ðʌ muvmʌnt kʌntɪnjud spikɪŋ mɔr tu hɪmsɛlf ðæn tu hɪz kʌmpænjʌn ", + "duration": 0.555736780166626, + "PER": 23.232323232323232, + "score": { + "S": 16, + "D": 5, + "I": 2, + "N": 99 + } + }, + { + "model": "WavLM", + "phonemes": "soww ŋ k ə s j u d b ɛ tɹ̩tejk ð ə l i d wajl w ɪ l p ʊ t ɑ n ð ə s k ɪ n ə ɡ ɛ n ɪ n t ɹ ʌ s t t ə k ʌ n ɪ ŋ f ɔ ɹ w ɑ n t ʌ v s p i d", + "ref_phonemes": "soʊ ʌŋkʌz ju hæd bɛtɝ teɪk ðʌ lɛd waɪl aɪ wɪl pʊt ɑn ðʌ skɪn ʌɡɛn ʌnd trʌst tu kʌnɪŋ fɔr wɑnt ʌv spid ", + "duration": 0.4274144172668457, + "PER": 26.923076923076923, + "score": { + "S": 15, + "D": 5, + "I": 1, + "N": 78 + } + }, + { + "model": "WavLM", + "phonemes": "w ɛ l ʌ t k æ n t b i d ʌ n bajm n kɹ̩d͡ʒɪ n d w ɔ ɹ m ʌ s t b i d ʌ n bajs sɹ̩k ə m v ɛ n ʃ ə n", + "ref_phonemes": "wɛl wʌt kænt bi dʌn baɪ meɪn kɝʌdʒ ɪn wɔr mʌst bi dʌn baɪ sɝkʌmvɛntʃʌn ", + "duration": 0.4013700485229492, + "PER": 28.57142857142857, + "score": { + "S": 8, + "D": 4, + "I": 4, + "N": 56 + } + }, + { + "model": "WavLM", + "phonemes": "ə s u n æ z ð i z d ɪ s p ə z ɪ ʃ ə n z wɹ̩mejd ð ə s kawt t tɹ̩n t ə dejv næ n d ɡejv h ɪ m ɪ s p ɑ ɹ t ɪ ŋ ɪ n s t ɹ ʌ k ʃ ə n z", + "ref_phonemes": "æz sun æz ðiz dɪspʌzɪʃʌnz wɝ meɪd ðʌ skaʊt tɝnd tu deɪvɪd ʌnd ɡeɪv hɪm hɪz pɑrtɪŋ ɪnstrʌkʃʌnz ", + "duration": 0.36983513832092285, + "PER": 31.57894736842105, + "score": { + "S": 17, + "D": 4, + "I": 3, + "N": 76 + } + }, + { + "model": "WavLM", + "phonemes": "m u s ɑ ɹ p i s f ə l æ n majt ɛ m pɹ̩ajh ʌ m b l i t ɹ ʌ s t ɪ z ɡ ɹejt l i ɡ ɪ v ə n t ə mɹ̩s i ɪ n d l ʌ v ɹ ɪ tɹ̩n n dejv ə ə l ɪ t ə l n n ʌ th owl l d ə t sowej dɹ̩ æɹ ɛ k æ n d ə t æ k ɑ n h ɪ z m æ n h ʊ d ʌ t ð ɛ ɹ ɑ ɹ n ʌ n h u k æ n sejðv æ tajəv ɛ vɹ̩fɔɹ̩ɡ ɑ t ɪ n majf ɪ n ð ə l ɔ ɹ d i v ə n ɪ n ð ə ɡ ɹejt ə s t t ɹejt s", + "ref_phonemes": "maɪ pɝsuts ɑr pisfʌl ʌnd maɪ tɛmpɝ aɪ hʌmbli trʌst ɪz ɡreɪtli ɡɪvʌn tu mɝsi ʌnd lʌv rɪtɝnd deɪvɪd ʌ lɪtʌl nɛtʌld æt soʊ dɝɛkt æn ʌtæk ɑn hɪz mænhʊd bʌt ðɛr ɑr nʌn hu kæn seɪ ðæt aɪ hæv ɛvɝ fɝɡɑtʌn maɪ feɪθ ɪn ðʌ lɔrd ivɪn ɪn ðʌ ɡreɪtʌst streɪts ", + "duration": 1.3749122619628906, + "PER": 39.37823834196891, + "score": { + "S": 44, + "D": 15, + "I": 17, + "N": 193 + } + }, + { + "model": "WavLM", + "phonemes": "ɪ ɪ f j ɹ n ɑ t ð ɛ n n ɑ k t ɑ n ð ə h ɛ d j ɔ ɹ b i ɪ ŋ ɪ n n ɑ n k ɪ m p ɑ s əɹ̩ w ɪ l p ɹ ə t ɛ k t j u n d j l ð ɛ n h æ v ə ɡ ʊ d ɹ i z ə n t ə ɪ s p ɛ k t ə dajɪ n j ɔ ɹ b ɛ d", + "ref_phonemes": "ɪf ju ɑr nɑt ðɛn nɑkt ɑn ðʌ hɛd jɔr biɪŋ ʌ nɑn kʌmpɑsɝ wɪl prʌtɛkt ju ʌnd jul ðɛn hæv ʌ ɡʊd rizʌn tu ɪkspɛkt tu daɪ ɪn jɔr bɛd ", + "duration": 0.594611644744873, + "PER": 26.041666666666668, + "score": { + "S": 15, + "D": 6, + "I": 4, + "N": 96 + } + }, + { + "model": "WavLM", + "phonemes": "sowd͡ʒ jt͡ʃu z f jɹ̩s ɛ l f t ə mejk ə ɹ ʌ ʃ ɔ ɹ t ɛ ɹ i h ɪ ɹ", + "ref_phonemes": "soʊ tʃuz fɔr jɝsɛlf tu meɪk ʌ rʌʃ ɔr tɛri hir ", + "duration": 0.3292689323425293, + "PER": 51.42857142857142, + "score": { + "S": 12, + "D": 1, + "I": 5, + "N": 35 + } + }, + { + "model": "WavLM", + "phonemes": "b ɹ v l i ɪ nd͡ʒɛ nɹ̩ə s l i h æ z h i b æ t ə d ɪ nd majd ɪ h æ f æ n d ð ɪ s æ n d m ɔ ɹ ɪ lajd ɛ ɹ n h ɪ z sɹ̩v ə s", + "ref_phonemes": "breɪvli ʌnd dʒɛnɝʌsli hæz hi bætʌld ɪn maɪ bɪhæf ʌnd ðɪs ʌnd mɔr wɪl aɪ dɛr ɪn hɪz sɝvʌs ", + "duration": 0.4369354248046875, + "PER": 32.857142857142854, + "score": { + "S": 15, + "D": 5, + "I": 3, + "N": 70 + } + }, + { + "model": "WavLM", + "phonemes": "ɪ i p sajn ənt z l ɔ ŋ æ z mejb i n ɪ w ʊ t b i wajz w ɛ n j u d u s i k ə b ɹejkt k t s ʌ d ə n l i æ n w ʌ n ʌv j ɔ ɹ ʃawn h ɪ ŋ z w ɪ ə w ɪ l sɹ̩v t ə ɹ i m ʌ ð ə ɪ n d i ə n z ð æ t j u wɑɹn ɑ t ɔ l t ə ɡ ɛ ðɹ̩æ z ɹ ɪ s p ɑ n z ə b ə l æ z m ɛ n ʃ ʊ d b i", + "ref_phonemes": "kip saɪlʌnt æz lɔŋ æz meɪ bi ʌnd ɪt wʊd bi waɪz wɛn ju du spik tu breɪk aʊt sʌdʌnli ɪn wʌn ʌv jɔr ʃaʊtɪŋz wɪtʃ wɪl sɝv tu rimaɪnd ðʌ ɪndiʌnz ðæt ju ɑr nɑt ɔltʌɡɛðɝ æz rispɑnsʌbʌl æz mɛn ʃʊd bi ", + "duration": 0.7867321968078613, + "PER": 30.666666666666664, + "score": { + "S": 32, + "D": 10, + "I": 4, + "N": 150 + } + }, + { + "model": "WavLM", + "phonemes": "ɪ f hawɛ vɹ̩ðejt ejk j ɔ ɹ s k æ l tp æ zajt ɹ ʌ s t ɪ n d b l i v ðejw ɪ l n ɑ t d ɪ p ɛ n d ɑ n ɪ d ʌ n ə s n najw ɪ l n ɑ t f ɔɹ̩ ɡ ɛ t ð ə d i d b ʌ t ɹ ɪ v ɛ nd͡ʒɪ t æ z b ɪ k ʌ m s t t ɹ u w ɔ ɹ j æɪ n d t ɹ ʌ s t i f ɹ ɛ n z", + "ref_phonemes": "ɪf haʊɛvɝ ðeɪ teɪk jɔr skælp æz aɪ trʌst ʌnd bɪliv ðeɪ wɪl nɑt dɪpɛnd ɑn ɪt ʌŋkʌz ʌnd aɪ wɪl nɑt fɝɡɛt ðʌ did bʌt rivɛndʒ ɪt æz bɪkʌmz tru wɔriɝz ʌnd trʌsti frɛndz ", + "duration": 0.812413215637207, + "PER": 29.457364341085274, + "score": { + "S": 27, + "D": 5, + "I": 6, + "N": 129 + } + }, + { + "model": "WavLM", + "phonemes": "how l d s ɛ dejv v ə d p ɹ ə s i v ɪ ŋ ð æ t w ɪ ð ð ɪ s ə ʃ ʊ ɹ ə n s ðejw w ɹə bawt t ə l i v h ɪ m n ə n wɹ̩ð ə ə n h ʌ m b ə f ɑ lowəw ɛ ɹ v w ʌ n h u t ɑ t n ɑ t ð ə d æ m n ə b ə l p ɹ ɪ n s ə p ə l ʌ v ɹ ɪ v ɛ ɪ", + "ref_phonemes": "hoʊld sɛd deɪvɪd pɝsivɪŋ ðæt wɪð ðɪs ʌʃʊrʌns ðeɪ wɝ ʌbaʊt tu liv hɪm aɪ æm æn ʌnwɝði ʌnd hʌmbʌl fɑloʊɝ ʌv wʌn hu tɔt nɑt ðʌ dæmnʌbʌl prɪnsʌpʌl ʌv rivɛndʒ ", + "duration": 0.7016916275024414, + "PER": 37.39837398373984, + "score": { + "S": 30, + "D": 10, + "I": 6, + "N": 123 + } + }, + { + "model": "WavLM", + "phonemes": "ð ɛ n h i v ɪ ŋ ə h ɛ v i saj pɹ ɑ b ə b l i ɪ m ʌ ŋ ð ə l æ s t h i ɛ vɹ̩d ɹ u n pajn d ɪ ŋ f ɔ ɹ ən d ɪ ʃ ə n h i æ d sowl ɔ ŋ ə b æ n d ə n d i æ d ə d t ɪ z w ʌ tajw w ʊ d w ɪ ʃ t ə p ɹ æ k t ə s majk s ɛ l f æ z w ʌ n w ɪ θawt ə k ɹ ɔ s ə b l ʌ d ðowð d z z n ɑ t ɔ l wejz i i z i d d iow w ð ɪ n ɪ n d i ə n æ z j i w ʊ d w ɪ ð ə ɛ lowk ɹ ɪ st͡ʃə n", + "ref_phonemes": "ðɛn hivɪŋ ʌ hɛvi saɪ prɑbʌbli ʌmʌŋ ðʌ læst hi ɛvɝ dru ɪn paɪnɪŋ fɔr ʌ kʌndɪʃʌn hi hæd soʊ lɔŋ ʌbændʌnd hi ædʌd ɪt ɪz wʌt aɪ wʊd wɪʃ tu præktaɪz maɪsɛlf æz wʌn wɪθaʊt ʌ krɔs ʌv blʌd ðoʊ ɪt ɪz nɑt ɔlweɪz izi tu dil wɪð æn ɪndiʌn æz ju wʊd wɪð ʌ fɛloʊ krɪstʃʌn ", + "duration": 1.4238016605377197, + "PER": 28.499999999999996, + "score": { + "S": 41, + "D": 10, + "I": 6, + "N": 200 + } + }, + { + "model": "WavLM", + "phonemes": "æ ɑ d b l ɛ s j ɪ f ɹ ɛ n d aj j u b ɪ l i v j ɔ ɹ s ɛ n t ɪ z n ɑ t kɡ ɹejt t l i ɹ ɔ �� w ɛ n ð ə m æ tɹ̩ɪ z d u l i k ə n s ɪ dɹ̩d n k i p ɪ ŋ ə tɹ̩n ə t i b ɪ f ɔ ɹ ð əajz ðowʌ ow m ʌt͡ʃk ɪ p ɛ n d z ɑ n ð ə n æt͡ʃɹ̩ə l ɡ ɪ v s ɪ n ð ə f ɔ ɹ ʌ v t ɛ m tejʃ ə n", + "ref_phonemes": "ɡɑd blɛs ju frɛnd aɪ du bɪliv jɔr sɛnt ɪz nɑt ɡreɪtli rɔŋ wɛn ðʌ mætɝ ɪz duli kʌnsɪdɝd ʌnd kipɪŋ ɪtɝnʌti bɪfɔr ðʌ aɪz ðoʊ mʌtʃ dɪpɛndz ɑn ðʌ nætʃɝʌl ɡɪfts ʌnd ðʌ fɔrs ʌv tɛmteɪʃʌn ", + "duration": 0.8925340175628662, + "PER": 32.16783216783217, + "score": { + "S": 30, + "D": 5, + "I": 11, + "N": 143 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə d ɛ l ə w ɛ ɹ d ɔ ɡ h i s ɛ d l i n ɪ ŋ f ɔ ɹ wɹ̩d æ n p j ɪ ɹ ɪ ŋ θ ɹ u ð ə d ɪ m lajk t ə k æt͡ʃð ə ɪ k s p ɹ ɛ ʃ ə n ʌ v ð ə ʌ ðɹ̩z f it͡ʃɹ̩z zs i ə f ɹejd", + "ref_phonemes": "ðʌ dɛlʌwɛr dɔɡ hi sɛd linɪŋ fɔrwɝd ʌnd pirɪŋ θru ðʌ dɪm laɪt tu kætʃ ðʌ ɪksprɛʃʌn ʌv ðʌ ʌðɝz fitʃɝz ɪz hi ʌfreɪd ", + "duration": 0.5121281147003174, + "PER": 34.831460674157306, + "score": { + "S": 23, + "D": 2, + "I": 6, + "N": 89 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə mows i k ə n s t ɑ ɹ t ə d ɑ n h ɪ z f i t æ n d ʃ ʊ k h ɪ ʃ æ ɡ i k ʌ vɹ̩ɪ ŋ æ z ðowð ə æ n ə m ə h i kawn tɹ̩f ɪ t ə d w ɑ z ə bawt t ə mejkə k s ʌ m d ɛ s pɹ̩ə t ɛ fɹ̩t", + "ref_phonemes": "ðʌ moʊhikʌn stɑrtʌd ɑn hɪz fit ʌnd ʃʊk hɪz ʃæɡi kʌvɝɪŋ æz ðoʊ ðʌ ænʌmʌl hi kaʊntɝfɪtɪd wɑz ʌbaʊt tu meɪk sʌm dɛsprɪt ɛfɝt ", + "duration": 0.5610170364379883, + "PER": 30.612244897959183, + "score": { + "S": 22, + "D": 2, + "I": 6, + "N": 98 + } + }, + { + "model": "WavLM", + "phonemes": "h i h æ n nowə kejʒ ə n t ə d ɪ lejf ɔ ɹ ɛ t ð ə n n ɛ k s t ɪ n s t ə n t ə bɹ̩s t ʌ v k ɹajz z ɪ l d ð əawtɹ̩d͡ʒd ɹ̩æ ɛ ɹ n d ɹ n n ə l ɔ ŋ ð ə howl ɪ k s t ɛ n t u v ð ə ɪ l ə d͡ʒ", + "ref_phonemes": "hi hæd noʊ ʌkeɪʒʌn tu dɪleɪ fɔr æt ðʌ nɛkst ɪnstʌnt ʌ bɝst ʌv kraɪz fɪld ðʌ aʊtɝ ɛr ʌnd ræn ʌlɔŋ ðʌ hoʊl ɪkstɛnt ʌv ðʌ vɪlʌdʒ ", + "duration": 0.6240766048431396, + "PER": 41.83673469387755, + "score": { + "S": 30, + "D": 1, + "I": 10, + "N": 98 + } + }, + { + "model": "WavLM", + "phonemes": "ə ŋ k ə s k æ s t h z s k ɪ n æ n d s t ɛ p t f ɔ ɹ θ ɪ n h ɪ zown b j u t ə f ə l p ɹ ə p ɔ ɹ ʃ ə n z", + "ref_phonemes": "ʌŋkʌz kæst hɪz skɪn ʌnd stɛpt fɔrθ ɪn hɪz oʊn bjutʌfʌl prʌpɔrʃʌnz ", + "duration": 0.3375828266143799, + "PER": 24.074074074074073, + "score": { + "S": 12, + "D": 1, + "I": 0, + "N": 54 + } + }, + { + "model": "WavLM", + "phonemes": "s ɪ n s ð ə p ɪ ɹ i ə d ʌ vawɹ̩ tejl ð i æ k t ɪ v s p ɪ ɹ ə t ʌ v ð ə k ə n t ɹ i h æə sɹ̩awn d ə d ə d w ɪ ð ə b ɛ l t ʌ v ɹ t͡ʃʃ ɪ n θ ɹajv ɪ ŋ s ɛ t ə m ə n t z own n ʌ n b ʌ ð ə h ʌ n tɹ̩ ɔ ɹ ð ə s æ v ɪd͡ʒɪ ɪ z ɛ vɹ̩nown i v ə naw t ə p ɛ n ə t ɹejt ɪ t s wajl d ɹ i s ɛ s ə z", + "ref_phonemes": "sɪns ðʌ pɪriʌd ʌv aʊɝ teɪl ðʌ æktɪv spɪrʌt ʌv ðʌ kʌntri hæz sɝaʊndʌd ɪt wɪð ʌ bɛlt ʌv rɪtʃ ʌnd θraɪvɪŋ sɛtʌlmʌnts ðoʊ nʌn bʌt ðʌ hʌntɝ ɔr ðʌ sævʌdʒ ɪz ɛvɝ noʊn ivɪn naʊ tu pɛnʌtreɪt ɪts waɪld risɛsʌz ", + "duration": 1.095329761505127, + "PER": 36.477987421383645, + "score": { + "S": 43, + "D": 6, + "I": 9, + "N": 159 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə d j u z wɹ̩s s ʌ fɹ̩dt ə ɛ k s hejl n d ð ə s ʌ n h æ d d ɪə s pɹ̩s t ð ə m ɪ s t s æ n d w ɑ s ʃ ɛ d ɪ ə s s t ɹ ɔ ŋ ɪæ n d k l ɪ ɹ lajt ɪ n ð ə f ɔ ɹ ə s t w ɛ n ð ə t ɹ æ v lɹ̩z z ɹ ɪ z u m d ð ɛ ɹd͡ʒɹ̩n i", + "ref_phonemes": "ðʌ duz wɝ sʌfɝd tu ɛkʃheɪl ʌnd ðʌ sʌn hæd dɪspɝst ðʌ mɪsts ʌnd wɑz ʃɛdɪŋ ʌ strɔŋ ʌnd klɪr laɪt ɪn ðʌ fɔrʌst wɛn ðʌ trævʌlɝz rɪzumd ðɛr dʒɝni ", + "duration": 0.6915643215179443, + "PER": 35.13513513513514, + "score": { + "S": 26, + "D": 2, + "I": 11, + "N": 111 + } + }, + { + "model": "WavLM", + "phonemes": "æ f tɹ̩p ɹ ə s i d ɪ ŋ ə f j u majl z ð ə p ɹ ɑ ɡ ɹ ɛ s ʌ v h ɑ kajh u l ɛ d ð ə ə d v æ n s b ɪ kejm m m ɔ ɹ d ɪ l ɪ bɹ̩ə ə t æ n d w ɑt͡ʃf ə l", + "ref_phonemes": "æftɝ prʌsidɪŋ ʌ fju maɪlz ðʌ prɑɡrɛs ʌv hɔkaɪ hu lɛd ðʌ ʌdvæns bɪkeɪm mɔr dɪlɪbɝʌt ʌnd wɑtʃfʌl ", + "duration": 0.5240211486816406, + "PER": 29.87012987012987, + "score": { + "S": 18, + "D": 0, + "I": 5, + "N": 77 + } + }, + { + "model": "WavLM", + "phonemes": "æ i ɔ f ə n s t ɑ p t t ə ɪ ɡ z æ m ə nd ð ə t ɹ i z n �� ɹ ɪ i k ɹ ɔ s hvɹ ɪ v j ə l ə t w ɪ θawt ə t ɛ n t ɪ v l i k ə n s ɪ dɹ̩ɪ ŋ ð ə k w ɑ n t ə t i ð ə v ə l ɑ s əɪ t i n d ð ə k ʌ lɹ̩ʌ v t s w ɔ tɹ̩z", + "ref_phonemes": "hi ɔfʌn stɑpt tu ɪɡzæmɪn ðʌ triz nɔr dɪd hi krɔs ʌ rɪvjʌlt wɪθaʊt ʌtɛntɪvli kʌnsɪdɝɪŋ ðʌ kwɑntʌti ðʌ vʌlɑsʌti ʌnd ðʌ kʌlɝ ʌv ɪts wɔtɝz ", + "duration": 0.6534790992736816, + "PER": 32.11009174311927, + "score": { + "S": 23, + "D": 5, + "I": 7, + "N": 109 + } + }, + { + "model": "WavLM", + "phonemes": "d ɪ s t ɹ ʌ s t ɪ ŋ h ɪ zown vd͡ʒʌt͡ʃk m ə n t h ɪ z ə p i l z t ə ð ə ə p ɪ nŋ j ə nd əʌ ɪ ŋ ɡ ʌt͡ʃk w i k w ɹ̩f ɹ i k w ə n t æ n t ɹ̩n ə s t", + "ref_phonemes": "dɪstrʌstɪŋ hɪz oʊn dʒʌdʒmʌnt hɪz ʌpilz tu ðʌ ʌpɪnjʌn ʌv tʃɪŋdʌkaʊtʃ wɝ frikwʌnt ʌnd ɝnɪst ", + "duration": 0.5104143619537354, + "PER": 48.0, + "score": { + "S": 24, + "D": 2, + "I": 10, + "N": 75 + } + }, + { + "model": "WavLM", + "phonemes": "j ɛ t h ɪ ɹ ɹ w i ɪ ð ɪ n ə ʃ ɔ ɹ t ɹejnd͡ʒ ʌ v ð ə s ɡɹ̩ɹ u n z æ n d n ɑ t ə sajn ʌ v ə t ɹejl h æ v w i k ɹ ɔ s t", + "ref_phonemes": "jɛt hir ɑr wi wɪðɪn ʌ ʃɔrt reɪndʒ ʌv ðʌ skɛrʌnz ʌnd nɑt ʌ saɪn ʌv ʌ treɪl hæv wi krɔst ", + "duration": 0.43381237983703613, + "PER": 34.84848484848485, + "score": { + "S": 19, + "D": 2, + "I": 2, + "N": 66 + } + }, + { + "model": "WavLM", + "phonemes": "l ɛ t ʌ s ɹ i t ɹejs awɹ̩sɹ t ɛ p s n d ɪ ɡ z æ m ə n æ z w i ɡow w ɪ ð k i nɹ̩ajz", + "ref_phonemes": "lɛt ʌs ritreɪs aʊɝ stɛps ʌnd ɪɡzæmɪn æz wi ɡoʊ wɪð kinɝ aɪz ", + "duration": 0.35148119926452637, + "PER": 27.659574468085108, + "score": { + "S": 9, + "D": 1, + "I": 3, + "N": 47 + } + }, + { + "model": "WavLM", + "phonemes": "æ m v ɪ k j ə w t æmw ɹ̩æɹ ə p ɹowɡ ɹ æ m dd͡ʒɹ̩ɛ k tɹ̩ æ ð ə nawæ ə l ɪ n d t ə t u s ə n ɛ ɹ ə l ɑd͡ʒɪ k ə l ɪ sɔ ɹ dɹ̩z æ n d s t ɹowk æ n d p ɹowɡ ɹ æ m dɹ̩ɛ tɹ̩ əowvɹs s i z", + "ref_phonemes": "aɪm vɪki wɪtmɔr aɪm ʌ proʊɡræm dɝɛktɝ æt ðʌ næʃʌnʌl ɪnstʌtuts ʌv nʊrʌlɑdʒɪkʌl dɪsɔrdɝz ʌnd stroʊk ʌnd ʌ proʊɡræm dɝɛktɝ hu oʊvɝsiz ", + "duration": 0.7520585060119629, + "PER": 55.04587155963303, + "score": { + "S": 40, + "D": 9, + "I": 11, + "N": 109 + } + }, + { + "model": "WavLM", + "phonemes": "s m m i s i ə f s ɹ ə sɹ̩d͡ʒt͡ʃkd ɹ æ n z æ n d wɹ̩k s t ə ɡ ɛ ɹ̩ lows s l i ɪ taw ɑ k t ɔ ɹ ʃ ɛ s ə k ɔ ɹ nejt ə ɛ m i s i əɛ ɛ s ɹ æ n z æ n ajej k æɛ m i s i ə θ ʌ s wɹ̩k ə n ɡk ɹ u s m ʌ t͡ʃ p l ɛ ʒɹ̩ k ə w ɛ l p ə m i t ə ð ə f fɹ̩s s t ɪ n", + "ref_phonemes": "mɛksf risɝtʃ ɡrænts ʌnd wɝks tʌɡɛðɝ kloʊsli wɪð draɪv kɔrʌsɛts tu koʊɔrdʌneɪt ðʌ mɛksf trænznɪh mɛksf wɝkɪŋ ɡrup ɪts maɪ plɛʒɝ tu wɛlkʌm ju tu ðʌ fɝst ɪn ", + "duration": 0.96291184425354, + "PER": 77.77777777777779, + "score": { + "S": 48, + "D": 17, + "I": 33, + "N": 126 + } + }, + { + "model": "WavLM", + "phonemes": "s v l ə n p ɑ ɹ t s ɪɹ̩ɹ i z ʌ v w ɛ v ə naw ɑɹ̩zɹ s tɹ̩b i ɪ ŋ ɔ ɹ ɡ ə najz ɪ nɔ ɹɡ ɹ̩d͡ʒə d ɪ ɛ l ə ə i sɹ̩d͡ʒds ɹowd n awæ f ɔ ɹ ɛ m i s i ə θ ʌ s ə s ɛ v n w ɛ v ə nawɹ̩z w ɪ l tejk p lejs", + "ref_phonemes": "ʌ sɛvʌpɝtæp sɪriz ʌv wɛbnɝʌnz ðæt ɑr biɪŋ ɔrɡʌnaɪzd ɪn ɔrdɝ tu dɪvɛlʌp ʌ risɝtʃ roʊdmæp fɔr mɛksf ðʌ sɛvʌn wɛbnɝʌnz wɪl teɪk pleɪs ", + "duration": 0.7429728507995605, + "PER": 65.42056074766354, + "score": { + "S": 36, + "D": 11, + "I": 23, + "N": 107 + } + }, + { + "model": "WavLM", + "phonemes": "b t w i naww æ n d ə s ɛ m bɹ̩w æ n ð ə d ɪ l ɪ vɹ̩əb ə l f ɹ ʌ m ɔ l ʌ v ð ɪ s æ fɹ̩w ɪ l b i ɹ i k w ɔ ɹ t ə ð ə æ n ajɪ n deji æ n ejɪ i n d d i æ s ə vajz ɹ i k ɑ n s ə l æ t ɛ ɹm mejɪ t w ɛ n t i t w ɛ n t i fw ɔ ɹ m i t ɪ ŋ", + "ref_phonemes": "bɪtwin naʊ ʌnd dɪsɛmbɝ ʌnd ðʌ dɪlɪvɝʌbʌl frʌm ɔl ʌv ðɪs ɛfɝt wɪl bi ʌ ripɔrt tu ðʌ nændz ædvaɪzɝi kaʊnsʌl æt ðɛr meɪ twɛnti twɛntifʊr mitɪŋ ", + "duration": 0.8182055950164795, + "PER": 52.21238938053098, + "score": { + "S": 27, + "D": 8, + "I": 24, + "N": 113 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə ɡowl ʌ v ð ə ɹ i sɹ̩t͡ʃ t͡ʃɹowdl p ɹ ɑ s ɛ s ɪ z t əw ɪ s ɛ s kɹ̩ə ə n t æ n z ʌ fθ ɛ s ɹ ɪ sɹ̩d͡ʒɪ æ n dajd ɛ n t ə fajd v ɡ æ p ɛ ɹ i ə z ɹ ɑ pɹ̩tɪ u n t ə t i z t ə m u ð ə f i l t w ɔ ɹ ɹ ɛn d z lejʃ ə n ə l ɹ i sɹ̩t͡ʃd͡ʒɪ", + "ref_phonemes": "ðʌ ɡoʊl ʌv ðʌ risɝtʃ roʊdmæp prɑsɛs ɪz tu ʌsɛs kɝʌnt mɛksf risɝtʃ ʌnd aɪdɛntʌfaɪ ɡæp ɛriʌz ɔr ɑpɝtunʌtiz tu muv ðʌ fild tʌwɔrd trænsleɪʃʌnʌl risɝtʃ ", + "duration": 0.8343296051025391, + "PER": 62.295081967213115, + "score": { + "S": 44, + "D": 7, + "I": 25, + "N": 122 + } + }, + { + "model": "WavLM", + "phonemes": "t ɹ æ v zlejʃ ə n ə l s t ʌ d i z n ɪ n t ə k l ɪ nt ɪ k ə l ɹajb z t ə d ɪ v ɛ l ə t ɹ i k m ə n t s f ɔ ɹ ɛ m i s i ʌ v s ɛ s ə ɹ i sɹ̩t͡ʃk p ɹajɔ ɹ ə i zajd ɛ n ə fajd w ɪ l b i ɪ z t ə ɡajdə ɹ i sɹ̩t͡ʃp ə k ɹ ɔ s ə k ə mj u n ə t i", + "ref_phonemes": "trænsleɪʃʌnʌl stʌdiz ʌnd ɪntu klɪnʌkʌl traɪʌlz tu dɪvɛlʌp tritmʌnts fɔr mɛksf ðʌ risɝtʃ praɪɔrʌtiz aɪdɛntʌfaɪd wɪl bi juzd tu ɡaɪd risɝtʃ ʌkrɔs ðʌ kʌmjunʌti ", + "duration": 0.8058602809906006, + "PER": 48.1203007518797, + "score": { + "S": 42, + "D": 10, + "I": 12, + "N": 133 + } + }, + { + "model": "WavLM", + "phonemes": "n ɑ t d͡ʒ ʌ s t bajð ə n æ ʃ ə ə l ɪ n s t u sz ʌ v h ɛ l θ ə ɛ m i s i ɛ fs ɛʌ s ɹ i sɹ̩d͡ʒʃp m wɹ̩k ɪ ŋ ɡɹowp æ n j u l i z ə v ɛ m s m ɛd sajz", + "ref_phonemes": "nɑt dʒʌst baɪ ðʌ næʃʌnʌl ɪnstʌtuts ʌv hɛlθ ðʌ mɛksf risɝtʃ wɝkɪŋ ɡrup kæn ju pliz ʌdvæns maɪ slaɪdz ", + "duration": 0.6618461608886719, + "PER": 53.086419753086425, + "score": { + "S": 20, + "D": 9, + "I": 14, + "N": 81 + } + }, + { + "model": "WavLM", + "phonemes": "s d ɑ n s i h t ə d u ð æ t ɪ ŋ k iow æ æ najɪ n d i ə s æ n i zs ɪ f zs wɹ̩k ɪ ɡ ɹ u p ʌ v kawn n s ə l ɪ ɪ z k ə m powz d ʌ v dajʌd vɹ̩s tejk howl dɹ̩z", + "ref_phonemes": "aɪ doʊnt si haʊ tu du ðæt θæŋk ju ðʌ nændz mɛksf wɝkɪŋ ɡrup ʌv kaʊnsʌl ɪz kʌmpoʊzd ʌv daɪvɝs steɪkhoʊldɝz ", + "duration": 0.8541884422302246, + "PER": 55.294117647058826, + "score": { + "S": 25, + "D": 7, + "I": 15, + "N": 85 + } + }, + { + "model": "WavLM", + "phonemes": "ɹ i sɹ̩t͡ʃɪ t͡ʃɹ̩z æ n k l ɪ n ɪ ʃ ə n s n ɑ n p ɹ ɑ f ə t æ v b ə k ə s i ɔ ɹ ɡ ə n ə zejʃ ə n l i dɹ̩z n d ð ə b ɹ ɔ tɹ̩æ n i zs ʌ v ɛ s k ə m j u n ə t i ɪ n k l u d ɪ ŋ æ n ɪ v ɪ ə ə l z w ɪ ð l u d ɪ k s p ɪ ɹ i ə n z", + "ref_phonemes": "risɝtʃɝz ʌnd klɪnɪʃʌnz nɑnprɑfʌt ædvʌkʌsi ɔrɡʌnʌzeɪʃʌn lidɝz ʌnd ðʌ brɔdɝ mɛksf kʌmjunʌti ɪnkludɪŋ ɪndʌvɪdʒʌwʌlz wɪð laɪvd ɪkspɪriʌns ", + "duration": 0.6159515380859375, + "PER": 48.717948717948715, + "score": { + "S": 34, + "D": 9, + "I": 14, + "N": 117 + } + }, + { + "model": "WavLM", + "phonemes": "sowɪ n k l u t ɪ ŋ ɪ n d d͡ʒə l z u h æ v æ n i i ə s ɛ s ɪ n k æ ɹə ɡ vɹ̩ u zs ɪ t ð ə wk n ɡ ɹ u p ɪ n k l z fajv ɪ n d ɪ ɪd͡ʒ ə l z w l ɪ d ɪ k s p ɪ ɹ ə n z æɪ n m i ə n vajt ə n ə d ɪ ʃ ə n ə l t w ʌ n i s ɛ v n n d ɪ d͡ʒ wə l z u m t ə p ɑ t t ɪ s ə pejd ɪ n ð z ɛ ɹ i s wb ɛ vb ə nawɹ̩ɹk l æ n ɪ ŋɡ ɹ u p s", + "ref_phonemes": "ɪnkludɪŋ ɪndʌvɪdʒʌwʌlz hu hæv mɛksf ʌnd kɛrɡɪvɝz ðʌ wɝkɪŋ ɡrup ɪnkludz faɪv ɪndʌvɪdʒʌwʌlz wɪð laɪvd ɪkspɪriʌns ʌnd wiv ɪnvaɪtʌd æn ʌdɪʃʌnʌl twɛntisɛvʌn ɪndʌvɪdʒʌwʌlz tu pɑrtɪsʌpeɪt ɪn ðʌ vɛriʌs wɛbɪnɑr plænɪŋ ɡrups ", + "duration": 1.186357021331787, + "PER": 52.17391304347826, + "score": { + "S": 43, + "D": 31, + "I": 22, + "N": 184 + } + }, + { + "model": "WavLM", + "phonemes": "ð i z ɪ n d ɪ v ɪ w ə l s ɛ l f n ɑ m ə nejt ɪ t t͡ʃɹ̩ ə ɹ̩ ɹ ɔɑ ɛ s ð æ t w i ɪ n ʃ iejt ə d k ɹ̩l i ð ɪ ʃ i ɪ ɹ ɛ n d lejt t ə θ æ ŋ k ɔ l ʌ v ð ɛ m ɔ l ʌ v ð ə ɪ n ə v ɪ w ə l z ʌ v ð ə wɹ̩k ɪ ŋɡ ə ə v k ʌɑ s ə l", + "ref_phonemes": "ðiz ɪndʌvɪdʒʌwʌl ɑr sɛlfnʌmeɪʃʌnt θru ʌ prɑsɛs ðæt wi ɪnɪʃieɪtʌd ɝli ðɪs jɪr wid laɪk tu θæŋk ɔl ʌv ðɛm ɔl ʌv ðʌ ɪndʌvɪdʒʌwʌlz ʌv ðʌ wɝkɪŋ ɡrup ʌv kaʊnsʌl ", + "duration": 0.8410265445709229, + "PER": 45.6, + "score": { + "S": 35, + "D": 14, + "I": 8, + "N": 125 + } + }, + { + "model": "WavLM", + "phonemes": "æ z w ɛ l æ z ð ə ɪ n d ɪ v ɪd͡ʒ əwə l z w ɪ wə l d ɪ k s p ɪ ɹ i ʌ v sɹ̩p ɹ t ɪ s ə pejt ɪ ŋ n ð ə ɪ n ð ə d ɪ v ɛ l ə m ə n td ʌ v d ə ɹ i sɹ̩t͡ʃ lt͡ʃɹ̩owɛ maw owð ɪ s w ɛ b ɪ nɹ̩ z pejt ŋ ɹ i k ɔ ɹ ə t ɪə t ɪ n ð əɹ i k ɔ ɹ d ɪ ŋ n ɹ æ n s k w ʌ w ɪ l b i aw", + "ref_phonemes": "æz wɛl æz ðʌ ɪndʌvɪdʒʌwʌlz wɪð laɪvd ɪkspɪriʌns fɔr pɑrtɪsʌpeɪtɪŋ ɪn ðʌ dɪvɛlʌpmʌnt ʌv ðʌ risɝtʃ roʊdmæp ðɪs wɛbɪnɑr ɪz biɪŋ rʌkɔrdʌd ʌnd ðʌ rʌkɔrdɪŋ ʌnd trænskrɪpt wɪl bi ", + "duration": 0.789602518081665, + "PER": 53.14685314685315, + "score": { + "S": 43, + "D": 13, + "I": 20, + "N": 143 + } + }, + { + "model": "WavLM", + "phonemes": "w s td ɪ d f ɔ ɹ ð ə p ʌ b l ɪ k ə m ə ʌ l ɛ n dʌ t ɪ n æ n s t w ɛ n ð æ t ə zs æ t i ʌ n s əɹ i sɹ̩d͡ʒp ɹajɔ ə t i z awɹajd ʌ m s sajd ə k ɹ ɔ s ɔ l l ʌ z ð ə w ɛ b ə nɹ̩z z ð ð æ wɹ̩k ɪ ŋ ɡ ɹ u p ʌ v ʌn n s ə l ɪ l p ʊ t ð ɛ m ɔ l t ə ɡ ɛ bðɹ̩ɪ n t u", + "ref_phonemes": "poʊstɪd fɔr ðʌ pʌblɪk ʌnd aɪl sɛnd aʊt æn ʌnaʊnsmʌnt wɛn ðæt ɪz rɛdi wʌns ðʌ risɝtʃ praɪɔrʌtiz ɑr aɪdɛntʌfaɪd ʌkrɔs ɔl ʌv ðʌ wɛbnɝʌnz ðʌ wɝkɪŋ ɡrup ʌv kaʊnsʌl wɪl pʊt ðɛm ɔl tʌɡɛðɝ ɪntu ", + "duration": 1.1007053852081299, + "PER": 48.0, + "score": { + "S": 45, + "D": 17, + "I": 10, + "N": 150 + } + }, + { + "model": "WavLM", + "phonemes": "ɔ ɹ i fajn ə l ɹ i ɔ ɹ t f ɔ ɹ ð ə k æ v s ə l ɪ n mejh v ə n ɛ k t ɪ ɹ n ð ə m i n tajm f tɹ̩h i t͡ʃʌ ʌ v ð i z w ɛ b ə nawɹ̩z", + "ref_phonemes": "ʌ faɪnʌl ripɔrt fɔr ðʌ kaʊnsʌl ɪn meɪ ʌv nɛkst jɪr ɪn ðʌ mintaɪm æftɝ itʃ ʌv ðiz wɛbnɝʌnz ", + "duration": 0.6167058944702148, + "PER": 47.88732394366197, + "score": { + "S": 19, + "D": 6, + "I": 9, + "N": 71 + } + }, + { + "model": "WavLM", + "phonemes": "w i w ɪ l b i pows t ɪ ŋ ð ə ɹ i sɹ̩d͡ʒkp ɹajɔ ɹ ə t i z ɑ n ə ɹ awd sɹ̩t͡ʃk s ɪ ŋ l æ t f ɔ ɹ m k ɔ l tajd i ə s kejl æ t w i w ɪ l ɔ l sow s ɛ n dawt t ə æ nawn s m ə n ə vawt", + "ref_phonemes": "wi wɪl bi poʊstɪŋ ðʌ risɝtʃ praɪɔrʌtiz ɑn ʌ kraʊdsɔrɪŋ plætfɔrm kɔld aɪdisɑkʌl ðæt wi wɪl ɔlsoʊ sɛnd aʊt æn ʌnaʊnsmʌnt ʌbaʊt ", + "duration": 0.6023879051208496, + "PER": 42.71844660194174, + "score": { + "S": 29, + "D": 5, + "I": 10, + "N": 103 + } + }, + { + "model": "WavLM", + "phonemes": "ə ə ɪ n d ə vɪd͡ʒ əw ə l s f ɹ ʌ m ð ə nɹ̩v ə s ɪ s t ə m w ɛ v ə n ɹ̩ɑ ɹ p l æ n ɪ ŋ ɹ u p æ v əd͡ʒojn ŋ d ə s l ɔ ŋ w ɪ ð ə kowt͡ʃɑ ɛ ɹ z ʌ v ð ə wɹ̩k ɪ ŋ ɡ uɹ̩k ʌ v ɹ n n s ə l d ɑ ktɹ̩z z mɔ ɹ i ŋ h ɛ n s ə n æ n d s ɪ n d ɪ bejt m ə n t", + "ref_phonemes": "ðʌ ɪndʌvɪdʒʌwʌlz frʌm ðʌ nɝvʌs sɪstʌm wɛbɪnɑr plænɪŋ ɡrup hæv dʒɔɪnd ʌs ʌlɔŋ wɪð ðʌ koʊhɛrz ʌv ðʌ wɝkɪŋ ɡrup ʌv kaʊnsʌl dɑktɝz mɔrin hænsʌn ʌnd sɪndi beɪtmʌn ", + "duration": 0.7320685386657715, + "PER": 46.15384615384615, + "score": { + "S": 37, + "D": 7, + "I": 16, + "N": 130 + } + }, + { + "model": "WavLM", + "phonemes": "æ d laj t ə ɹ ɛ k ə ɡ najz ɔ l ʌ z b ɪə n ɛ m bɹ̩ z ʌ v ð ɪ s p l æ n t ɪ ŋ ɡ ɹ̩ p ə s ɪ f ɪ k l i id͡ʒ ɛ ɹ j ʌ m ɡ ɹ̩ p ɔ l ð ə wɹ̩k ð æ t j u d ʌ n t ə ɔ ɹ ə najz ð ɪ s fɹ̩s t w ɛ ə nɹ̩", + "ref_phonemes": "aɪd laɪk tu rɛkʌɡnaɪz ɔl ʌv ðʌ mɛmbɝz ʌv ðɪs plænɪŋ ɡrup spʌsɪfɪkli dʒɑrd jʌŋɡɝ fɔr ɔl ðʌ wɝk ðæt juv dʌn tu ɔrɡʌnaɪz ðɪs fɝst wɛbɪnɑr ", + "duration": 0.6259040832519531, + "PER": 42.592592592592595, + "score": { + "S": 30, + "D": 9, + "I": 7, + "N": 108 + } + }, + { + "model": "WavLM", + "phonemes": "æ ɔ l sowl lajk t ə θ æ ŋ k ð æ t æ n daji n d i i s t i m ɪ f æ k ʊ d æ v ə n ɛ k s ajdb l i z w i z wɹ̩k t b ɪ hajn d ð ə s i n z t ə ɡ ɛ t ɔ l ʌ", + "ref_phonemes": "aɪd ɔlsoʊ laɪk tu θæŋk ðʌ nɪndz tim ɪf aɪ kʊd hæv ðʌ nɛkst slaɪd pliz huz wɝkt bɪhaɪnd ðʌ sinz tu ɡɛt ɔl ʌv ", + "duration": 0.6542129516601562, + "PER": 42.168674698795186, + "score": { + "S": 17, + "D": 9, + "I": 9, + "N": 83 + } + }, + { + "model": "WavLM", + "phonemes": "ð z ɔ ɹ ɡ ə najz t æ n t ə wɹ̩k w ɪ ð ɔ l ʌ v ð i z wɹ̩k ɪ ŋ ɡ ɹ u p s z w ɛ l ʌæ zs ɹ̩ ɹ h ɑ l i ɹajd i æ n hɹ̩ t i ŋ ɛ t ɑ ɹ l ejɛ wɹ̩ ɹ ɹ vajd ɪ ŋ ð ə l əd͡ʒɪ s t ɪ k s ɪ n h ɪ k h ɛ l p t ʌ s", + "ref_phonemes": "ðɪs ɔrɡʌnaɪzd ʌnd tu wɝk wɪð ɔl ʌv ðiz wɝkɪŋ ɡrups æz wɛl æz aʊɝ hɑli raɪli ʌnd aʊɝ tim æt rlɑ hu ɑr prʌvaɪdɪŋ ðʌ lʌdʒɪstɪks ʌnd hæv hɛlpt ʌs ", + "duration": 0.6780431270599365, + "PER": 43.24324324324324, + "score": { + "S": 37, + "D": 5, + "I": 6, + "N": 111 + } + }, + { + "model": "WavLM", + "phonemes": "s ɪ ð ɔ l v ð ə j u ɔ ɹ ɡ ə ə z ejʃ ə n əʌ p t ə ð ɪ s pojn t ɛ vɹ i w ʌ n z w ɛ l k ə m æ z j u l ɪ s ə n t ə ð ə p ɹ z ɛ n tejʃ ə n z ə ɛ n tɹ̩i ɔ ɹ w ɛ st͡ʃə n z ɪ n t ə ð ə k j uə æ nejm", + "ref_phonemes": "wɪð ɔl ʌv ðʌ ɔrɡʌnʌzeɪʃʌn ʌp tu ðɪs pɔɪnt ɛvriwʌnz wɛlkʌm æz ju lɪsʌn tu ðʌ prɛzʌnteɪʃʌnz tu ɛntɝ jɔr kwɛstʃʌnz ɪntu ðʌ kɑ ", + "duration": 0.771047830581665, + "PER": 44.44444444444444, + "score": { + "S": 27, + "D": 5, + "I": 12, + "N": 99 + } + }, + { + "model": "WavLM", + "phonemes": "bajs ə l ɛ k t ɪ m ð ə k j u ɪ nejdb b ʌ t ə n æ t ð ə b ɑ t ə m ʌ v ð ə s k ɹ i m æ n d w i w ɪ l b i æ t t ejk ɪ ŋ ɪ k w ɛ st͡ʃə n sows v j u h æ v ə k w ɛ st͡ʃə n zs p ə s ɪ f ɪ k t ə ə s i k kɹ̩", + "ref_phonemes": "baɪ sʌlɛktɪŋ ðʌ kɑ bʌtʌn æt ðʌ bɑtʌm ʌv ðʌ skrin wi wɪl bi teɪkɪŋ ðoʊz kwɛstʃʌnz ɪf ju hæv ʌ kwɛstʃʌn spʌsɪfɪk tu ʌ spikɝ ", + "duration": 0.6703896522521973, + "PER": 46.875, + "score": { + "S": 22, + "D": 4, + "I": 19, + "N": 96 + } + }, + { + "model": "WavLM", + "phonemes": "p p l i z ɪ n d ə k ej æ t æ nd d w l b i tejk ɪ ŋ s ʌ m k w ɛ st͡ʃə n z ə s ɪ v ɪ t ə it͡ʃ i k ɹ̩ɹajt æ f tɹ̩ɪ it͡ʃ t͡ʃ ə v ð ɛ ɹ t t ɔɑ k s ɪ f ð ɛ ɹ s tajm æ n d ð ɛ n w ɪ l j u ə lajz ow z z w ɛ st͡ʃə n z æ z w ɛ l æ ð v ɛ ɹ i ʌ n d ə m", + "ref_phonemes": "pliz ɪndʌkeɪt ðæt ʌnd wil bi teɪkɪŋ sʌm kwɛstʃʌnz spʌsɪfɪk tu itʃ spikɝ raɪt æftɝ itʃ ʌv ðɛr tɔks ɪf ðɛrz taɪm ðɛn wil jutʌlaɪz ðoʊz kwɛstʃʌnz æz wɛl æt ðʌ vɛri ɛnd ʌv ", + "duration": 0.8933329582214355, + "PER": 41.7910447761194, + "score": { + "S": 27, + "D": 12, + "I": 17, + "N": 134 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə ɛ æ n ɹ̩ɑɹ̩wɹ ɔ ɹ ð ə ð ə l ɔ ŋ ɡɹ̩t d ɪ s ɹ̩l ɹ̩l ɔ ŋ d ɪ s k ʌ ʃ ə n ʊ ð ð æ t ɪ n t ɹ ə d ʌ ʃ ə najtə n lajk t ə t ejk ð ɪ s ɑ pɹ̩t i n ə t t u n ə t i t ə ɪ n ə d u s ð ət͡ʃɛ ɹ ow", + "ref_phonemes": "ðʌ wɛbɪnɑr fɔr aʊɝ lɔŋ dɪskʌʃʌn wɪð ðæt ɪntrʌdʌkʃʌn aɪd laɪk tu teɪk ðɪs ɑpɝtunʌti tu ɪntrʌdus ðʌ tʃɛr ʌv ", + "duration": 0.6802647113800049, + "PER": 70.93023255813954, + "score": { + "S": 26, + "D": 6, + "I": 29, + "N": 86 + } + }, + { + "model": "WavLM", + "phonemes": "æ ən ɹ̩ ə s ɪ s t ə w ʌ æ n awɹ̩ l æ n d ɪ ŋ ɡ ɹ u æ n d ð ə m ɑ dɹ̩ejɹ̩ v ɹ ə dejz w ɛ p æ n hɹ̩ d ɑ p t əd͡ʒ ɛ ɹ ə ʌ ŋ ɡ dd͡ʒɛ ɹ d ɪ z ð ɪ zð ə p ɹ ə ɛ sɹ̩ɪ n ʌ d ɪ p ɹ n ʌ sajk k ɑ l əd͡ʒi f θ ɪ ŋ j n ə ɡ ɹ̩ɹs s ə t ɪ v ɛ l ə v ɛ ə", + "ref_phonemes": "ðʌ nɝvʌs sɪstʌm wɛbɪnɑr plænɪŋ ɡrup ʌnd ðʌ mɑdɝeɪtɝ fɔr tʌdeɪz wɛbɪnɑr draɪv dʒɑrd jʌŋɡɝ dʒɑrd ɪz ʌ prʌfɛsɝ ɪn ðʌ dɪpɑrtmʌnt ʌv saɪkɑlʌdʒi æt ðʌ junʌvɝsʌti ʌv ælʌbæmʌ ", + "duration": 0.8610451221466064, + "PER": 65.94202898550725, + "score": { + "S": 57, + "D": 18, + "I": 16, + "N": 138 + } + }, + { + "model": "WavLM", + "phonemes": "bɹ̩ ə ɪ w ɪ ð s ɛ k ə n d ɛ ɹ i ə pojn t ə nt s ɪ n ɛæ m ə s t i z i ɑ l əd͡ʒi æ n d ɹ u m t l əd͡ʒ i ɛ z ɔ l sowð v ə dɹ̩ɛ k tɹ̩ʌ v ð ə n ɛ ɹ n əwə l l ʃ ə n d pejn æ n d ð t l æ b ɹ ət͡ʃw ɔ ɹ i n ə m ɛ m ɹ̩ ʌ v ð ə j uejv i pejn n k əɹ̩ l ɛ k t ɪ v", + "ref_phonemes": "bɝmɪŋhæm wɪð sɛkʌndɛri ʌpɔɪntmʌnts ɪn ænʌsθiziɑlʌdʒi ʌnd rumʌtɑlʌdʒi hiz ɔlsoʊ ðʌ dɝɛktɝ ʌv ðʌ nʊrʌfʌlænʃmʌnʌn peɪn ʌnd fʌtiɡ læbrʌtɔri ʌnd ʌ mɛmbɝ ʌv ðʌ juv peɪn kʌlɛktɪv ", + "duration": 0.8491082191467285, + "PER": 51.03448275862069, + "score": { + "S": 41, + "D": 16, + "I": 17, + "N": 145 + } + }, + { + "model": "WavLM", + "phonemes": "h i z kɹ̩ ə t l i f ʌ n d ə d bajej najejt m ð ə d ə p ɑ ɹ t ə n ʌ v d ɪ f ɛ n z ə s t ʌ d i n u t ɛ k n i k s ɔ ɹ dajæejə nows ɪ ŋ æ n t ɹ i t ɪ ŋ n ɹ̩æowʌ n f mejʃ ə n ɪ ð ð æ ə l t ɹ towvɹ̩d͡ʒs ud͡ʒɛ ɹ θ æ ŋ k j u", + "ref_phonemes": "hiz kɝʌntli fʌndʌd baɪ ni ʌnd ðʌ dɪpɑrtmʌnt ʌv dɪfɛns tu stʌdi nu tɛkniks fɔr daɪʌɡnoʊsɪŋ ʌnd tritɪŋ nʊrʌfʌlænʃmʌnʌn wɪð ðæt aɪl tɝn ɪt oʊvɝ tu ju dʒɑrd θæŋk ju ", + "duration": 0.7994182109832764, + "PER": 48.091603053435115, + "score": { + "S": 39, + "D": 13, + "I": 11, + "N": 131 + } + }, + { + "model": "WavLM", + "phonemes": "æ æ ŋ k s v ɪ ɡ ɪ n d əaj m ɡowɪ ŋ t ə ɹd͡ʒʌ s t ɡowɹ ɹajtd ɪ n ɪ n t ɹ ə d u s s ʌ m w ʌ n ɛ l s ə d ʌ sow m i d u ɪ ŋ ə mows t ʌ v t ə", + "ref_phonemes": "dʒɑrd jʌŋɡɝ θæŋks vɪki aɪ æm ɡoʊɪŋ tu dʒʌst ɡoʊ raɪt ɪn ʌnd ɪntrʌdus sʌmwʌn ɛls ðæts wʌt aɪm oʊnli duɪŋ moʊst ʌv tʌdeɪ ", + "duration": 0.5554192066192627, + "PER": 52.63157894736842, + "score": { + "S": 16, + "D": 25, + "I": 9, + "N": 95 + } + }, + { + "model": "WavLM", + "phonemes": "w ɛ v ɡ ɑ t ə l ɪ s t ʌ v s p i kɹ̩z ð æ t ɑ z ɹ ɪ l i ɹ̩ ɹ̩w w ɪ ʃ l ɪ s t w i ɡ ɑ tɹ̩ɪ n tajɹ̩w w ɪ ʃ l ɪ s t æ n soww wɹ̩v ɪ ɹ i ɡ ɹ v f ʊ l ð æ t ɛ vɹ̩ w ʌ n ə ɡ ɹ i t ə t ɔ k", + "ref_phonemes": "wiv ɡɑt ʌ lɪst ʌv spikɝz ðæt wɑz rɪli aʊɝ wɪʃ lɪst ʌnd wi ɡɑt aʊɝ ɪntaɪɝ wɪʃ lɪst soʊ wir vɛri ɡreɪtfʌl ðæt ɛvriwʌn ʌɡrid tu tɔk ", + "duration": 0.6501636505126953, + "PER": 39.603960396039604, + "score": { + "S": 24, + "D": 8, + "I": 8, + "N": 101 + } + }, + { + "model": "WavLM", + "phonemes": "ð i z ʌɹ ð ə p i p ə ð ə d t ɑ p ʌ v ð ɛ ɹ v i l d sowh ɪ z ɪ z ɡæ n b i ə ɡ ʊ d ə h æ f tdejk ə d ə ɡowh ɑ n æ n d ɔɑ n w ɪ ðd ð æ ɡ n ɑ l d͡ʒdə m ə n t s f ɔ ɹ it͡ʃs p i kɹ̩l", + "ref_phonemes": "ðiz ɑr ðʌ pipʌl æt ðʌ tɑp ʌv ðɛr fildz ðɪs ɪz ɡoʊɪŋ tu bi ʌ ɡʊd hæfdi aɪ kʊd ɡoʊ ɑn ʌnd ɑn wɪð æknɑlmʌdɪnts fɔr itʃ spikɝ ", + "duration": 0.6337282657623291, + "PER": 51.61290322580645, + "score": { + "S": 26, + "D": 7, + "I": 15, + "N": 93 + } + }, + { + "model": "WavLM", + "phonemes": "b ʌ ɛ vɹ̩i s ɛ k ə nd ɪ s ɪ l θ ɪ ŋ d z ɑ ɡɑ n ə t ɔ k ə bawt s ʌ m nd ʌ v f ɪ ɹ i bɡ ɹ i f l i ɪ n t ɹ ə d u s it͡ʃs s p it͡ʃ kɹ̩æ n d ɹ̩ɡ ə ə s t ɑ ɹ t w ɪ ð ɹ ɪ ʃ ə f ɪ ʃɹ̩æ d ʃ i z k n ə ɡ ɪ v ð ə fɹ̩s t t ɔ w ɪ ɪ z ð ə l ɪ v θ ɪ k s p ɪ ɹ i ə n s t ɔ k", + "ref_phonemes": "bʌt ɛvɝi sɛkʌnd ðɛrz ɔl θɪŋz wir ɡoʊɪŋ tu tɔk ʌbaʊt aɪm ɡoʊɪŋ tu vɛri brifli ɪntrʌdus itʃ spikɝ ʌnd wir ɡoʊɪŋ tu stɑrt wɪð trɪʃʌ fɪʃɝ ʌnd ʃiz ɡoʊɪŋ tu ɡɪv ðʌ fɝst tɔk wɪtʃ ɪz ðʌ laɪvd ɪkspɪriʌns tɔk ", + "duration": 1.1323294639587402, + "PER": 50.0, + "score": { + "S": 44, + "D": 25, + "I": 10, + "N": 158 + } + }, + { + "model": "WavLM", + "phonemes": "ɪ m sajə t ə s t s w i w i k ɑ ɹ v ə p æ θ n d w i howp ð æ t ð æ t ɪ n s æ n ə p lejs s w ɛ ɹw i k æ n f ɛ k t ɪ v l i m i ð ə n i d z ʌə v pejʃ ə n t s æ n soww ɹ v ɛ ɹ i ɡ ɹejt f ə l f ɔ ɹ ð ə ɪ n d v ɪd͡ʒə w ə l z ð æ t k æ n", + "ref_phonemes": "saɪʌntɪsts wi kɑrv ʌ pæθ ʌnd wi hoʊp ðæt ðæt ɛndz ɪn ʌ pleɪs wɛr wi kæn ɪfɛktɪvli mit ðʌ nidz ʌv peɪʃʌnts ʌnd soʊ wir vɛri ɡreɪtfʌl fɔr ðʌ ɪndʌvɪdʒʌwʌlz ðæt kæn ", + "duration": 0.9142181873321533, + "PER": 32.03125, + "score": { + "S": 26, + "D": 8, + "I": 7, + "N": 128 + } + }, + { + "model": "WavLM", + "phonemes": "ɑ ɹ t ɪ k k j ə lejt ð ə ɪ k s p ɪ ɹ ə n s ʌ v ɛ m i s i ɪ f ɛ s æ z v ɛ ɹ i d ɪ f ə k ə ɔ l æ z ð æ t ɪ z s owt͡ʃɹ ɹ ɪ ʃ i h h æ z æ ŋ ɔ mows t θɹ̩d i j ɪ ɹ z ʌ v l ɪ v d ɪ k s p ɪ ɹ i ə n t s w ɪ ð ɛ m i s i ɪ f ɛ s", + "ref_phonemes": "ɑrtɪkjʌlʌt ðʌ ɪkspɪriʌns ʌv mɛksf æz vɛri dɪfʌkʌlt æz ðæt ɪz trɪʃʌ hæz aɪ θɪŋk ɔlmoʊst θɝdi jɪrz ʌv laɪvd ɪkspɪriʌns wɪð mɛksf ", + "duration": 0.8210926055908203, + "PER": 49.03846153846153, + "score": { + "S": 19, + "D": 10, + "I": 22, + "N": 104 + } + }, + { + "model": "WavLM", + "phonemes": "æ n d ð ɛ ɹ wɹ̩ɹ ɹ̩ l ɛn t l ɪə s ɛ fɹ̩t s ʌ v hɹ̩ɹ m ʌ ðɹ̩æ n d ð ə n u dd͡ʒɹ̩z z ɪ ɛ m i s i ə v ɛ s ə sows ejʃ ə n aj d d ɹu ð ɛæ fɹ̩t s ʃ i w ɑ z dajəæ ɡ nows t æ ð əejt ə d͡ʒʌ v t w ɛ l fw ɪ ð ɛ m i s i ə f ɛ s", + "ref_phonemes": "ʌnd ðɛr wɝ rɪlɛntlɪs ɛfɝts ʌv hɝ mʌðɝ ʌnd ðʌ nu dʒɝzi mɛksf ʌsoʊsieɪʃʌn θru ðɛr ɛfɝts ʃi wɑz daɪʌɡnoʊst æt ðʌ eɪdʒ ʌv twɛlv wɪð mɛksf ", + "duration": 0.781137228012085, + "PER": 57.943925233644855, + "score": { + "S": 30, + "D": 4, + "I": 28, + "N": 107 + } + }, + { + "model": "WavLM", + "phonemes": "æ n ʃ i m ʌt͡ʃk lejtdɹ̩ʌ k ə n t æɪ n j u s t ə m i ðowz vt͡ʃæ l əd͡ʒə n d͡ʒ ə z ə ʃ i z ə f m ʌ ðɹ̩ʌ t t͡ʃ ɪ l d ɹ ə n æ n d ð ə t ɹ ɛ ʒɹ̩ v", + "ref_phonemes": "ʌnd ʃi mʌtʃ leɪtɝ kʌntɪnjuz tu mit ðoʊz tʃælʌndʒɪz ʃiz ʌ waɪf mʌðɝ ʌv tu tʃɪldrʌn ʌnd ðʌ trɛʒɝɝ ʌv ", + "duration": 0.6063783168792725, + "PER": 53.16455696202531, + "score": { + "S": 20, + "D": 7, + "I": 15, + "N": 79 + } + }, + { + "model": "WavLM", + "phonemes": "ðə n u i ɔ ɹ k s ɪ t i bejs t ɛ p p ɹ p ɹajvɹ p ɹajv ə t ɛd͡ʒ k w ə t i fɹ̩m z ɔ l sowə ə ɡ ɪ f t ə k mj n ə k kejtɹ̩ə s ʌ m v ɛɹ i m ʌt͡ʃ ʊ k ɪ nŋ f ɔ ɹ ə d t ə h ɪ ɹ ɪ ŋ hɹ̩p ɹ ə s p ɛ k t ɪ v ɑ n ð ə f j ut͡ʃɹ̩ ɹ i sɹ̩t͡ʃɪ n m i s i ɛ f ɛ s", + "ref_phonemes": "ʌ nu jɔrk sɪti beɪst praɪvʌt ɛkwʌti fɝm ʌnd ʃiz ɔlsoʊ ʌ ɡɪftʌd kʌmjunʌkeɪtɝ aɪm vɛri mʌtʃ lʊkɪŋ fɔrwɝd tu hirɪŋ hɝ pɝspɛktɪv ɑn ðʌ fjutʃɝ risɝtʃ ɪn mɛksf ", + "duration": 0.8189132213592529, + "PER": 57.599999999999994, + "score": { + "S": 30, + "D": 11, + "I": 31, + "N": 125 + } + }, + { + "model": "WavLM", + "phonemes": "sowej ɪ l tɹ̩ n ɪ dtowvɹ̩t ə t ɹ ɪ ʃ ə f ɔ ɹ ð ə l v ɪ k s pɪ ɹ ə n s t ɑ ɹ ɪ m mejn æ n ɹ ɪ ə lɹ ɛ æ ɛ ɹ j ɪ ɹ ɡow", + "ref_phonemes": "aɪ wɪl tɝn ɪt oʊvɝ tu trɪʃʌ fɔr ðʌ laɪvd ɪkspɪriʌns tɔk trɪʃʌ fɪʃɝ θæŋk ju maɪ neɪm ɪz trɪʃʌ fɪʃɝ aɪm fɔrti jɪrz oʊld ", + "duration": 0.7379879951477051, + "PER": 69.89247311827957, + "score": { + "S": 30, + "D": 30, + "I": 5, + "N": 93 + } + }, + { + "model": "WavLM", + "phonemes": "ɪ ɡ ʊ d m ɔ ɹn ɪ ŋ ɛ v ɹ iw ʌ n t s ʌ m ŋ w i k ɹ ɪ s t ə v ə kl ɪ z n", + "ref_phonemes": "noʊt ðʌ kæpʃʌnz ɑr aɪ dʒɛnɝeɪtʌd ʌnd meɪ kʌnteɪn ɛrɝz ɡʊd mɔrnɪŋ ɛvriwʌn ɪts ʌm aɪm krɪstʌfɝ klɛmʌnsʌn ", + "duration": 0.8297123908996582, + "PER": 69.41176470588235, + "score": { + "S": 11, + "D": 48, + "I": 0, + "N": 85 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə ɡ ɹ u b l i ð æ s ɛ n dð ə f ɹ̩ bejs ɪ m ɪ t ə b ɑ l iɡ ɹ i sɹ̩t͡ʃs s æ n d ɪ t s majɡej ɡ ɹejtk p lejɛ ʃt͡ʃɹ̩æ n d ɑ n n ʌ w ɛ nd͡ʒ d u s ð ə d ɛ k s s p i kɹ̩ m p ɹ ə f ɛ s dowɔ ɹ i s ɛ l s ə f ɹ ʌ m ɡ l ʌ m b j ɹ u nɹ̩ vɹ̩s ə t i sowl d", + "ref_phonemes": "ðʌ ɡrup lidɝ æt sɛntɝ fɔr beɪsɪk mɛtʌbɑlɪk risɝtʃ ʌnd ɪts maɪ ɡreɪt plɛʒɝ ʌnd hʌnɝ tu ɪntrʌdus ðʌ nɛkst spikɝ prʌfɛsɝ lɔri zɛltsɝ frʌm kʌlʌmbiʌ junʌvɝsʌti soʊ ", + "duration": 0.718489408493042, + "PER": 59.541984732824424, + "score": { + "S": 48, + "D": 8, + "I": 22, + "N": 131 + } + }, + { + "model": "WavLM", + "phonemes": "l ɔ ɹ i ɡ ɹ æd͡ʒuejt ə d f ɹ ʌ m ɹ ɪ n s ə n ju n vɹ̩s t i t ə t ə p i t͡ʃt s t i ɹ ɑ k ə f ɛ l i n ə vɹ̩s t i t ɪ d p ow s ɑ k əw ə l wɹ̩k æ k ejɪ ŋ z k ɑ l d ə t l ʌ m bowɹ̩ɛ n d æ n d ɹ ɹ̩s n t t ə u ə l ʌ m bejæ u n vɹ̩s i ə n i z", + "ref_phonemes": "lɔri ɡrædʒueɪtɪd frʌm prɪnstʌn junʌvɝsʌti ʌnd dɪd ʌ fɪdz æt rɑkʌfɛlɝ junʌvɝsʌti dɪd poʊstdɑktɝʌl wɝk æt kɪŋz kɑlɪdʒ lʌndʌn ʌnd rɪtɝnd tu kʌlʌmbiʌ junʌvɝsʌti ʌnd ʃiz ", + "duration": 0.8221659660339355, + "PER": 56.83453237410072, + "score": { + "S": 44, + "D": 19, + "I": 16, + "N": 139 + } + }, + { + "model": "WavLM", + "phonemes": "d n ɹ ə m ɛ n d z wɹ̩k f ɹ ʌ m ɛ n i ə z ɑ n p ɹ̩ ɹ fɹ̩ɹi ɹejɪ ŋ k ɔ s t h ɔ m ɛ k ə n d ɪ s ə m z p ə tejn ŋ t ɛ n ə d j h h ɪ s tejs s ə z t f i d ɪ ŋ b ɪ hejv i ɹ̩ ɹ æ n d ɛɪ ɹ i s ə n ð i lojw ɑ s ɔ l soww l ɹ ə mowtɹ̩ ə t ə f ʊ l", + "ref_phonemes": "dʌn trʌmɛndʌs wɝk fɔr mɛni jɪrz ɑn pɝɪfɝi breɪn krɔs tɔk mɛkʌnɪzʌmz pɝteɪnɪŋ tu ɛnɝdʒi hoʊmioʊsteɪsʌs fidɪŋ bɪheɪvjɝ ʌnd risʌntli lɔri wɑz ɔlsoʊ prʌmoʊtʌd tu fʊl ", + "duration": 0.9801616668701172, + "PER": 54.41176470588235, + "score": { + "S": 40, + "D": 18, + "I": 16, + "N": 136 + } + }, + { + "model": "WavLM", + "phonemes": "p ə f ɛ s s ə s ð ɪ s ɪ l bɪ t ʌ f æ n ɑ b dejt t ə ð ə ɪ n f ɹə d ʌ ʃ ə n m æ n dk ɹ ɡ ɹ æ sə lejʃ ə n s æ n d t ɹ̩ dejw i ɡ ɑ n ə h ɪ ɹ ə bawt s ʌ m ɪ nt ɹ ə s t ɪ ŋ wɹ̩k æ ndajl ʊ f ɔ ɹ h ɪ ŋ ə bawt ʌ s", + "ref_phonemes": "prʌfɛsɝ soʊ ðɪs lɪtʌl bɪt ʌv æn ʌpdeɪt tu ðʌ ɪntrʌdʌkʃʌn ʌnd kʌŋrætʃʌleɪʃʌnz ʌnd tʌdeɪ wir ɡoʊɪŋ tu hir ʌbaʊt sʌm ɪntrʌstɪŋ wɝk ʌnd aɪ lʊk fɔrwɝd tu hirɪŋ ʌbaʊt ", + "duration": 0.8223943710327148, + "PER": 48.854961832061065, + "score": { + "S": 40, + "D": 19, + "I": 5, + "N": 131 + } + }, + { + "model": "WavLM", + "phonemes": "b m ʌə θ ɛ t ə n i vɹ̩ə s ɪ t ə m ɹ ɛ ɡ jə lejʃ t ʌ v b dawn d ə pows t ɪ ʃ u f ʌ ŋ k ʃ ə n s ɔ ɹ ɹ ɛ s l ɔ ɹ i ð ə s tejt s ə j ʊ ɹ s s lajk t ə θ ɪ ŋ k ð ə ɔ ɹ ɡ ə najz sɹ̩z z f ɹ̩n d vajd ɪ ŋ n i d", + "ref_phonemes": "sɪmpʌθɛtɪk nɝvʌs sɪstʌm rɛɡjʌleɪʃʌn ʌv braʊn ædʌpoʊs tɪsju fʌŋkʃʌn soʊ pliz lɔri ðʌ steɪdʒ ɪz jʊrz soʊ aɪd laɪk tu θæŋk ðʌ ɔrɡʌnaɪzɝz fɔr ɪnvaɪtɪŋ mi ", + "duration": 0.6544408798217773, + "PER": 51.61290322580645, + "score": { + "S": 42, + "D": 15, + "I": 7, + "N": 124 + } + }, + { + "model": "WavLM", + "phonemes": "t ə dejɪ t s ɪ l i ə p l ɛ ʒɹ̩hɪ m sowm t ɹ l æ b zd͡ʒɛ dnɹ̩ə l i s t ʌ d i z nɹ̩ə l sɹ̩k ə t s sð æ t ɹejɛ j ə lejt d æ p ə t t ə n m ə t æ b ə l ɪ z ə m f ɔ ɹ ð ə l ɑ p ɑ ɹ t majd l æ b ɪ z ɹ̩ l i b ɪ n fowk ə s ɪ ɪ ŋ ɑ s ɛ n ʃ ə l z", + "ref_phonemes": "tʌdeɪ ɪts rɪli ʌ plɛʒɝ soʊ maɪ læb dʒɛnɝʌli stʌdiz nʊrʌl sɝkʌts ðæt rɛɡjʌleɪt æpʌtaɪt ʌnd mʌtæbʌlɪzʌm fɔr ðʌ lɑrdʒ pɑrt maɪ læb hæz rɪli bɪn foʊkʌsɪŋ ɑn sɛntrʌl ", + "duration": 0.8471066951751709, + "PER": 45.45454545454545, + "score": { + "S": 33, + "D": 11, + "I": 16, + "N": 132 + } + }, + { + "model": "WavLM", + "phonemes": "s ə s m b ʌ t ə dejæ m k æ n ɪi t ɔ ə bawt ʌə ə m p l i t l i n u ɛ ɹ i v ɹ i sɹ̩t͡ʃf ɹ̩ ɹ̩v f ɔ ɹ majl æ w s tɪ l d ɪ v ɛ l ə b ɪ ŋ ə l ɑ t ʌ v ð ə t w u l z m w t͡ʃf owk ə s ɪ z ɑ n ð ə p ɛ f ɹ sow n ʌ θ ɪ ŋ ɪ z", + "ref_phonemes": "sɝkʌts bʌt tʌdeɪ aɪm ɡoʊɪŋ tu tɔk ʌbaʊt ʌ kʌmplitli nu ɛriʌ ʌv risɝtʃ fɔr maɪ læb wir stɪl dɪvɛlʌpɪŋ ʌ lɑt ʌv ðʌ tulz wɪtʃ foʊkʌsɪz ɑn ðʌ pɝɪfɝi soʊ nʌθɪŋ ɪz ", + "duration": 0.8180773258209229, + "PER": 44.0, + "score": { + "S": 29, + "D": 15, + "I": 11, + "N": 125 + } + }, + { + "model": "WavLM", + "phonemes": "p l ɛ s ʃ ð ɛ n t ɔ k ɪ ŋ ə bawʌ t ə dejw m n d w ʌ tajw ɑ n t ə t ɔ k tj u b ɪ k ɔ z ɪ z z ə p ɹ ɪ t i dajɛ vɹ̩s ɑ i ə n s w ɹaj s u b ɹ ɪ k saj ə ə bawt dw ɑ n t ə t ɔ k t əu ə l ɪ t ə l b ɪ t ə bawt", + "ref_phonemes": "pʌblɪʃt ðæt aɪm tɔkɪŋ ʌbaʊt tʌdeɪ ʌnd wʌt aɪ wɑnt tu tɔk tu ju bɪkɔz ðɪs ɪz ʌ prɪti daɪvɝs ɑdiʌns wɪtʃ aɪm supɝ ɪksaɪtʌd ʌbaʊt aɪ wɑnt tu tɔk tu ju ʌ lɪtʌl bɪt ʌbaʊt ", + "duration": 0.7063789367675781, + "PER": 42.30769230769231, + "score": { + "S": 34, + "D": 18, + "I": 3, + "N": 130 + } + }, + { + "model": "WavLM", + "phonemes": "wajɪ t s p ow u ɪ n t ɹ ə s t ɪ ŋ æ n k l æ ɪ k l i ɹ ɛ l ə v ə n ə t ɛ n ʃ ə l i t ə s t ʌ d i s ɪ m p ə ɛæ d ə ɹ ɛ ɡ j ə l iʃ ʃ ə n ʌ v m ə t æ b ə l ɪ z ə m fowk ə s ɪ ŋ ɑ n ɹaw æ n æ d ə pows t ɪ ʃ u ɹ̩ɹ b æ t æ n ə m æ n iɔ ɔ l sowt͡ʃ t ɔ k t ə j u ə baw l", + "ref_phonemes": "waɪ ɪts boʊθ ɪntrʌstɪŋ ʌnd klɪnɪkʌli rɛlʌvʌnt pʌtɛnʃʌli tu stʌdi sɪmpʌθɛtɪk rɛɡjʌleɪʃʌn ʌv mʌtæbʌlɪzʌm foʊkʌsɪŋ ɑn braʊn ædʌpoʊs tɪsju ɔr bæt ʌnd aɪm ɡoʊɪŋ tu ɔlsoʊ tɔk tu ju ʌbaʊt ", + "duration": 0.9614987373352051, + "PER": 42.384105960264904, + "score": { + "S": 46, + "D": 13, + "I": 5, + "N": 151 + } + }, + { + "model": "WavLM", + "phonemes": "s ə ɹaj z æ n t ɹ ə b ə lejtʃ ə n z æ n d p ɹ ɑ ɡ ɹ ɛ s ɛæ t w ɛi v mejd ɪ n d ɪ v ɛ l ə p ɪ ŋ ð ə t u l z æ n d æ sej zð æ tɹ̩æ k ə ə l i n i d ə d t ə s t ʌ d i ð ɪ s s m ə p ɹowp ɹ i ə l i ow tdɑ n d n tej ɪ n ənd͡ʒ d u s ð ɪ s", + "ref_phonemes": "ðʌ traɪʌlz ʌnd trɪbjʌleɪʃʌnz ʌnd prɑɡrɛs ðæt wiv meɪd ɪn dɪvɛlʌpɪŋ ðʌ tulz ʌnd ʌseɪz ðæt ɑr æktʃʌwʌli nidʌd tu stʌdi ðɪs ʌproʊpriɪtli soʊ aɪ doʊnt nid tu ɪntrʌdus ðɪs ", + "duration": 0.8104333877563477, + "PER": 43.79562043795621, + "score": { + "S": 41, + "D": 13, + "I": 6, + "N": 137 + } + }, + { + "model": "WavLM", + "phonemes": "s ajt ɪ n ð ə s ɹ u m ʌ əd͡ʒʌ s t t ə sejv ð ə s ð ɪ ð s t ɑ ɹ ɪ ŋ pojn m æ n d w ʌ t t ɹ i k m i ə bawt t ð ə bɹawn t t ə p ʊɑ t ə ʃ u s ɪ s t ə m w ɑ z s s s ɛ t i ð æ t wɹ̩d ʌ n j u z i ŋ ʌ p t ɪ m əd͡ʒɪ ŋ w ɪ", + "ref_phonemes": "slaɪd ɪn ðɪs rum bʌt dʒʌst tu seɪ ðæt ðɪs ɪz ʌ stɑrtɪŋ pɔɪnt ʌnd wʌt ɪntriɡd mi ʌbaʊt ðʌ braʊn ædʌpoʊs tɪsju sɪstʌm wɑz stʌdiz ðæt wɝ dʌn juzɪŋ pɛt ɪmɪdʒɪŋ wɪð ʌ ", + "duration": 0.987990140914917, + "PER": 44.53125, + "score": { + "S": 35, + "D": 15, + "I": 7, + "N": 128 + } + }, + { + "model": "WavLM", + "phonemes": "w ej iowə l i b ə l ɡ l u k s st t ɹ i sɹ̩ɪ n nd͡ʒ ɛ k t d ɪ n t ə pejnɪ ʃ ə n z ʌ ɹ t w ɑ z nowt ə s ð æ k kowl d s t ɪ m j ə lejt s t ɪ m j ə lejt ə d ɹawd ə pows t u ʃ ɡ u k s z ə p t ejk ə n b ɹ æ n ɑ t pows t əɪ ʃ u ɪ n l i n æ n d ɪ v ɪd͡ʒə w ə l z æ n d", + "ref_phonemes": "reɪdioʊ leɪbʌl ɡlukoʊs treɪsɝ ɪndʒɛktʌd ɪntu peɪʃʌnts wʌt wɑz noʊtʌst ðæt koʊld stɪmjʌleɪt stɪmjʌleɪtʌd braʊn ædʌpoʊs tɪsju ɡlukoʊs ʌpteɪk ɪn braʊn ædʌpoʊs tɪsju ɪn lin ɪndʌvɪdʒʌwʌlz ʌnd ", + "duration": 0.8471603393554688, + "PER": 43.75, + "score": { + "S": 46, + "D": 16, + "I": 8, + "N": 160 + } + }, + { + "model": "WavLM", + "phonemes": "ð ɪ kowl t ɪ m j ə lejt ə ɡ l u sowkp ɡ l u ɑ zs ʌ p tejdk w ɑ z d ɪə k ɹ i s t ɪ n n p i p ə l w ɛɪ f θ m ɛ l əvejt ə d b i ə majæ nowb b i s ə t i æ nd s u v ə s tsajp ʌ v", + "ref_phonemes": "ðɪs koʊl stɪmjʌleɪtʌd ɡlukoʊs ɡlukoʊs ʌpteɪk wɑz dɪkrist ɪn pipʌl wɪð ɛlʌveɪtɪd bimi ʌnd oʊbisʌti ʌnd soʊ ðɪs taɪp ʌv ", + "duration": 0.7469496726989746, + "PER": 42.857142857142854, + "score": { + "S": 25, + "D": 6, + "I": 11, + "N": 98 + } + }, + { + "model": "WavLM", + "phonemes": "s ɹ̩ ɹ ʃ ʃ ə n ɹɪ l i s ɛ t ɔ f howl k ɑ t ə d͡ʒd d k ʌ t d͡ʒ ə ɪ n d ə ʃ t ɹ v p i p ə l h u l ʊ k ɪ ŋ t j u z ʌ b æ t æ k t ə vejtɹ̩z æ z ð ɛ ɹ ə p j u dðej æ n t iowp ɹ b i s ə d i t ɑ ɹ ɡ ə t s æ n d ð ə k ɪ n ɪ k ə", + "ref_phonemes": "ɑbzɝveɪʃʌn rɪli sɛt ɔf ʌ hoʊl kɑtʌdʒ kɑtʌdʒ ɪndʌstri ʌv pipʌl hu wɝ lʊkɪŋ tu juz bæt æktʌveɪtɝz æz θɛrʌpjutɪk ænti oʊbisʌti tɑrɡʌts ʌnd boʊθ ðʌ klɪnʌkʌl ", + "duration": 0.9423882961273193, + "PER": 45.23809523809524, + "score": { + "S": 32, + "D": 15, + "I": 10, + "N": 126 + } + }, + { + "model": "WavLM", + "phonemes": "d n d ʌ v ð ə bejs ʊ ɡ ɹ i sɹ̩t͡ʃɹs tejt ə sʊ d ʌ v ʃowd dowvɹ̩ɹ tajm ð æ t ð ɪ s f ɹ ɪ lejʃ ə n ʃ ɪ p ɪ z m ʌt͡ʃk ɔkɹ ə m p l ɛ k s æ n dsθ θ ɪ ŋ k ɪ l i ð ə b ɛ s t wejʌ v htajb lajt ɪ ŋ ð ə s ɪ z ʌ ɹ i s ə n s t ʌ d i ð æ t w ɑ z", + "ref_phonemes": "deɪtʌ ʌnd ðʌ beɪsɪk risɝtʃ deɪtʌ sɔrt ʌv ʃoʊd oʊvɝ taɪm ðæt ðɪs rileɪʃʌnʃɪp ɪz mʌtʃ mɔr kɑmplɛks ʌnd aɪ θɪŋk rɪli ðʌ bɛst weɪ ʌv haɪlaɪtɪŋ ðɪs ɪz ʌ risʌnt stʌdi ðæt wɑz ", + "duration": 0.7723493576049805, + "PER": 39.25925925925926, + "score": { + "S": 34, + "D": 7, + "I": 12, + "N": 135 + } + }, + { + "model": "WavLM", + "phonemes": "p b l ɪ ʃ t m l æ s ʌ k ʌ p l i ɪɹ̩z ə ɡowɑn awæ bajp h ɔ l kowə n d ɪ ɹ ɑ ə f ɛ ɹ̩æ æ n w ʌ t h i d ɪ d ɪ z ejd d ɪ d ə h j d͡ʒ ɹ ɛ ɹt ɹ ɛt͡ʃæ t͡ʃ ə s p ɛ k t ɪ v s t ʌ d i ʌ vowəowvɹ̩v f ɪ f t i faw z ɪ n p ɛ k s k æ n z f ɔ ɹ k æ n sɹ̩ pfɹ̩", + "ref_phonemes": "pʌblɪʃt læst ʌ kʌpʌl jɪrz ʌɡoʊ naʊ baɪ pɔl koʊʌn æt rɑkʌfɛlɝ ʌnd wʌt hi dɪd ɪz ðeɪ dɪd ʌ hjudʒ rɛnt rɛtrʌspɛktɪv stʌdi ʌv oʊvɝ fɪfti θaʊzʌnd pɛt skænz fɔr kænsɝ ", + "duration": 0.9594736099243164, + "PER": 47.286821705426355, + "score": { + "S": 30, + "D": 8, + "I": 23, + "N": 129 + } + }, + { + "model": "WavLM", + "phonemes": "b ə n s æ n d sowð i s pejʃ ə n z wɹ̩n n ɑ t k ɔ d æ k s powzs d ɪ s t ɪ s dd͡ʒ zs bejs s lajn ɹ æ n t t ə p t ʃ u æ k t ɪ v ə t i w ʌ t h i d ɪ d w ɑ z h i bejs ɪ k l i t ɹ æ t ə fajd ɔ l ʌ v ð ə pejs ʃ ə n s ɪ n t u b æ t", + "ref_phonemes": "peɪʃʌnts ʌnd soʊ ðiz peɪʃʌnts wɝ nɑt koʊld ɪkspoʊzd ðɪs ɪz dʒʌst beɪslaɪn braʊn ædʌpoʊs tɪsju æktɪvʌti ʌnd wʌt hi dɪd wɑz hi beɪsɪkli strætʌfaɪd ɔl ʌv ðʌ peɪʃʌnts ɪntu bæd ", + "duration": 0.8604328632354736, + "PER": 42.5531914893617, + "score": { + "S": 31, + "D": 21, + "I": 8, + "N": 141 + } + }, + { + "model": "WavLM", + "phonemes": "p ɑ z ə t ɪ v pɹ̩b b æ t n ɛ ɡ t ɪ v pejʃ ə n z æ n nð ɛ n æ n ə lajz t ə howl b ʌ n d ɪ fɹ̩ ə n t m ɛ t ə b ɑ l ɪ p ɹowɹ fajl z m w ʌ t h i fawn d z sow ə pej ʃ ə n z ð æ nt h æ ð i m p ɹ ɛ z ə n ʌ v æ k d ɪ v b æ", + "ref_phonemes": "pɑzʌtɪv ɔr bæd nɛɡʌtɪv peɪʃʌnts ʌnd ðɛn ænʌlaɪzd ʌ hoʊl bʌntʃ ʌv dɪfɝʌnt mɛtʌbɑlɪk proʊfaɪlz ʌnd wʌt hi faʊnd ɪz soʊ ðʌ peɪʃʌnts ðæt hæd ðʌ prɛzʌns ʌv æktɪv bæt ", + "duration": 1.0112450122833252, + "PER": 39.69465648854962, + "score": { + "S": 31, + "D": 15, + "I": 6, + "N": 131 + } + }, + { + "model": "WavLM", + "phonemes": "sow h ɪ ɹ ɪ n d b ɹawn s ow ðejh h æ d lowɹ̩d wɹ̩ɡ l u k w ɑ ɛ p bejs lajn nawʌ ð ɪ s ɪ f f ɛ k t ɑʌ ŋ ɡ lajs i m i ə ɑ z ɹ ɪ l i p ɹ ɪ t i m ɑ d ə s t b ʌ t w ɛ n", + "ref_phonemes": "ʃoʊn hir ɪn braʊn soʊ ðeɪ hæd loʊɝ ɡlukoʊs æt beɪslaɪn naʊ ðɪs ɪfɛkt ɑn ɡlaɪkeɪmiʌ wɑz rɪli prɪti mɑdʌst bʌt wɛn ", + "duration": 0.6490256786346436, + "PER": 42.857142857142854, + "score": { + "S": 25, + "D": 4, + "I": 10, + "N": 91 + } + }, + { + "model": "WavLM", + "phonemes": "h t ɹ æ t ə fajd aj i ə majl æ j u k æ n s i ɪ n ɪ n dɹ̩ɛ k ʃ ə n b ɪ t w i n ð ə æ t n d ð æ ɛ l ə vejt ə b i ə majn ɛ ɹ̩ɛ t m m æ t lowb b i ə majz j u", + "ref_phonemes": "hi strætʌfaɪd baɪ bimi naʊ ju kæn si æn ɪntɝækʃʌn bɪtwin ðʌ bæt ʌnd ðʌ ɛlʌveɪtɪd bimi wir æt æt loʊ bimi aɪz ju ", + "duration": 0.7664926052093506, + "PER": 47.72727272727273, + "score": { + "S": 25, + "D": 8, + "I": 9, + "N": 88 + } + }, + { + "model": "WavLM", + "phonemes": "ow l i s j u t ɑn t ɹ i l i s i ɛ n i ə f æ k t v ð ə b ɹawæ ntawt ə pows t ə ʃ t͡ʃə æ k t ɪ v ə t i b ʌ t æ ð ə hajj æ ə majz z nawj u s t ɑ ɹ t t ə s i p ɹɹ̩s p t p æ k t ɪ v ə ɛ k t m w ɛ ɹ ðowz m n d ə v d͡ʒ ə d͡ʒə ə l z h æ d lowɹ̩ ɡ lajs s i m i ə", + "ref_phonemes": "oʊnli si ju doʊnt rɪli si ɛni ɪfɛkt ʌv ðʌ braʊn ædʌpoʊs tɪsju æktɪvʌti bʌt æt ðʌ haɪ bimi naʊ ju wɪl stɑrt tu si ʌ prʌtɛktɪv ɪfɛkt wɛr ðoʊz ɪndʌvɪdʒʌwʌlz hæd loʊɝ ɡlaɪsɛmiʌ ", + "duration": 1.025355339050293, + "PER": 53.23741007194245, + "score": { + "S": 43, + "D": 11, + "I": 20, + "N": 139 + } + }, + { + "model": "WavLM", + "phonemes": "æ n ð ɪ s ɔ l sow t ɹ æ k t θ ɹ u d ə p ɹ æ v ə l ə n s ʌ v tajp t ə dajb b i d i z sowʌ ɔ l sows ə ɪ n d ə v ɪd͡ʒə w ə l z u k ʊ nd s i z s ʌ m m ɑ d ə s p ɹ ə t ɛ k ʃ ə n ʌ m ʌ v u k ɔ s ɪ n t ɑ lɹ̩æ n s ɪ n ð ə ɪ n ə", + "ref_phonemes": "ʌnd ðɪs ɔlsoʊ trækt θru ðʌ prɛvʌlʌns ʌv taɪp tu daɪʌbitiz soʊ ɔlsoʊ ðʌ ɪndʌvɪdʒʌwʌlz ju kʊd si sʌm mɑdʌst prʌtɛkʃʌn ʌv ɡlukoʊs ɪntɑlɝʌns ɪn ðʌ ɪn ðʌ ", + "duration": 0.7556242942810059, + "PER": 36.36363636363637, + "score": { + "S": 34, + "D": 5, + "I": 5, + "N": 121 + } + }, + { + "model": "WavLM", + "phonemes": "p ʃ ə n dz ð æ t h æ d b ɹawn ɑ p s t ə ʃ ə æ k t ɪ v ə t i b ʌ t j u ɹ ɪ l i s t ɑɹ k ə s i owə l ɑ ɹd͡ʒɹ̩ɪ f ɛ k sajz ɪn ð ə k ɑ n t ɛ k s t ʌ v ə b i ə majzn zowvɹ̩s s θ θɹ̩d ə t i æ n d sowðu ð ɪ s ɹejz ə z ð ə p ɑ s ə b ɪ l ə t i ð æ t mejlb i ɑ m æ k l ɪ ɹl l i", + "ref_phonemes": "peɪʃʌnts ðæt hæd braʊn ædʌpoʊs tɪsju æktɪvʌti bʌt ju rɪli stɑrt tu si ʌ lɑrdʒ ɪfɛkt saɪz ɪn ðʌ kɑntɛkst ʌv ʌ bimi ɪz oʊvɝ θɝdi ʌnd soʊ ðɪs reɪzʌz ðʌ pɑsʌbɪlʌti ðæt meɪbi klɪrli ", + "duration": 1.0600395202636719, + "PER": 45.774647887323944, + "score": { + "S": 34, + "D": 9, + "I": 22, + "N": 142 + } + }, + { + "model": "WavLM", + "phonemes": "b ɹaw t ɹawn dawt t ə ps t ə ʃ u æ k t ə vejdtɹ̩ ɑ ɹn n ɑ t s ə v ɪ ʃ ə n t t u p ɹ ɹ̩ v ɛ n t ow b i s ə t ɪ z j u k ʊ d s i ð ɛ ɹ p l ɛ n t i ʌ v p i ə l u h æ b i ə majnt z owvɹ̩θ θ θɹ̩d ə i ð æ t ɪ n f æ k t ɔ ɔ l sowh h æ d æ k t ɪ v b æ bʌ nt t m i", + "ref_phonemes": "braʊn braʊn ædʌpoʊs tɪsju æktʌveɪtɝz ɑr nɑt sʌfɪʃʌnt tu prɪvɛnt oʊbisʌti æz ju kæn si ðɛr ɑr plɛnti ʌv pipʌl hu hæd bimi oʊvɝ θɝdi ðæt ɪn fækt ɔlsoʊ hæv æktɪv fæt bʌt ɪt meɪ ", + "duration": 0.9497230052947998, + "PER": 47.482014388489205, + "score": { + "S": 36, + "D": 12, + "I": 18, + "N": 139 + } + }, + { + "model": "WavLM", + "phonemes": "b i ɹ i l i j u s f ə l z ɪ t t ɑ ɹ ɡ ə t ə ɪ m p ɹ u v m ə t æ b ə l ɪ z ə m ə m ɪ n ð ə k ɑ n t ɛ k s t ʌ v ɹ b i s ə t i æ n d sowɑ m ajʃ ʊ d dj u b ɪ f ɔ ɹ ð ə pk æ t tajp ə", + "ref_phonemes": "bi rɪli jusfʌl æz ʌ tɑrɡʌt tu ɪmpruv mʌtæbʌlɪzʌm ɪn ðʌ kɑntɛkst ʌv oʊbisʌti ʌnd soʊ aɪ ʃoʊd ju bɪfɔr ðʌ pɛt taɪp ", + "duration": 0.9674661159515381, + "PER": 36.666666666666664, + "score": { + "S": 21, + "D": 4, + "I": 8, + "N": 90 + } + }, + { + "model": "WavLM", + "phonemes": "ʌ v s ə p ɹowt͡ʃh t ə s t ʌ d i ʌ l k s ʌ p t tejk æ z s ɪ ɡ n ə l ʌ v æ k t vd b æ t ə n ʌ ðɹ̩wej ð æ æ m p iu p ə l h æ v s t ʌ d i d æ k t ə vejt ə d b æ tk ɪ n h j u m ə n z ɪ z kpajd dɹ̩ɛ k t θɹ̩m ɑ ɡ ɹ ə f i b ɪ k ɔ z w ɛ n b æ d", + "ref_phonemes": "ʌv ʌproʊtʃ tu stʌdi ɡlukoʊs ʌpteɪk æz ʌ sɪɡnʌl ʌv æktɪv bæt ʌnʌðɝ weɪ ðæt pipʌl hæv stʌdid æktʌveɪtʌd bæt ɪn hjumʌnz ɪz baɪ dɝɛkt θɝmʌɡrʌfi bɪkɔz wɛn bæd ", + "duration": 0.9733748435974121, + "PER": 32.800000000000004, + "score": { + "S": 23, + "D": 5, + "I": 13, + "N": 125 + } + }, + { + "model": "WavLM", + "phonemes": "æ k t ə vejt ə d ɪ dɹ̩ɔ ɔ l sowd ɹd͡ʒɛ nɹ̩ejt s h i æ n sowð ɪ z ɪ z ɔ l sowb ɪ n j u s t b ʌ t wajl m ð i z s t ʌ d i z h æ v b ɪ n ɹ ɪ l i ɪ n t ɹ ə s t ɪ æ n ə n t ɹ ɪi ɡ ɪ ŋ n j u m ə n d ɪ n ð æ n d ɪ f j u ɹ l i w ɑ nt ə", + "ref_phonemes": "ɪz æktʌveɪtʌd ɪt ɔlsoʊ dʒɛnɝeɪts hit ʌnd soʊ ðɪs ɪz ɔlsoʊ bɪn juzd bʌt waɪl ðiz stʌdiz hæv bɪn rɪli ɪntrʌstɪŋ ʌnd ɪntriɡɪŋ ɪn hjumʌnz ɪn ðʌ ɛnd ɪf ju rɪli wɑnt tu ", + "duration": 0.782343864440918, + "PER": 34.61538461538461, + "score": { + "S": 25, + "D": 11, + "I": 9, + "N": 130 + } + }, + { + "model": "WavLM", + "phonemes": "d͡ʒ s t ɹ w ʌ t s ɡowʌ ɪ ŋ ɑ n æ n ʌ t ɪ z ð ə ɹ ə lejʃ ə n ʃ ɪ p b ɪ t w i n m p i s ə t i æ d m ɛ d ə b ɑ l ə d ə s fowʌ ŋ ʃ ə n æ n d ɹawn d æ d ə pows t dt ə ʃ u j u ɹ i l i n i t i ɡ ɛ t t w ɔ ɹ m w ɛ ɹ m ɛ k ə n ɪ s t ɪ k m ɑ d ə l", + "ref_phonemes": "ʌndɝstænd wʌts ɡoʊɪŋ ɑn ʌnd wʌt ɪz ðʌ rileɪʃʌnʃɪp bɪtwin oʊbisʌti ʌnd mɛtʌbɑlɪk dɪsfʌŋkʃʌn ʌnd braʊn ædʌpoʊs tɪsju ju rɪli nid tu ɡɛt tu ʌ mɔr mɛkʌnɪstɪk mɑdʌl ", + "duration": 0.7935781478881836, + "PER": 41.66666666666667, + "score": { + "S": 37, + "D": 11, + "I": 7, + "N": 132 + } + }, + { + "model": "WavLM", + "phonemes": "w ɹ ɪ ð ə s t ə ɹowt ə n s æ n d sow ð ɪ s ɪ s bejs ɪ k l i ə s ʌ mɹ̩i ʌ v w ʌ t ɪ ɪ z nownm ə bawt ð ə sɹ̩k ɪ t s ɹ ɛ ɡ j ə lejt ɪ ŋ θɹ̩m ə l ɹ ɛ ɡ j ə lejʃ ə n æ n d ɛ n t æ d ə p ə t ɪ ʃj ə θɹ̩m əd͡ʒ n ə s əɪ s ɪ n ɹowd ɪ n", + "ref_phonemes": "wɪtʃ brɪŋz ʌs tu roʊdʌnts ʌnd soʊ ðɪs ɪz beɪsɪkli ʌ sʌmɝi ʌv wʌt ɪz noʊn ʌbaʊt ðʌ sɝkʌts rɛɡjʌleɪtɪŋ θɝmʌl rɛɡjʌleɪʃʌn ʌnd braʊn ædʌpoʊs tɪsju θɝmʌdʒʌnisʌz ɪn roʊdʌnts ", + "duration": 0.835320234298706, + "PER": 47.482014388489205, + "score": { + "S": 45, + "D": 13, + "I": 8, + "N": 139 + } + }, + { + "model": "WavLM", + "phonemes": "s i z ɑ ɹ p ɹɪ t i w ɛ l m æ p tdaw æ bm m ɛ n i ɪ fɹ ə n t l æ b m æ n sowɹ ʌ t h ɑ p ə n z ɪ z ʌ v θɹ̩ɹm ə s ɛ n sɹ̩ɹi nd fɹ̩mejʃ ə n sowb bowθ h i t æ n d w ɔ ɹ ɪ n d fɹ̩mejdʃ ə n ɪ z ɹ i lejd n t p ɹ ɑ s ɛ s t ɪ n ð i", + "ref_phonemes": "soʊ ðiz ɑr prɪti wɛl mæpt aʊt baɪ mɛni dɪfɝʌnt læbz ʌnd soʊ wʌt hæpʌnz ɪz θɝmʌl sɛnsɝi ɪnfɝmeɪʃʌn soʊ boʊθ hit ʌnd wɔrm ɪnfɝmeɪʃʌn ɪz rileɪd ʌnd prɑsɛst ɪn ðʌ ", + "duration": 1.1312975883483887, + "PER": 42.1875, + "score": { + "S": 29, + "D": 11, + "I": 14, + "N": 128 + } + }, + { + "model": "WavLM", + "phonemes": "saj l ə m ə s s ɪ s s ð i s ɪ ŋɡ n ə l ð ɛ n d ɡ ɛ ɹt ɹ i lejd d ɪ n t u ð ə aw ʌ m hajn p ɹejn æ n daw t θ ɹ u ð ə ə m ɪ n t u m ə iɹ̩ɹ l æ tɹ̩ow ə l k ɑ l ə m ə", + "ref_phonemes": "haɪpʌθɑlʌzʌm ðɪs ðiz sɪɡnʌlz ðɛn ɡɛt rileɪd ɪntu ðʌ hɪndbreɪn ʌnd aʊt θru ðʌ ɪntɝmidiɪt lætɝʌl kɑlʌm ", + "duration": 0.6689493656158447, + "PER": 59.523809523809526, + "score": { + "S": 25, + "D": 8, + "I": 17, + "N": 84 + } + }, + { + "model": "WavLM", + "phonemes": "ð ə s fajn ə l k ɔ ɹ d æ n ɪ n t u ð ɪ s ɪ m p ə θ ɛ t ə ɡ æ l æ n w ɪt͡ʃs fajn ə l i j u h æ v ð ə s s ɪ m p ə θ ɛ t ɪ k nɹ̩ɹ ɑ n z ð ɛ t ð ɛ n p ɹ əd͡ʒæ k t t ə b ɹawn n d ɑ t ə pows t ɪ ʃ u ɛ b ə v æ s m əd͡ʒɔ ɹ ə t i ʌ ɹ i sɹ̩t͡ʃ s ɛ n", + "ref_phonemes": "ʌv ðʌ spaɪnʌl kɔrd ʌnd ɪntu ðʌ sɪmpʌθɛtɪk ɡæŋɡlʌn wɪtʃ faɪnʌli ju hæv ðʌ sɪmpʌθɛtɪk nʊrɑnz ðæt ðɛn prɑdʒɛkt aʊt tu braʊn ædʌpoʊs tɪsju naʊ ðʌ væst mʌdʒɔrʌti ʌv risɝtʃ ðæts ", + "duration": 0.8274753093719482, + "PER": 44.680851063829785, + "score": { + "S": 38, + "D": 15, + "I": 10, + "N": 141 + } + }, + { + "model": "WavLM", + "phonemes": "b n d ʌ n ɪ n d θɹ̩mɹ̩iɹ ɡ j ə l ə t ɔ ɹ i sɹ̩k ə t h æ d z i ðɹ̩f f fowk ə s n ðə s sɹ̩k əɪ t s ɪ n ð ə b ɹ̩ɹejn n w ɪt͡ʃ æ v b ɪ n ɹ t nawɡð ð p ɑ p jə lejʃ ə n z ɪ n s ʌ m ɑ p j ə lejʃ ə n z ɹ ɛ ɡ j ə lejt ɪ ŋ ə m θɹ̩m ə l k ə n ɹowl ɹow", + "ref_phonemes": "bɪn dʌn ɪn θɝmoʊ rɛɡjʌlʌtɔri sɝkʌts hæz iðɝ foʊkʌst ɑn ðʌ sɝkʌts ɪn ðʌ breɪn wɪtʃ hæv bɪn rɪtʌn naʊ ðʌ pɑpjʌleɪʃʌnz ɪn sʌm pɑpjʌleɪʃʌnz rɛɡjʌleɪtɪŋ θɝmʌl kʌntroʊl ɑr ", + "duration": 0.8092470169067383, + "PER": 48.9051094890511, + "score": { + "S": 38, + "D": 10, + "I": 19, + "N": 137 + } + }, + { + "model": "WavLM", + "phonemes": "æ i l l i k k wojt ɪ z l i d ɹ̩ fajn d ɔ ɹ ðejə fowk ə s tawt ɪ n ð ə b ɹawn d æ d ə p t h ɪ ʃ u d i powə t s ɛ l f n d w ʌ t majn ɡ ɹ u p ɪ v z fowk ə s ɪ ŋ ɑ n ɪ z ɹ", + "ref_phonemes": "rɪli kwaɪt naɪsli dɪfaɪnd ɔr ðeɪ foʊkʌst aʊt ɪn ðʌ braʊn ædʌpoʊs tɪsju dipoʊ ɪtsɛlf ʌnd wʌt maɪ ɡrup ɪz foʊkʌsɪŋ ɑn ɪz ", + "duration": 0.6357197761535645, + "PER": 40.625, + "score": { + "S": 25, + "D": 6, + "I": 8, + "N": 96 + } + }, + { + "model": "WavLM", + "phonemes": "ɹ ðɹ̩s ə p ɹ əd͡ʒɛ k ʃ ə n f f ɹ ʌ m ð ɪ s ɪ b ɪ s æ t ɪ ɪ ŋ l i æ n awt t ə b ɹawn n d t pows t u ʃ u n d u ðɹ̩b ɪ n b ɪ k ɔ z ʌ v ð ɪ s l ɛ ŋ k b ɪ t w i n b i ə majə l ə vejt ə b i majn ajb b i d i z ɪ m p ɛ ɹ b ɹaw n ɑ p s t", + "ref_phonemes": "ræðɝ ðʌ prʌdʒɛkʃʌn frʌm ðʌ sɪmpʌθɛtɪk ɡæŋɡlʌn aʊt tu braʊn ædʌpoʊs tɪsju ʌnd soʊ ðɛr hæv bɪn bɪkɔz ʌv ðɪs lɪŋk bɪtwin bimi ɛlʌveɪtɪd bimi daɪʌbitiz ɪmpɛrd braʊn ædʌpoʊs ", + "duration": 0.9877290725708008, + "PER": 48.57142857142857, + "score": { + "S": 44, + "D": 17, + "I": 7, + "N": 140 + } + }, + { + "model": "WavLM", + "phonemes": "ʃ u f ʌ ŋ k ʃ ə n ɪ ŋ sow ɛ ɹ b ɪ n m ɛ n i ɡ ɹ u p s ð æ t h æ v j u d æ n ə m ə l majɑ d ə l z t ə t ɹajt dɹ̩s t æ n d ʌ t z d ð ə l ɪ ŋ ɡ b ɪ t w i n ɛ l ə vejt ə d b i ə majn æ n d m ɪ m p ɛ ɹ æ æ t ɪ m p ɛ ɹ d b b ɹ n", + "ref_phonemes": "tɪsju fʌŋkʃʌnɪŋ soʊ ðɛr hæv bɪn mɛni ɡrups ðæt hæv juzd ænʌmʌl mɑdʌlz tu traɪ tu ʌndɝstænd wʌt ɪz ðʌ lɪŋk bɪtwin ɛlʌveɪtɪd bimi ʌnd ɪmpɛrd æt ɪmpɛrd braʊn ", + "duration": 0.9650528430938721, + "PER": 36.507936507936506, + "score": { + "S": 26, + "D": 13, + "I": 7, + "N": 126 + } + }, + { + "model": "WavLM", + "phonemes": "d t ə ʃ ə v f ʌ ŋ k ʃ ə n æ n d b s s ɪ k ɹl i m d ɪ p ɛ n ɪ ŋ ɑ n w ɛ ɹ j u l ʌ k θ ɪɛ ɹv ɪ n m ɛ n i d ɪ fɹ̩ə n s ɛ l tajp s ɪ n m ɛ ɡ ə n ɪ z ə m z ɪ m p l ə kejt ə d æ n sow ð ə b ɹ awt aw t d ə p s t ɪ ʃ u ɪ z ə", + "ref_phonemes": "ædʌpoʊs tɪsju fʌŋkʃʌn ʌnd beɪsɪkli dɪpɛndɪŋ ɑn wɛr ju lʊk ðɛr hæv bɪn mɛni dɪfɝʌnt sɛl taɪps ʌnd mɛkʌnɪzʌmz ɪmplɪkeɪtɪd ʌnd soʊ ðʌ braʊn ædʌpoʊs tɪsju ɪz ʌ ", + "duration": 0.7037043571472168, + "PER": 42.1875, + "score": { + "S": 31, + "D": 17, + "I": 6, + "N": 128 + } + }, + { + "model": "WavLM", + "phonemes": "w ɛ l k ə m t ə ð ə j u ɹ̩ʌ l æ t æə s ɹ i ɪ s ʌ sajə n s sajn bejs s t ə ɹ ɹ s f ɔ ɹ ejs ʌi lajfk k s æ n d ɹ̩ɹ j u bɹ̩m ə n æ n d ɑ m ə p ɹ ə f ɛ sɹ̩ʌ nɹ̩æowə bajɑ ld͡ʒi", + "ref_phonemes": "wɛlkʌm tu ðʌ hubɝmʌn læb poʊdkæst wɛr wi dɪskʌs saɪʌns ʌnd saɪʌnsbeɪst tulz fɔr ɛvrideɪ laɪf aɪm ændru hubɝmʌn ʌnd aɪm ʌ prʌfɛsɝ ʌv nʊroʊbaɪɑlʌdʒi ", + "duration": 0.7734794616699219, + "PER": 59.83606557377049, + "score": { + "S": 41, + "D": 24, + "I": 8, + "N": 122 + } + }, + { + "model": "WavLM", + "phonemes": "t d p θ ə m ɑ l əd͡ʒi æ t s t æ m f ɹ̩d s k u lʌ v m ɛ d ə s ə n ə dejw i ɑ ɹ d ɪ s k ʌ s ɪ ŋ ð ə ɪ m j u n s ɪ s t ə m æ n d w i ɑ ɹ ɔ l sowd d ɪ s k ʌ s ɪ ŋ ð ə nɹ̩v ə s ɪ s t ə m", + "ref_phonemes": "ʌnd ɑpθʌmɑlʌdʒi æt stænfɝd skul ʌv mɛdʌsʌn tʌdeɪ wi ɑr dɪskʌsɪŋ ðʌ ɪmjun sɪstʌm ʌnd wi ɑr ɔlsoʊ dɪskʌsɪŋ ðʌ nɝvʌs sɪstʌm ", + "duration": 0.6238527297973633, + "PER": 27.27272727272727, + "score": { + "S": 19, + "D": 4, + "I": 4, + "N": 99 + } + }, + { + "model": "WavLM", + "phonemes": "w ɪ z ð ə b ɹejn n s pajn ə l k ɔ ɹ d æ n dð ə k ə n ɛ k ʃ ə n z ʌ v ð ə bɹejn æ n s bajn ə lk w ɹ d w ɪ ð ɔ l ð ə ɔ ɹ d ə n z ʌ v ð ə b ɑ d i ɛ ɑɹ ɔ l sow ɡɪ t ə d ɪ s k ʌ s hawn ə nɹ̩v ə s ɪ s t ə m k æ n b i", + "ref_phonemes": "wɪtʃ ɪz ðʌ breɪn spaɪnʌl kɔrd ʌnd ðʌ kʌnɛkʃʌnz ʌv ðʌ breɪn ʌnd spaɪnʌl kɔrd wɪð ɔl ðʌ ɔrɡʌnz ʌv ðʌ bɑdi wi ɑr ɔlsoʊ ɡoʊɪŋ tu dɪskʌs haʊ ðʌ nɝvʌs sɪstʌm kæn bi ", + "duration": 0.6508762836456299, + "PER": 36.0, + "score": { + "S": 34, + "D": 9, + "I": 2, + "N": 125 + } + }, + { + "model": "WavLM", + "phonemes": "j u z d t ə æ f t ə vejt ɪ n n k ə n t ɹowl ð ə ɪ m j u n s ɪ s t ə m bawt t ɛ n d t w ɛ n t j ɪ ɹ z ə ɡowð s ʌ m ɑ d i s ɛ d ð æ t ð ə majn k ʊ d k n t ɹowl ð", + "ref_phonemes": "juzd tu æktʌveɪt ʌnd kʌntroʊl ðʌ ɪmjun sɪstʌm naʊ ʌbaʊt tɛn twɛnti jɪrz ʌɡoʊ ɪf sʌmbɑdi sɛd ðæt ðʌ maɪnd kʊd kʌntroʊl ", + "duration": 0.594658613204956, + "PER": 32.29166666666667, + "score": { + "S": 20, + "D": 9, + "I": 2, + "N": 96 + } + }, + { + "model": "WavLM", + "phonemes": "ðə ɪ m j u n s ɪ s t ə m ɪ t ɹ ɑ b l i ɡ ɛ t l æ f dawt ʌ mows t æ k ə d ɛ m ɪ k ɑ m f ɹ̩ə n s ɪ s æ n sɹ̩ t ə l i ð ə wɹ̩k w ɛ n b i p ʌ b l ɪ ʃ ɪ n k w ɑ l ə t i id͡ʒɹ̩n ə l z b ʌ t nawb dejz ð ɛ ɹ ɑ ɹ dowz ɪ n z", + "ref_phonemes": "ðʌ ɪmjun sɪstʌm ðeɪd prɑbʌbli ɡɛt læft aʊt ʌv moʊst ækʌdɛmɪk kɑnfɝʌnsʌz ʌnd sɝtʌnli ðʌ wɝk wʊdʌnt bi pʌblɪʃt ɪn kwɑlʌti dʒɝnʌlz bʌt naʊʌdeɪz ðɛr ɑr dʌzʌnz ", + "duration": 0.6998803615570068, + "PER": 38.28125, + "score": { + "S": 29, + "D": 13, + "I": 7, + "N": 128 + } + }, + { + "model": "WavLM", + "phonemes": "n ɑ t h ʌ n dɹ̩ɹ əɪ d z ʌ v k w ɑ l ə t i p ʊ ɹvɹ̩v j u d s t ʌ d i z ɑ n hawɪ ð ə majn d æ n d hawæ ɹ ð ə nɹ̩v ə s ɪ s t ə m æ n k ə n t ɹowl æ k t ə vejʃ ə n ʌ v ð ə ɪ m u n s ɪ s t ə m", + "ref_phonemes": "ɪf nɑt hʌndrʌdz ʌv kwɑlʌti pɪrʌvɝid stʌdiz ɑn haʊ ðʌ maɪnd ʌnd haʊ ðʌ nɝvʌs sɪstʌm kæn kʌntroʊl æktʌveɪʃʌn ʌv ðʌ ɪmjun sɪstʌm ", + "duration": 0.7067463397979736, + "PER": 37.86407766990291, + "score": { + "S": 25, + "D": 5, + "I": 9, + "N": 103 + } + }, + { + "model": "WavLM", + "phonemes": "d͡ʒ z ə w ʌ n dɹ̩f ə l ɡ ɹowɪ ŋ b ɑ d iʌ v ɹ i sɹ̩t͡ʃɪ dd͡ʒʌ s t t ɡ ɪ v j u ə h ɪ n t ə vw ɛ ɹ w i ɑ ɹ h ɛ d ə d w ɪ ð ɪ s d͡ʒ s t ð ɪ s l æ s w i k ɑ z ə php pɹ̩p p ʌ b l ɪ t ɪ n n nt͡ʃ", + "ref_phonemes": "ðɪs ɪz ʌ wʌndɝfʌl ɡroʊɪŋ bɑdi ʌv risɝtʃ ʌnd dʒʌst tu ɡɪv ju ʌ hɪnt ʌv wɛr wi ɑr hɛdʌd wɪð ðɪs dʒʌst ðɪs læst wik ðɛr wɑz ʌ peɪpɝ pʌblɪʃt ɪn neɪtʃɝ ", + "duration": 0.7170331478118896, + "PER": 36.84210526315789, + "score": { + "S": 21, + "D": 13, + "I": 8, + "N": 114 + } + }, + { + "model": "WavLM", + "phonemes": "w ɪ z ð ə ejp ɛ k nt͡ʃd͡ʒɹ̩ ə l ʌ v f ɔ ɹ sajə t ɪ v ɪ k p ʌ l ɪ ʃ ɪ ŋ p ɹ ɹ m ɪ nɹd͡ʒɹ̩ ə l ɪ k s t ɹ i m l i s t ɹ ej n d͡ʒə n ə p pejp ʌ b ɪ ʃ ɪ dn nej t͡ʃɹ̩ p f", + "ref_phonemes": "wɪtʃ ɪz ðʌ eɪpɛks dʒɝnʌl fɔr saɪʌntɪfɪk pʌblɪʃɪŋ prɛmɪr dʒɝnʌl ɪkstrimli strɪndʒʌnt ʌ peɪpɝ pʌblɪʃt ɪn neɪtʃɝ ", + "duration": 0.5988266468048096, + "PER": 52.68817204301075, + "score": { + "S": 25, + "D": 9, + "I": 15, + "N": 93 + } + }, + { + "model": "WavLM", + "phonemes": "fɹ ʌ uə f u m ɑ l æ b æ t h ɑ ɹ v ɹ̩d m ɛ t ɪ k əl s k uə l ɛ k s p l ɔ ɹ d hawæ k j ə p ʌ ŋ kt͡ʃɹ̩æ æ n ɹ ə d u s ɪ m f l ə mejʃ ə n ɪ n ð ə b ɑ d i", + "ref_phonemes": "frʌm kjufu mɑz læb æt hɑrvɝd mɛdʌkʌl skul ɪksplɔrd haʊ ækjupʌŋktʃɝ kæn rʌdus ɪnflʌmeɪʃʌn ɪn ðʌ bɑdi ", + "duration": 0.574798583984375, + "PER": 33.734939759036145, + "score": { + "S": 21, + "D": 3, + "I": 4, + "N": 83 + } + }, + { + "model": "WavLM", + "phonemes": "æ n d w t ɪl d ɪ s k ɹajb ə s t ʌ d i ɪ n ə ɪ t m ɔ ɹ d ɪ tejl ʌ w ðej ɪ s k ʌ vɹ̩d ɑ z ð æ t bajs t ɪ m j ə lejt ɪ ŋ ə b ɑ d i ɪ n p ɹ t ɪ k j ə lɹ̩wejz æ t p t ɪ k əlɹ̩ ɹ sajd s ʌ ɑ m ð ə b ɑ d i", + "ref_phonemes": "ʌnd aɪ wɪl dɪskraɪb ðɪs stʌdi ɪn ʌ bɪt mɔr dɪteɪl leɪtɝ bʌt wʌt ðeɪ dɪskʌvɝd wɑz ðæt baɪ stɪmjʌleɪtɪŋ ðʌ bɑdi ɪn pɝtɪkjʌlɝ weɪz æt pɝtɪkjʌlɝ saɪts ɑn ðʌ bɑdi ", + "duration": 0.7999927997589111, + "PER": 37.79527559055118, + "score": { + "S": 25, + "D": 18, + "I": 5, + "N": 127 + } + }, + { + "model": "WavLM", + "phonemes": "ð ejt ə l t ə l ɪ bɹ̩ejt sɹ̩t ə n s ɛ l z æ n d m ɔ l ə k j u ə l z ð æ t ɪ n h ɛ n s ð ə f ʌ ŋ ʃ ə n ʌ v ðəɪ m j u n s ɪ s t ə m æ n d p ə t ɛ n ʃ ə l i k ə m j u z t ə k ɑ m b æ t", + "ref_phonemes": "ðeɪ wɝ eɪbʌl tu lɪbɝeɪt sɝtʌn sɛlz ʌnd mɑlʌkjulz ðæt ɛnhæns ðʌ fʌŋkʃʌn ʌv ðʌ ɪmjun sɪstʌm ʌnd pʌtɛnʃʌli kæn bi juzd tu kʌmbæt ", + "duration": 0.6667976379394531, + "PER": 34.31372549019608, + "score": { + "S": 24, + "D": 8, + "I": 3, + "N": 102 + } + }, + { + "model": "WavLM", + "phonemes": "f ɹ ə n tp s ʌ v ɪ n f ɛ k ʃ ə n æ n dd͡ʒ s i ɪ v j u ə n ʌ ðɹ̩l ɪ t ə l h ɪ n d ðejhi fawn d ð æ t ə p ɑ t ɪ k j ə lɹ̩t s hajp p ʌ v ɔ ɹ ɪ n t ɪ ʃ u k ɔ d f æ ʃ ə s ʌ m ʌ v j u mejh æ v hɹ̩d ʌ v f æ ʃ ɪ f", + "ref_phonemes": "dɪfɝʌnt taɪps ʌv ɪnfɛkʃʌn ʌnd dʒʌst tu ɡɪv ju ʌnʌðɝ lɪtʌl hɪnt ðeɪ faʊnd ðæt ʌ pɝtɪkjʌlɝ taɪp ʌv ɔrɡʌn tɪsju kɔld fɑʃiʌ sʌm ʌv ju meɪ hæv hɝd ʌv fɑʃiʌ ", + "duration": 0.6326031684875488, + "PER": 40.0, + "score": { + "S": 26, + "D": 13, + "I": 9, + "N": 120 + } + }, + { + "model": "WavLM", + "phonemes": "d͡ʒ æ ʃ ə s əɹ̩awn d z ɑ ɹm ʌ s ə l z s t t ə l ʊ k æ ɪ u majtk θ ɪ ŋ k ɪ t s ə k n n ə j u s l ə s t ɪ ʃ ɪ t s ɔ ɹ l kə k ə t d ɛ n s b æ ɡ ðæ t", + "ref_phonemes": "fɑʃiʌ sɝaʊndz aʊɝ mʌsʌlz dʒʌst tu lʊk æt ɪt ju maɪt θɪŋk ɪts ʌ kaɪnd ʌv juslʌs tɪsju ɪts sɔrt ʌv laɪk ʌ dɛns bæɡ ", + "duration": 0.41788315773010254, + "PER": 51.13636363636363, + "score": { + "S": 19, + "D": 17, + "I": 9, + "N": 88 + } + }, + { + "model": "WavLM", + "phonemes": "ɪ n wɪt͡ʃð ə m ʌ s ə l z ɑ ɹ k ə n tejn d w ɛ l tɹ̩n zawt ð æ ðowz d ɛ n s æ ɡ z ɹ m ʌt͡ʃk s m ɑ ɹ tɹ̩ð æ n w i θ ɔ t ðejd ɑ ɹn æ v ə majn d ʌ v ð ɛ ɹown b", + "ref_phonemes": "ɪn wɪtʃ ðʌ mʌsʌlz ɑr kʌnteɪnd wɛl ɪt tɝnz aʊt ðæt ðoʊz dɛns bæɡz ɑr mʌtʃ smɑrtɝ ðæn wi θɔt ðeɪ doʊnt hæv ʌ maɪnd ʌv ðɛr oʊn ", + "duration": 0.49857592582702637, + "PER": 31.25, + "score": { + "S": 19, + "D": 6, + "I": 5, + "N": 96 + } + }, + { + "model": "WavLM", + "phonemes": "bajs t ɪ m j ə lejt ɪ ŋ ð ə f æ ə ɪ n ə pɹ t ɪ k j ɹ̩lowkejʃ ə n ɑ n ð ə b ɑ d i ɛ ɹ z ə p æ θ wejt l i d ɪ ŋ t ʌ v ð æ t f æ ə d ɹ̩ ɹ k l i t ə n ɔ ɹ ŋn k ɔ l ð ə ə d ɹ i n ə m ə d ʌ ə", + "ref_phonemes": "bʌt baɪ stɪmjʌleɪtɪŋ ðʌ fɑʃiʌ ɪn ʌ pɝtɪkjʌlɝ loʊkeɪʃʌn ɑn ðʌ bɑdi ðɛrz ʌ pæθweɪ lidɪŋ aʊt ʌv ðæt fɑʃiʌ dɝɛktli tu æn ɔrɡʌn kɔld ðʌ ʌdrinʌl mɪdʌlʌ ", + "duration": 0.7681550979614258, + "PER": 41.52542372881356, + "score": { + "S": 32, + "D": 16, + "I": 1, + "N": 118 + } + }, + { + "model": "WavLM", + "phonemes": "æ l ɪ k s lejn ŋ ɛ n ɔ l ð ɪ s m i n z ð æ t k ʊ d l ɪ b ɹ̩ejt p ɹ ɪ t ɪ kjəlɹ̩k tk ɛ m ə k ə l z ð æ t h æ d ə pow t ə n d n tajæɪ n d f l æ m ə t ɔ ɹ i ɪ f ɛ k t w ɪ l w ʌ wɹ̩ɹb pejs ɪ ɡ l i s æ ŋ", + "ref_phonemes": "aɪl ɪkspleɪn wʌt ɔl ðɪs minz ðæt kʊd lɪbɝeɪt pɝtɪkjʌlɝ kɛmɪkʌlz ðæt hæd ʌ poʊtʌnt æntɪfʌndlʌmɪti ɪfɛkt soʊ wʌt wir beɪsɪkli seɪɪŋ ", + "duration": 0.5513260364532471, + "PER": 42.592592592592595, + "score": { + "S": 29, + "D": 6, + "I": 11, + "N": 108 + } + }, + { + "model": "WavLM", + "phonemes": "ð æ t ð ə nɹ̩v ə s ɪ s t ə m æ k s ɪæ z ə s ɛ t ʌ v hajwej wejz z b ɪ t w i n ð ə t ɪfɹ̩ə n t ɪ ʃ u z ʌ v j ɔ ɹ b ɑ d i k ɔ l ɪ ŋ ɪ n t u æ k ʃ ə n ð ə ɪ m j u n s ɪ s t ə m", + "ref_phonemes": "ɪz ðæt ðʌ nɝvʌs sɪstʌm ækts æz ʌ sɛt ʌv haɪweɪz bɪtwin ðʌ dɪfɝʌnt tɪsjuz ʌv jɔr bɑdi kɔlɪŋ ɪntu ækʃʌn ðʌ ɪmjun sɪstʌm ", + "duration": 0.600597620010376, + "PER": 30.851063829787233, + "score": { + "S": 16, + "D": 6, + "I": 7, + "N": 94 + } + }, + { + "model": "WavLM", + "phonemes": "l ɪ bɹ̩ejt ɪ ŋ pɹ t ɪ kjə lɹ̩m ɔ l ə k j u l z ð æ k æʌ m ɹ ə d u s ɪ n f mejʃ ə n æ n d l i d t ə f æ s tɹ̩h i l ɪ ŋ æ n d ajw ɪ ɪ k s p lejn hawɔl ɔ l ʌ v ð æ t wɹ̩k s", + "ref_phonemes": "lɪbɝeɪtɪŋ pɝtɪkjʌlɝ mɑlʌkjulz ðæt kæn rʌdus ɪnflʌmeɪʃʌn ʌnd lɛd tu fæstɝ hilɪŋ ʌnd aɪ wɪl ɪkspleɪn haʊ ɔl ʌv ðæt wɝks ", + "duration": 0.5858020782470703, + "PER": 32.98969072164948, + "score": { + "S": 21, + "D": 4, + "I": 7, + "N": 97 + } + }, + { + "model": "WavLM", + "phonemes": "w z w ɛ l ə s ʌ m ʌ ðɹ̩s n ʌ n æ k jə p ʌ ŋ kt͡ʃɹ̩ɹm ɛ θ ə d z f ɔ ɹ k t ə vejt ɪ ŋ ɪ n ɪ h æ n s ɪ ŋ ð ə f ʌ ŋ ə n ʌ v ð ə m j u n s ɪ s t ə m", + "ref_phonemes": "æz wɛl æz sʌm ʌðɝ nɑnʌkʌnstwɛk mɛθʌdz fɔr æktʌveɪtɪŋ ʌnd ɛnhænsɪŋ ðʌ fʌŋkʃʌn ʌv ðʌ ɪmjun sɪstʌm ", + "duration": 0.5109455585479736, + "PER": 43.037974683544306, + "score": { + "S": 20, + "D": 7, + "I": 7, + "N": 79 + } + }, + { + "model": "WavLM", + "phonemes": "sow ə dejw ɡ ɑ n b i t ɔ k ɪ ŋ ɔ l ə bawt h i l ɪ ŋ w ɪ θ ð ə majn d ɪ n ə k ə m p l i t l i n ɑ n m ɪ s t ɪ k ə l n ɑ n æ b s t ɹ æ k t s ɛ t s", + "ref_phonemes": "soʊ tʌdeɪ wir ɡoʊɪŋ tu bi tɔkɪŋ ɔl ʌbaʊt hilɪŋ wɪð ðʌ maɪnd ɪn ʌ kʌmplitli nɑnmɪstʌkʌl nɑnʌbæstrækt sɛns ", + "duration": 0.5785262584686279, + "PER": 29.069767441860467, + "score": { + "S": 17, + "D": 8, + "I": 0, + "N": 86 + } + }, + { + "model": "WavLM", + "phonemes": "b ɪ f ɔ ɹ w i b ɪ ɡ ɪ n dlajt t ə ɛ m f ə sajz ð æ t ð ɪ s p ɑɔ t k æ s t ɪ z s ɛ pɹ̩ə f ɹ ʌ majt it͡ʃ ɪ ŋ æ n ɹ i sɹ̩t͡ʃɪ w ɔ l z t s t æ m fɹ̩t ɪ t ɪ z hawɛ vɹ̩p ɑ ɹ t ʌ v majtd ɪ zajɹ̩i ɛ fɹ̩t", + "ref_phonemes": "bɪfɔr wi bɪɡɪn aɪd laɪk tu ɛmfʌsaɪz ðæt ðɪs poʊdkæst ɪz sɛpɝɪt frʌm maɪ titʃɪŋ ʌnd risɝtʃ roʊlz æt stænfɝd ɪt ɪz haʊɛvɝ pɑrt ʌv maɪ dɪzaɪɝ ʌnd ɛfɝt ", + "duration": 0.6302568912506104, + "PER": 37.81512605042017, + "score": { + "S": 32, + "D": 6, + "I": 7, + "N": 119 + } + }, + { + "model": "WavLM", + "phonemes": "t ə ɹ ɪ ŋ z ɪ ɹ ə k ɑ s t ə k ə n s u mɹ̩ m fɹ̩mejʃ ə n ə bawt sajə n s æ n d saj s ɹ ɪ lejt ə t u l z t ə ð əd͡ʒɛ nɹ̩ə p ʌ b l ɪ k ɪ n k i p ɪ ŋ w ɪ ð æ t θ i m", + "ref_phonemes": "tu brɪŋ zɪroʊ kɑst tu kʌnsumɝ ɪnfɝmeɪʃʌn ʌbaʊt saɪʌns ʌnd saɪʌnsɛrʌleɪtɪd tulz tu ðʌ dʒɛnɝʌl pʌblɪk ɪn kipɪŋ wɪð ðæt θim ", + "duration": 0.5141208171844482, + "PER": 37.0, + "score": { + "S": 27, + "D": 8, + "I": 2, + "N": 100 + } + }, + { + "model": "WavLM", + "phonemes": "ɹ lajk ð ə θ æ ŋ k ð ə s p ɑ n sɹ̩z ʌ v t ə dejz p ɑ d k æ s t ɑ ɹ fɹ̩s ɹ s p ɑ n sɹ̩ ɪ z ɹowkd ə ɹowk ə mej zaj ajɡ l æ s ə z æ n d s ʌ n ɡ l æ s ə z", + "ref_phonemes": "aɪd laɪk tu θæŋk ðʌ spɑnsɝz ʌv tʌdeɪz poʊdkæst aʊɝ fɝst spɑnsɝ ɪz roʊkʌ roʊkʌ meɪks aɪɡlæsʌz ʌnd sʌŋlæsɪz ", + "duration": 0.5893282890319824, + "PER": 43.67816091954023, + "score": { + "S": 28, + "D": 4, + "I": 6, + "N": 87 + } + }, + { + "model": "WavLM", + "phonemes": "ð d b s ə l u t s u pɹ̩b k w ɑ l ə t i v s ɛ n t ə lajf tajm wɹ̩k ɪ ŋ ɑ n ð ə v ɪ ʒ ə l s ɪ s t ə m æ n dajɪ æ n t ɛ l j u ð æ t ʌ n ʌ vð əmejd͡ʒɹ̩k ɪ ɪɹ ɪ ʃ zɑɹ", + "ref_phonemes": "ðæt ɑr æbsʌlut sʌbɝb kwɑlʌti aɪv spɛnt ʌ laɪftaɪm wɝkɪŋ ɑn ðʌ vɪʒʌwʌl sɪstʌm ʌnd aɪ kæn tɛl ju ðæt wʌn ʌv ðʌ meɪdʒɝ ɪʃuz ", + "duration": 0.6201605796813965, + "PER": 41.66666666666667, + "score": { + "S": 17, + "D": 12, + "I": 11, + "N": 96 + } + }, + { + "model": "WavLM", + "phonemes": "v v ɪ ʒ ə l s ɪ t ə m h æ s ð ə k ə n t ɛ n d w ɪ θ ɪ z hawt ə s i θ ɪ ŋ z k l ɪ ɹ l i ɪ n b ɹajt ɪ n vajɹ m ə n t s ɔ ɹ d ɪ mɹ̩ ɪ n vajɹ m ə n t s æ t s ɛ tɹ̩ə", + "ref_phonemes": "aʊɝ vɪʒʌwʌl sɪstʌm hæz tu kʌntɛnd wɪð ɪz haʊ tu si θɪŋz klɪrli ɪn braɪt ɪnvaɪrʌnmʌnts ɔr dɪmɝ ɪnvaɪrʌnmʌnts ɛt sɛtɝʌ ", + "duration": 0.6306734085083008, + "PER": 36.45833333333333, + "score": { + "S": 24, + "D": 9, + "I": 2, + "N": 96 + } + }, + { + "model": "WavLM", + "phonemes": "ɹ owt l ɪ l i ʌ n dɹ̩s t æ n d z ð ə sajn s ð ə v ɪ ʒ ə l s ɪ s t ə m b ɪ k ɔz z w ʌ n θ ɪ ŋ ð t s w ʌ n dɹ̩f ə l ə bawt ɛ ɹ s ʌ n ɡl ɔ s əɪ z ɪ z ð æ t j u k æ n b i ɪ n ə v ɛ ɹ i b ɹajt ɪ n vajɹ m ə n t", + "ref_phonemes": "roʊkʌ klɪrli ʌndɝstændz ðʌ saɪʌns ʌv ðʌ vɪʒʌwʌl sɪstʌm bɪkɔz wʌn θɪŋ ðæts wʌndɝfʌl ʌbaʊt ðɛr sʌŋlæsɪz ɪz ðæt ju kæn bi ɪn ʌ vɛri braɪt ɪnvaɪrʌnmʌnt ", + "duration": 0.5576746463775635, + "PER": 33.057851239669425, + "score": { + "S": 23, + "D": 12, + "I": 5, + "N": 121 + } + } +] \ No newline at end of file