diff --git "a/eval-results/phonemes_1760931179_HuBERT fine-tuned.json" "b/eval-results/phonemes_1760931179_HuBERT fine-tuned.json" new file mode 100644--- /dev/null +++ "b/eval-results/phonemes_1760931179_HuBERT fine-tuned.json" @@ -0,0 +1,6502 @@ +[ + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.7776634693145752, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðɛrɑr pipʌlhut rævʌl lɔŋdɪs tʌn sʌz tuʌʃʊr maɪkʌn tɪn judɛɡ zɪs tʌn s", + "ref_phonemes": "ðɛr ɑr pipʌl hu trævʌl lɔŋ dɪstʌnsʌz tu ʌʃʊr maɪ kʌntɪnjud ɛɡzɪstʌns ", + "duration": 0.3458883762359619, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 57 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.2574305534362793, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.2688024044036865, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "t rɪmɛk sɛs k leɪf rʌmʌraʊn d lɪpʌv moʊl dʌn d sɛtʌsaɪd waɪlʌsɛm bʌlɪŋlɪd", + "ref_phonemes": "trɪm ɛksɛs kleɪ frʌm ɝaʊnd lɪp ʌv moʊld ʌnd sɛt ʌsaɪd waɪl ʌsɛmbʌlɪŋ lɪd ", + "duration": 0.3655211925506592, + "PER": 3.389830508474576, + "score": { + "S": 1, + "D": 0, + "I": 1, + "N": 59 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.27793264389038086, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌaɪdiʌʌvʌsɛn t rʌl tæŋk wɪlaɪʌn z tuitʃhaʊsɪz nɑtɪnɪt sɛl fʌnɑvʌl ti", + "ref_phonemes": "ðʌ aɪdiʌ ʌv ʌ sɛntrʌl tæŋk wɪð laɪnz tu itʃ haʊs ɪz nɑt ɪn ɪtsɛlf ʌ nɑvʌlti ", + "duration": 0.2885303497314453, + "PER": 3.389830508474576, + "score": { + "S": 0, + "D": 1, + "I": 1, + "N": 59 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɪf jujuz pɑr kɪŋʌtɛn dʌn t s kænðeɪbirip leɪs t baɪɔtʌmætɪk pɑr kɪŋɡeɪt s", + "ref_phonemes": "ɪf ju juz pɑrkɪŋ ʌtɛndʌnts kæn ðeɪ bi ripleɪst baɪ ɔtʌmætɪk pɑrkɪŋ ɡeɪts ", + "duration": 0.33306884765625, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 60 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðɛrɑr rɪzʌl t sʌs tʌdiʌv lɪtɝʌtʃɝf rid f rʌmðʌtɪrʌniʌvðʌkʌn tɛm pɝɛri", + "ref_phonemes": "ðɛr rɪzʌlts ʌ stʌdi ʌv lɪtɝʌtʃɝ frid frʌm ðʌ tɪrʌni ʌv ðʌ kʌntɛmpɝɛri ", + "duration": 0.29767823219299316, + "PER": 3.508771929824561, + "score": { + "S": 0, + "D": 0, + "I": 2, + "N": 57 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌθɪkɛl m fɔrʌs t wɑz nɪr lioʊvɝwɛl m d baɪdʌtʃɛl m dɪziz", + "ref_phonemes": "ðʌ θɪk ɛlm fɔrʌst wɑz nɪrli oʊvɝwɛlmd baɪ dʌtʃ ɛlm dɪziz ", + "duration": 0.3240509033203125, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 46 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "bʌt tukʌn tɪn jutudɪvɔr sʌd væn s s tudʌn t s f rʌm riælʌtiɪzɪnɪk s k juzʌbʌl", + "ref_phonemes": "bʌt tu kʌntɪnju tu dɪvɔrs ʌdvænst studʌnts frʌm riælʌti ɪz ɪnɪkskjuzʌbʌl ", + "duration": 0.335235595703125, + "PER": 1.6129032258064515, + "score": { + "S": 0, + "D": 1, + "I": 0, + "N": 62 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.22455883026123047, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.25194787979125977, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.2674391269683838, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "hɪz feɪl jɝtuoʊpʌnðʌs tɔr baɪeɪt kɑs θhɪmhɪzdʒɑb", + "ref_phonemes": "hɪz feɪljɝ tu oʊpʌn ðʌ stɔr baɪ eɪt kɑst hɪm hɪz dʒɑb ", + "duration": 0.3000757694244385, + "PER": 2.380952380952381, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 42 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.2590155601501465, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.3433527946472168, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "kʌmɑnhiwɪs pɝd f lɔr lɛvʌl zʌbaʊtθrifit daʊn soʊdoʊn t fɔl", + "ref_phonemes": "kʌmɑn hi wɪspɝd fɔr lɛvʌlz ʌbaʊt θri fit daʊn soʊ doʊnt fɔl ", + "duration": 0.29814887046813965, + "PER": 2.083333333333333, + "score": { + "S": 0, + "D": 0, + "I": 1, + "N": 48 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.30002379417419434, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "hɪz kæp tʌn wɑzθɪnʌn ðhæɡɝdʌn ðhɪz b jutʌfʌl but s wɝwɔr nʌn dʃæbi", + "ref_phonemes": "hɪz kæptʌn wɑz θɪn ʌnd hæɡɝd ʌnd hɪz bjutʌfʌl buts wɝ wɔrn ʌnd ʃæbi ", + "duration": 0.33699631690979004, + "PER": 3.7037037037037033, + "score": { + "S": 2, + "D": 0, + "I": 0, + "N": 54 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.2683095932006836, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɪf nɛsʌsɛririp leɪs boʊθhæf sɑn ɡ ril sɪr kʌt sʌn dʌlɑtɛk s t rʌtaɪm", + "ref_phonemes": "ɪf nɛsʌsɛri tu ripleɪs boʊθ hævz ɑn ɡrɪl sɪr kʌts ʌnd ʌlɑt ɛkstrʌ taɪm ", + "duration": 0.3049764633178711, + "PER": 8.771929824561402, + "score": { + "S": 3, + "D": 2, + "I": 0, + "N": 57 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "maɪdɪzaɪɝzɑr sɪm pʌl ɡɪv miwʌnɪn fɔr mʌtɪv pærʌɡ ræfɑnðʌsʌbdʒɪk t", + "ref_phonemes": "maɪ dɪzaɪɝz ɑr sɪmpʌl ɡɪv mi wʌn ɪnfɔrmʌtɪv pærʌɡræf ɑn ðʌ sʌbdʒɪkt ", + "duration": 0.2713584899902344, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 56 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.2652618885040283, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.26399827003479004, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌs t rʌktʃɝʒhaʊsɪŋðʌʌpɑr t mʌn t sɑrʌv meɪsʌn riʌn d f reɪm kʌn s t rʌkʃʌn", + "ref_phonemes": "ðʌ strʌktʃɝz haʊzɪŋ ðʌ ʌpɑrtmʌnts ɑr ʌv meɪsʌnri ʌnd freɪm kʌnstrʌkʃʌn ", + "duration": 0.2626006603240967, + "PER": 3.3333333333333335, + "score": { + "S": 2, + "D": 0, + "I": 0, + "N": 60 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.2733154296875, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.2672712802886963, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "dujulʌv turʌnʌpʌhɛm soʊɑn bʌtʌn z meɪk nit bʌtʌnhoʊl z", + "ref_phonemes": "du ju lʌv tu rʌn ʌp ʌ hɛm soʊ ɑn bʌtʌnz meɪk nit bʌtʌnhoʊlz ", + "duration": 0.31487345695495605, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 46 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.26454806327819824, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "hiɪzʌmænʌv meɪdʒɝtælʌn t bʌtʌmænʌv sɑlʌtɛriʌn sɝtʌnɪm pʌl sɪz", + "ref_phonemes": "hi ɪz ʌ mæn ʌv meɪdʒɝ tælʌnt bʌt ʌ mæn ʌv sɑlʌtɛri ʌnsɝtʌn ɪmpʌlsɪz ", + "duration": 0.3075540065765381, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 54 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.18354296684265137, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.2659318447113037, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.3340268135070801, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʌn dɑk tʌl jʌnædʌm z naʊlɛtʌs siwɛrðɪs paʊɝkʌm z f rʌm", + "ref_phonemes": "æn ɑktɪljʌn ætʌmz naʊ lɛt ʌs si wɛr ðɪs paʊɝ kʌmz frʌm ", + "duration": 0.28738856315612793, + "PER": 9.30232558139535, + "score": { + "S": 3, + "D": 0, + "I": 1, + "N": 43 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʌdɪteɪl d s tʌdiʌvðɪs lætɝfʌnɑmʌnɑn wɑz nɑtʌtɛm p tʌdɪnðɪs peɪpɝ", + "ref_phonemes": "ʌ dɪteɪld stʌdi ʌv ðɪs lætɝ fʌnɑmʌnɑn wɑz nɑt ʌtɛmptʌd ɪn ðɪs peɪpɝ ", + "duration": 0.3343033790588379, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 55 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðɛrɪz lɪtʌl daʊtðætðʌs tudʌn t s bɛnʌfɪt f rʌm voʊkeɪʃʌnʌlɛdʒʌkeɪʃʌn", + "ref_phonemes": "ðɛr ɪz lɪtʌl daʊt ðæt ðʌ studʌnts bɛnʌfɪt frʌm voʊkeɪʃʌnʌl ɛdʒʌkeɪʃʌn ", + "duration": 0.3275299072265625, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 59 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.2496964931488037, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʌkærɪdʒk rʌntʃt baɪɪt s dɪm laɪt s fɪl tɝɪŋθruðʌɡ lum", + "ref_phonemes": "ʌ kærɪdʒ krʌntʃt baɪ ɪts dɪm laɪts fɪltɝɪŋ θru ðʌ ɡlum ", + "duration": 0.25043678283691406, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 44 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "noʊp raɪsɪz tuhaɪwɛn t rulʌvɪzæt s teɪk", + "ref_phonemes": "noʊ praɪs ɪz tu haɪ wɛn tru lʌv ɪz æt steɪk ", + "duration": 0.250887393951416, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 33 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.24321985244750977, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.24486565589904785, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "peɪpɝweɪt meɪbipɝsɪnʌlaɪz dɑn bæk waɪl k leɪɪz lɛðɝhɑr d", + "ref_phonemes": "peɪpɝweɪt meɪ bi pɝsʌnʌlaɪzd ɑn bæk waɪl kleɪ ɪz lɛðɝ hɑrd ", + "duration": 0.316051721572876, + "PER": 2.083333333333333, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 48 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "haʊɛvɝðʌlɪtɝrɪmeɪn dɔɡ mɛn tʌd baɪsɛv rʌl dʌzʌn lʌntʃrum sʌpɝz", + "ref_phonemes": "haʊɛvɝ ðʌ lɪtɝ rɪmeɪnd ɑɡmɛntʌd baɪ sɛvrʌl dʌzʌn lʌntʃrum sʌpɝz ", + "duration": 0.34598755836486816, + "PER": 1.8518518518518516, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 54 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.2996554374694824, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "æl rʌsiv dʌdʒɔɪn tʌpɔɪn t mʌn tɪnðʌbaɪɑlʌdʒiʌn dðʌɛndʒʌnɪrɪŋdɪpɑr t mʌn t s", + "ref_phonemes": "æl rʌsivd ʌ dʒɔɪnt ʌpɔɪntmʌnt ɪn ðʌ baɪɑlʌdʒi ʌnd ðʌ ɛndʒʌnɪrɪŋ dɪpɑrtmʌnts ", + "duration": 0.31675076484680176, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 64 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "wikʌn ɡ rætʃʌleɪtðʌɪn taɪɝmɛm bɝʃɪpɑnɪt s rɛkɝdʌv ɡʊd lɛdʒʌs leɪʃʌn", + "ref_phonemes": "wi kʌŋrætʃʌleɪt ðʌ ɪntaɪɝ mɛmbɝʃɪp ɑn ɪts rɛkɝd ʌv ɡʊd lɛdʒʌsleɪʃʌn ", + "duration": 0.31624484062194824, + "PER": 3.508771929824561, + "score": { + "S": 1, + "D": 0, + "I": 1, + "N": 57 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.2618114948272705, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɪt wʊd biwɛl tuʃoʊðʌpɑp jʌlʌʃhaʊwidil wɪðʌdʌl tɝɝz", + "ref_phonemes": "ɪt wʊd bi wɛl tu ʃoʊ ðʌ pɑpjʌlʌs haʊ wi dil wɪð ʌdʌltɝɝz ", + "duration": 0.31086182594299316, + "PER": 2.272727272727273, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 44 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌtuθfɛrifɝɡɑt tukʌm wɛn rɑdʒɝz tuθfɛlaʊt", + "ref_phonemes": "ðʌ tuθ fɛri fɝɡɑt tu kʌm wɛn rɑdʒɝz tuθ fɛl aʊt ", + "duration": 0.2529726028442383, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 37 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌhaɪʌs t reɪtʌd nɑn supɝvaɪzɝiɛndʒʌnɪrɪŋtaɪtʌlɪz risɝtʃɛndʒʌnɪr", + "ref_phonemes": "ðʌ haɪʌst reɪtʌd nɑn supɝvaɪzɝi ɛndʒʌnɪrɪŋ taɪtʌl ɪz risɝtʃ ɛndʒʌnɪr ", + "duration": 0.311398983001709, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 59 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "meɪbiɪt s teɪkɪŋlɔŋɡɝtuɡɛtθɪŋz s k wɛr dʌweɪðænðʌbæŋkɝzɪk s pɛk tʌd", + "ref_phonemes": "meɪbi ɪts teɪkɪŋ lɔŋɡɝ tu ɡɛt θɪŋz skwɛrd ʌweɪ ðæn ðʌ bæŋkɝz ɪkspɛktʌd ", + "duration": 0.33446812629699707, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 58 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌhɔn tʌðhaʊs wɑzʌhɪt dutuaʊt s tæn dɪŋɑdioʊvɪʒʌwʌlɪfɛk t s", + "ref_phonemes": "ðʌ hɔntʌd haʊs wɑz ʌ hɪt du tu aʊtstændɪŋ ɑdioʊ vɪʒʌwʌl ɪfɛkts ", + "duration": 0.3263378143310547, + "PER": 1.9607843137254901, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 51 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.25372910499572754, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌbɪɡ dɔɡ lʌv d tutʃuɑnðʌoʊl d ræɡ dɑl", + "ref_phonemes": "ðʌ bɪɡ dɔɡ lʌvd tu tʃu ɑn ðʌ oʊld ræɡ dɑl ", + "duration": 0.20824718475341797, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 31 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.26445603370666504, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌloʊɝpɔrʃʌn p rʌvaɪd zʌreɪtɪŋætɛnis teɪdʒbɪt winɪn fʌn siʌn dʌdʌl θhʊd", + "ref_phonemes": "ðʌ loʊɝ pɔrʃʌn prʌvaɪdz ʌ reɪtɪŋ æt ɛni steɪdʒ bɪtwin ɪnfʌnsi ʌnd ʌdʌlθhʊd ", + "duration": 0.3740055561065674, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 62 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.27276611328125, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "hiɔl soʊrimaɪn dʌðhɪm sɛl fðæθhihædænʌn juʒʌwʌl nʌm bɝʌv pɑsʌbɪlʌtiz", + "ref_phonemes": "hi ɔlsoʊ rimaɪndʌd hɪmsɛlf ðæt hi hæd æn ʌnjuʒʌwʌl nʌmbɝ ʌv pɑsʌbɪlʌtiz ", + "duration": 0.322251558303833, + "PER": 3.3333333333333335, + "score": { + "S": 2, + "D": 0, + "I": 0, + "N": 60 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.2556016445159912, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.2693657875061035, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "rɪtʃlʊk t fɔr s pɑtʌðhaɪinʌzʌn ddʒæɡ wɑr zɑnðʌsʌfɑri", + "ref_phonemes": "rɪtʃ lʊkt fɔr spɑtʌd haɪinʌz ʌnd dʒæɡwɑrz ɑn ðʌ sʌfɑri ", + "duration": 0.25066685676574707, + "PER": 2.2222222222222223, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 45 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "aɪtʊkhɝwɝd fɔrɪt bʌtɪzʃirɪliɡoʊɪŋwɪðju", + "ref_phonemes": "aɪ tʊk hɝ wɝd fɔr ɪt bʌt ɪz ʃi rɪli ɡoʊɪŋ wɪð ju ", + "duration": 0.27170252799987793, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 36 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "aɪtʊkhɝwɝd fɔrɪt bʌtɪzʃirɪliɡoʊɪŋwɪðju", + "ref_phonemes": "aɪ tʊk hɝ wɝd fɔr ɪt bʌt ɪz ʃi rɪli ɡoʊɪŋ wɪð ju ", + "duration": 0.2542862892150879, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 36 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ræl f p ripɛr d rɛd s næpɝwɪðf rɛʃlɛmʌn sɔs fɔr dɪnɝ", + "ref_phonemes": "rælf pripɛrd rɛd snæpɝ wɪð frɛʃ lɛmʌn sɔs fɔr dɪnɝ ", + "duration": 0.2628040313720703, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 41 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.27045154571533203, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "poʊl t rirɪzʌl t sʌvɪreɪdieɪʃʌn tɛs t s wɪðpoʊl t rihæv bɪn k waɪt sʌk sɛs fʌl", + "ref_phonemes": "poʊltri rɪzʌlts ʌv ɪreɪdieɪʃʌn tɛsts wɪð poʊltri hæv bɪn kwaɪt sʌksɛsfʌl ", + "duration": 0.32950282096862793, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 62 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.24821686744689941, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.2249443531036377, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "dɪsɛm bɝʌn ddʒæn juɛriɑr naɪs mʌnθs tus pɛn dɪn maɪæmi", + "ref_phonemes": "dɪsɛmbɝ ʌnd dʒænjuɛri ɑr naɪs mʌnθs tu spɛnd ɪn maɪæmi ", + "duration": 0.3350677490234375, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 45 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "jutuwɝʌs tupʌddʒækæsʌn tɪl jupɔɪzʌn d mi", + "ref_phonemes": "ju tu wɝ ʌ stupʌd dʒækæs ʌntɪl ju pɔɪzʌnd mi ", + "duration": 0.33400464057922363, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 35 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "mɛniwɛlθitaɪkun z s p lɝdʒdʌn d bɑt boʊθʌjɑtʌn dʌs kunɝ", + "ref_phonemes": "mɛni wɛlθi taɪkunz splɝdʒd ʌnd bɑt boʊθ ʌ jɑt ʌnd ʌ skunɝ ", + "duration": 0.4016087055206299, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 46 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.3681328296661377, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.305328369140625, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɪf kærʌl kʌm z tumɑroʊhævhɝɝeɪndʒdfɔrʌmitɪŋæt tu", + "ref_phonemes": "ɪf kærʌl kʌmz tʌmɑroʊ hæv hɝ ɝeɪndʒ fɔr ʌ mitɪŋ æt tu ", + "duration": 0.32610440254211426, + "PER": 4.761904761904762, + "score": { + "S": 1, + "D": 0, + "I": 1, + "N": 42 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.3464031219482422, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.46920084953308105, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.4012136459350586, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɪf pipʌl wɝmɔrdʒɛnɝʌsðɛr wʊd binoʊnid fɔr wɛl fɛr", + "ref_phonemes": "ɪf pipʌl wɝ mɔr dʒɛnɝʌs ðɛr wʊd bi noʊ nid fɔr wɛlfɛr ", + "duration": 0.45954060554504395, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 42 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.3254220485687256, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.4050173759460449, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ænʌdʌl t meɪl bæbun z tiθɑr nɑt sutʌbʌl fɔritɪŋʃɛl fɪʃ", + "ref_phonemes": "æn ʌdʌlt meɪl bæbunz tiθ ɑr nɑt sutʌbʌl fɔr itɪŋ ʃɛlfɪʃ ", + "duration": 0.41857409477233887, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 45 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃisɛdʃɑr k ʃhæv noʊboʊn zʌn dʃrɪm p s s wæm bæk wɝd", + "ref_phonemes": "ʃi sɛd ʃɑrks hæv noʊ boʊnz ʌnd ʃrɪmp swæm bækwɝd ", + "duration": 0.44524288177490234, + "PER": 5.128205128205128, + "score": { + "S": 1, + "D": 0, + "I": 1, + "N": 39 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.395979642868042, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.2646629810333252, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.3710641860961914, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʌsɛkʌn d t wɪtʃθhɪzʃɝt s livʌn ðhifɛl tʌb rif bɝnɑnhɪzʌpɝɑr m", + "ref_phonemes": "ʌ sɛkʌnd twɪtʃt hɪz ʃɝtsliv ʌnd hi fɛlt ʌ brif bɝn ɑn hɪz ʌpɝ ɑrm ", + "duration": 0.4988236427307129, + "PER": 3.9215686274509802, + "score": { + "S": 2, + "D": 0, + "I": 0, + "N": 51 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "kɔriʌn d t rɪʃp leɪd tæɡ wɪðbitʃbɔl z fɔraʊɝz", + "ref_phonemes": "kɔri ʌnd trɪʃ pleɪd tæɡ wɪð bitʃ bɔlz fɔr aʊɝz ", + "duration": 0.5800149440765381, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 37 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.33854079246520996, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.30297255516052246, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "dɪsɛm bɝʌn ddʒæn juɛriɑr naɪs mʌnθs tus pɛn dɪn maɪæmi", + "ref_phonemes": "dɪsɛmbɝ ʌnd dʒænjuɛri ɑr naɪs mʌnθs tu spɛnd ɪn maɪæmi ", + "duration": 0.46044373512268066, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 45 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.40424227714538574, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "sɛd juwɔr jɝsɛl faʊt k linɪŋɔlðizɛm p tirum z", + "ref_phonemes": "sɛd ju wɔr jɝsɛlf aʊt klinɪŋ ɔl ðiz ɛmpti rumz ", + "duration": 0.3458411693572998, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 37 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌdaɪʌɡ noʊsʌs wɑz dɪs kɝʌdʒɪŋhaʊɛvɝhiwɑz nɑtoʊvɝliwɝid", + "ref_phonemes": "ðʌ daɪʌɡnoʊsʌs wɑz dɪskɝʌdʒɪŋ haʊɛvɝ hi wɑz nɑt oʊvɝli wɝid ", + "duration": 0.4761066436767578, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 50 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌtɑr ɡʌttʃɑr t k wɪk liʌn d b rif litɛl z juwɪtʃædʌtɪv z duwʌt", + "ref_phonemes": "ðʌ tɑrɡʌt tʃɑrt kwɪkli ʌnd brifli tɛlz ju wɪtʃ ædʌtɪvz du wʌt ", + "duration": 0.33432722091674805, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 50 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.33656835556030273, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.3978149890899658, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "hiɡeɪvʌʃɔr θhɑr d læfʌn d lʊk tæθhɝnoʊɪŋli", + "ref_phonemes": "hi ɡeɪv ʌ ʃɔrt hɑrd læf ʌnd lʊkt æt hɝ noʊɪŋli ", + "duration": 0.35310840606689453, + "PER": 5.555555555555555, + "score": { + "S": 2, + "D": 0, + "I": 0, + "N": 36 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɡ rɛɡɝiʌn d tɑmtʃoʊz tuwɑtʃkɑr tun zɪnðʌæf tɝnun", + "ref_phonemes": "ɡrɛɡɝi ʌnd tɑm tʃoʊz tu wɑtʃ kɑrtunz ɪn ðʌ æftɝnun ", + "duration": 0.38575267791748047, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 41 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "kɔriʌn d t rɪʃp leɪd tæɡ wɪðbitʃbɔl z fɔraʊɝz", + "ref_phonemes": "kɔri ʌnd trɪʃ pleɪd tæɡ wɪð bitʃ bɔlz fɔr aʊɝz ", + "duration": 0.4525783061981201, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 37 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "aɪnoʊmaɪfæmdiʌʌn ddɪnðʌf jutʃɝaɪwɑn t tumeɪk maɪfʌn dɝp raʊd", + "ref_phonemes": "aɪ lʌv maɪ fæmʌli ʌnd ɪn ðʌ fjutʃɝ aɪ wɑnt tu meɪk maɪ pændʌz praʊd ", + "duration": 0.7225725650787354, + "PER": 20.754716981132077, + "score": { + "S": 7, + "D": 2, + "I": 2, + "N": 53 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "aɪlʌv maɪfæmʌliʌn dʌn dɪnðʌf jutʃɝaɪwɑn t tumeɪk maɪfæmʌlib raʊ", + "ref_phonemes": "aɪ lʌv maɪ fæmʌli ʌnd ɪn ðʌ fjutʃɝ aɪ wɑnt tu meɪk maɪ fæmʌli praʊd ", + "duration": 0.8761904239654541, + "PER": 9.433962264150944, + "score": { + "S": 1, + "D": 1, + "I": 3, + "N": 53 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "wiʃʊd rɪs pɛk tʌn d lʌvɔl mɛm bɝzʌvðʌfæmʌli", + "ref_phonemes": "wi ʃʊr rɪspɛkt ʌnd lʌv ɔl mɛmbɝz ʌv ðʌ fæmʌli ", + "duration": 0.35597681999206543, + "PER": 2.7777777777777777, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 36 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "aɪdoʊnhæv taɪm tuɡoʊwɪðjoʊaɪn f leɪɪŋdiɡeɪt", + "ref_phonemes": "aɪ doʊnt hæv taɪm tu ɡoʊ wɪð ðʌ aɪm pleɪɪŋ krɪkʌt ", + "duration": 0.3717000484466553, + "PER": 28.205128205128204, + "score": { + "S": 9, + "D": 1, + "I": 1, + "N": 39 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "aɪlʌvmaɪfæmʌliæn dæn dɪnðʌf jutʃɝaɪwɑn t tumeɪk maɪfæmʌlip raʊ", + "ref_phonemes": "aɪ lʌv maɪ fæmʌli ʌnd ɪn ðʌ fjutʃɝ aɪ wɑnt tu meɪk maɪ fæmʌli praʊd ", + "duration": 0.6088316440582275, + "PER": 9.433962264150944, + "score": { + "S": 1, + "D": 1, + "I": 3, + "N": 53 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "t wɛn tinaɪn tineɪtin sɛvʌn tin sɪk s tin fɪf tin fɔr tinsɝtinwʌnɪlɛvʌn tɛn naɪneɪtsɛvʌneɪtfaɪv fɔrθituwʌn", + "ref_phonemes": "twɛnti naɪntin eɪtin sɛvʌntin sɪkstin fɪftin fɔrtin θɝtin wʌn ɪlɛvʌn tɛn naɪn eɪt sɛvʌn sɪks faɪv fɔr θri tu wʌn ", + "duration": 0.7371363639831543, + "PER": 5.376344086021505, + "score": { + "S": 3, + "D": 2, + "I": 0, + "N": 93 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "neɪtʃɝɪzæz ɡeɪtɪŋæzɔr mʌðɝɪt sɔl weɪz s wit laɪkhɝ", + "ref_phonemes": "neɪtʃɝ ɪz dʒʌst ɡɛtɪŋ æz aʊɝ mʌðɝ ɪts ɔlweɪz swit laɪk hɝ ", + "duration": 0.34150171279907227, + "PER": 21.73913043478261, + "score": { + "S": 7, + "D": 3, + "I": 0, + "N": 46 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "dɑɡ zit boʊn z maɪk laɪk s baɪk sʌæl sʌbɑn teɪbʊkædʌm p leɪs bæs kʌt bɔ", + "ref_phonemes": "dɑk sid boʊnz mɪk laɪts baɪks ɛlsʌ wɑnt ʌ bʊk ædʌm pleɪz bæskʌtbɔl ", + "duration": 0.6122865676879883, + "PER": 22.22222222222222, + "score": { + "S": 8, + "D": 1, + "I": 3, + "N": 54 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɪnðʌwɪn tɝwɛnɪt s noʊhis loʊliteɪk sʌʃɔr t wɔkɪnðʌoʊpʌnɛritʃdeɪ", + "ref_phonemes": "ɪn ðʌ wɪntɝ wɛn ɪt snoʊ hi sloʊli teɪks ʌ ʃɔrt wɔk ɪn ðʌ oʊpʌn ɛr itʃ deɪ ", + "duration": 0.3615591526031494, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 56 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌs tudʌn t wɛrtðʌjunʌfɔr mʌn d ɡoʊzθrus kul deɪli", + "ref_phonemes": "ðʌ studʌnt wɛr ðʌ junʌfɔrm ʌnd ɡoʊz θru skul daɪʌli ", + "duration": 0.44240593910217285, + "PER": 7.142857142857142, + "score": { + "S": 1, + "D": 1, + "I": 1, + "N": 42 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "wiʃʊd rɪs pɛk tʌn d loʊɔl mɛm bɝzʌvðʌfæmʌli", + "ref_phonemes": "wi ʃʊd rɪspɛkt ʌnd ʌlaʊ aʊɝ mɛmbɝz ʌv ðʌ fæmʌli ", + "duration": 0.4199659824371338, + "PER": 13.157894736842104, + "score": { + "S": 3, + "D": 2, + "I": 0, + "N": 38 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌneɪtɝɪz vɛriæk rɛk tuʌn d fʊlʌv maɪfævɝaɪt ɡ rin kʌlɝ", + "ref_phonemes": "ðʌ neɪtʃɝ ɪz vɛri ʌtræktɪv ʌnd fʊl ʌv maɪ feɪvɝɪt ɡrin kʌlɝ ", + "duration": 0.44040679931640625, + "PER": 18.75, + "score": { + "S": 5, + "D": 3, + "I": 1, + "N": 48 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "juwɪʃ tunoʊɔlʌbaʊt maɪɡ ræn d fɑðɝwɪlhiɪz nɪr linaɪn tiθrijɪr zoʊl d wɪðjʌlɔŋbɪr d", + "ref_phonemes": "juv mɪst tu noʊ ɔl ʌbaʊt maɪ ɡrændfɑðɝ wɛl hi ɪz nɪrli naɪntɪfri jɪrz oʊld wɪð ʌ lɔŋ bɪrd ", + "duration": 0.5284268856048584, + "PER": 11.267605633802818, + "score": { + "S": 5, + "D": 2, + "I": 1, + "N": 71 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðeɪʃʊd rɪs pɛk tæn lʌvɔl mɛm bɝzʌvðʌfæmʌli", + "ref_phonemes": "wi ʃʊd rɪspɛkt ʌnd lʌv ɔl mɛmbɝz ʌv ðʌ fæmʌli ", + "duration": 0.45360493659973145, + "PER": 13.88888888888889, + "score": { + "S": 3, + "D": 1, + "I": 1, + "N": 36 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "mɔnɪŋnætʌn daɪwʊdɛn ðʌfɝʌs teɪʃʌnædibʌt weɪtɪdaɪkɛnðʌbɝs t ɪl", + "ref_phonemes": "oʊ maɪ ɡɑd ʌnd aɪ wʊd laɪk tu fɝst steɪʃʌn bʌt raɪt ɪt æt ðʌ fɝst steɪʃʌn ", + "duration": 0.492739200592041, + "PER": 59.64912280701754, + "score": { + "S": 18, + "D": 9, + "I": 7, + "N": 57 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "dɔɡit boʊn z maɪ laɪk baɪk tʌsʌvɔn teɪbʌlædʌm p leɪbæs kʌt bɔ", + "ref_phonemes": "dɔɡ it boʊnz laɪk baɪk ɛlsʌ wɑnt ʌ bʊk ædʌm pleɪ bæskʌtbɔl ", + "duration": 0.5258560180664062, + "PER": 25.53191489361702, + "score": { + "S": 7, + "D": 1, + "I": 4, + "N": 47 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "hʌn d rʌd naɪn tinaɪn naɪn tieɪt naɪn tisɛvʌn naɪn tisɪk s naɪn tifaɪv naɪn tifɔr naɪn tiθri naɪn titunaɪn tiwʌn naɪn tieɪtinaɪneɪtieɪteɪtisɛvʌneɪtisɪk seɪtifaɪveɪtifɔreɪtiθrieɪtitueɪtiwʌneɪti", + "ref_phonemes": "wʌn hʌndrʌd naɪntaɪnti naɪntaɪt naɪntɪvsɪn naɪntɪkis naɪntɪfaɪtɝ naɪntwɪfɝ naɪntɪfri niɪntutioʊ naɪnʃeɪn naɪnti eɪtinaɪn aɪtit eɪtɪɡstʌn aɪtiksɪs eɪtaɪvɪf eɪtifʊr eɪtritɛr eɪtitwɑtoʊ eɪtiʌn eɪti ", + "duration": 1.1669044494628906, + "PER": 34.68208092485549, + "score": { + "S": 22, + "D": 21, + "I": 17, + "N": 173 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "itɪðʌoʊl dʌs t mɛm bɝʌv maɪfæmʌliɪz maɪk wɪn fɑðɝʌn dðʌjʌŋɡʌs t mɛm bɝʌv maɪfæmʌliɪz maɪbeɪbih rʌk", + "ref_phonemes": "ðʌ oʊldʌst mɛmbɝ ʌv maɪ fæmʌli ɪz maɪ frɛnd kæðɝ ʌnd ðʌ jʌŋɡʌst mɛmbɝ ʌv maɪ fæmʌli ɪz maɪ beɪbi bjurt ", + "duration": 0.6094794273376465, + "PER": 17.073170731707318, + "score": { + "S": 9, + "D": 2, + "I": 3, + "N": 82 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "juwɪʃtunoʊɔlʌbaʊt maɪɡ ræn d fɑðɝ waɪlhiɪz nɪr linaɪn tiθrir soʊl jɛθhistɪlθɪŋk sæz s wɪf t liæzɛvɝhid rʌsɛʃhɪm sɛl fɪn jænoʊl d b læk f rɑk koʊt juʒʌʌlisɛv rʌl bʌtʌn z mɪsɪŋʌlɔŋb reɪd k lɪŋz tuhɪztʃɪn ɡɪvɪŋðoʊʒhuʌb zɝvhɪmjir p rʌnaʊn sɝfilɪŋɔfðʌʌt moʊs t rɪs pɛk t wɛnhis pik ʃhɪz waɪʃhɪzdʒɛstʃɝbɪt k rækɝʌn dkɪvɪʌsʌbɪt", + "ref_phonemes": "ju wɪʃ tu noʊ ɔl ʌbaʊt maɪ ɡrændfɑðɝ wɛl hi ɪz nɪrli naɪntɪfri jɪrz oʊld jɛt hi stɪl θɪŋks hi hæz sɪftɪd æz ɛvɝ hi drɛsʌz hɪmsɛlf ɪn æn oʊld blæk rɑk kɔrt juʒʌwʌli sɛvrʌl bʌtʌnz mɪsɪŋ ʌ lɔŋ ɡreɪt klɪŋz tu hɪz tʃɪn ɡɪvɪŋ ðoʊz hu ʌbzɝv hɪm hir prʌnaʊns ðʌ filɪŋ ʌv ðʌ ʌtmoʊst rɪspɛkt ", + "duration": 2.304561138153076, + "PER": 35.11111111111111, + "score": { + "S": 19, + "D": 8, + "I": 52, + "N": 225 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "neɪtʃɝiɪʒhiæzʌɡeɪtæzaʊɝmʌðɝɪθɔl weɪztus pit laɪkhɝ", + "ref_phonemes": "neɪtʃɝ ɪz æz kɛr æz aʊɝ mʌðɝ ɪt ɔlweɪz fɪts laɪk hɝ ", + "duration": 0.41074633598327637, + "PER": 40.0, + "score": { + "S": 7, + "D": 1, + "I": 8, + "N": 40 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "neɪtʃɝɡɪv zʌs f rut s vɛdʒtʌbʌl zʌn d ɡ reɪn z tuit", + "ref_phonemes": "boʊθ jɔr ɡɪvz ʌs fruts vɛdʒtʌbʌlz ʌnd ɡreɪnz tu it ", + "duration": 0.25613856315612793, + "PER": 17.073170731707318, + "score": { + "S": 6, + "D": 1, + "I": 0, + "N": 41 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "mɔr mʌn raʊdaɪaɪwʌdætðʌbʌʃ teɪtʃʌnæt libʌtðʌweɪoʊðʌlæn daɪm tɪlðaʊwʌs t kɪn", + "ref_phonemes": "mɑm ʌnd dæd ʌnd aɪ wʊd æd ðʌ bʌs steɪʃʌnɝ liv ɪt tu hɝ ʌntɪl ðʌ bʌs keɪm ", + "duration": 0.4439575672149658, + "PER": 67.27272727272727, + "score": { + "S": 19, + "D": 3, + "I": 15, + "N": 55 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "dɑɡ zit boʊn z maɪk lɛɡ s baɪk sɛsʌwɑn t sʌbʊkædʌm p leɪz bæs kʌt bɔl", + "ref_phonemes": "dɑɡz it boʊlz maɪk laɪks baɪks æz ʌ wʌns ʌ bʊk ædʌm pleɪz bæskʌtbɔl ", + "duration": 0.4639289379119873, + "PER": 14.814814814814813, + "score": { + "S": 6, + "D": 1, + "I": 1, + "N": 54 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "juwɪʃtunoʊɔlʌbaʊt maɪɡ ræn d fɑðɝwɛlhiz nɪr linaɪn tiθrijɪr zoʊl d wɪððʌlɔŋbɪr d", + "ref_phonemes": "ju wɪʃ tu noʊ ɔl ʌbaʊt maɪ ɡrændfɑðɝ wɛr hi ɪz nɪrli naɪntɪfri jɪrz oʊld wɪð ʌ lɔŋ brɛθ ", + "duration": 0.4187312126159668, + "PER": 11.594202898550725, + "score": { + "S": 4, + "D": 2, + "I": 2, + "N": 69 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌneɪtʃɝɪz vɛriʌt ræk tɪvʌn d fʊlʌv maɪfæv jɝuaɪt ɡ rin kʌlɝ", + "ref_phonemes": "ðʌ neɪtʃɝ ɪz vɛri ʌtræktɪv ʌnd fʊl ʌv maɪ feɪvɝɪt ɡrin kʌlɝ ", + "duration": 0.40871119499206543, + "PER": 10.416666666666668, + "score": { + "S": 1, + "D": 1, + "I": 3, + "N": 48 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "moʊmʌn dætɝaɪv ldætðʌbʌʃs teɪʃʌnɛd libʌt weɪtɪŋʌn tɪlðʌbʌs keɪm", + "ref_phonemes": "mɑm ʌnd dæd ɝaɪvd æt ðʌ bʌs steɪʃʌn ɝli bʌt weɪtɪŋ ʌntɪl ðʌ bʌs keɪm ", + "duration": 0.565222978591919, + "PER": 14.814814814814813, + "score": { + "S": 4, + "D": 1, + "I": 3, + "N": 54 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "aɪdunɑθhæv taɪm tuɡoʊwɪðjuaɪp leɪʌn d k rɪkʌt", + "ref_phonemes": "aɪ du nɑt hæv taɪm tu ɡoʊ wɪð ju aɪ pleɪ ɪn krɪkʌt ", + "duration": 0.5037426948547363, + "PER": 7.894736842105263, + "score": { + "S": 2, + "D": 0, + "I": 1, + "N": 38 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɪnðʌwɪn tɝwɪwɛnɪt s noʊhis loʊliteɪk ʃhɪzʃɔr t wɔkɪnðʌoʊpʌnɛritudeɪ", + "ref_phonemes": "ɪn ðʌ wɪntɝ wɛn ɪt snoʊ hi sloʊli teɪks ʌ ʃɔrt wɔk ɪn ðʌ oʊpʌn ɛriʌ itʃ deɪ ", + "duration": 0.44188499450683594, + "PER": 15.517241379310345, + "score": { + "S": 3, + "D": 2, + "I": 4, + "N": 58 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌs tudʌn t s wɛrdðʌjunʌfɔr mʌn d bɝs tɝs kul deɪli", + "ref_phonemes": "ðʌ studʌnts wɝ ðʌ junʌfɔrm ʌnd bɝst ðʌ skoʊld ɛriʌ ", + "duration": 0.3031747341156006, + "PER": 26.82926829268293, + "score": { + "S": 5, + "D": 3, + "I": 3, + "N": 41 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "dɔɡ z laɪk dɑɡ zit boʊn z maɪk laɪt s baɪt sɛl sʌwɑn tʌbʊkɑl dʌm p leɪs bæs kʌt bɔl", + "ref_phonemes": "dɑɡz it boʊts maɪk laɪks baɪks ɛlsʌ wɑnts ʌ bʊk ædʌm pleɪz bæskʌtbɔl ", + "duration": 0.506636381149292, + "PER": 28.57142857142857, + "score": { + "S": 6, + "D": 1, + "I": 9, + "N": 56 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɪnðʌwɪn dɝwɛn mɪk s noʊʒhis loʊliteɪk sʌʃɔr t wɔkɪnnʌoʊl bɛneɪtitʃdeɪ", + "ref_phonemes": "ɪn ðʌ wɪntɝ wɛn mɪkst noʊz hi sloʊli teɪks ʌ ʃɔrt wɔk ɪn ðʌ oʊpʌn ɛr itʃ deɪ ", + "duration": 0.36728477478027344, + "PER": 16.94915254237288, + "score": { + "S": 7, + "D": 1, + "I": 2, + "N": 59 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "nitʌi js kædiɪŋnætzʌw maɪɡɝditaɪmɪʃhip leɪkhʌm", + "ref_phonemes": "neɪtʃɝ ɪz jɛs kæriɪŋ æz aʊɝ mʌðɝ it ðʌ hɑrvʌst wi teɪk hɝ ", + "duration": 0.583643913269043, + "PER": 68.88888888888889, + "score": { + "S": 18, + "D": 8, + "I": 5, + "N": 45 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "neɪtʃɝdɪz kɛnɪŋæzaʊɝmʌðɝɪtɔl weɪz s wit laɪk", + "ref_phonemes": "neɪtʃɝ ɪz kɛrɪŋ æz aʊɝ mʌðɝ ɪt ɔlweɪz wik laɪk hɝ ", + "duration": 0.2790393829345703, + "PER": 15.384615384615385, + "score": { + "S": 2, + "D": 2, + "I": 2, + "N": 39 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "aɪlʌvmaɪfæmʌliʌn dɪn f jutʃɝaɪwɑn t tumeɪk maɪfæmʌlip raʊd", + "ref_phonemes": "aɪ lʌv maɪ fæmʌli ʌnd ɪn ðʌ fjutʃɝ aɪ wɑnt tu meɪk maɪ fæmʌli praʊd ", + "duration": 0.37912702560424805, + "PER": 3.7735849056603774, + "score": { + "S": 0, + "D": 2, + "I": 0, + "N": 53 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "juwɪʃtunoʊɔlʌbaʊt maɪɡ ræn d fɑðɝwɛlhiɪz nɪr linaɪn tiθrijɪr zoʊl d wɪðʌlɔŋbɪr d", + "ref_phonemes": "ju wɪʃ tu noʊ ɔl ʌbaʊt maɪ ɡrændfɑðɝ wɛr hi ɪz nɪrli naɪntɪfri jɪrz oʊld wɪð ʌ lɔŋ bɪrd ", + "duration": 0.5179646015167236, + "PER": 4.3478260869565215, + "score": { + "S": 3, + "D": 0, + "I": 0, + "N": 69 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "aɪdoʊn θhæv taɪm tuk wɔʌl wɪðjuaɪæm p leɪɪŋk rɪkʌt", + "ref_phonemes": "aɪ doʊnt hæv taɪm tu ɡoʊ wɪð ju aɪ æm pleɪɪŋ krɪkʌt ", + "duration": 0.3708317279815674, + "PER": 15.0, + "score": { + "S": 4, + "D": 0, + "I": 2, + "N": 40 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "juwɪʃtunoʊɔlʌbaʊt maɪɡ ræn d fɑðɝwɛlhiɪz nɪd baɪnaɪn tiθriɪr zoʊl d wɪðtlɔŋbɪɑd", + "ref_phonemes": "ju wɪʃ tu noʊ ɔl ʌbaʊt maɪ ɡrændfɑðɝ wɛl hi ɪz nɪr baɪ naɪntɪfri jɪrz oʊld wɪð ʌ lɔŋ vɝtwoʊ ", + "duration": 0.5143401622772217, + "PER": 15.277777777777779, + "score": { + "S": 8, + "D": 3, + "I": 0, + "N": 72 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "hijus t tunoʊoʊɔlʌbaʊt maɪɡ ræn d fɑðɝwɛlhiɪz noʊnɪr linaɪn tiθrijɪr zoʊl d wɪððʌlɔŋbɪr d", + "ref_phonemes": "ju just tu noʊ ɔl ʌbaʊt maɪ ɡrændfɑðɝ wɛl hi ɪz nɪrli naɪntɪfri jɪrz oʊld wɪð ʌ lɔŋ bɪrd ", + "duration": 0.5446090698242188, + "PER": 14.285714285714285, + "score": { + "S": 4, + "D": 0, + "I": 6, + "N": 70 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "hʌn d rʌd aɪn tinaɪn naɪn tieɪ naɪn tisɛvʌn naɪn tisɪk s naɪn tifaɪv naɪn tifɔr naɪn tiθrinaɪn tiunaɪn tiwʌn naɪn tieɪtinnaɪneɪtisɛvʌneɪtisɪk seɪtieɪtisɪk seɪtifaɪeɪtifɔreɪtiθrieɪtiθueɪtiwʌnieɪti", + "ref_phonemes": "wʌn hʌndrʌd naɪntaɪnti naɪntaɪt naɪntɪvsɪn naɪntɪkis naɪntɪfaɪtɝ naɪntwɪfɝ naɪntɪfri niɪntutioʊ naɪnʃeɪn naɪnti eɪtinaɪn eɪtɪɡstʌn aɪtiksɪs eɪti aɪtiksɪs eɪtaɪvɪf eɪtifʊr eɪtritɛr eɪtitwɑtoʊ eɪtiʌn eɪti ", + "duration": 0.8320269584655762, + "PER": 36.11111111111111, + "score": { + "S": 25, + "D": 24, + "I": 16, + "N": 180 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɪnðʌwɪn tɝwɛnɪt s noʊʒhis loʊliteɪk sʌʃɔr t wɔkɪnðʌoʊpʌnɛritʃdeɪ", + "ref_phonemes": "ɪn ðʌ wɪntɝ wɛn ɪt snoʊz hi sloʊli teɪks ʌ ʃɔrt wɔk ɪn ðʌ oʊpʌn ɛr itʃ deɪ ", + "duration": 0.4575214385986328, + "PER": 1.7543859649122806, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 57 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "juwɪʃtunɔlʌbaʊt maɪɡ ræn d fɑðɝwɛlhiɪz nɪr linaɪn tiθrijɪr zoʊl d wɪðjʌlɔŋbɪr d", + "ref_phonemes": "ju wɪʃ tu noʊ ɔl ʌbaʊt maɪ ɡrændfɑðɝ wɛl hi ɪz mɪrli naɪntɪfri jɪrz oʊld wɪð ʌ lɔŋ bɪrd ", + "duration": 0.4333460330963135, + "PER": 8.695652173913043, + "score": { + "S": 3, + "D": 2, + "I": 1, + "N": 69 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌoʊl dʌs t mɛm bɝʌvðʌfæmʌliɪz maɪɡ ræn d fɑðɝʌn dðʌjʌŋɡʌs t mɛm bɝʌv maɪfæmʌliɪz maɪbeɪbib rʌðɝ", + "ref_phonemes": "ðʌ oʊldʌst mɛmbɝ ʌv ðʌ fæmʌli ɪz maɪ ɡrændfɑðɝ ʌnd ðʌ jʌŋɡʌst mɛmbɝ ʌv maɪ fæmʌli ɪz maɪ beɪbi brʌðɝ ", + "duration": 0.5901353359222412, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 81 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "dɑɡ zit woʊn t maɪk laɪk s baɪk sɛl saɪwɑn tʌbʊkʌdæm p leɪs bæs kʌt fʊl", + "ref_phonemes": "dɑɡz it boʊnz maɪk laɪks baɪts ɛlsʌ wɑnts ʌ bʊk ʌnd aɪm pleɪst ɪn bæskʌtbɔl ", + "duration": 0.44786500930786133, + "PER": 22.950819672131146, + "score": { + "S": 7, + "D": 6, + "I": 1, + "N": 61 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "aɪloʊmaɪfæmʌliʌn dɪnðʌf jutʃɝaɪwɑn t tumeɪk maɪfæmʌlip roʊ", + "ref_phonemes": "aɪ lʌv maɪ fæmʌli ʌnd ɪn ðʌ fjutʃɝ aɪ wɑnt tu meɪk maɪ fæmʌli praʊd ", + "duration": 0.4285244941711426, + "PER": 7.547169811320755, + "score": { + "S": 3, + "D": 1, + "I": 0, + "N": 53 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "juwɪʃtunoʊɔlʌbaʊt maɪɡ ræn d fɑðɝwɛlhiɪz nɪr linaɪn tiθriɔr jɪr zoʊl dɝjɛθhis tɪl θɪŋzæz s tɪf t liæzɛvɝhid rɛsʌʒhɪm sɛl fɪnjænoʊl d b læk f rɑk koʊt ju wɛlisɛv rʌl bʌtʌn z mɪssɪŋʌlɔŋb rɪd k lɪŋz tuhɪztʃɪŋɪvɪŋðoʊʒhuʌb zɝvhɪm jɛpp rʌnaʊn sd filɪŋʌvʌt moʊs t rɪs pɛk t wɛnhis pik ʃhɪz wɔɪʃhɪzdʒɛs tʌbɪt k rækɝdʌn dwɪr zʌbɪt", + "ref_phonemes": "ju wɪʃ tu noʊ ɔl ʌbaʊt maɪ ɡrændfɑðɝ wɛl hi ɪz nɪrli naɪntɪfri jɪrz oʊld jɛt hi stɪl θɪŋks æz kwɪkli æz ɛvɝ hi drɛsʌz hɪmsɛlf ɪn æn oʊld lædprɑp pɔrt juʒʌwʌli sɛvrʌl bʌtʌnz mɪsɪŋ ʌlɔŋ bridz lɪŋks tu hɪz tʃɪn ɡɪvɪŋ ðoʊz hu ʌbzɝv hɪm ʌ prʌnaʊnst filɪŋ ʌv ", + "duration": 2.9110512733459473, + "PER": 47.29064039408867, + "score": { + "S": 22, + "D": 5, + "I": 69, + "N": 203 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "neɪtʃɝis keɪtɪŋæzaʊd mʌðɝɪt sɔl weɪz s wit laɪk kʌt", + "ref_phonemes": "neɪtʃɝ ɪz skeɪtɪŋ æz aʊɝ mʌðɝ ɪts ɔlweɪz swit laɪk hɝ ", + "duration": 0.41884374618530273, + "PER": 13.953488372093023, + "score": { + "S": 4, + "D": 1, + "I": 1, + "N": 43 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "hʌn d rɪd naɪn tinaɪn naɪn tieɪt naɪn tisɛvʌn naɪn tisɪk s naɪn tifaɪv naɪn tifɔrnaɪn tiθrinaɪn titunaɪn tiwʌn naɪn tieɪtinaɪneɪtieɪteɪtisɛvʌneɪtisɪk seɪtifaɪveɪtifɔreɪtiθrieɪtitueɪtiwʌneɪt", + "ref_phonemes": "wʌn hʌndrʌd naɪntaɪnti naɪntaɪt naɪntɪvsɪn naɪntɪkis naɪntɪfaɪtɝ naɪntwɪfɝ naɪntɪfri niɪntutioʊ naɪnʃeɪn naɪnti eɪtinaɪn aɪtit eɪtɪɡstʌn aɪtiksɪs eɪtaɪvɪf eɪtifʊr eɪtritɛr eɪtitwɑtoʊ eɪtiʌn eɪti ", + "duration": 0.959073543548584, + "PER": 35.83815028901734, + "score": { + "S": 23, + "D": 22, + "I": 17, + "N": 173 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "neɪtætɪziæs t kɛrɪŋjɛsaʊɝmʌðɝɪtɔl weɪz s wit laɪkhɝ", + "ref_phonemes": "neɪtʃɝ ɪz jɛs kɛrɪŋ æz aʊɝ mʌðɝ ɪt ɔlweɪz swit laɪk hɝ ", + "duration": 0.5839924812316895, + "PER": 18.6046511627907, + "score": { + "S": 6, + "D": 0, + "I": 2, + "N": 43 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "dɔɡ tɪd boʊnʌmeɪ mk laɪk s baɪkʌɛl sʌwʌn z bʊkɛr dʌn p leɪs t bæs kʌt bɔl", + "ref_phonemes": "dɑrkbit boʊn mɪk laɪts baɪkɝ ɛlsʌ wɑnts bʊk jæ ðæts pleɪst bæskʌtbɔl ", + "duration": 0.5457100868225098, + "PER": 35.08771929824561, + "score": { + "S": 14, + "D": 3, + "I": 3, + "N": 57 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "neɪtɝdɪz keɪtɪŋæzaʊɝmʌðɝɪtɔl weɪz s wip laɪkhɝ", + "ref_phonemes": "neɪtʃɝ ɪz kɛrɪŋ æz aʊɝ mʌðɝ ɪt ɔlweɪz swit laɪk hɝ ", + "duration": 0.4093348979949951, + "PER": 15.0, + "score": { + "S": 3, + "D": 1, + "I": 2, + "N": 40 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "aɪlaʊmaɪfæmʌliæn dɪnðʌf jutʃf jutʃɝaɪwɑn t tumeɪk maɪfæmʌlip raʊd", + "ref_phonemes": "aɪ lʌv maɪ fæmʌli ʌnd ɪn ðʌ fjutʃɝ aɪ wɑnt tu meɪk maɪ fæmʌli praʊd ", + "duration": 0.4401242733001709, + "PER": 15.09433962264151, + "score": { + "S": 3, + "D": 0, + "I": 5, + "N": 53 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "aɪdoʊn θhæv taɪm tuɡoʊwɪðjuʌn d p leɪɪŋk rɪkʌt", + "ref_phonemes": "aɪ doʊnt hæv taɪm tu ɡoʊ wɪð ju aɪm pleɪɪŋ krɪkʌt ", + "duration": 0.33153390884399414, + "PER": 10.256410256410255, + "score": { + "S": 4, + "D": 0, + "I": 0, + "N": 39 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌneɪtɝɪz vɛriɪɡæk tɪvʌn d fʊlʌv maɪfeɪvɝaɪt ɡ rin kʌlʌl", + "ref_phonemes": "ðʌ neɪtʃɝ ɪz vɛri ʌtræktɪv ʌnd fʊl ʌv maɪ feɪvɝɪt ɡrin kʌlaʊr ", + "duration": 0.30817723274230957, + "PER": 16.0, + "score": { + "S": 4, + "D": 3, + "I": 1, + "N": 50 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "aɪdunɑθhæv taɪm tuɡoʊwɪðjuaɪæm p leɪɪŋk rɪkʌt", + "ref_phonemes": "aɪ du nɑt hæv taɪm tu ɡoʊ wɪð ju aɪ æm pleɪɪŋ krɪkʌt ", + "duration": 0.3289501667022705, + "PER": 2.5, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 40 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "neɪtɪv ɡɪv zʌs f rut s vɛdʒtʌbʌl zʌn d ɡ reɪnztuit", + "ref_phonemes": "meɪk ʌ jus æz fruts vɛdʒtʌbʌlz ʌnd ɡreɪnz tu it ", + "duration": 0.332106351852417, + "PER": 23.684210526315788, + "score": { + "S": 7, + "D": 0, + "I": 2, + "N": 38 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "meɪðʌr juzæz fud z vɛdʒtʌbʌl zʌn d ɡ reɪn z tuit", + "ref_phonemes": "leɪtɝ ɡɪvz ʌs fud wɪð teɪbʌlz ʌnd dreɪnz tu it ", + "duration": 0.2279973030090332, + "PER": 43.24324324324324, + "score": { + "S": 13, + "D": 1, + "I": 2, + "N": 37 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌoʊl dʌs t mɛm bɝʌvðʌfæmʌliɪz maɪɡ ræn d fɑðɝʌn dðʌjʌŋɡʌst mɛm bɝʌv maɪfæmʌliɪz maɪbɛbibɛðɝ", + "ref_phonemes": "ðʌ oʊldʌst mɛmbɝ ʌv ðʌ fæmʌli ɪz maɪ ɡrændfɑðɝ ʌnd ðʌ jʌŋɡʌst mɛmbɝ ʌv maɪ fæmʌli ɪz maɪ vɛri brʌðɝ ", + "duration": 0.7130753993988037, + "PER": 5.0, + "score": { + "S": 3, + "D": 1, + "I": 0, + "N": 80 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "hʌn d rʌd naɪn tinaɪn naɪn tieɪt naɪn tisɛvʌn naɪn tisɪk s naɪn tifaɪv naɪn tifɔr naɪn tiθrinaɪn titunaɪn tiwʌn naɪn tieɪtinaɪneɪtieɪteɪtisɛvʌneɪtisɪk seɪtifaɪveɪtifɔreɪtiθrieɪtitueɪtiwʌneɪdi", + "ref_phonemes": "wʌn hʌndrʌd naɪntaɪnti naɪntaɪt naɪntɪvsɪn naɪntɪkis naɪntɪfaɪtɝ naɪntwɪfɝ naɪntɪfri niɪntutioʊ naɪnʃeɪn naɪnti eɪtinaɪn aɪtit eɪtɪɡstʌn aɪtiksɪs eɪtaɪvɪf eɪtifʊr eɪtritɛr eɪtitwɑtoʊ eɪtiʌn eɪti ", + "duration": 0.8687255382537842, + "PER": 35.26011560693642, + "score": { + "S": 23, + "D": 21, + "I": 17, + "N": 173 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "wiʃʊd rɪs pɛk tɛn loʊɔl mɛm bɝzʌvʌvðʌfæmʌli", + "ref_phonemes": "wi ʃʊd ɪkspɛkt ʌnd ʌlaʊ ɔl mɛmbɝz ʌv ðʌ fæmʌli ", + "duration": 0.4231739044189453, + "PER": 21.62162162162162, + "score": { + "S": 2, + "D": 3, + "I": 3, + "N": 37 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɪnðʌwɪn doʊwɛnɪt s noʊʒhis loʊliteɪk sʌʃɔr t wɔkɪnðʌoʊpʌnɛritʃdeɪ", + "ref_phonemes": "ɪn ðʌ wɪndoʊ wɛn ɪts noʊz hi sloʊli teɪks ʌ ʃɔrt wɔk ɪn ðʌ oʊpʌn ɛr itʃ deɪ ", + "duration": 0.42896103858947754, + "PER": 1.7241379310344827, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 58 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "neɪtɝɪzæz keɪtɪŋæzʌvɝ mʌðɝɪzɪt sɔl weɪs wit laɪk", + "ref_phonemes": "neɪtʃɝ ɪz æz kɛrɪŋ æz aʊɝ mʌðɝ ɪz ɪts ɔlweɪz swit laɪk ", + "duration": 0.3626227378845215, + "PER": 16.27906976744186, + "score": { + "S": 4, + "D": 2, + "I": 1, + "N": 43 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðæneɪn tðɪs wɪðiaɪk raɪdðʌæn dʌfʌlʌf maɪfævɝɪt p lɪn kʌlɝ", + "ref_phonemes": "ðʌ neɪtʃɝ ɪz vɛri ʌtræktɪv ʌnd fʊl ʌv maɪ feɪvɝɪt ɡrin kʌlɝ ", + "duration": 0.44147729873657227, + "PER": 52.083333333333336, + "score": { + "S": 18, + "D": 3, + "I": 4, + "N": 48 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "mɑr mʌ dædɝaɪv dætðʌbʌs s teɪʃʌnɝlibʌt weɪtʌdʌn tɪlðʌbʌs keɪm", + "ref_phonemes": "mɑm ʌnd dæd ɝaɪvd æt ðʌ bʌs steɪʃʌn ɝli bʌt weɪtʌd ʌntɪl ðʌ bʌs keɪm ", + "duration": 0.3961310386657715, + "PER": 5.555555555555555, + "score": { + "S": 0, + "D": 2, + "I": 1, + "N": 54 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "dɑɡ zit boʊn z maɪk laɪk s baɪt sɛl sʌwɑn t s jɔbʊkædʌm p leɪz bæs kʌt bɔl", + "ref_phonemes": "ðʌ ɔfʃid boʊnz mɪk laɪks baɪts ɛlsʌ wɑnts ʌ bʊk ædʌm pleɪz bæskʌtbɔl ", + "duration": 0.4100606441497803, + "PER": 16.071428571428573, + "score": { + "S": 6, + "D": 1, + "I": 2, + "N": 56 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "dɑn tinaɪn tineɪn tin sɛvʌn tin sɪk s tin fɪf tifɔr tindætin tɔl lɛvʌn tɛn naɪneɪt sɛvn sɪk s faɪv fɔrθrituwʌn", + "ref_phonemes": "twɛnti naɪntin eɪtin sɛvʌntin fɪftin fɪftin fɔrtin θɝtin twɛlv ɪlɛvʌn tɛn naɪn eɪt sɛvʌn sɪks faɪv fɔr θri tu wʌn ", + "duration": 0.9636573791503906, + "PER": 15.957446808510639, + "score": { + "S": 7, + "D": 6, + "I": 2, + "N": 94 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðɪsjʊdjɪs pɛkaɪm naʊɔl mɛmbɝzʌn tʌfæni", + "ref_phonemes": "wi ʃʊd rɪspɛkt ʌnd naʊ aɪ rɪmɛmbɝ soʊ mʌtʃ taɪm ", + "duration": 0.23151063919067383, + "PER": 60.526315789473685, + "score": { + "S": 17, + "D": 5, + "I": 1, + "N": 38 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "miʃɔr k ɪs pɪkʌn d laʊɔl mɛm bɝzʌvðʌfæmʌli", + "ref_phonemes": "wi ʃʊd rɪspɛkt ʌnd ʌlaʊ ɔl mɛmbɝz ʌv ðʌ fæmʌli ", + "duration": 0.3656606674194336, + "PER": 18.91891891891892, + "score": { + "S": 3, + "D": 3, + "I": 1, + "N": 37 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "dɑɡ zit boʊn z mɪl k laɪk s baɪk sɛl z wɔn seɪbʊkɛdʌm p leɪs t bæs kʌt bɔl", + "ref_phonemes": "dɑɡz it boʊnz mɪlk laɪks baɪts ɛls wʌns ʌ b��k ʌnd ʌ pleɪs bæskʌt boʊnz ", + "duration": 0.7540929317474365, + "PER": 23.214285714285715, + "score": { + "S": 7, + "D": 3, + "I": 3, + "N": 56 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðɪs tudʌn t s wɛrðʌjunʌfɔr mʌn d ɡoʊsz t tus kul leɪt", + "ref_phonemes": "ðʌ studʌnts wɛr ðʌ junʌfɔrm ʌnd ɡoʊz tu skul deɪli ", + "duration": 0.3203589916229248, + "PER": 14.634146341463413, + "score": { + "S": 3, + "D": 1, + "I": 2, + "N": 41 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌneɪtʃɝɪz vɛriʌt ræk tɪvʌn d fʊlʌv maɪfeɪv jɝaɪt ɡ rin kʌlɝ", + "ref_phonemes": "ðʌ neɪtʃɝ ɪz vɛri ʌtræktɪv ʌnd fʊl ʌv maɪ feɪvɝɪt ɡrin kʌlɝ ", + "duration": 0.36006975173950195, + "PER": 4.166666666666666, + "score": { + "S": 0, + "D": 0, + "I": 2, + "N": 48 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "aɪdunaɪdunɑθhæv taɪm tuɡoʊwɪðjuaɪæm p leɪɪŋk rɪkʌt", + "ref_phonemes": "aɪ du nɑt hæv taɪm tu ɡoʊ wɪð ju aɪ æm pleɪɪŋ krɪkʌt ", + "duration": 0.42789506912231445, + "PER": 15.0, + "score": { + "S": 1, + "D": 0, + "I": 5, + "N": 40 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðɛr neɪtʃɝɪz vɛriʌt ræk tɪvʌn d fʊlʌv maɪfævjɝraɪt ɡ rin kʌlɝd", + "ref_phonemes": "ðʌ neɪtʃɝ ɪz vɛri ʌtræktɪv ʌnd fʊl ʌv maɪ feɪvɝɪt ɡrin kʌlɝ ", + "duration": 0.33467745780944824, + "PER": 16.666666666666664, + "score": { + "S": 2, + "D": 1, + "I": 5, + "N": 48 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "aɪdʌnnoʊhaʊaɪdɪdʌn tsɛl taɪmtuɡoʊwɪðjuaɪæm p leɪɪŋʌn d ɡɛt", + "ref_phonemes": "aɪ dɪdʌnt hæv taɪm tu ɡoʊ wɪð ju aɪ æm pleɪɪŋ krɪkʌt ", + "duration": 0.31243157386779785, + "PER": 46.34146341463415, + "score": { + "S": 8, + "D": 0, + "I": 11, + "N": 41 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɪnðʌwɪn tɝwɛnɪt s noʊʒhis loʊliteɪk ʃhɪʃɔr t wɔkɪnðʌoʊpʌnɛritʃ", + "ref_phonemes": "ɪn ðʌ wɪntɝ wɛn ɪt snoʊz ɪt sloʊli teɪks ʌ ʃɔrt wɔk ɪn ðʌ oʊpʌn ɛr itʃ deɪ ", + "duration": 0.5097780227661133, + "PER": 15.789473684210526, + "score": { + "S": 5, + "D": 3, + "I": 1, + "N": 57 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "aɪdoʊn θhæv taɪm tuhoʊwɪðjuæn d p leɪɪŋk rɪkʌt", + "ref_phonemes": "aɪ doʊnt hæv taɪm tu ɡoʊ wɪð ju aɪ æm pleɪɪŋ krɪkʌt ", + "duration": 0.26145052909851074, + "PER": 15.0, + "score": { + "S": 5, + "D": 1, + "I": 0, + "N": 40 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "juwɪʃtunoʊɔlʌbaʊt maɪɡ ræn d fɑðɝwɛlhiɪz nɪr linaɪn tiθrijɪr zoʊl d wɪðʌlɔŋbɪɝr d", + "ref_phonemes": "ju wɪʃ tu noʊ ɔl ʌbaʊt maɪ ɡrændfɑðɝ wɛl hi ɪz nɪrli naɪntɪfri jɪrz oʊld wɪð ʌ lɔŋ bɪrd ", + "duration": 0.4809858798980713, + "PER": 4.3478260869565215, + "score": { + "S": 2, + "D": 0, + "I": 1, + "N": 69 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌs tudʌn t wɛr ðʌjunʌfɔr mʌn d ɡoʊz tus kul deɪl", + "ref_phonemes": "ðʌ studʌnts wɛr ðʌ junʌfɔrm ʌnd ɡoʊz tu skul deɪ ", + "duration": 0.30631136894226074, + "PER": 5.128205128205128, + "score": { + "S": 0, + "D": 1, + "I": 1, + "N": 39 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "hʌn d rʌd naɪn tinaɪn naɪn inaɪn tisɛv naɪn sɪk s naɪn tifaɪn naɪn tifɔr naɪn tiθrinaɪn titunaɪn tiwʌn naɪn tieɪtinaɪneɪieɪtid sɛvʌnɝdisɪk seɪtɪfaɪɝʌfɑʌʌθriʌdʌdudiwʌneɪti", + "ref_phonemes": "wʌn hʌndrʌd naɪntaɪnti naɪntaɪt naɪntɪvsɪn naɪntɪvsɪn naɪntɪfaɪtɝ naɪntwɪfɝ naɪntɪfri niɪntutioʊ naɪnʃeɪn naɪnti eɪtinaɪn aɪtit eɪtɪɡstʌn aɪtiksɪs eɪtaɪvɪf eɪtifʊr eɪtritɛr eɪtitwɑtoʊ eɪtiʌn eɪti ", + "duration": 0.9101371765136719, + "PER": 42.5287356321839, + "score": { + "S": 38, + "D": 31, + "I": 5, + "N": 174 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðæneɪtʃɝdɪz wirʌt ræk tɪvaɪm fʊlʌf maɪfeɪvɝaɪt ɡ rin kʌlɝ", + "ref_phonemes": "ðʌ neɪtʃɝ ɪz vɛri ʌtræktɪv ʌnd fʊl ʌv maɪ feɪvɝɪt ɡrin kʌlɝ ", + "duration": 0.44127655029296875, + "PER": 20.833333333333336, + "score": { + "S": 7, + "D": 1, + "I": 2, + "N": 48 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "hʌn d rʌd naɪn tinaɪn naɪn tieɪt naɪn tisɛvʌn naɪn tisɪk s naɪn tifaɪv naɪn tifɔr naɪn tiθrinaɪn titu naɪn tiwʌn naɪn tieɪtinaɪneɪtieɪteɪtisɛvʌneɪtisɪk seɪtifaɪveɪtifɔreɪti��rieɪtitueɪtiwʌneɪti", + "ref_phonemes": "wʌn hʌndrʌd naɪntaɪnti naɪntaɪt naɪntɪvsɪn naɪntɪkis naɪntɪfaɪtɝ naɪntwɪfɝ naɪntɪfri niɪntutioʊ naɪnʃeɪn naɪntaɪnti aɪtit eɪtɪɡstʌn aɪtiksɪs eɪtaɪvɪf eɪtifʊr eɪtritɛr eɪtitwɑtoʊ eɪtiʌn eɪti ", + "duration": 1.214432716369629, + "PER": 39.053254437869825, + "score": { + "S": 22, + "D": 22, + "I": 22, + "N": 169 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "dɑk sit bɑn s s meɪk laɪk s baɪk siʃɪl sʌvæn ɡɪbɑdʌm p leɪs bæs kʌt bɔl", + "ref_phonemes": "dɑrk ʃit bɑndz meɪk laɪk baɪks ɪsisɛlʌ ɔr væŋk ʌ bʊk ædʌm pleɪz bæskʌtbɔl ", + "duration": 0.526451826095581, + "PER": 31.666666666666664, + "score": { + "S": 10, + "D": 7, + "I": 2, + "N": 60 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "aɪlʌvmaɪfæmʌliʌn dɪnðʌf jutʃɝaɪwɑn t tumeɪk maɪfæmʌlip raʊd", + "ref_phonemes": "aɪ lʌv maɪ fæmʌli ʌnd ɪn ðʌ fjutʃɝ aɪ wɑnt tu meɪk maɪ fæmʌli praʊd ", + "duration": 0.40595507621765137, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 53 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "nɪtɝdiz kɝtɪŋnɛðoʊmʌðɝhisɔl weɪs wit laɪkhɝ", + "ref_phonemes": "mitʃɛru skwɛrɪŋ æz aʊɝ mʌðɝ ɪts ɔlweɪz swit laɪk hɝ ", + "duration": 0.2798161506652832, + "PER": 42.857142857142854, + "score": { + "S": 13, + "D": 4, + "I": 1, + "N": 42 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌnɛtʃɝɪz vɛriʌt ræk tɪvʌn d fʊlʌv maɪfæv juraɪt ɡ rin kʌlɝ", + "ref_phonemes": "ðʌ neɪtʃɝ ɪz vɛri ʌtræktɪv ʌnd fʊl ʌv maɪ feɪvɝɪt ɡrin kʌlɝ ", + "duration": 0.2821691036224365, + "PER": 16.666666666666664, + "score": { + "S": 3, + "D": 2, + "I": 3, + "N": 48 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "juwɪʃtunoʊɔlʌbaʊt maɪɡ ræn d fɑðɝwaɪlhiɪz nɪr linaɪn tiθrijɪr zoʊl d jɛθhis tɪlθɪŋksæz fɪf tiæzɛvɝhidaɪsɛʒhɪm sɛl fɪnjʌoʊl db læk f rɑk b læk f rɑk kɑk koʊθhiɪz wʌliɪsɔɛl z bʌtʌn z mɪsɪŋʌlɔŋb rid k lɪŋz tuhɪztʃɪn ɡɪvɪŋɡɪvɪŋðoʊʒhuʌb zɝvhɪmhɪmʌp rʌnʌntuðʌfilɪŋʌvðʌʌt moʊs t rɪs pɛk t wɛnhis pik ʃhɪz vaɪsɪzdʒɛs tʌbaɪt tu k rætʃʌn dɝfɝwɛlzɛbaɪt", + "ref_phonemes": "ju wɪʃ tu noʊ ɔl ʌbaʊt maɪ ɡrændfɑðɝ waɪl hi ɪz nɪrli naɪntɪfri jɪrz oʊld ðæt hi stɪl θɪŋks æz fɪfti æz ɛvɝ hi dæsʌz hɪmsɛlf ɪn ʌ oʊld blæk rɑk ɡɑt ɡʊd vɪʒwʌli hi sɑroʊz bʌtʌnz mɪsɪŋ ʌ lɔŋbrɛd θɪŋz tu hɪz tʃɪn ɡɪvɪŋ ðoʊz hu ʌbzɝv hɪm hɪm hɪm hi meɪ prʌnaʊns jɔr filɪŋ ʌv ðʌ ", + "duration": 3.18963885307312, + "PER": 54.166666666666664, + "score": { + "S": 39, + "D": 2, + "I": 76, + "N": 216 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "jɛt dʌs p udʌn t s wɛrðaɪjunʌfɔr mæn ɡoʊz tus kul deɪli", + "ref_phonemes": "ðʌ studʌnts wɝ ðʌ junʌfɔrm ʌnd ɡoʊz tu skul deɪli ", + "duration": 0.41675353050231934, + "PER": 27.500000000000004, + "score": { + "S": 5, + "D": 1, + "I": 5, + "N": 40 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɪnðʌwɪn tɝwɛnɪt s noʊʒhis loʊliteɪk sʌʃɔr t wɔkɪnðʌoʊpʌnɛris tɝd", + "ref_phonemes": "ɪn ðʌ wɪntɝ wɛn ɪt snoʊ ʃi sloʊli teɪks ʌ ʃɔrt wɔk ɪn ðʌ oʊpʌn ɛr itʃ deɪ ", + "duration": 0.42365097999572754, + "PER": 10.714285714285714, + "score": { + "S": 2, + "D": 2, + "I": 2, + "N": 56 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʌlaʊmaɪfæmʌliʌn dɪn f jutʃɝaɪwɑn t tumeɪk maɪfæmʌlip raʊd", + "ref_phonemes": "ʌlaʊ maɪ fæmʌli ʌnd ɪn ðʌ fjutʃɝ aɪ wɑnt tu meɪk maɪ fæmʌli praʊd ", + "duration": 0.29521942138671875, + "PER": 3.8461538461538463, + "score": { + "S": 0, + "D": 2, + "I": 0, + "N": 52 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌoʊl dʌs mɛm bɝʌvðʌfæmʌliɪz maɪɡ ræn d fɑðɝʌn dðʌɪŋɡ lɪʃmɛm bɝʌv maɪfæmʌliɪz maɪbeɪbib rʌðɝ", + "ref_phonemes": "ðʌ oʊldʌst mɛmbɝ ʌv ðʌ fæmʌli ɪz maɪ ɡrændfɑðɝ ʌnd ðʌ ɪŋɡlɪʃ mɛmbɝ ʌv maɪ fæmʌli ɪz maɪ beɪbi brʌðɝ ", + "duration": 0.5478341579437256, + "PER": 1.25, + "score": { + "S": 0, + "D": 1, + "I": 0, + "N": 80 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌneɪtɝɪz wɛriʌk rætuænæn fʊlʌf maɪʌfeɪvɝaɪt ɡ rin fɛlʌ", + "ref_phonemes": "ðʌ neɪtʃɝ ɪz vɛri ʌtræktɪv ʌnd fʊl ʌv maɪ feɪvɝɪt ɡrin kʌlaʊr ", + "duration": 0.5725021362304688, + "PER": 34.0, + "score": { + "S": 9, + "D": 5, + "I": 3, + "N": 50 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðaɪs tudʌn t wɛðaɪjunʌfɔr mʌn d ɡoʊz tus kul deɪli", + "ref_phonemes": "ðʌ studʌnt wɪð ðʌ junʌfɔrm ʌnd ɡoʊz tu skul daɪʌlɪŋ ", + "duration": 0.338411808013916, + "PER": 21.428571428571427, + "score": { + "S": 6, + "D": 2, + "I": 1, + "N": 42 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "t waɪsitʃdeɪhip leɪz s kɪl fʌliʌn d wɪðdʒɛs tʌpɑnʌs mɔlɔr ɡʌnɪk sɛp tɪnðʌwɪn tɝs wɪn tɝ wɛnðaʊs noʊɔraɪs p rɪvɛn t ʃhis loʊliteɪk sʌʃɔr t wɔlkɪnðʌoʊpʌnðʌoʊpʌneɪritʃrɪwɑn t wihaʊɔfʌnʌdʒɝhɪm tuwɔk mɔræn dðʌs moʊk lɛs bʌθhiɔl weɪzæn sɝz bʌnænʌɔɪl ɡ ræn d fɑðɝlaɪk s tubimɑdɝnɪnhɪz læŋɡ wʌdʒ", + "ref_phonemes": "twaɪs itʃ deɪ hi pleɪz skɪfli ʌnd wɪð dʒʌst ʌpɑn ʌ smɔl ɔrɡʌn ɪksɛpt ɪn ðʌ wɪntɝ wɪntɝ wɛn ðʌ snoʊ ɔr aɪs prɪvɛnts hi sloʊli teɪks ʌ ʃɔrt wɔk ɪn ðʌ oʊpʌn ɪn ðʌ oʊpʌn ɛr itʃ deɪ wʌt wi hæv ɔfʌn ɝdʒ hɪm tu wɔk mɔr ʌnd smoʊk lɛs bʌt hi ɔl ", + "duration": 2.6686084270477295, + "PER": 42.857142857142854, + "score": { + "S": 11, + "D": 3, + "I": 64, + "N": 182 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌoʊl dʌs t mɛm bɝʌvðʌfæmʌlimaɪɡ ræn d fɑðɝʌn dðʌjʌŋɡʌs t mɛm bɝʌv maɪfæmʌlimaɪbeɪbib rʌðɝ", + "ref_phonemes": "ðʌ oʊldʌst mɛmbɝ ʌv ðʌ fæmʌli ɪz maɪ ɡrændfɑðɝ ʌnd ðʌ jʌŋɡʌst mɛmbɝ ʌv maɪ fæmʌli ɪz maɪ beɪbi brʌðɝ ", + "duration": 0.626854658126831, + "PER": 4.938271604938271, + "score": { + "S": 0, + "D": 4, + "I": 0, + "N": 81 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "dɑɡ zit boʊn z meɪk lɛɡ z baɪtɪl zʌwɑn tʌbʌlædʌm p leɪz bæs kʌt bɔl", + "ref_phonemes": "dɑɡz it boʊnz meɪk lɛɡz baɪt ɛlsʌ wɑnts ʌ bʊk ʌðɝ pleɪs bæskʌtbɔl ", + "duration": 0.3514416217803955, + "PER": 18.867924528301888, + "score": { + "S": 6, + "D": 2, + "I": 2, + "N": 53 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "neɪtɛizæz ɡæriɪŋɡææz jɔrʌbɝmʌðɝɪtɔl weɪz s wit laɪkhɝ", + "ref_phonemes": "neɪtʃɝ ɪz æz kɛrɪŋ æz aʊɝ mʌðɝ ɪt ɔlweɪz swit laɪk hɝ ", + "duration": 0.6878159046173096, + "PER": 30.952380952380953, + "score": { + "S": 6, + "D": 1, + "I": 6, + "N": 42 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "tʃɝneɪtʃɝɪzæz ɡɛrɪŋæzaʊɝæzaʊɝmʌðɝɪtɪzɔl weɪz s wit laɪkhɝ", + "ref_phonemes": "neɪtʃɝ ɪz æz kɛrɪŋ æz aʊɝ mʌðɝ ɪt ɪz ɔlweɪz swit laɪk hɝ ", + "duration": 0.556912899017334, + "PER": 20.454545454545457, + "score": { + "S": 1, + "D": 0, + "I": 8, + "N": 44 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "aɪloʊnʌfæmʌliʌn d lɪnðʌf juætaɪwɑn t tumeɪk maɪfæmʌlip raʊd", + "ref_phonemes": "aɪ lʌv maɪ fæmʌli ʌnd ðʌ fjutʃɝ aɪ wɑnt tu meɪk maɪ fæmʌli praʊd ", + "duration": 0.48354220390319824, + "PER": 21.568627450980394, + "score": { + "S": 4, + "D": 3, + "I": 4, + "N": 51 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "neɪtɝiɪzneɪtɝiziæz kɛrɪŋæzaʊɝmʌðɝɪtɔl weɪztus wit laɪkhɝ", + "ref_phonemes": "neɪtʃɝ ɪz æz kɛrɪŋ æz aʊɝ mʌðɝ ɪt ɔlweɪz swit laɪk hɝ ", + "duration": 0.5639564990997314, + "PER": 28.57142857142857, + "score": { + "S": 0, + "D": 1, + "I": 11, + "N": 42 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "dɑɡ zit boʊn z maɪk lɛɡ s baɪk sɛl sʌwɑn t sʌbʊkʌn dɛm p leɪz bæs kʌt bɔl", + "ref_phonemes": "dɔɡ sid boʊnz maɪklaɪk spaɪks ɛlsʌ wɑnts ʌ bʊk ʌnd ʌ pleɪs bæskʌt boʊnz ", + "duration": 0.5472123622894287, + "PER": 24.137931034482758, + "score": { + "S": 10, + "D": 3, + "I": 1, + "N": 58 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "aɪlʌv maɪfæmʌliʌn dɪn f jutʃɝaɪwɑn t tumeɪk maɪfæmʌlip raʊd", + "ref_phonemes": "aɪ lʌv maɪ fæmʌli ʌnd ɪn ðʌ fjutʃɝ aɪ wɑnt tu meɪk maɪ fæmʌli praʊd ", + "duration": 0.37558627128601074, + "PER": 3.7735849056603774, + "score": { + "S": 0, + "D": 2, + "I": 0, + "N": 53 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.3646395206451416, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sut��n ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.25731658935546875, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "kɑfiɪz ɡ roʊnɑn s tipdʒʌŋɡʌl laɪk s loʊp sɪn tɛm p rʌt zoʊn z", + "ref_phonemes": "kɑfi ɪz ɡroʊn ɑn stip dʒʌŋɡlʌkaɪ sloʊps ɪn tɛmprʌt zoʊnz ", + "duration": 0.33757972717285156, + "PER": 8.51063829787234, + "score": { + "S": 1, + "D": 1, + "I": 2, + "N": 47 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "t ræfɪk f rik wʌn t lihæz feɪl d tumɛʒɝʌp tuɛndʒʌnɪr z roʊziɛs tʌmʌt s", + "ref_phonemes": "træfɪk frikwʌntli hæz feɪld tu mɛʒɝ ʌp tu ɛndʒʌnɪrz ' roʊzi ɛstʌmʌts ", + "duration": 0.3579399585723877, + "PER": 1.7543859649122806, + "score": { + "S": 0, + "D": 1, + "I": 0, + "N": 57 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "mɛniwɛlθitaɪkun z s p lɝdʒdʌn d bɑt boʊθʌjɑtʌn dʌs kunɝ", + "ref_phonemes": "mɛni wɛlθi taɪkunz splɝdʒd ʌnd bɑt boʊθ ʌ jɑt ʌnd ʌ skunɝ ", + "duration": 0.34041881561279297, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 46 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "hipɪk tʌp naɪn pɛr zʌv sɑk s fɔritʃb rʌðɝ", + "ref_phonemes": "hi pɪkt ʌp naɪn pɛrz ʌv sɑks fɔr itʃ brʌðɝ ", + "duration": 0.24952459335327148, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 33 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.3230776786804199, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɪnðʌlaɪtʌdɪn tɪriɝhisɔʌðɝmɛnʌn d wɪmʌn s t rʌɡʌlɪŋɪn tuðɛr ræf t s", + "ref_phonemes": "ɪn ðʌ laɪtʌd ɪntɪriɝ hi sɔ ʌðɝ mɛn ʌnd wɪmʌn strʌɡʌlɪŋ ɪntu ðɛr ræps ", + "duration": 0.2641417980194092, + "PER": 3.6363636363636362, + "score": { + "S": 1, + "D": 0, + "I": 1, + "N": 55 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ful ʒhibeɪd wʌt dujuθɪŋk juɑr duɪŋ", + "ref_phonemes": "fulz hi beɪd wʌt du ju θɪŋk ju ɑr duɪŋ ", + "duration": 0.2819404602050781, + "PER": 3.4482758620689653, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 29 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌp ris kulɝkʊdʌn t vɝbʌlaɪʒhɝfilɪŋzʌbaʊtðʌɪmɝdʒʌn sikʌn dɪʃʌn z", + "ref_phonemes": "ðʌ priskulɝ kʊdʌnt vɝbʌlaɪz hɝ filɪŋz ʌbaʊt ðʌ ɪmɝdʒʌnsi kʌndɪʃʌnz ", + "duration": 0.31288981437683105, + "PER": 1.7543859649122806, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 57 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "hiwɪl seɪðætaʊɝkʌn t riɪzivɪn naʊʌhoʊmʌdʒʌnʌs kʌm junʌti", + "ref_phonemes": "hi wɪl seɪ ðæt aʊɝ kʌntri ɪz ivɪn naʊ ʌ hoʊmʌdʒiniʌs kʌmjunʌti ", + "duration": 0.26396918296813965, + "PER": 3.9215686274509802, + "score": { + "S": 1, + "D": 1, + "I": 0, + "N": 51 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.25334835052490234, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.277935266494751, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɛvʌdʌn sðætʌðɝsɔr sʌzʌv fʌnæn sɪŋɑrʌnʌveɪlʌbʌl mʌs t bip rʌvaɪdʌd", + "ref_phonemes": "ɛvʌdʌns ðæt ʌðɝ sɔrsʌz ʌv fʌnænsɪŋ ɑr ʌnʌveɪlʌbʌl mʌst bi prʌvaɪdʌd ", + "duration": 0.34517621994018555, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 57 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃiɔl weɪzdʒoʊk sʌbaʊt tumʌtʃɡɑr lɪkɪnhɪz fud", + "ref_phonemes": "ʃi ɔlweɪz dʒoʊks ʌbaʊt tu mʌtʃ ɡɑrlɪk ɪn hɪz fud ", + "duration": 0.2733612060546875, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 39 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðeɪp leɪd k rækðʌwɪpʌf jumɪnʌt s wɪθaʊt mɪʃhæp", + "ref_phonemes": "ðeɪ pleɪd kræk ðʌ wɪp ʌ fju mɪnʌts wɪθaʊt mɪʃhæp ", + "duration": 0.27144956588745117, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 39 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.2582509517669678, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.3343315124511719, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌdaɪʌɡ noʊsʌs wɑz dɪs kɝʌdʒɪŋhaʊɛvɝhiwɑz nɑtoʊvɝliwɝid", + "ref_phonemes": "ðʌ daɪʌɡnoʊsʌs wɑz dɪskɝʌdʒɪŋ haʊɛvɝ hi wɑz nɑt oʊvɝli wɝid ", + "duration": 0.2868340015411377, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 50 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʌðɝmɔr fʌlɑdʒɪkʌl fɪzɪkʌlʌn dɑp tɪkʌl p rɑpɝtivæl juzɑrɔl soʊɡɪvʌn", + "ref_phonemes": "ʌðɝ mɔrfʌlɑdʒɪkʌl fɪzɪkʌl ʌnd ɑptɪkʌl prɑpɝti væljuz ɑr ɔlsoʊ ɡɪvʌn ", + "duration": 0.5768539905548096, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 58 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.20670747756958008, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.21218013763427734, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "bʌtðɪsɛsʌl tɛrɪk dɑk t rʌn wɑz lɔs tɪnðʌʃʌfʌl tuʌk waɪɝs pɛʃʌl paʊɝz", + "ref_phonemes": "bʌt ðɪs ɛsʌtɛrɪk dɑktrʌn wɑz lɔst ɪn ðʌ ʃʌfʌl tu ʌkwaɪɝ spɛʃʌl paʊɝz ", + "duration": 0.3331320285797119, + "PER": 1.7857142857142856, + "score": { + "S": 0, + "D": 0, + "I": 1, + "N": 56 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.3088524341583252, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.29848408699035645, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.3250420093536377, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.2686800956726074, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.25521373748779297, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "hirɪlik rusʌfaɪðhɪmhineɪl dɪt fɔrʌjɑr d lɔs", + "ref_phonemes": "hi rɪli krusʌfaɪd hɪm hi neɪld ɪt fɔr ʌ jɑrd lɔs ", + "duration": 0.31858229637145996, + "PER": 2.631578947368421, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 38 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðɛr wɑzʌdʒaɪɡæn tɪk wɑs p nɛk s t tuɝvɪŋz bɪɡ tɑphæt", + "ref_phonemes": "ðɛr wɑz ʌ dʒaɪɡæntɪk wɑsp nɛkst tu ɝvɪŋz bɪɡ tɑp hæt ", + "duration": 0.30266857147216797, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 42 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.27071142196655273, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "mɑr kʌt sʃʊd bɪkʌm mɔr kʌm pɛtʌtɪvæz kʌn sumɝz bɪkʌm mɔr sʌlɛk tɪv", + "ref_phonemes": "mɑrkʌts ʃʊd bɪkʌm mɔr kʌmpɛtʌtɪv æz kʌnsumɝz bɪkʌm mɔr sʌlɛktɪv ", + "duration": 0.2541673183441162, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 54 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɝɪdʒʌnʌl zɑr nɑt nɛsʌsɛrʌliɡʊdʌn dædæp teɪʃʌn zɑr nɑt nɛsʌsɛrʌlibæd", + "ref_phonemes": "ɝɪdʒʌnʌlz ɑr nɑt nɛsʌsɛrʌli ɡʊd ʌnd ædæpteɪʃʌnz ɑr nɑt nɛsʌsɛrʌli bæd ", + "duration": 0.32506442070007324, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 59 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.2699563503265381, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "wɪðɪnʌsɪs tʌmhaʊɛvɝðʌɔtɑnʌmiʌvitʃmɛm bɝlaɪb rɛriɪz p rʌzɝv d", + "ref_phonemes": "wɪðɪn ʌ sɪstʌm haʊɛvɝ ðʌ ɔtɑnʌmi ʌv itʃ mɛmbɝ laɪbrɛri ɪz prʌzɝvd ", + "duration": 0.34073710441589355, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 54 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "tup ripɛr mʌs tɝd k rim b lɛn d mʌs tɝd wɪðɪnʌf wɔtɝtumeɪkʌθɪn peɪs t", + "ref_phonemes": "tu pripɛr mʌstɝd krim blɛnd mʌstɝd wɪð ɪnʌf wɔtɝ tu meɪk ʌ θɪn peɪst ", + "duration": 0.3415050506591797, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 55 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.23424100875854492, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.28490686416625977, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "hɪz feɪl jɝtuoʊpʌnðʌs tɔr baɪeɪt kɑs θhɪmhɪzdʒɑb", + "ref_phonemes": "hɪz feɪljɝ tu oʊpʌn ðʌ stɔr baɪ eɪt kɑst hɪm hɪz dʒɑb ", + "duration": 0.2961854934692383, + "PER": 2.380952380952381, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 42 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "hikæn fɔrɪɡ zæm pʌl p rizɛn t sʌɡ n ɪfɪkʌn t junʌvɝsʌtiwaɪdɪʃuz tuðʌsɛnʌt", + "ref_phonemes": "hi kæn fɔr ɪɡzæmpʌl prɛzʌnt sʌɡnɪfɪkʌnt junʌvɝstʌfaɪtɝ ɪʃuz tu ðʌ sɛnʌt ", + "duration": 0.35698723793029785, + "PER": 11.475409836065573, + "score": { + "S": 5, + "D": 1, + "I": 1, + "N": 61 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.29200267791748047, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.29054856300354004, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌɡ raʊn ðhɑɡ k lɪr lisɔhɪzʃædoʊbʌt s teɪdaʊtoʊn liʌmoʊmʌn t", + "ref_phonemes": "ðʌ ɡraʊnðhɑɡ klɪrli sɔ hɪz ʃædoʊ bʌt steɪd aʊt oʊnli ʌ moʊmʌnt ", + "duration": 0.302931547164917, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 51 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃih��d jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.2468574047088623, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.25621819496154785, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðɛrʃʊd binoʊrizʌn tumɪsɪn tɝp rʌtɔrɪɡ nɔrðʌɪn tɛn tʌvðɪs lɛtɝ", + "ref_phonemes": "ðɛr ʃʊd bi noʊ rizʌn tu mɪsɪntɝprʌt ɔr ɪɡnɔr ðʌ ɪntɛnt ʌv ðɪs lɛtɝ ", + "duration": 0.32408952713012695, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 53 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.26096630096435547, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌdɛd s pɪrʌt sɑk jʌpaɪdʌp rɑmʌnʌn t p leɪsɪnɛvɝihoʊpʌn dɪnɛvɝifɪr", + "ref_phonemes": "ðʌ dɛd spɪrʌts ɑkjʌpaɪd ʌ prɑmʌnʌnt pleɪs ɪn ɛvɝi hoʊp ʌnd ɪn ɛvɝi fɪr ", + "duration": 0.3547379970550537, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 57 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌθɪkɛl m fɔrʌs t wɑz nɪr lioʊvɝwɛl m d baɪdʌtʃɛl m dɪziz", + "ref_phonemes": "ðʌ θɪk ɛlm fɔrʌst wɑz nɪrli oʊvɝwɛlmd baɪ dʌtʃ ɛlm dɪziz ", + "duration": 0.37575507164001465, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 46 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.27382397651672363, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.24404120445251465, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.28731369972229004, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.25509142875671387, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðɪs p rɑsɛsɪzʌs pɛʃlidɪfʌkʌl t sɪn sdʒaɪroʊd rɪf tɪŋɪz tɪpɪkʌliræn dʌm", + "ref_phonemes": "ðɪs prɑsɛs ɪz ʌspɛʃli dɪfʌkʌlt sɪns dʒaɪroʊ drɪftɪŋ ɪz tɪpɪkli rændʌm ", + "duration": 0.3543276786804199, + "PER": 1.694915254237288, + "score": { + "S": 0, + "D": 0, + "I": 1, + "N": 59 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.30155444145202637, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌwɔtɝkʌn teɪn d tumʌtʃk lɔrinʌn d s tʌŋhɪzaɪz", + "ref_phonemes": "ðʌ wɔtɝ kʌnteɪnd tu mʌtʃ klɔrin ʌnd stʌŋ hɪz aɪz ", + "duration": 0.25768113136291504, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 39 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "waɪdoʊn tðeɪtɛl miðɛm sɛl v zɪfɪt bɑðɝzðɛm", + "ref_phonemes": "waɪ doʊnt ðeɪ tɛl mi ðɛmsɛlvz ɪf ɪt bɑðɝz ðɛm ", + "duration": 0.2756073474884033, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 36 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.17646169662475586, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "sɔl idɛpʌzɪʃʌnɪzɪvæl jueɪtʌd baɪwɑʃɪŋk lin s wɑtʃɪz wɪððʌdɝtiwʌn z", + "ref_phonemes": "sɔɪl ridɛpʌzɪʃʌn ɪz ɪvæljueɪtʌd baɪ wɑʃɪŋ klin swɑtʃʌz wɪð ðʌ dɝti wʌnz ", + "duration": 0.4310646057128906, + "PER": 5.0, + "score": { + "S": 1, + "D": 2, + "I": 0, + "N": 60 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "s mæʃlaɪt bʌl b zʌn dðɛr kæʃvæl juwɪl dɪmɪnɪʃtunʌθɪŋ", + "ref_phonemes": "smæʃ laɪtbʌlbz ʌnd ðɛr kæʃ vælju wɪl dɪmɪnɪʃ tu nʌθɪŋ ", + "duration": 0.2521669864654541, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 44 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.2617511749267578, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðɛrɪz lɪtʌl daʊtðætðʌs tudʌn t s bɛnʌfɪt f rʌm voʊkeɪʃʌnʌlɛdʒʌkeɪʃʌn", + "ref_phonemes": "ðɛr ɪz lɪtʌl daʊt ðæt ðʌ studʌnts bɛnʌfɪt frʌm voʊkeɪʃʌnʌl ɛdʒʌkeɪʃʌn ", + "duration": 0.30736708641052246, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 59 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.2971651554107666, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænʌɡliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.27147865295410156, + "PER": 6.25, + "score": { + "S": 2, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌsɪɡɝɛt sɪnðʌk leɪæʃt reɪoʊvɝf loʊdɑn tuðʌoʊk teɪbʌl", + "ref_phonemes": "ðʌ sɪɡɝɛts ɪn ðʌ kleɪ æʃtreɪ oʊvɝfloʊd ɑntu ðʌ oʊk teɪbʌl ", + "duration": 0.30188918113708496, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 47 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.28130507469177246, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.2899038791656494, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.2941591739654541, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.34290504455566406, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.278261661529541, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "sʌmʌb zɝvɝz s pɛk jʌleɪtʌdðætðɪs maɪt bihɪz rivɛndʒɑnhɪʒhoʊm taʊn", + "ref_phonemes": "sʌm ʌbzɝvɝz spɛkjʌleɪtʌd ðæt ðɪs maɪt bi hɪz rivɛndʒ ɑn hɪz hoʊm taʊn ", + "duration": 0.34465479850769043, + "PER": 1.7543859649122806, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 57 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.24314117431640625, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.2811732292175293, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.2977883815765381, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænoʊliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.18869495391845703, + "PER": 6.25, + "score": { + "S": 2, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "wɪððʌs p rɪŋreɪn zðʌf loʊroʊz ræpʌd lidutuɪn fɪl t reɪʃʌnɪnoʊpʌn suɝz", + "ref_phonemes": "wɪð ðʌ sprɪŋ reɪnz ðʌ floʊ roʊz ræpʌdli du tu ɪnfɪltreɪʃʌn ɪn oʊpʌn suɝz ", + "duration": 0.3584012985229492, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 59 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "baɪðʌlʊkʌvhɪmhiwɑzʌn tðæt fɑr ɡɔn", + "ref_phonemes": "baɪ ðʌ lʊk ʌv hɪm hi wɑzʌnt ðæt fɑr ɡɔn ", + "duration": 0.21589446067810059, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 30 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.2893800735473633, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.27084851264953613, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "his lɪp taʊt saɪðhʌɡɪŋðʌwɔl zʌv bɪl dɪŋzʌn d dɑdʒɪŋɪn tudɔr weɪz", + "ref_phonemes": "hi slɪpt aʊtsaɪd hʌɡɪŋ ðʌ wɔlz ʌv bɪldɪŋz ʌnd dɑdʒɪŋ ɪntu dɔrweɪz ", + "duration": 0.38501715660095215, + "PER": 1.8518518518518516, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 54 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.2932872772216797, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "k waɪtɔfʌnhʌnibiz fɔr mʌmʌdʒɔrʌtiɑnðʌwɪloʊkæt kɪn z", + "ref_phonemes": "kwaɪt ɔfʌn hʌnibiz fɔrm ʌ mʌdʒɔrʌti ɑn ðʌ wɪloʊ kætkʌnz ", + "duration": 0.23620915412902832, + "PER": 2.1739130434782608, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 46 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɪf jujuz pɑr kɪŋʌtɛn dʌn t s kænðeɪbirip leɪs t baɪɔtʌmætɪk pɑr kɪŋɡeɪt s", + "ref_phonemes": "ɪf ju juz pɑrkɪŋ ʌtɛndʌnts kæn ðeɪ bi ripleɪst baɪ ɔtʌmætɪk pɑrkɪŋ ɡeɪts ", + "duration": 0.3262803554534912, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 60 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "kæn jɔrɪnʃʊrʌn s kʌm pʌnieɪd juɪn rʌdusɪŋʌd mɪnɪs t reɪtɪv kɑs t s", + "ref_phonemes": "kæn jɔr ɪnʃʊrʌns kʌmpʌni eɪd ju ɪn rʌdusɪŋ ʌdmɪnʌstreɪtɪv kɑsts ", + "duration": 0.31185197830200195, + "PER": 1.8518518518518516, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 54 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.27300024032592773, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.229661226272583, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "wikʌn ɡ rætʃʌleɪtðʌɪn taɪɝmɛm bɝʃɪpɑnɪt s rɛkɝdʌv ɡʊd lɛdʒʌs leɪʃʌn", + "ref_phonemes": "wi kʌŋrætʃʌleɪt ðʌ ɪntaɪɝ mɛmbɝʃɪp ɑn ɪts rɛkɝd ʌv ɡʊd lɛdʒʌsleɪʃʌn ", + "duration": 0.33844947814941406, + "PER": 3.508771929824561, + "score": { + "S": 1, + "D": 0, + "I": 1, + "N": 57 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.259232759475708, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃihæd jɔr dɑr k sutɪn ɡ risiwɑʃwɔtɝɔl jɪr", + "ref_phonemes": "ʃi hæd jɔr dɑrk sut ɪn ɡrisi wɑʃ wɔtɝ ɔl jɪr ", + "duration": 0.27231812477111816, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "æt noʊtaɪm wɝældʒifaʊn dɪnðʌmɪk s t lɪkɝ", + "ref_phonemes": "æt noʊ taɪm wɝ ældʒi faʊnd ɪn ðʌ mɪkst lɪkɝ ", + "duration": 0.2942821979522705, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 34 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "æzʌp rikɔʃʌnðʌaʊt lɔz bɑt ɡʌn paʊdɝfɔrðɛr s t rɔŋhoʊl d", + "ref_phonemes": "æz ʌ prikɔʃʌn ðʌ aʊtlɔz bɑt ɡʌnpaʊdɝ fɔr ðɛr strɔŋhoʊld ", + "duration": 0.3215196132659912, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 46 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʌvaʊdeɪθiʌs t sɔr f riθɪŋkɝzɑr soʊrɛræz tubiʌk jʊriɑsʌti", + "ref_phonemes": "ʌvaʊd eɪθiʌsts ɔr friθɪŋkɝz ɑr soʊ rɛr æz tu bi ʌ kjʊriɑsʌti ", + "duration": 0.3504617214202881, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 49 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "laɪkɪnʌf wilɔl biʌpɑn tɑp baɪsʌn daʊn", + "ref_phonemes": "laɪk ɪnʌf wil ɔl bi ʌp ɑn tɑp baɪ sʌndaʊn ", + "duration": 0.23646807670593262, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.25362658500671387, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "mɛniwɛlθitaɪkun z s p lɝdʒdʌn d bɑt boʊθʌjɑtʌn dʌs kunɝ", + "ref_phonemes": "mɛni wɛlθi taɪkunz splɝdʒd ʌnd bɑt boʊθ ʌ jɑt ʌnd ʌ skunɝ ", + "duration": 0.3415830135345459, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 46 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "s mæʃlaɪt bʌl b zʌn dðɛr kæʃvæl juwɪl dɪmɪnɪʃtunʌθɪŋ", + "ref_phonemes": "smæʃ laɪtbʌlbz ʌnd ðɛr kæʃ vælju wɪl dɪmɪnɪʃ tu nʌθɪŋ ", + "duration": 0.29656004905700684, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 44 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɪnðʌlɔŋrʌnɪt peɪz tubaɪk wɑlʌtik loʊðɪŋ", + "ref_phonemes": "ɪn ðʌ lɔŋ rʌn ɪt peɪz tu baɪ kwɑlʌti kloʊðɪŋ ", + "duration": 0.34152650833129883, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 35 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.2894899845123291, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌp ris kulɝkʊdʌn t vɝbʌlaɪʒhɝfilɪŋnzʌbaʊtðʌɪmɝdʒʌn sikʌn dɪʃʌn z", + "ref_phonemes": "ðʌ priskulɝ kʊdʌnt vɝbʌlaɪz hɝ filɪŋz ʌbaʊt ðʌ ɪmɝdʒʌnsi kʌndɪʃʌnz ", + "duration": 0.29825735092163086, + "PER": 3.508771929824561, + "score": { + "S": 1, + "D": 0, + "I": 1, + "N": 57 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "doʊn tæs k mitukæriænɔɪliræɡ laɪkðæt", + "ref_phonemes": "doʊnt æsk mi tu kæri æn ɔɪli ræɡ laɪk ðæt ", + "duration": 0.2092297077178955, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌɪŋɡ lɪʃfɔr wɝdɪd tuðʌf rɛntʃbæs kʌt sʌv f la��ɝzʌv wɪtʃðeɪhæd meɪdʌp lɛn tʌfʌl p rʌvɪʒʌn tuɡ ritðʌɝaɪvʌlʌvðʌjʌŋp rɪn sɛsðʌf rɛntʃɪn rɪtɝnɪn vaɪtʌdðʌɪŋɡ lɪʃtuʌsʌpɝwɪtʃwɑz tubiɡɪvʌnðʌnɛk s t deɪ", + "ref_phonemes": "ðʌ ɪŋɡlɪʃ fɔrwɝdɪd tu ðʌ frɛntʃ bæskʌts ʌv flaʊɝz ʌv wɪtʃ ðeɪ hæd meɪd ʌ plɛntʌfʌl prʌvɪʒʌn tu ɡrit ðʌ ɝaɪvʌl ʌv ðʌ jʌŋ prɪnsɛs ðʌ frɛntʃ ɪn rɪtɝn ɪnvaɪtʌd ðʌ ɪŋɡlɪʃ tu ʌ sʌpɝ wɪtʃ wɑz tu bi ɡɪvʌn ðʌ nɛkst deɪ ", + "duration": 1.0153682231903076, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 167 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "kʌn ɡ rætʃʌleɪʃʌn z wɝpɔr dɪnʌpɑnðʌp rɪn sɛsɛv riwɛr dʊrɪŋhɝdʒɝni", + "ref_phonemes": "kʌŋrætʃʌleɪʃʌnz wɝ pɔrd ɪn ʌpɑn ðʌ prɪnsɛs ɛvriwɛr dʊrɪŋ hɝ dʒɝni ", + "duration": 0.3153502941131592, + "PER": 3.6363636363636362, + "score": { + "S": 1, + "D": 0, + "I": 1, + "N": 55 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "f rʌmðʌrɪs pɛk t peɪðhɝɑnɔl saɪd zʃisim d laɪkʌk winʌn d f rʌmðʌædɝeɪʃʌn wɪðwɪtʃʃiwɑz t ritʌd baɪtuɔrθriʃiʌpɪr dænʌbdʒɛk tʌv wɝʃʌpðʌk win mʌðɝɡeɪvðʌf rɛntʃðʌmoʊs tʌfɛkʃʌnʌt rɪsɛpʃʌn f ræn s wɑʒhɝneɪtɪv kʌn t riʌn dʃihæd sʌfɝd tumʌtʃʌnhæpinʌsɪnɪŋɡ lʌn d fɔrɪŋɡ lʌn d tuhæv meɪðhɝfɝɡɛt f ræn s", + "ref_phonemes": "frʌm ðʌ rɪspɛkt peɪd hɝ ɑn ɔl saɪdz ʃi simd laɪk ʌ kwin ʌnd frʌm ðʌ ædɝeɪʃʌn wɪð wɪtʃ ʃi wɑz tritʌd baɪ tu ɔr θri ʃi ʌpɪrd æn ʌbdʒɛkt ʌv wɝʃʌp ðʌ kwin mʌðɝ ɡeɪv ðʌ frɛntʃ ðʌ moʊst ʌfɛkʃʌnʌt rɪsɛpʃʌn fræns wɑz hɝ neɪtɪv kʌntri ʌnd ʃi hæd sʌfɝd tu mʌtʃ ʌnhæpinɪs ɪn ɪŋɡlʌnd fɔr ɪŋɡlʌnd tu hæv meɪd hɝ fɝɡɛt fræns ", + "duration": 1.8581867218017578, + "PER": 1.6194331983805668, + "score": { + "S": 4, + "D": 0, + "I": 0, + "N": 247 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃitɔθhɝdɔtɝðɛn baɪhɝoʊnʌfɛkʃʌn fɔrɪtðæt lʌv fɔrʌkʌn t riwɛrðeɪhæd boʊθbɪnhɑs pɪtʌb lirʌsiv dʌn d wɛrʌb rɪl jʌn t f jutʃɝoʊpʌn d fɔrðɛm", + "ref_phonemes": "ʃi tɔt hɝ dɔtɝ ðɛn baɪ hɝ oʊn ʌfɛkʃʌn fɔr ɪt ðæt lʌv fɔr ʌ kʌntri wɛr ðeɪ hæd boʊθ bɪn hɑspʌtʌbli rʌsivd ʌnd wɛr ʌ brɪljʌnt fjutʃɝ oʊpʌnd bɪfɔr ðɛm ", + "duration": 0.7474658489227295, + "PER": 3.418803418803419, + "score": { + "S": 2, + "D": 2, + "I": 0, + "N": 117 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌkaʊn θhædθroʊnhɪm sɛl f bækɑnhɪz sit linɪŋhɪzʃoʊl dɝzʌɡɛn s tðʌpɑr tɪʃʌnʌvðʌtɛn tʌn d rɪmeɪn dðʌʃhɪz feɪs bɛridɪnhɪʒhæn d z wɪðhivɪŋtʃɛs tʌn d rɛs t lʌs lɪm z", + "ref_phonemes": "ðʌ kaʊnt hæd θroʊn hɪmsɛlf bæk ɑn hɪz sit linɪŋ hɪz ʃoʊldɝz ʌɡɛnst ðʌ pɑrtɪʃʌn ʌv ðʌ tɛnt ʌnd rɪmeɪnd ðʌs hɪz feɪs bɛrid ɪn hɪz hændz wɪð hivɪŋ tʃɛst ʌnd rɛstlʌs lɪmz ", + "duration": 0.99153733253479, + "PER": 2.2388059701492535, + "score": { + "S": 3, + "D": 0, + "I": 0, + "N": 134 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðɪʃhæzɪn did bɪnʌhɝæsɪŋdeɪkʌn tɪn judðʌjʌŋmænhɪzaɪz fɪk s tʌpɑnhɪz f rɛn d", + "ref_phonemes": "ðɪs hæz ɪndid bɪn ʌ hɝæsɪŋ deɪ kʌntɪnjud ðʌ jʌŋ mæn hɪz aɪz fɪkst ʌpɑn hɪz frɛnd ", + "duration": 0.39222264289855957, + "PER": 1.5625, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 64 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "kæn juɪmædʒʌn waɪbʌkɪŋhæmhæz bɪn soʊvaɪʌlʌn taɪsʌs pɛk t", + "ref_phonemes": "kæn ju ɪmædʒʌn waɪ bʌkɪŋhæm hæz bɪn soʊ vaɪʌlʌnt aɪ sʌspɛkt ", + "duration": 0.33504462242126465, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 49 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɪtɪz juhuɑr mɪs teɪkʌn raʊlaɪhæv rɛðhɪz dɪs t rɛsɪnhɪzaɪzɪnhɪzɛvɝidʒɛstʃɝʌn dækʃʌnðʌhoʊl deɪ", + "ref_phonemes": "ɪt ɪz ju hu ɑr mɪsteɪkʌn rɑul aɪ hæv rɛd hɪz dɪstrɛs ɪn hɪz aɪz ɪn hɪz ɛvɝi dʒɛstʃɝ ʌnd ækʃʌn ðʌ hoʊl deɪ ", + "duration": 0.5443277359008789, + "PER": 3.6585365853658534, + "score": { + "S": 3, + "D": 0, + "I": 0, + "N": 82 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "aɪæm kʌn vɪn s tʌv wʌtaɪseɪsɛdðʌkaʊn t", + "ref_phonemes": "aɪ æm kʌnvɪnst ʌv wʌt aɪ seɪ sɛd ðʌ kaʊnt ", + "duration": 0.2603292465209961, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 32 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "bʌt kʌn tɪn jud raʊ nɑtɪn tɝʌp tɪd baɪðɪs muv mʌn tʌvhɪz f rɛn ðhɛvʌn bip reɪz dðʌf rɛntʃhuɑr p rʌnaʊn s t tubiθɔt lʌsʌn dɪn dɪs k rit rɛk lʌsivɪnɑr keɪpʌbʌlʌv b rɪŋɪŋʌkɑmʌn d saʊn ddʒʌdʒmʌn t tubɛrɑn mætɝzʌv sʌtʃhaɪɪm pɔr tʌn s", + "ref_phonemes": "bʌt kʌntɪnjud rɑul nɑt ɪntɝʌptɪd baɪ ðɪs muvmʌnt ʌv hɪz frɛnd hɛvʌn bi preɪzd ðʌ frɛntʃ hu ɑr prʌnaʊnst tu bi θɔtlʌs ʌnd ɪndɪskrit rɛklʌs ivɪn ɑr keɪpʌbʌl ʌv brɪŋɪŋ ʌ kɑm ʌnd saʊnd dʒʌdʒmʌnt tu bɛr ɑn mætɝz ʌv sʌtʃ haɪ ɪmpɔrtʌns ", + "duration": 1.055006742477417, + "PER": 2.1505376344086025, + "score": { + "S": 3, + "D": 1, + "I": 0, + "N": 186 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌsɪtɪzðætðʌhʌnɝʌvθriɪz seɪv daʊɝkʌn t riaʊɝmæs tɝzʌn daʊɝoʊn", + "ref_phonemes": "ðʌs ɪt ɪz ðæt ðʌ ɑnɝ ʌv θri ɪz seɪvd aʊɝ kʌntriz aʊɝ mæstɝz ʌnd aʊɝ oʊn ", + "duration": 0.45667195320129395, + "PER": 5.454545454545454, + "score": { + "S": 1, + "D": 1, + "I": 1, + "N": 55 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "jɛsaɪnid ripoʊz mɛniθɪŋʒhævædʒʌteɪtʌd mitudeɪboʊθɪn maɪn dʌn d bɑdiwɛn jurɪtɝn tumɑroʊaɪʃæl noʊlɔŋɡɝbiðʌseɪm mæn", + "ref_phonemes": "jɛs aɪ nid ripoʊz mɛni θɪŋz hæv ædʒʌteɪtʌd mi tu deɪ boʊθ ɪn maɪnd ʌnd bɑdi wɛn ju rɪtɝn tu mɑroʊ aɪ ʃæl noʊ lɔŋɡɝ bi ðʌ seɪm mæn ", + "duration": 0.6459617614746094, + "PER": 0.9900990099009901, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 101 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "bʌtɪnðɪs f rɛn d lip rɛʃɝrælkʊd dɪtɛk tðʌnɝvʌsædʒʌteɪʃʌnʌvʌɡ reɪtɪn tɝnʌl kɑn f lɪk t", + "ref_phonemes": "bʌt ɪn ðɪs frɛndli prɛʃɝ rɑul kʊd dɪtɛkt ðʌ nɝvʌs ædʒʌteɪʃʌn ʌv ʌ ɡreɪt ɪntɝnʌl kɑnflɪkt ", + "duration": 0.46155285835266113, + "PER": 2.73972602739726, + "score": { + "S": 1, + "D": 1, + "I": 0, + "N": 73 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌnaɪt wɑz k lɪr s tɑr lɪtʌn d s p lɛn dʌdðʌtɛm pʌs θhæd pæs tʌweɪʌn dðʌs witɪn f luʌn sɪzʌvðʌiv nɪŋhæd rɪs tɔr d laɪf pisʌn d sɪk jʊrʌtiɛv riwɛr", + "ref_phonemes": "ðʌ naɪt wɑz klɪr stɑrlɪt ʌnd splɛndʌd ðʌ tɛmpʌst hæd pæst ʌweɪ ʌnd ðʌ swit ɪnfluʌnsɪz ʌv ðʌ ivnɪŋ hæd rɪstɔrd laɪf pis ʌnd sɪkjʊrʌti ɛvriwɛr ", + "duration": 0.7665653228759766, + "PER": 0.8695652173913043, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 115 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʌpɑnðʌlɑrdʒs k wɛrɪn f rʌn tʌvðʌhoʊtɛlðʌʃædoʊzʌvðʌtɛn t sɪn tɝsɛk tɪd baɪðʌɡoʊl dʌn mun bim z fɔr m dæzɪt wɝʌhjudʒmoʊzeɪɪkʌvdʒɛtʌn d jɛloʊf læɡ s toʊn z", + "ref_phonemes": "ʌpɑn ðʌ lɑrdʒ skwɛr ɪn frʌnt ʌv ðʌ hoʊtɛl ðʌ ʃædoʊz ʌv ðʌ tɛnts ɪntɝsɛktɪd baɪ ðʌ ɡoʊldʌn munbimz fɔrmd æz ɪt wɝ ʌ hjudʒ moʊzeɪɪk ʌv dʒɛt ʌnd jɛloʊ flæɡstoʊnz ", + "duration": 0.7941620349884033, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 128 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "b ræɡʌlʌn wɑtʃt fɔr sʌm taɪmðʌkɑn dʌk tʌvðʌtulʌvɝz lɪsʌn d tuðʌlaʊdʌn dʌn sɪvʌl s lʌm bɝzʌv mænɪkɛm phus nɔr dæzɪm pɪriʌs liæzðoʊhiwɑz wɛrɪŋhɪz b luʌn d ɡoʊl dɪn s tɛdʌvhɪz vaɪʌlɪt sut", + "ref_phonemes": "bræɡʌloʊn wɑtʃt fɔr sʌm taɪm ðʌ kɑndʌkt ʌv ðʌ tu lʌvɝz lɪsʌnd tu ðʌ laʊd ʌnd ʌnsɪvʌl slʌmbɝz ʌv mænɪkæmp hu snɔrd æz ɪmpɪriʌsli æz ðoʊ hi wɑz wɛrɪŋ hɪz blu ʌnd ɡoʊld ɪnstɛd ʌv hɪz vaɪʌlɪt sut ", + "duration": 0.9825656414031982, + "PER": 1.948051948051948, + "score": { + "S": 2, + "D": 1, + "I": 0, + "N": 154 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðeɪwɝsɝtʌn linoʊnɪrɝðʌsʌluʃʌnʌvðɛr p rɑb lʌm", + "ref_phonemes": "ðeɪ wɝ sɝtʌnli noʊ nɪrɝ ðʌ sʌluʃʌn ʌv ðɛr prɑblʌm ", + "duration": 0.23743629455566406, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 40 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌpʊr lɪtʌlθɪŋz k raɪd sɪnθiʌθɪŋkʌvðɛmhævɪŋbɪn tɝn d tuðʌwɔlɔlðiz jɪr z", + "ref_phonemes": "ðʌ pʊr lɪtʌl θɪŋz kraɪd sɪnθiʌ θɪŋk ʌv ðɛm hævɪŋ bɪn tɝnd tu ðʌ wɔl ɔl ðiz jɪrz ", + "duration": 0.3935403823852539, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 62 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "naʊwʌt��zðʌsɛn sʌvɪt tuɪnʌsʌn t beɪbiz laɪkðæt", + "ref_phonemes": "naʊ wʌt wɑz ðʌ sɛns ʌv ɪt tu ɪnʌsʌnt beɪbiz laɪk ðæt ", + "duration": 0.2882883548736572, + "PER": 4.878048780487805, + "score": { + "S": 1, + "D": 1, + "I": 0, + "N": 41 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "bʌtdʒɔɪʃhæd nɑt bɪn lɪsʌnɪŋɔlæt wʌn sʃipʊt daʊnhɝkæn dʌlɑnðʌteɪbʌlʌn d feɪs θhɝkʌm pæn jʌn", + "ref_phonemes": "bʌt dʒɔɪs hæd nɑt bɪn lɪsʌnɪŋ ɔl æt wʌns ʃi pʊt daʊn hɝ kændʌl ɑn ðʌ teɪbʌl ʌnd feɪst hɝ kʌmpænjʌn ", + "duration": 0.4698948860168457, + "PER": 2.564102564102564, + "score": { + "S": 2, + "D": 0, + "I": 0, + "N": 78 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌt wɪn b rʌðɝdɪd sʌmθɪŋʃidɪdʌn t laɪkʌn dʃitɝn ðhɪz pɪktʃɝtuðʌwɔl", + "ref_phonemes": "ðʌ twɪn brʌðɝ dɪd sʌmθɪŋ ʃi dɪdʌnt laɪk ʌnd ʃi tɝnd hɪz pɪktʃɝ tu ðʌ wɔl ", + "duration": 0.3589966297149658, + "PER": 1.7543859649122806, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 57 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "hɝʒhæpʌn d tubiɑnðʌseɪm f reɪm tubʌtʃiɛvʌdʌn t lidɪdʌn t kɛrʌbaʊtɪt", + "ref_phonemes": "hɝz hæpʌnd tu bi ɪn ðʌ seɪm freɪm tu bʌt ʃi ɛvʌdʌntli dɪdʌnt kɛr ʌbaʊt ðæt ", + "duration": 0.35890769958496094, + "PER": 6.779661016949152, + "score": { + "S": 3, + "D": 1, + "I": 0, + "N": 59 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "aɪθɔt wiwɝs tʌm p tʌɡɛn wɛnaɪfɝs t sɔðæt pɪktʃɝbʌtɪt s bɪnʌv sʌm jusæf tɝɔl", + "ref_phonemes": "aɪ θɔt wi wɝ stʌmpt ʌɡɛn wɛn aɪ fɝst sɔ ðæt pɪktʃɝ bʌt ɪts bɪn ʌv sʌm jus æftɝ ɔl ", + "duration": 0.418790340423584, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 62 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "dujusʌpoʊzðʌmɪniʌtʃɝwɑzʌkɑpiʌvðʌseɪmθɪŋ", + "ref_phonemes": "du ju sʌpoʊz ðʌ mɪniʌtʃʊr wɑz ʌ kɑpi ʌv ðʌ seɪm θɪŋ ", + "duration": 0.31195497512817383, + "PER": 5.0, + "score": { + "S": 1, + "D": 1, + "I": 0, + "N": 40 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðeɪwɝimitɛrʌb liʌn d bɪsaɪd zaɪd laɪk tusiwʌtðɪs lʌv lifɝnɪtʃɝlʊk s laɪk wɪθaʊt sʌtʃk wɑn tʌtizʌv dʌs tɔloʊvɝɪt ɡʊd s kim sɪn", + "ref_phonemes": "ðeɪ wɝi mi tɛrʌbli ʌnd bɪsaɪdz aɪd laɪk tu si wʌt ðɪs lʌvli fɝnɪtʃɝ lʊks laɪk wɪθaʊt sʌtʃ kwɑntʌtiz ʌv dʌst ɔl oʊvɝ ɪt ɡʊd skim sɪn ", + "duration": 0.6554384231567383, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 105 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "wil kʌmɪnhirðɪsæf tɝnun wɪðoʊl d k loʊðzɑnʌn ðhævʌrɛɡ jʌlɝhaʊs k linɪŋ", + "ref_phonemes": "wil kʌm ɪn hir ðɪs æftɝnun wɪð oʊld kloʊðz ɑn ʌnd hæv ʌ rɛɡjʌlɝ haʊs klinɪŋ ", + "duration": 0.34357285499572754, + "PER": 1.6666666666666667, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 60 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɪt kæn θhɝtɛniθɪŋaɪmʃʊr fɔr wiwoʊn t dɪs tɝbθɪŋzætɔl", + "ref_phonemes": "ɪt kænt hɝt ɛniθɪŋ aɪm ʃʊr fɔr wi woʊnt dɪstɝb θɪŋz æt ɔl ", + "duration": 0.32655882835388184, + "PER": 2.2222222222222223, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 45 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðɪsθɔθhaʊɛvɝdɪd nɑtɛn tɝðʌhɛd zʌvðʌɪnθuziæs tɪk pɛr", + "ref_phonemes": "ðɪs θɔt haʊɛvɝ dɪd nɑt ɛntɝ ðʌ hɛdz ʌv ðʌ ɪnθuziæstɪk pɛr ", + "duration": 0.3425126075744629, + "PER": 2.1739130434782608, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 46 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "s mʌɡʌlɪŋðʌhaʊs k linɪŋpɛrʌfɝneɪl jʌɪn tuðʌsɛlɝwɪn doʊʌnʌb s ɝv dðætæf tɝnun p ruv d noʊizitæs k fɔr sɪnθiʌhædædʌdʌwɪs k b rumʌn d dʌs t pæn tuðʌaʊt fɪt", + "ref_phonemes": "smʌɡlɪŋ ðʌ haʊs klinɪŋ pɛrʌfʌneɪljʌ ɪntu ðʌ sɛlɝ wɪndoʊ ʌnʌbʌstɝvd ðæt æftɝnun pruvd noʊ izi tæsk fɔr sɪnθiʌ hæd ædʌd ʌ wɪsk brum ʌnd dʌst pæn tu ðʌ aʊtfɪt ", + "duration": 0.7541806697845459, + "PER": 3.149606299212598, + "score": { + "S": 1, + "D": 2, + "I": 1, + "N": 127 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌlʊr p ruv d tumʌtʃfɔrhɪmʌn ðhikeɪm s pɔr tɪŋæf tɝɪtæz f rɪs k liæzʌjʌŋkɪtʌn mʌtʃtusɪnθiʌz dɪlaɪt wɛnʃikɑt saɪtʌvhɪm", + "ref_phonemes": "ðʌ lʊr pruvd tu mʌtʃ fɔr hɪm ʌnd hi keɪm spɔrtɪŋ æftɝ ɪt æz frɪskʌli æz ʌ jʌŋ kɪtʌn mʌtʃ tu sɪnθiʌz dɪlaɪt wɛn ʃi kɑt saɪt ʌv hɪm ", + "duration": 0.7212660312652588, + "PER": 1.9801980198019802, + "score": { + "S": 1, + "D": 1, + "I": 0, + "N": 101 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "oʊlɛθhɪm kʌmʌlɔŋʃiɝdʒdaɪdulʌv tusihɪmʌbaʊtðætoʊl ðhaʊs", + "ref_phonemes": "oʊ lɛt hɪm kʌm ʌlɔŋ ʃi ɝdʒd aɪ du lʌv tu si hɪm ʌbaʊt ðæt oʊld haʊs ", + "duration": 0.4254567623138428, + "PER": 3.9215686274509802, + "score": { + "S": 2, + "D": 0, + "I": 0, + "N": 51 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "jɛt lɪtʌlæzɪt wɑzɪθhædɔl rɛdimeɪdʌvæs t dɪfɝʌn sɪnðʌæs pɛk tʌvðʌrum", + "ref_phonemes": "jɛt lɪtʌl æz ɪt wɑz ɪt hæd ɔlrɛdi meɪd ʌ væst dɪfɝʌns ɪn ðʌ æspɛkt ʌv ðʌ rum ", + "duration": 0.32015037536621094, + "PER": 1.694915254237288, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 59 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "sɝfʌs dʌs tæt lis θhæd bɪn rimuv dʌn dðʌfaɪnoʊl d fɝnɪtʃɝɡeɪvʌhɪn tʌvɪt s rilɛlʌɡʌn sʌn d pɑlɪʃ", + "ref_phonemes": "sɝfʌs dʌst æt list hæd bɪn rimuvd ʌnd ðʌ faɪn oʊld fɝnɪtʃɝ ɡeɪv ʌ hɪnt ʌv ɪts ril ɛlʌɡʌns ʌnd pɑlɪʃ ", + "duration": 0.49976563453674316, + "PER": 1.2658227848101267, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 79 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʌn d maɪpɑkʌt mʌniɪz ɡɛtɪŋloʊʌɡɛnʌn d juhævʌn tɛnilɛf tæz juʒʌwʌl", + "ref_phonemes": "ʌnd maɪ pɑkʌt mʌni ɪz ɡɛtɪŋ loʊ ʌɡɛn ʌnd ju hævʌnt ɛni lɛft æz juʒʌwʌl ", + "duration": 0.3765230178833008, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 56 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðeɪseɪɪlumʌneɪʃʌn baɪkæn dʌl laɪtɪzðʌp rɪtiʌs tɪnðʌwɝl d", + "ref_phonemes": "ðeɪ seɪ ɪlumʌneɪʃʌn baɪ kændʌl laɪt ɪz ðʌ prɪtiʌst ɪn ðʌ wɝld ", + "duration": 0.3529036045074463, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 50 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "waɪɪt s ɡʌlaɪʌθæz juʒʌwʌlðeɪboʊθk raɪd pirɪŋɪn", + "ref_phonemes": "waɪ ɪts ɡʌlaɪʌθ æz juʒʌwʌl ðeɪ boʊθ kraɪd pirɪŋ ɪn ", + "duration": 0.32969069480895996, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 41 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "fɝɡɛtɪŋɔlðɛr wɪrinʌsðeɪsiz dðɛr kæn dʌl zʌn d s kɝidθruðʌhaʊs faɪn dɪŋɑnʌkeɪʒʌnʌl peɪpɝtʌk tʌweɪɪn sʌmɑd kɔr nɝ", + "ref_phonemes": "fɝɡɛtɪŋ ɔl ðɛr wɪrinʌs ðeɪ sizd ðɛr kændʌlz ʌnd skɝid θru ðʌ haʊs faɪndɪŋ æn ʌkeɪʒʌnʌl peɪpɝ tʌkt ʌweɪ ɪn sʌm ɑd kɔrnɝ ", + "duration": 0.5624287128448486, + "PER": 1.0416666666666665, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 96 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "wɛlaɪm kʌn vɪn s tðætðʌbɔr dʌdʌphaʊs mɪs tɝihæpʌn d nɑtɝliɝðæneɪp rʌl sɪk s tinθeɪtin sɪk s tiwʌnʌn d p rɑbʌb linɑt mʌtʃleɪtɝ", + "ref_phonemes": "wɛl aɪm kʌnvɪnst ðæt ðʌ bɔrdʌd ʌp haʊs mɪstɝi hæpʌnd nɑt ɝliɝ ðæn eɪprʌl sɪkstinθ eɪtin sɪksti wʌn ʌnd prɑbʌbli nɑt mʌtʃ leɪtɝ ", + "duration": 0.7402865886688232, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 104 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "noʊwɝd z wɝs poʊkʌn noʊlæŋɡ wʌdʒwɑzʌtɝd seɪvðætʌv weɪlɪŋʌn ðhɪsɪŋʌn dðæt sʌmhaʊwɑzɪn dɪs tɪŋk tæzɪfɪtɪɡ zɪs tʌdɪn fæn siʌn d nɑtɪn riælʌti", + "ref_phonemes": "noʊ wɝdz wɝ spoʊkʌn noʊ læŋɡwʌdʒ wɑz ʌtɝd seɪv ðæt ʌv weɪlɪŋ ʌnd hɪsɪŋ ʌnd ðæt sʌmhaʊ wɑz ɪndɪstɪŋkt æz ɪf ɪt ɪɡzɪstʌd ɪn fænsi ʌnd nɑt ɪn riælʌti ", + "duration": 0.9701550006866455, + "PER": 0.847457627118644, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 118 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "aɪhɝdʌnɔɪz bɪhaɪn daɪtɝn dʌn d sɔkæfɝhɪz b lækaɪzʃaɪnɪŋ waɪlɪnhɪʒhæn ðhihɛl dʌɡ limɪŋnaɪfhilɪf tʌdɪtʌbʌvhɪʒhɛdæzɪf tus t raɪk bʌtaɪhædðʌs t rɛŋkθʌv tɛn mɛnʌn daɪhɝl ðhɪm f rʌm mi", + "ref_phonemes": "aɪ hɝd ʌ nɔɪz bɪhaɪnd aɪ tɝnd ʌnd sɔ kæfɝ hɪz blæk aɪz ʃaɪnɪŋ waɪl ɪn hɪz hænd hi hɛld ʌ ɡlimɪŋ naɪf hi lɪftʌd ɪt ʌbʌv hɪz hɛd æz ɪf tu straɪk bʌt aɪ hæd ðʌ strɛŋkθ ʌv tɛn mɛn ʌnd aɪ hɝld hɪm frʌm mi ", + "duration": 1.2227182388305664, + "PER": 2.6143790849673203, + "score": { + "S": 4, + "D": 0, + "I": 0, + "N": 153 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌs tɔriʌvɪt sivʌlɪn f luʌn s keɪm bæk tumiʌn dɪn maɪbɪwɪl dɝd kʌn dɪʃʌnaɪwʌn dɝd wɛðɝðɛr wɑz nɑt sʌm t ruθɪn wʌθhæd bɪn sɛd", + "ref_phonemes": "ðʌ stɔri ʌv ɪts ivʌl ɪnfluʌns keɪm bæk tu mi ʌnd ɪn maɪ bɪwɪldɝd kʌndɪʃʌn aɪ wʌndɝd wɛðɝ ðɛr wɑz nɑt sʌm truθ ɪn wʌt hæd bɪn sɛd ", + "duration": 0.7046661376953125, + "PER": 0.9900990099009901, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 101 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "wʌtðɛnʌhjumʌnhæn d lɑrdʒʌn dʃeɪp liʌpɪr d dɪs tɪŋk t liɑnðʌsɝfʌsʌvðʌpɑn d", + "ref_phonemes": "wʌt ðɛn ʌ hjumʌn hænd lɑrdʒ ʌnd ʃeɪpli ʌpɪrd dɪstɪŋktli ɑn ðʌ sɝfʌs ʌv ðʌ pɑnd ", + "duration": 0.5205509662628174, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 63 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "nʌθɪŋmɔr nɑtivɪnðʌrɪs t tuwɪtʃɪt maɪt biʌtætʃt", + "ref_phonemes": "nʌθɪŋ mɔr nɑt ivɪn ðʌ rɪst tu wɪtʃ ɪt maɪt bi ʌtætʃt ", + "duration": 0.3416154384613037, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 41 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɪt dɪd nɑt bɛkʌnɔrɪn did muvætɔlɪt wɑzæz s tɪlæzðʌhæn dʌv dɛθ", + "ref_phonemes": "ɪt dɪd nɑt bɛkʌn ɔr ɪndid muv æt ɔl ɪt wɑz æz stɪl æz ðʌ hænd ʌv dɛθ ", + "duration": 0.43433713912963867, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 51 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "aɪʌwoʊk tukɑnʃʌs nʌs faɪtɪŋæt fɝs tɪt sim dæzɪfaɪwɑz faɪtɪŋwɪððʌfæn tʌm bʌt ɡ rædʒuʌlimaɪʌpoʊnʌn t bɪkeɪm mɔr ril tumiɪt wɑz kæfɝ", + "ref_phonemes": "aɪ ʌwoʊk tu kɑnʃʌsnʌs faɪtɪŋ æt fɝst ɪt simd æz ɪf aɪ wɑz faɪtɪŋ wɪð ʌ fæntʌm bʌt ɡrædʒuʌli maɪ ʌpoʊnʌnt bɪkeɪm mɔr ril tu mi ɪt wɑz kæfɝ ", + "duration": 0.8653082847595215, + "PER": 0.9174311926605505, + "score": { + "S": 0, + "D": 0, + "I": 1, + "N": 109 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "aɪhæd s kɛr s linoʊn wʌtaɪhæd bɪn seɪɪŋɔr duɪŋʌp tuðɪs taɪm bʌtæʒhis poʊkaɪlʊk tæt maɪhæn d", + "ref_phonemes": "aɪ hæd skɛrsli noʊn wʌt aɪ hæd bɪn seɪɪŋ ɔr duɪŋ ʌp tu ðɪs taɪm bʌt æz hi spoʊk aɪ lʊkt æt maɪ hænd ", + "duration": 0.5413336753845215, + "PER": 1.3157894736842104, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 76 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɪnðʌlaɪtʌvðʌmunaɪsɔʌnaɪf rɛd wɪðb lʌdʌn d maɪhæn d tuwɑzɔl soʊdɪs kʌlɝd", + "ref_phonemes": "ɪn ðʌ laɪt ʌv ðʌ mun aɪ sɔ ʌ naɪf rɛd wɪð blʌd ʌnd maɪ hænd tu wɑz ɔlsoʊ dɪskʌlɔrd ", + "duration": 0.5419461727142334, + "PER": 3.1746031746031744, + "score": { + "S": 1, + "D": 1, + "I": 0, + "N": 63 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "voʊl tʃɛ pɪk tʌp sʌmθɪŋf rʌmðʌɡ raʊn dʌn d lʊk tætɪt", + "ref_phonemes": "voʊltɛr pɪkt ʌp sʌmθɪŋ frʌm ðʌ ɡraʊnd ʌnd lʊkt æt ɪt ", + "duration": 0.2697868347167969, + "PER": 4.761904761904762, + "score": { + "S": 0, + "D": 1, + "I": 1, + "N": 42 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "aɪseɪjudunoʊwʌtðɪs min zʌn d jumʌs t tɛlʌs", + "ref_phonemes": "aɪ seɪ ju du noʊ wʌt ðɪs minz ʌnd ju mʌst tɛl ʌs ", + "duration": 0.3508741855621338, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 36 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "aɪhædʌɡɛn bɪnæk tɪŋʌn dɝðʌɪn f luʌn sʌvðɪs mæn z paʊɝ", + "ref_phonemes": "aɪ hæd ʌɡɛn bɪn æktɪŋ ʌndɝ ðʌ ɪnfluʌns ʌv ðɪs mænz paʊɝ ", + "duration": 0.27144885063171387, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 44 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "pɝtʃæn s tukæfɝz dɛθmaɪt sɝvhɪmɪn ɡʊd s tɛd", + "ref_phonemes": "pɝtʃæns tu kæfɝz dɛθ maɪt sɝv hɪm ɪn ɡʊd stɛd ", + "duration": 0.35928916931152344, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 36 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "maɪtʌŋrʌf juz d tuɑr tɪk jʌleɪt maɪpaʊɝʌv s pitʃlɛf t mi", + "ref_phonemes": "maɪ tʌŋ rʌfjuzd tu ɑrtɪkjʌlʌt maɪ paʊɝ ʌv spitʃ lɛft mi ", + "duration": 0.3728628158569336, + "PER": 4.444444444444445, + "score": { + "S": 1, + "D": 0, + "I": 1, + "N": 45 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "nɑt wɪθs tæn dɪŋðʌhaɪrɛzʌluʃʌnʌvhɔkaɪhifʊlikɑm p rihɛn dʌdɔlðʌdɪfʌkʌl tizʌn d deɪndʒɝhiwɑzʌbaʊt tuɪn kɝ", + "ref_phonemes": "nɑtwɪθstændɪŋ ðʌ haɪ rɛzʌluʃʌn ʌv hɔkaɪ hi fʊli kɑmprɪhɛndɪd ɔl ðʌ dɪfʌkʌltiz ʌnd deɪndʒɝ hi wɑz ʌbaʊt tu ɪnkɝ ", + "duration": 0.6169147491455078, + "PER": 2.1739130434782608, + "score": { + "S": 2, + "D": 0, + "I": 0, + "N": 92 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɪnhɪz rɪtɝn tuðʌkæm phɪzʌk jutʌn d p ræk tʌs tɪn tʌlɛk t s wɝɪn tɛn t liɛn ɡeɪdʒdɪn dɪvaɪzɪŋmin z tukaʊn tɝæk tʌwɑtʃfʌl nʌsʌn d sʌs pɪʃʌnɑnðʌpɑr tʌvhɪzɛnʌmizðæθhinuwɝɪn noʊdɪɡ riɪn fɪriɝtuhɪzoʊn", + "ref_phonemes": "ɪn hɪz rɪtɝn tu ðʌ kæmp hɪz ʌkjut ʌnd præktʌst ɪntʌlɛkts wɝ ɪntɛntli ɛŋeɪdʒd ɪn dɪvaɪzɪŋ minz tu kaʊntɝækt ʌ wɑtʃfʌlnʌnz ʌnd sʌspɪʃʌn ɑn ðʌ pɑrt ʌv hɪz ɛnʌmiz ðæt hi nu wɝ ɪn noʊ dɪɡri ɪnfɪriɝ tu hɪz oʊn ", + "duration": 0.7900381088256836, + "PER": 3.048780487804878, + "score": { + "S": 3, + "D": 1, + "I": 1, + "N": 164 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɪnʌðɝwɝd z waɪlhihædɪm p lɪsʌt feɪθɪnðʌʌbɪlʌtiʌv beɪlʌm zæs tus pikhiwɑz sʌm wʌt sɛp tɪkʌlɑnðʌsʌbdʒɪk tʌvʌbɛr z sɪŋɪŋʌn d jɛθhihæd bɪnʌʃʊr dʌvðʌlætɝɑnðʌtɛs tʌmoʊniʌvhɪzoʊnɛk s k wʌzʌtɔr ɡʌn z", + "ref_phonemes": "ɪn ʌðɝ wɝdz waɪl hi hæd ɪmplɪsʌt feɪθ ɪn ðʌ ʌbɪlʌti ʌv bælʌmz æs tu spik hi wɑz sʌmwʌt skɛptʌkʌl ɑn ðʌ sʌbdʒɪkt ʌv ʌ bɛrz sɪŋɪŋ ʌnd jɛt hi hæd bɪn ʌʃʊrd ʌv ðʌ lætɝ ɑn ðʌ tɛstʌmoʊni ʌv hɪz oʊn ɛkskwʌzʌt ɔrɡʌnz ", + "duration": 0.9376177787780762, + "PER": 3.0303030303030303, + "score": { + "S": 3, + "D": 1, + "I": 1, + "N": 165 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðɛr wɑz sʌmθɪŋɪnhɪzɛrʌn d mænɝðæt bɪt reɪd tuðʌs kaʊtðʌʌtɝkʌn f juʒʌnʌvðʌs teɪtʌvhɪz maɪn d", + "ref_phonemes": "ðɛr wɑz sʌmθɪŋ ɪn hɪz ɛr ʌnd mænɝ ðæt bɪtreɪd tu ðʌ skaʊt ðʌ ʌtɝ kʌnfjuʒʌn ʌv ðʌ steɪt ʌv hɪz maɪnd ", + "duration": 0.4674856662750244, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 78 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌɪndʒin jʌʃhɔkaɪhurɪkɔl dðʌheɪs timænɝɪn wɪtʃðʌʌðɝhædʌbæn dʌn ðhɪz poʊs tætðʌbɛd saɪdʌvðʌsɪk wʊmʌn wɑz nɑt wɪθaʊθhɪz sʌs pɪʃʌn z kʌn sɝnɪŋðʌsʌbdʒɪk tʌv soʊmʌtʃsɑlʌm dɪlɪbɝeɪʃʌn", + "ref_phonemes": "ðʌ ɪndʒinjʌs hɔkaɪ hu rɪkɔld ðʌ heɪsti mænɝ ɪn wɪtʃ ðʌ ʌðɝ hæd ʌbændʌnd hɪz poʊst æt ðʌ bɛdsaɪd ʌv ðʌ sɪk wʊmʌn wɑz nɑt wɪθaʊt hɪz sʌspɪʃʌnz kʌnsɝnɪŋ ðʌ sʌbdʒɪkt ʌv soʊ mʌtʃ sɑlʌm dɪlɪbɝeɪʃʌn ", + "duration": 0.9302494525909424, + "PER": 1.9230769230769231, + "score": { + "S": 3, + "D": 0, + "I": 0, + "N": 156 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌbɛrʃʊkhɪzʃæɡisaɪd zʌn dðɛnʌwɛl noʊn vɔɪs rɪp laɪd", + "ref_phonemes": "ðʌ bɛr ʃʊk hɪz ʃæɡi saɪdz ʌnd ðɛn ʌ wɛl noʊn vɔɪs rɪplaɪd ", + "duration": 0.35232090950012207, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 45 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "kænðizθɪŋz birɪtɝn d deɪvɪd b riðɪŋmɔr f riliæzðʌt ruθbɪɡæn tudɔnʌpɑnhɪm", + "ref_phonemes": "kæn ðiz θɪŋz bi rɪtɝnd deɪvɪd briðɪŋ mɔr frili æz ðʌ truθ bɪɡæn tu dɔn ʌpɑn hɪm ", + "duration": 0.4311559200286865, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 63 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "kʌm kʌm rɪtɝn ðhɔkaɪʌn keɪsɪŋhɪzɑnʌs t kaʊn tʌnʌn sðʌbɛtɝtuʌʃʊrðʌweɪvɝɪŋkɑn fʌdʌn sʌvhɪz kʌm pæn jʌn jumeɪsiʌs kɪn wɪtʃɪfɪt binɑtæz waɪtæz wʌnʌvðʌdʒɛn tʌl wʌn ʒhæz noʊtɪndʒʌv rɛd tuɪtðætðʌwɪn d zʌvðʌhɛvʌnʌn dðʌsʌnhæv nɑt bɪs toʊd naʊlɛtʌs tubɪz nʌs", + "ref_phonemes": "kʌm kʌm rɪtɝnd hɔkaɪ ʌnkeɪsɪŋ hɪz ɑnʌst kaʊntʌnʌns ðʌ bɛtɝ tu ʌʃʊr ðʌ weɪvɝɪŋ kɑnfʌdʌns ʌv hɪz kʌmpænjʌn ju meɪ si ʌ skɪn wɪtʃ ɪf ɪt bi nɑt æz waɪt æz wʌn ʌv ðʌ dʒɛntʌl wʌnz hæz noʊ tɪndʒ ʌv rɛd tu ɪt ðæt ðʌ wɪndz ʌv ðʌ hɛvʌn ʌnd ðʌ sʌn hæv nɑt bɪstoʊd naʊ lɛt ʌs tu bɪznʌs ", + "duration": 1.369077444076538, + "PER": 0.9345794392523363, + "score": { + "S": 2, + "D": 0, + "I": 0, + "N": 214 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌjʌŋmænɪzɪn bɑn dɪdʒʌn d mʌtʃaɪfɪrhɪz dɛθɪz dɪk rid", + "ref_phonemes": "ðʌ jʌŋ mæn ɪz ɪn bɑndɪdʒ ʌnd mʌtʃ aɪ fɪr hɪz dɛθ ɪz dɪkrid ", + "duration": 0.313701868057251, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 45 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "aɪɡ reɪt limɔr nðæt wʌn soʊwɛl dɪs poʊz dʃʊd daɪɪnhɪzɪɡ nɝʌn sʌn daɪhæv sɔtʌɡʊd lihɪm kæn julɛd mituhɪm", + "ref_phonemes": "aɪ ɡreɪtli mɔrn ðæt wʌn soʊ wɛl dɪspoʊzd ʃʊd daɪ ɪn hɪz ɪɡnɝʌns ʌnd aɪ hæv sɔt ʌ ɡʊdli hɪm kæn ju lɛd mi tu hɪm ", + "duration": 0.5496425628662109, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 86 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌtæs k wɪl nɑt bidɪfʌkʌl t rɪtɝn d deɪvɪðhɛzɪteɪtɪŋðoʊaɪɡ reɪt lifɪr jɔr p rɛzʌn s wʊd ræðɝɪn k risðæn mɪtʌɡeɪθhɪzʌnhæpifɔrtʃʌn z", + "ref_phonemes": "ðʌ tæsk wɪl nɑt bi dɪfʌkʌlt rɪtɝnd deɪvɪd hɛzʌteɪtɪŋ ðoʊ aɪ ɡreɪtli fɪr jɔr prɛzʌns wʊd ræðɝ ɪnkris ðæn mɪtʌɡeɪt hɪz ʌnhæpi fɔrtʃʌnz ", + "duration": 0.6123270988464355, + "PER": 2.727272727272727, + "score": { + "S": 3, + "D": 0, + "I": 0, + "N": 110 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌlɑdʒɪn wɪtʃʌŋkʌs wɑz kʌn faɪn d wɑzɪnðʌvɛrisɛn tɝʌvðʌvɪlʌdʒʌn dɪnʌsɪtʃueɪʃʌn pɝhæp s mɔr dɪfʌkʌl tðænɛniʌðɝtuʌp roʊtʃɔr liv wɪθaʊtɑb zɝveɪʃʌn", + "ref_phonemes": "ðʌ lɑdʒ ɪn wɪtʃ ʌŋkʌz wɑz kʌnfaɪnd wɑz ɪn ðʌ vɛri sɛntɝ ʌv ðʌ vɪlʌdʒ ʌnd ɪn ʌ sɪtʃueɪʃʌn pɝhæps mɔr dɪfʌkʌlt ðæn ɛni ʌðɝ tu ʌproʊtʃ ɔr liv wɪθaʊt ɑbzɝveɪʃʌn ", + "duration": 0.7892212867736816, + "PER": 0.7936507936507936, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 126 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "fɔrɔr faɪvʌvðʌlætɝoʊn lilɪŋɡɝdʌbaʊtðʌdɔrʌvðʌp rɪzʌnʌvʌŋkʌs wɛribʌt k loʊsʌb zɝvɝzʌvðʌmænɝʌvðɛr kæp tɪv", + "ref_phonemes": "fɔr ɔr faɪv ʌv ðʌ lætɝ oʊnli lɪŋɡɝd ʌbaʊt ðʌ dɔr ʌv ðʌ prɪzʌn ʌv ʌŋkʌz wɛri bʌt kloʊs ʌbzɝvɝz ʌv ðʌ mænɝ ʌv ðɛr kæptɪv ", + "duration": 0.6110684871673584, + "PER": 1.0752688172043012, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 93 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "dɪlɪvɝdɪnʌs t rɔŋtoʊnʌvʌsɛn tʌnaʊn s tðʌɡ rætʌfʌkeɪʃʌnðʌsævʌdʒwʊd rʌsivɪn wɪt nʌsɪŋsʌtʃænɛk sʌbɪʃʌnʌv wik nʌsɪnænɛnʌmisoʊlɔŋheɪtʌdʌn d soʊmʌtʃfɪr d", + "ref_phonemes": "dɪlɪvɝd ɪn ʌ strɔŋ toʊn ʌv ʌsɛnt ʌnaʊnst ðʌ ɡrætʌfʌkeɪʃʌn ðʌ sævʌdʒ wʊd rʌsiv ɪn wɪtnʌsɪŋ sʌtʃ æn ɛksʌbɪʃʌn ʌv wiknʌs ɪn æn ɛnʌmi soʊ lɔŋ heɪtʌd ʌnd soʊ mʌtʃ fɪrd ", + "duration": 0.7816107273101807, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 132 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðeɪd rubækʌlɪtʌl f rʌmðʌɛn t rʌn sʌn d moʊʃʌn d tuðʌsʌpoʊz d kɑndʒɝɝtuɛn tɝ", + "ref_phonemes": "ðeɪ dru bæk ʌ lɪtʌl frʌm ðʌ ɛntrʌns ʌnd moʊʃʌnd tu ðʌ sʌpoʊzd kɑndʒɝɝ tu ɛntɝ ", + "duration": 0.3389894962310791, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 62 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "bʌtðʌbɛrɪn s tɛdʌvoʊbeɪɪŋmeɪn teɪn dðʌsitɪθhæd teɪkʌnʌn d ɡ raʊl d", + "ref_phonemes": "bʌt ðʌ bɛr ɪnstɛd ʌv oʊbeɪɪŋ meɪnteɪnd ðʌ sit ɪt hæd teɪkʌn ʌnd ɡraʊld ", + "duration": 0.3531529903411865, + "PER": 1.7543859649122806, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 57 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌkʌnɪŋmænɪzʌf reɪdðæθhɪz b rɛθwɪl b loʊʌpɑnhɪz b rʌðɝzʌn d teɪkʌweɪðɛr kɝʌdʒtukʌn tɪn jud deɪvɪdɪm p ruvɪŋðʌhɪn θhirʌsiv dðeɪmʌs t s tæn d fɝðɝɔf", + "ref_phonemes": "ðʌ kʌnɪŋ mæn ɪz ʌfreɪd ðæt hɪz brɛθ wɪl bloʊ ʌpɑn hɪz brʌðɝz ʌnd teɪk ʌweɪ ðɛr kɝʌdʒ tu kʌntɪnjud deɪvɪd ɪmpruvɪŋ ðʌ hɪnt hi rʌsivd ðeɪ mʌst stænd fɝðɝ ɔf ", + "duration": 0.7444944381713867, + "PER": 1.6129032258064515, + "score": { + "S": 2, + "D": 0, + "I": 0, + "N": 124 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðɛnæzɪf sætʌs faɪdʌvðɛr seɪf tiðʌs kaʊt lɛf θhɪz pʌzɪʃʌnʌn d s loʊliɛn tɝdðʌp leɪs", + "ref_phonemes": "ðɛn æz ɪf sætʌsfaɪd ʌv ðɛr seɪfti ðʌ skaʊt lɛft hɪz pʌzɪʃʌn ʌnd sloʊli ɛntɝd ðʌ pleɪs ", + "duration": 0.37670016288757324, + "PER": 1.4492753623188406, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 69 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɪt wɑz saɪlʌn tʌn d ɡ lumibiɪŋtɛnʌn tɪd soʊl libaɪðʌkæp tɪvʌn d laɪtʌd baɪðʌdaɪɪŋɛm bɝzʌvʌfaɪɝwɪtʃhæd bɪn juz d fɔrðʌpɝpʌsʌv kʊkɝi", + "ref_phonemes": "ɪt wɑz saɪlʌnt ʌnd ɡlumi biɪŋ tɛnʌntɪd soʊlli baɪ ðʌ kæptɪv ʌnd laɪtʌd baɪ ðʌ daɪɪŋ ɛmbɝz ʌv ʌ faɪɝ wɪtʃ hæd bɪn juzd fɔr ðʌ pɝpʌst ʌv kʊkɝi ", + "duration": 0.6672601699829102, + "PER": 0.8928571428571428, + "score": { + "S": 0, + "D": 1, + "I": 0, + "N": 112 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʌŋkʌsɑk jʌpaɪdʌdɪs tʌn t kɔr nɝɪnʌrɪk laɪnɪŋætʌtud biɪŋrɪdʒʌd libaʊn d boʊθhæn d zʌn d fit baɪs t rɔŋʌn d peɪn fʌl wɪdðs", + "ref_phonemes": "ʌŋkʌz ɑkjʌpaɪd ʌ dɪstʌnt kɔrnɝ ɪn ʌ rɪklaɪnɪŋ ætʌtud biɪŋ rɪdʒɪdli baʊnd boʊθ hændz ʌnd fit baɪ strɔŋ ʌnd peɪnfʌl wɪðz ", + "duration": 0.5618233680725098, + "PER": 4.081632653061225, + "score": { + "S": 3, + "D": 0, + "I": 1, + "N": 98 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌs kaʊθhuhæd lɛf t deɪvɪdætðʌdɔr tuæsɝteɪnðeɪwɝnɑtʌb zɝv dθɔtɪt p rudʌn t tup rʌzɝvhɪz dɪs ɡaɪzʌn tɪlʌʃʊr dʌvðɛr p raɪvʌsi", + "ref_phonemes": "ðʌ skaʊt hu hæd lɛft deɪvɪd æt ðʌ dɔr tu æsɝteɪn ðeɪ wɝ nɑt ʌbzɝvd θɔt ɪt prudʌnt tu prʌzɝv hɪz dɪsɡaɪz ʌntɪl ʌʃʊrd ʌv ðɛr praɪvʌsi ", + "duration": 0.6226785182952881, + "PER": 0.9523809523809524, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 105 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "wʌtʃæl widuwɪððʌmɪŋɡoʊzætðʌdɔrðeɪkaʊn t sɪk sʌn dðʌsɪŋɝɪzæz ɡʊdæz nʌθɪŋ", + "ref_phonemes": "wʌt ʃæl wi du wɪð ðʌ mɪŋɡoʊz æt ðʌ dɔr ðeɪ kaʊnt sɪks ʌnd ðɪs sɪŋɝ ɪz æz ɡʊd æz nʌθɪŋ ", + "duration": 0.4109313488006592, + "PER": 3.076923076923077, + "score": { + "S": 1, + "D": 1, + "I": 0, + "N": 65 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌdɛlʌwɛr zɑrtʃɪl d rʌnʌvðʌtɔr tʌsʌn dðeɪaʊt s t rɪpðʌdɪr", + "ref_phonemes": "ðʌ dɛlʌwɛrz ɑr tʃɪldrʌn ʌv ðʌ tɔrtʌs ʌnd ðeɪ aʊtstrɪp ðʌ dɪr ", + "duration": 0.22959423065185547, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 49 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʌŋkʌʃhuhædɔl rɛdiʌp roʊtʃtðʌdɔrɪn rɛdinʌs tulɛdðʌweɪnaʊrikɔɪl dʌn d p leɪs θhɪm sɛl f wʌn s mɔrɪnðʌbɑtʌmʌvðʌlɑdʒ", + "ref_phonemes": "ʌŋkʌz hu hæd ɔlrɛdi ʌproʊtʃt ðʌ dɔr ɪn rɛdinʌs tu lɛd ðʌ weɪ naʊ rikɔɪld ʌnd pleɪst hɪmsɛlf wʌns mɔr ɪn ðʌ bɑtʌm ʌv ðʌ lɑdʒ ", + "duration": 0.565105676651001, + "PER": 2.0408163265306123, + "score": { + "S": 2, + "D": 0, + "I": 0, + "N": 98 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "bʌθhɔkaɪhuwɑz tumʌtʃɑk jʌpaɪd wɪðhɪzoʊnθɔt s tunoʊtðʌmuv mʌn t kʌn tɪn jud s pikɪŋmɔr tuhɪm sɛl fðæn tuhɪz kʌm pæn jʌn", + "ref_phonemes": "bʌt hɔkaɪ hu wɑz tu mʌtʃ ɑkjʌpaɪd wɪð hɪz oʊn θɔts tu noʊt ðʌ muvmʌnt kʌntɪnjud spikɪŋ mɔr tu hɪmsɛlf ðæn tu hɪz kʌmpænjʌn ", + "duration": 0.5269057750701904, + "PER": 1.0101010101010102, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 99 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "soʊʌŋkʌs juhæd bɛtɝteɪkðʌlɛd waɪlaɪwɪl pʊtɑnðʌs kɪnʌɡɛnʌn d t rʌs t tukʌnɪŋfɔr wɑn tʌv s pid", + "ref_phonemes": "soʊ ʌŋkʌz ju hæd bɛtɝ teɪk ðʌ lɛd waɪl aɪ wɪl pʊt ɑn ðʌ skɪn ʌɡɛn ʌnd trʌst tu kʌnɪŋ fɔr wɑnt ʌv spid ", + "duration": 0.4471476078033447, + "PER": 1.282051282051282, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 78 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "wɛl wʌt kæn t bidʌn baɪmeɪn kɝʌdʒɪn wɔr mʌs t bidʌn baɪsɝkʌm vɛnʃʌn", + "ref_phonemes": "wɛl wʌt kænt bi dʌn baɪ meɪn kɝʌdʒ ɪn wɔr mʌst bi dʌn baɪ sɝkʌmvɛntʃʌn ", + "duration": 0.4338233470916748, + "PER": 1.7857142857142856, + "score": { + "S": 0, + "D": 1, + "I": 0, + "N": 56 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "æz sunæzðiz dɪs pʌzɪʃʌn z wɝmeɪdðʌs kaʊt tɝn d tudeɪvɪdʌn d ɡeɪvhɪmhɪz pɑr tɪŋɪn s t rʌkʃʌn z", + "ref_phonemes": "æz sun æz ðiz dɪspʌzɪʃʌnz wɝ meɪd ðʌ skaʊt tɝnd tu deɪvɪd ʌnd ɡeɪv hɪm hɪz pɑrtɪŋ ɪnstrʌkʃʌnz ", + "duration": 0.3737614154815674, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 76 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "maɪpɝsut sɑr pis fʌlʌn d maɪtɛm pɝaɪhʌm b lit rʌs tɪz ɡ reɪt liɡɪvʌn tumɝsiʌn d lʌv rɪtɝn d deɪvɪdʌlɪtʌl nɛtʌl dæt soʊdɝɛk tænʌtækɑnhɪz mænhʊd bʌtðɛrɑr nʌnhukæn seɪðætaɪhævɛvɝfɝɡɑtʌn maɪfeɪθɪnðʌlɔr divɪnɪnðʌɡ reɪtʌs t s t reɪt s", + "ref_phonemes": "maɪ pɝsuts ɑr pisfʌl ʌnd maɪ tɛmpɝ aɪ hʌmbli trʌst ɪz ɡreɪtli ɡɪvʌn tu mɝsi ʌnd lʌv rɪtɝnd deɪvɪd ʌ lɪtʌl nɛtʌld æt soʊ dɝɛkt æn ʌtæk ɑn hɪz mænhʊd bʌt ðɛr ɑr nʌn hu kæn seɪ ðæt aɪ hæv ɛvɝ fɝɡɑtʌn maɪ feɪθ ɪn ðʌ lɔrd ivɪn ɪn ðʌ ɡreɪtʌst streɪts ", + "duration": 0.9869449138641357, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 193 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɪf juɑr nɑtðɛn nɑk tɑnðʌhɛd jɔr biɪŋʌnɑn kʌm pɑsɝwɪl p rʌtɛk t juʌn d julðɛnhævʌɡʊd rizʌn tuɪk s pɛk t tudaɪɪn jɔr bɛd", + "ref_phonemes": "ɪf ju ɑr nɑt ðɛn nɑkt ɑn ðʌ hɛd jɔr biɪŋ ʌ nɑn kʌmpɑsɝ wɪl prʌtɛkt ju ʌnd jul ðɛn hæv ʌ ɡʊd rizʌn tu ɪkspɛkt tu daɪ ɪn jɔr bɛd ", + "duration": 0.5675628185272217, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 96 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "soʊtʃuz fɔr jɝsɛl f tumeɪkʌrʌʃɔr tærihir", + "ref_phonemes": "soʊ tʃuz fɔr jɝsɛlf tu meɪk ʌ rʌʃ ɔr tɛri hir ", + "duration": 0.31586790084838867, + "PER": 2.857142857142857, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 35 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "b reɪv liʌn ddʒɛnɝʌs lihæʒhibætʌl dɪn maɪbɪhæfʌn dðɪsʌn d mɔr wɪlaɪdɛrɪnhɪz sɝvʌs", + "ref_phonemes": "breɪvli ʌnd dʒɛnɝʌsli hæz hi bætʌld ɪn maɪ bɪhæf ʌnd ðɪs ʌnd mɔr wɪl aɪ dɛr ɪn hɪz sɝvʌs ", + "duration": 0.4260861873626709, + "PER": 1.4285714285714286, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 70 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "kip saɪlʌn tæz lɔŋæz meɪbiʌn dɪt wʊd biwaɪz wɛn judus pik tub reɪkaʊt sʌdʌn liɪn wʌnʌv jɔrʃaʊtɪŋz wɪtʃwɪl sɝv turimaɪn dðʌɪn diʌn zðæt juɑr nɑtɔl tʌɡɛðɝæz ris pɑn sʌbʌlæz mɛnʃʊd bi", + "ref_phonemes": "kip saɪlʌnt æz lɔŋ æz meɪ bi ʌnd ɪt wʊd bi waɪz wɛn ju du spik tu breɪk aʊt sʌdʌnli ɪn wʌn ʌv jɔr ʃaʊtɪŋz wɪtʃ wɪl sɝv tu rimaɪnd ðʌ ɪndiʌnz ðæt ju ɑr nɑt ɔltʌɡɛðɝ æz rispɑnsʌbʌl æz mɛn ʃʊd bi ", + "duration": 0.5728750228881836, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 150 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɪfhaʊɛvɝðeɪteɪk jɔr s kæl pæzaɪt rʌs tʌn d bɪlivðeɪwɪl nɑt dɪpɛn dɑnɪtʌŋkʌsʌn daɪwɪl nɑt fɝɡɛtðʌdid bʌt rivɛndʒɪtæz bɪkʌm z t ruwɔriɝzʌn d t rʌs tif rɛn d z", + "ref_phonemes": "ɪf haʊɛvɝ ðeɪ teɪk jɔr skælp æz aɪ trʌst ʌnd bɪliv ðeɪ wɪl nɑt dɪpɛnd ɑn ɪt ʌŋkʌz ʌnd aɪ wɪl nɑt fɝɡɛt ðʌ did bʌt rivɛndʒ ɪt æz bɪkʌmz tru wɔriɝz ʌnd trʌsti frɛndz ", + "duration": 0.658043384552002, + "PER": 0.7751937984496124, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 129 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "hoʊl d sɛd deɪvɪd pɝsivɪŋðæt wɪððɪsʌʃʊrʌn sðeɪwɝʌbaʊt tulivhɪmaɪæmænʌn wɝðiʌn ðhʌm bʌl fɑloʊɝʌv wʌnhutɔt nɔtðʌdæm nʌbʌl p rɪn sʌpʌlʌv rivɛndʒ", + "ref_phonemes": "hoʊld sɛd deɪvɪd pɝsivɪŋ ðæt wɪð ðɪs ʌʃʊrʌns ðeɪ wɝ ʌbaʊt tu liv hɪm aɪ æm æn ʌnwɝði ʌnd hʌmbʌl fɑloʊɝ ʌv wʌn hu tɔt nɑt ðʌ dæmnʌbʌl prɪnsʌpʌl ʌv rivɛndʒ ", + "duration": 0.6510789394378662, + "PER": 1.6260162601626018, + "score": { + "S": 2, + "D": 0, + "I": 0, + "N": 123 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðɛnhivɪŋʌhɛvisaɪp rɑbʌb liʌmʌŋðʌlæs θhiɛvɝd ruɪn paɪnɪŋfɔrʌkʌn dɪʃʌnhihæd soʊlɔŋʌbæn dʌn ðhiædʌdɪtɪz wʌtaɪwʊd wɪʃtup ræk tʌs maɪsɛl fæz wʌn wɪθaʊtʌk rɔsʌv b lʌdðoʊɪtɪz nɑtɔl weɪzizitudil wɪðænɪn diʌnæz juwʊd wɪðʌfɛloʊk rɪstʃʌn", + "ref_phonemes": "ðɛn hivɪŋ ʌ hɛvi saɪ prɑbʌbli ʌmʌŋ ðʌ læst hi ɛvɝ dru ɪn paɪnɪŋ fɔr ʌ kʌndɪʃʌn hi hæd soʊ lɔŋ ʌbændʌnd hi ædʌd ɪt ɪz wʌt aɪ wʊd wɪʃ tu præktaɪz maɪsɛlf æz wʌn wɪθaʊt ʌ krɔs ʌv blʌd ðoʊ ɪt ɪz nɑt ɔlweɪz izi tu dil wɪð æn ɪndiʌn æz ju wʊd wɪð ʌ fɛloʊ krɪstʃʌn ", + "duration": 1.2845687866210938, + "PER": 2.5, + "score": { + "S": 4, + "D": 1, + "I": 0, + "N": 200 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɡɑd b lɛs juf rɛn daɪdubɪliv jɔr sɛn tɪz nɑt ɡ reɪt lirɔŋwɛnðʌmætɝɪz dulikʌn sɪdɝdʌn d kipɪŋɪtɝnʌtibɪfɔrðʌaɪzðoʊmʌtʃdɪpɛn d zɑnðʌnætʃɝʌl ɡɪf t sʌn dðʌfɔr sʌv tɛm teɪʃʌn", + "ref_phonemes": "ɡɑd blɛs ju frɛnd aɪ du bɪliv jɔr sɛnt ɪz nɑt ɡreɪtli rɔŋ wɛn ðʌ mætɝ ɪz duli kʌnsɪdɝd ʌnd kipɪŋ ɪtɝnʌti bɪfɔr ðʌ aɪz ðoʊ mʌtʃ dɪpɛndz ɑn ðʌ nætʃɝʌl ɡɪfts ʌnd ðʌ fɔrs ʌv tɛmteɪʃʌn ", + "duration": 0.6936440467834473, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 143 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌdɛlʌwɛr dɔɡhisɛd linɪŋfɔr wɝdʌn d pirɪŋθruðʌdɪm laɪt tukætʃðʌɪk s p rɛʃʌnʌvðʌʌðɝz fitʃɝzɪʒhiʌf reɪd", + "ref_phonemes": "ðʌ dɛlʌwɛr dɔɡ hi sɛd linɪŋ fɔrwɝd ʌnd pirɪŋ θru ðʌ dɪm laɪt tu kætʃ ðʌ ɪksprɛʃʌn ʌv ðʌ ʌðɝz fitʃɝz ɪz hi ʌfreɪd ", + "duration": 0.5528101921081543, + "PER": 1.1235955056179776, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 89 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌmoʊhikʌn s tɑr tʌdɑnhɪz fitʌn dʃʊkhɪzʃæɡikʌvɝɪŋæzðoʊðʌænʌmʌlhikaʊn tɝfɪtɪd wɑzʌbaʊt tumeɪk sʌm dɛs p rɪtɛfɝt", + "ref_phonemes": "ðʌ moʊhikʌn stɑrtʌd ɑn hɪz fit ʌnd ʃʊk hɪz ʃæɡi kʌvɝɪŋ æz ðoʊ ðʌ ænʌmʌl hi kaʊntɝfɪtɪd wɑz ʌbaʊt tu meɪk sʌm dɛsprɪt ɛfɝt ", + "duration": 0.5169446468353271, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 98 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "hihæd noʊʌkeɪʒʌn tudɪleɪfɔrætðʌnɛk s tɪn s tʌn tʌbɝs tʌv k raɪz fɪl dðʌaʊtɝɛrʌn d rænʌlɔŋðʌhoʊlɪk s tɛn tʌvðʌvɪlʌdʒ", + "ref_phonemes": "hi hæd noʊ ʌkeɪʒʌn tu dɪleɪ fɔr æt ðʌ nɛkst ɪnstʌnt ʌ bɝst ʌv kraɪz fɪld ðʌ aʊtɝ ɛr ʌnd ræn ʌlɔŋ ðʌ hoʊl ɪkstɛnt ʌv ðʌ vɪlʌdʒ ", + "duration": 0.5987515449523926, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 98 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʌŋkʌs kæs θhɪz s kɪnʌn d s tɛp t fɔrθɪnhɪzoʊn b jutʌfʌl p rʌpɔrʃʌn z", + "ref_phonemes": "ʌŋkʌz kæst hɪz skɪn ʌnd stɛpt fɔrθ ɪn hɪz oʊn bjutʌfʌl prʌpɔrʃʌnz ", + "duration": 0.3342907428741455, + "PER": 3.7037037037037033, + "score": { + "S": 2, + "D": 0, + "I": 0, + "N": 54 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "sɪn sðʌpɪriʌdʌvaʊɝteɪlðʌæk tɪv s pɪrʌtʌvðʌkʌn t rihæz sɝaʊn dʌdɪt wɪðʌbɛl tʌv rɪtʃʌn dθraɪvɪŋsɛtʌl mʌn t sðoʊnʌn bʌtðʌhʌn tɝɔrðʌsævʌdʒɪzɛvɝnoʊnivɪn naʊtupɛnʌt reɪtɪt s waɪl d risɛsʌz", + "ref_phonemes": "sɪns ðʌ pɪriʌd ʌv aʊɝ teɪl ðʌ æktɪv spɪrʌt ʌv ðʌ kʌntri hæz sɝaʊndʌd ɪt wɪð ʌ bɛlt ʌv rɪtʃ ʌnd θraɪvɪŋ sɛtʌlmʌnts ðoʊ nʌn bʌt ðʌ hʌntɝ ɔr ðʌ sævʌdʒ ɪz ɛvɝ noʊn ivɪn naʊ tu pɛnʌtreɪt ɪts waɪld risɛsʌz ", + "duration": 0.8139874935150146, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 159 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌduz wɝsʌfɝd tuɛk ʃheɪlʌn dðʌsʌnhæd dɪs pɝs tðʌmɪs t sʌn d wɑzʃɛdɪŋʌs t rɔŋʌn d k lɪr laɪtɪnðʌfɔrʌs t s wɛnðʌt rævʌlɝz rɪzum dðɛrdʒɝni", + "ref_phonemes": "ðʌ duz wɝ sʌfɝd tu ɛkʃheɪl ʌnd ðʌ sʌn hæd dɪspɝst ðʌ mɪsts ʌnd wɑz ʃɛdɪŋ ʌ strɔŋ ʌnd klɪr laɪt ɪn ðʌ fɔrʌst wɛn ðʌ trævʌlɝz rɪzumd ðɛr dʒɝni ", + "duration": 0.7023882865905762, + "PER": 0.9009009009009009, + "score": { + "S": 0, + "D": 0, + "I": 1, + "N": 111 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "æf tɝp rʌsidɪŋʌf jumaɪl zðʌp rɑɡ rɛsʌvhɔkaɪhulɛdðʌʌd væn s bɪkeɪm mɔr dɪlɪbɝʌtʌn d wɑtʃfʌl", + "ref_phonemes": "æftɝ prʌsidɪŋ ʌ fju maɪlz ðʌ prɑɡrɛs ʌv hɔkaɪ hu lɛd ðʌ ʌdvæns bɪkeɪm mɔr dɪlɪbɝʌt ʌnd wɑtʃfʌl ", + "duration": 0.4677140712738037, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 77 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "hiɔfʌn s tɑp t tuɪɡ zæmɪnðʌt riz nɔr dɪðhik rɔsʌrɪv jʌlʌt wɪθaʊtʌtɛn tɪv likʌn sɪdɝɪŋðʌk wɑn tʌtiðʌvʌlɑsʌtiʌn dðʌkʌlɝʌvɪt s wɔtɝz", + "ref_phonemes": "hi ɔfʌn stɑpt tu ɪɡzæmɪn ðʌ triz nɔr dɪd hi krɔs ʌ rɪvjʌlt wɪθaʊt ʌtɛntɪvli kʌnsɪdɝɪŋ ðʌ kwɑntʌti ðʌ vʌlɑsʌti ʌnd ðʌ kʌlɝ ʌv ɪts wɔtɝz ", + "duration": 0.7436251640319824, + "PER": 1.834862385321101, + "score": { + "S": 1, + "D": 0, + "I": 1, + "N": 109 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "dɪs t rʌs tɪŋhɪzoʊndʒʌdʒmʌn θhɪzʌpil z tuðʌʌpɪn jʌnʌvtʃɪŋɡɑtʃkuk wɝf rik wʌn tʌn dɝnɪs t", + "ref_phonemes": "dɪstrʌstɪŋ hɪz oʊn dʒʌdʒmʌnt hɪz ʌpilz tu ðʌ ʌpɪnjʌn ʌv tʃɪŋdʌkaʊtʃ wɝ frikwʌnt ʌnd ɝnɪst ", + "duration": 0.490293025970459, + "PER": 10.666666666666668, + "score": { + "S": 8, + "D": 0, + "I": 0, + "N": 75 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "jɛθhirɑr wiwɪðɪnʌʃɔr t reɪndʒʌvðʌs kɝrun zʌn d nɑtʌsaɪnʌvʌt reɪlhæv wik rɔs t", + "ref_phonemes": "jɛt hir ɑr wi wɪðɪn ʌ ʃɔrt reɪndʒ ʌv ðʌ skɛrʌnz ʌnd nɑt ʌ saɪn ʌv ʌ treɪl hæv wi krɔst ", + "duration": 0.45402956008911133, + "PER": 4.545454545454546, + "score": { + "S": 3, + "D": 0, + "I": 0, + "N": 66 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "lɛtʌs rit reɪsaʊɝs tɛp sʌn dɪɡ zæmɪnæz wiɡoʊwɪðkinɝaɪz", + "ref_phonemes": "lɛt ʌs ritreɪs aʊɝ stɛps ʌnd ɪɡzæmɪn æz wi ɡoʊ wɪð kinɝ aɪz ", + "duration": 0.28613853454589844, + "PER": 0.0, + "score": { + "S": 0, + "D": 0, + "I": 0, + "N": 47 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "aɪm vɪkiwɪtʌmɔraɪmʌp roʊɡ ræm dɝɛk tɝætðʌnæʃʌnʌlɪn s tɪtut sʌv nʊrʌlɑdʒɪkʌl dɪsɔr dɝzʌn d s t roʊkʌn dʌp roʊɡ ræm dɝɛk tɝhuoʊvɝsiz", + "ref_phonemes": "aɪm vɪki wɪtmɔr aɪm ʌ proʊɡræm dɝɛktɝ æt ðʌ næʃʌnʌl ɪnstʌtuts ʌv nʊrʌlɑdʒɪkʌl dɪsɔrdɝz ʌnd stroʊk ʌnd ʌ proʊɡræm dɝɛktɝ hu oʊvɝsiz ", + "duration": 0.6882309913635254, + "PER": 1.834862385321101, + "score": { + "S": 1, + "D": 0, + "I": 1, + "N": 109 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɛmisiɛfɛs risɝtʃɡ ræn t sʌn d wɝk s tʌɡɛðɝk loʊs liwɪðdɑk tɝkɔrʌʃʌt s tukoʊɔr dʌneɪtðʌɛmisiɛfɛs t ræn zɛneɪtʃɛmisiʌfɛ wɝkɪŋɡ rup soʊɪt s maɪp lɛʒɝtuwɛl kʌm jutuðʌfɝs tɪn", + "ref_phonemes": "mɛksf risɝtʃ ɡrænts ʌnd wɝks tʌɡɛðɝ kloʊsli wɪð draɪv kɔrʌsɛts tu koʊɔrdʌneɪt ðʌ mɛksf trænznɪh mɛksf wɝkɪŋ ɡrup ɪts maɪ plɛʒɝ tu wɛlkʌm ju tu ðʌ fɝst ɪn ", + "duration": 1.0296258926391602, + "PER": 25.396825396825395, + "score": { + "S": 11, + "D": 2, + "I": 19, + "N": 126 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "sɛvʌn pɑr t sɪrizʌv wɛbʌnɝzðætɑr biɪŋɔr ɡʌnaɪz dɪnɔr dɝtudɪvɛlʌpʌrisɝtʃroʊd mæp fɔrɛmisiɛfɛsðʌsɛvʌn wɛbʌnɝrz wɪl teɪk p leɪs", + "ref_phonemes": "ʌ sɛvʌpɝtæp sɪriz ʌv wɛbnɝʌnz ðæt ɑr biɪŋ ɔrɡʌnaɪzd ɪn ɔrdɝ tu dɪvɛlʌp ʌ risɝtʃ roʊdmæp fɔr mɛksf ðʌ sɛvʌn wɛbnɝʌnz wɪl teɪk pleɪs ", + "duration": 0.6772060394287109, + "PER": 17.75700934579439, + "score": { + "S": 3, + "D": 7, + "I": 9, + "N": 107 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "bɪt win naʊʌn d dɪsɛm bɝʌn dðʌdɪlɪvɝʌbʌl f rʌmɔlʌvðɪsɛfɝt wɪl biʌripɔr t tuðʌɛnʌɛnʌɛnʌɛn diʌsæd vaɪzɝikaʊn sʌlætðɛr meɪt wɛn tit wɛn tifɔrθmitɪŋ", + "ref_phonemes": "bɪtwin naʊ ʌnd dɪsɛmbɝ ʌnd ðʌ dɪlɪvɝʌbʌl frʌm ɔl ʌv ðɪs ɛfɝt wɪl bi ʌ ripɔrt tu ðʌ nændz ædvaɪzɝi kaʊnsʌl æt ðɛr meɪ twɛnti twɛntifʊr mitɪŋ ", + "duration": 0.7238314151763916, + "PER": 12.389380530973451, + "score": { + "S": 3, + "D": 0, + "I": 11, + "N": 113 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌɡoʊlʌvðʌrisɝtʃroʊd mæp p rɑsɛsɪz tuʌsɛs kɝʌn tɛmisifɛs t risɝtʃʌn daɪdɛn tʌfaɪɡæpɛriʌzɔrɑpɝtunʌtiz tumuvðʌfil d tʌwɔr d t ræn z leɪʃʌnʌl risɝtʃ", + "ref_phonemes": "ðʌ ɡoʊl ʌv ðʌ risɝtʃ roʊdmæp prɑsɛs ɪz tu ʌsɛs kɝʌnt mɛksf risɝtʃ ʌnd aɪdɛntʌfaɪ ɡæp ɛriʌz ɔr ɑpɝtunʌtiz tu muv ðʌ fild tʌwɔrd trænsleɪʃʌnʌl risɝtʃ ", + "duration": 0.7792346477508545, + "PER": 6.557377049180328, + "score": { + "S": 2, + "D": 1, + "I": 5, + "N": 122 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "t ræn z leɪʃʌnʌl s tʌdizʌn dɪn tuk lɪnɪkʌl t raɪʌl z tudɪvɛlʌp t rit mʌn t s fɔrɛmisiɛfɛsðʌrisɝtʃp raɪɔrʌtizaɪdɛn tʌfaɪd wɪl bijuz d tuɡaɪd risɝtʃʌk rɔsðʌkʌm junʌti", + "ref_phonemes": "trænsleɪʃʌnʌl stʌdiz ʌnd ɪntu klɪnʌkʌl traɪʌlz tu dɪvɛlʌp tritmʌnts fɔr mɛksf ðʌ risɝtʃ praɪɔrʌtiz aɪdɛntʌfaɪd wɪl bi juzd tu ɡaɪd risɝtʃ ʌkrɔs ðʌ kʌmjunʌti ", + "duration": 0.7016212940216064, + "PER": 6.7669172932330826, + "score": { + "S": 3, + "D": 1, + "I": 5, + "N": 133 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "nɑtdʒʌs t baɪðʌnæʃʌnʌlɪn s tɪtut sʌvhɛlθðʌɛmisiɛfɛs risɝtʃɑm wɝkɪŋɡ rup kæn jup lizʌd væn s maɪs laɪd z", + "ref_phonemes": "nɑt dʒʌst baɪ ðʌ næʃʌnʌl ɪnstʌtuts ʌv hɛlθ ðʌ mɛksf risɝtʃ wɝkɪŋ ɡrup kæn ju pliz ʌdvæns maɪ slaɪdz ", + "duration": 0.7134566307067871, + "PER": 12.345679012345679, + "score": { + "S": 2, + "D": 1, + "I": 7, + "N": 81 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "aɪdoʊn t sihaʊtuduðætθæŋk jusoʊðʌɛnaɪɛn diɛsɛmisiʌfʌs wɝkɪŋɡ rupʌv kaʊn sʌlɪz kʌm poʊz dʌv daɪvɝz s teɪkhoʊl dɝz", + "ref_phonemes": "aɪ doʊnt si haʊ tu du ðæt θæŋk ju ðʌ nændz mɛksf wɝkɪŋ ɡrup ʌv kaʊnsʌl ɪz kʌmpoʊzd ʌv daɪvɝs steɪkhoʊldɝz ", + "duration": 0.8351013660430908, + "PER": 20.0, + "score": { + "S": 5, + "D": 0, + "I": 12, + "N": 85 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "risɝtʃɝzʌn d k lʌnɪʃʌn z nɑn p rɑfʌtæd vʌkʌsiɔr ɡʌnʌzeɪʃʌn lidɝzʌn dðʌb rɔdɝɛmʌsiʌfɛs t kʌm junʌtiɪn k ludɪŋɪn dʌvɪdʒʌwʌl z wɪðlaɪv dɪk s pɪriʌn s", + "ref_phonemes": "risɝtʃɝz ʌnd klɪnɪʃʌnz nɑnprɑfʌt ædvʌkʌsi ɔrɡʌnʌzeɪʃʌn lidɝz ʌnd ðʌ brɔdɝ mɛksf kʌmjunʌti ɪnkludɪŋ ɪndʌvɪdʒʌwʌlz wɪð laɪvd ɪkspɪriʌns ", + "duration": 0.6980006694793701, + "PER": 7.6923076923076925, + "score": { + "S": 2, + "D": 1, + "I": 6, + "N": 117 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɪn k ludɪŋɪn dʌvɪdʒʌwʌl ʒhuhævɛmsiʌfʌʌn d kɛr ɡɪvɝz soʊðʌwɝkɪŋɡ rupɪn k lud z faɪvɪn dʌvɪdʒʌwʌl z wɪðlaɪv dɪk s pɪriʌn sʌn d wivɪn vaɪtʌdænʌdɪʃʌnʌl t wɛn tisɛvʌnɪn dʌvɪdʒʌwʌl ʒhuʌm pɑr tɪsʌpeɪtɪnðʌvɛriʌs wɛbʌnɑrp lænɪŋɡ rup s", + "ref_phonemes": "ɪnkludɪŋ ɪndʌvɪdʒʌwʌlz hu hæv mɛksf ʌnd kɛrɡɪvɝz ðʌ wɝkɪŋ ɡrup ɪnkludz faɪv ɪndʌvɪdʒʌwʌlz wɪð laɪvd ɪkspɪriʌns ʌnd wiv ɪnvaɪtʌd æn ʌdɪʃʌnʌl twɛntisɛvʌn ɪndʌvɪdʒʌwʌlz tu pɑrtɪsʌpeɪt ɪn ðʌ vɛriʌs wɛbɪnɑr plænɪŋ ɡrups ", + "duration": 1.2580897808074951, + "PER": 7.608695652173914, + "score": { + "S": 5, + "D": 1, + "I": 8, + "N": 184 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðizɪn dʌvɪdʒʌwʌl z sɛl f nɑmʌneɪtʌdθruʌp rɑsɛsðæt wiɪnɪʃieɪtʌdɝliðɪs jɪrʌn d wid laɪk tuθæŋkɔlʌvðɛmɔlʌvðʌɪn dʌvɪdʒʌwʌl zʌvðʌwɝkɪŋɡ rupʌv kaʊn sʌl", + "ref_phonemes": "ðiz ɪndʌvɪdʒʌwʌl ɑr sɛlfnʌmeɪʃʌnt θru ʌ prɑsɛs ðæt wi ɪnɪʃieɪtʌd ɝli ðɪs jɪr wid laɪk tu θæŋk ɔl ʌv ðɛm ɔl ʌv ðʌ ɪndʌvɪdʒʌwʌlz ʌv ðʌ wɝkɪŋ ɡrup ʌv kaʊnsʌl ", + "duration": 0.5389463901519775, + "PER": 8.799999999999999, + "score": { + "S": 4, + "D": 2, + "I": 5, + "N": 125 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "æz wɛlæzðʌɪn dʌvɪdʒʌwʌl z wɪðlaɪv dɪk s pɪriʌn s fɔr pɑr tɪsʌpeɪtɪŋɪnɪnðʌdɪvɛlʌp mʌn tʌvðʌrisɝtʃroʊd mæp soʊðʌs wɛbʌnɝ z biɪŋrʌkɔr dʌdʌn dðʌrɪkɔr dɪŋʌn d t ræn s k rɪp t wɪl bi", + "ref_phonemes": "æz wɛl æz ðʌ ɪndʌvɪdʒʌwʌlz wɪð laɪvd ɪkspɪriʌns fɔr pɑrtɪsʌpeɪtɪŋ ɪn ðʌ dɪvɛlʌpmʌnt ʌv ðʌ risɝtʃ roʊdmæp ðɪs wɛbɪnɑr ɪz biɪŋ rʌkɔrdʌd ʌnd ðʌ rʌkɔrdɪŋ ʌnd trænskrɪpt wɪl bi ", + "duration": 0.8726036548614502, + "PER": 7.6923076923076925, + "score": { + "S": 4, + "D": 2, + "I": 5, + "N": 143 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "poʊs tʌd fɔrðʌpʌb lɪkʌn d wɪl sɛn daʊtænʌnaʊn s mʌn t wɛnðætɪz rɛdiwʌn sðʌrisɝtʃp raɪɔrtizɑraɪdɛn tʌfaɪdʌk rɔsɔlʌvðʌwɛbʌnɝzðʌðʌwɝkɪŋɡ rupʌv kaʊn sʌl wɪl pʊtðɛmɔl tʌɡɛðɝɪn tu", + "ref_phonemes": "poʊstɪd fɔr ðʌ pʌblɪk ʌnd aɪl sɛnd aʊt æn ʌnaʊnsmʌnt wɛn ðæt ɪz rɛdi wʌns ðʌ risɝtʃ praɪɔrʌtiz ɑr aɪdɛntʌfaɪd ʌkrɔs ɔl ʌv ðʌ wɛbnɝʌnz ðʌ wɝkɪŋ ɡrup ʌv kaʊnsʌl wɪl pʊt ðɛm ɔl tʌɡɛðɝ ɪntu ", + "duration": 0.8507750034332275, + "PER": 4.666666666666667, + "score": { + "S": 5, + "D": 1, + "I": 1, + "N": 150 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "faɪnʌl ripɔr t fɔrðʌkaʊn sʌlɪn meɪʌf nɛk s t jɪrɪnðʌmin taɪmæf tɝitʃʌvðiz wɛbʌnɝz", + "ref_phonemes": "ʌ faɪnʌl ripɔrt fɔr ðʌ kaʊnsʌl ɪn meɪ ʌv nɛkst jɪr ɪn ðʌ mintaɪm æftɝ itʃ ʌv ðiz wɛbnɝʌnz ", + "duration": 0.6086018085479736, + "PER": 7.042253521126761, + "score": { + "S": 1, + "D": 3, + "I": 1, + "N": 71 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "wiwɪl bipoʊs tɪŋðʌrisɝtʃp raɪɔrʌtizɑnʌk raʊd sɔr sɪŋp læt fɔr m kɔl daɪdiʌs keɪlðæt wiwɪlɔl soʊsɛn daʊtænʌnaʊn s mʌn tʌbaʊt", + "ref_phonemes": "wi wɪl bi poʊstɪŋ ðʌ risɝtʃ praɪɔrʌtiz ɑn ʌ kraʊdsɔrɪŋ plætfɔrm kɔld aɪdisɑkʌl ðæt wi wɪl ɔlsoʊ sɛnd aʊt æn ʌnaʊnsmʌnt ʌbaʊt ", + "duration": 0.6696164608001709, + "PER": 4.854368932038835, + "score": { + "S": 1, + "D": 1, + "I": 3, + "N": 103 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌɪn dʌvɪdʒʌwʌl z f rʌmðʌnɝvʌs sɪs tʌm wɛbʌnɑrp lænɪŋɡ ruphævdʒɔɪn dʌsʌlɔŋwɪððʌkoʊtʃɛrzʌvðʌwɝkɪŋɡ rupʌv kaʊn sʌl dɑk tɝz mɔrinhæn sʌnʌn d sɪn dibeɪt mʌn", + "ref_phonemes": "ðʌ ɪndʌvɪdʒʌwʌlz frʌm ðʌ nɝvʌs sɪstʌm wɛbɪnɑr plænɪŋ ɡrup hæv dʒɔɪnd ʌs ʌlɔŋ wɪð ðʌ koʊhɛrz ʌv ðʌ wɝkɪŋ ɡrup ʌv kaʊnsʌl dɑktɝz mɔrin hænsʌn ʌnd sɪndi beɪtmʌn ", + "duration": 0.825300931930542, + "PER": 2.307692307692308, + "score": { + "S": 2, + "D": 0, + "I": 1, + "N": 130 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "aɪd laɪk turɛkʌɡ naɪzɔlʌvðʌmɛm bɝzʌvðɪs p læntɪŋɡ rup s pʌsɪfɪk lidʒɛrʌd jʌŋɡɝfɔrɔlðʌwɝkðæt juv dʌn tuɔr ɡʌnaɪzðɪs fɝs t wɛbʌnɑr", + "ref_phonemes": "aɪd laɪk tu rɛkʌɡnaɪz ɔl ʌv ðʌ mɛmbɝz ʌv ðɪs plænɪŋ ɡrup spʌsɪfɪkli dʒɑrd jʌŋɡɝ fɔr ɔl ðʌ wɝk ðæt juv dʌn tu ɔrɡʌnaɪz ðɪs fɝst wɛbɪnɑr ", + "duration": 0.6624867916107178, + "PER": 3.7037037037037033, + "score": { + "S": 2, + "D": 0, + "I": 2, + "N": 108 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "aɪdɔl soʊlaɪk tuθæŋkðʌɛnaɪɛn diɛs timɪfaɪkʊðhævðʌnɛk s t s laɪd p liʒhuz wɝk t bɪhaɪn dðʌsin z tuɡɛtɔlʌv", + "ref_phonemes": "aɪd ɔlsoʊ laɪk tu θæŋk ðʌ nɪndz tim ɪf aɪ kʊd hæv ðʌ nɛkst slaɪd pliz huz wɝkt bɪhaɪnd ðʌ sinz tu ɡɛt ɔl ʌv ", + "duration": 0.6831099987030029, + "PER": 9.63855421686747, + "score": { + "S": 3, + "D": 0, + "I": 5, + "N": 83 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɪsɔr ɡʌnaɪz dʌn d tuwɝk wɪðɔlʌvðiz wɝkɪŋɡ rup sæz wɛlæzaʊɝhɑliraɪliʌn daʊɝtimætɑrɛleɪhuɑr p rʌvaɪdɪŋðʌlʌdʒɪs tɪk sʌn ðhævhɛl p tʌs", + "ref_phonemes": "ðɪs ɔrɡʌnaɪzd ʌnd tu wɝk wɪð ɔl ʌv ðiz wɝkɪŋ ɡrups æz wɛl æz aʊɝ hɑli raɪli ʌnd aʊɝ tim æt rlɑ hu ɑr prʌvaɪdɪŋ ðʌ lʌdʒɪstɪks ʌnd hæv hɛlpt ʌs ", + "duration": 0.7298989295959473, + "PER": 5.405405405405405, + "score": { + "S": 2, + "D": 1, + "I": 3, + "N": 111 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "wɪðɔlvðʌɔr ɡʌnʌzeɪʃʌnʌp tuðɪs pɔɪn t soʊɛv iwʌn z wɛl kʌmæz julɪsʌn tuðʌp rɛzʌn teɪʃʌn z tuɛn tɝjɔr k wɛstʃʌn zɪn tuðʌk juʌneɪ", + "ref_phonemes": "wɪð ɔl ʌv ðʌ ɔrɡʌnʌzeɪʃʌn ʌp tu ðɪs pɔɪnt ɛvriwʌnz wɛlkʌm æz ju lɪsʌn tu ðʌ prɛzʌnteɪʃʌnz tu ɛntɝ jɔr kwɛstʃʌnz ɪntu ðʌ kɑ ", + "duration": 0.7626791000366211, + "PER": 11.11111111111111, + "score": { + "S": 1, + "D": 2, + "I": 8, + "N": 99 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "baɪsʌlɛk tɪŋðʌk juʌnʌbʌtʌnætðʌbɑtʌmʌvðʌs k rinʌn d wiwɪl biæt teɪkɪŋðoʊz k wɛstʃʌn z soʊɪf juhævʌk wɛstʃʌn s pʌsɪfɪk tuʌs pikɝ", + "ref_phonemes": "baɪ sʌlɛktɪŋ ðʌ kɑ bʌtʌn æt ðʌ bɑtʌm ʌv ðʌ skrin wi wɪl bi teɪkɪŋ ðoʊz kwɛstʃʌnz ɪf ju hæv ʌ kwɛstʃʌn spʌsɪfɪk tu ʌ spikɝ ", + "duration": 0.7107248306274414, + "PER": 13.541666666666666, + "score": { + "S": 1, + "D": 0, + "I": 12, + "N": 96 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "p lizɪn dʌkeɪtðætʌn d wil biteɪkɪŋsʌm k wɛstʃʌn s pʌsɪfɪk tuitʃs pikɝraɪtæf tɝitʃʌvðɛr tɔk sɪfðɛr z taɪmʌn dðɛn wil jutʌlaɪzðoʊz k wɛstʃʌn zæz wɛlætðʌvɛriɛn dʌv", + "ref_phonemes": "pliz ɪndʌkeɪt ðæt ʌnd wil bi teɪkɪŋ sʌm kwɛstʃʌnz spʌsɪfɪk tu itʃ spikɝ raɪt æftɝ itʃ ʌv ðɛr tɔks ɪf ðɛrz taɪm ðɛn wil jutʌlaɪz ðoʊz kwɛstʃʌnz æz wɛl æt ðʌ vɛri ɛnd ʌv ", + "duration": 0.7261383533477783, + "PER": 2.9850746268656714, + "score": { + "S": 0, + "D": 1, + "I": 3, + "N": 134 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "wɛbʌnɑrfɔrðoʊðʌlɔŋɡɝdɪsaʊɝlɔŋdɪs kʌʃʌn soʊwɪððætɪn t rʌdʌkʃʌnaɪlaɪk tuteɪkðɪsɑpɝtunʌtunʌtituɪn t rʌdusðʌtʃɛr", + "ref_phonemes": "ðʌ wɛbɪnɑr fɔr aʊɝ lɔŋ dɪskʌʃʌn wɪð ðæt ɪntrʌdʌkʃʌn aɪd laɪk tu teɪk ðɪs ɑpɝtunʌti tu ɪntrʌdus ðʌ tʃɛr ʌv ", + "duration": 0.7098805904388428, + "PER": 30.23255813953488, + "score": { + "S": 1, + "D": 5, + "I": 20, + "N": 86 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌnɝvʌs sɪs tʌm wɛbʌnɑr m p læn ɪŋɡ rupʌn dðʌmɑdɝeɪtɝfɔr tudeɪz wɛpʌnɑr m dɑk tɝdʒɛrʌd jʌŋɡɝdʒɛrʌdɪzðʌtɪzʌp rʌfɛsɝɪnðʌdɪpɑr t mʌn tʌv saɪkɑlʌdʒiætðʌjunʌvɝsʌtiʌvælʌbæmʌ", + "ref_phonemes": "ðʌ nɝvʌs sɪstʌm wɛbɪnɑr plænɪŋ ɡrup ʌnd ðʌ mɑdɝeɪtɝ fɔr tʌdeɪz wɛbɪnɑr draɪv dʒɑrd jʌŋɡɝ dʒɑrd ɪz ʌ prʌfɛsɝ ɪn ðʌ dɪpɑrtmʌnt ʌv saɪkɑlʌdʒi æt ðʌ junʌvɝsʌti ʌv ælʌbæmʌ ", + "duration": 0.8169817924499512, + "PER": 13.768115942028986, + "score": { + "S": 10, + "D": 0, + "I": 9, + "N": 138 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "bɝmɪŋhæm wɪðsɛkʌn dɛriʌpɔɪn t mʌn t sɪnænʌsθiziɑlʌdʒiʌn d rumʌtɑlʌdʒihizɔl soʊðʌdɝɛk tɝʌvðʌnɝɪn f lʌmeɪʃʌn peɪnʌn d fʌtiɡ læb rʌtɔriʌn dʌmɛm bɝʌvðʌjuʌbipeɪn kʌlɛk tɪv", + "ref_phonemes": "bɝmɪŋhæm wɪð sɛkʌndɛri ʌpɔɪntmʌnts ɪn ænʌsθiziɑlʌdʒi ʌnd rumʌtɑlʌdʒi hiz ɔlsoʊ ðʌ dɝɛktɝ ʌv ðʌ nʊrʌfʌlænʃmʌnʌn peɪn ʌnd fʌtiɡ læbrʌtɔri ʌnd ʌ mɛmbɝ ʌv ðʌ juv peɪn kʌlɛktɪv ", + "duration": 0.912384033203125, + "PER": 8.96551724137931, + "score": { + "S": 7, + "D": 3, + "I": 3, + "N": 145 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "hiz kɝʌn t lifʌn dʌd baɪɛnaɪeɪtʃʌn dðʌdɪpɑr t mʌn tʌv dɪfɛn s tus tʌdinutɛk nik s fɔr daɪʌɡ noʊsɪŋʌn d t ritɪŋnɛrɪn f lʌmeɪʃʌn wɪððætaɪl tɝnɪtoʊvɝtujudʒɛrʌdθæŋk ju", + "ref_phonemes": "hiz kɝʌntli fʌndʌd baɪ ni ʌnd ðʌ dɪpɑrtmʌnt ʌv dɪfɛns tu stʌdi nu tɛkniks fɔr daɪʌɡnoʊsɪŋ ʌnd tritɪŋ nʊrʌfʌlænʃmʌnʌn wɪð ðæt aɪl tɝn ɪt oʊvɝ tu ju dʒɑrd θæŋk ju ", + "duration": 0.6355912685394287, + "PER": 14.50381679389313, + "score": { + "S": 7, + "D": 3, + "I": 9, + "N": 131 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "θæŋk s fɪɡiʌn daɪæm ɡoʊɪŋtudʒʌs t ɡoʊraɪtɪnʌn dɪn t rʌdus sʌm wʌnɛl sðæt soʊn liduɪŋʌmoʊs tʌv tʌdeɪ", + "ref_phonemes": "dʒɑrd jʌŋɡɝ θæŋks vɪki aɪ æm ɡoʊɪŋ tu dʒʌst ɡoʊ raɪt ɪn ʌnd ɪntrʌdus sʌmwʌn ɛls ðæts wʌt aɪm oʊnli duɪŋ moʊst ʌv tʌdeɪ ", + "duration": 0.6093814373016357, + "PER": 23.157894736842106, + "score": { + "S": 2, + "D": 16, + "I": 4, + "N": 95 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "wiv ɡɑtʌlɪs tʌv s pikɝzðæt wɑz rɪliaʊɝwɪʃlɪs tʌn d wiɡɑtaʊɝɪn taɪɝwɪʃlɪs tʌn d soʊwir vɛriʌɡ reɪt fʌlðætɛv riwʌnʌɡ rid tutɔk", + "ref_phonemes": "wiv ɡɑt ʌ lɪst ʌv spikɝz ðæt wɑz rɪli aʊɝ wɪʃ lɪst ʌnd wi ɡɑt aʊɝ ɪntaɪɝ wɪʃ lɪst soʊ wir vɛri ɡreɪtfʌl ðæt ɛvriwʌn ʌɡrid tu tɔk ", + "duration": 0.6886608600616455, + "PER": 3.9603960396039604, + "score": { + "S": 0, + "D": 0, + "I": 4, + "N": 101 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðizɑrðʌpipʌlætðʌtɑpʌvðɛr fil d soʊðɪsɪz ɡoʊŋtubiʌɡʊdʌhæf deɪaɪkʊdʌɡoʊɑnʌn dɑn wɪðæk nɑlɪdʒmʌn t s fɔritʃs pikɝ", + "ref_phonemes": "ðiz ɑr ðʌ pipʌl æt ðʌ tɑp ʌv ðɛr fildz ðɪs ɪz ɡoʊɪŋ tu bi ʌ ɡʊd hæfdi aɪ kʊd ɡoʊ ɑn ʌnd ɑn wɪð æknɑlmʌdɪnts fɔr itʃ spikɝ ", + "duration": 0.6884758472442627, + "PER": 13.978494623655912, + "score": { + "S": 2, + "D": 3, + "I": 8, + "N": 93 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "bʌtɛvɝisɛkʌn daɪsiðʌs poʊlθɪŋzjʊr ɡoʊŋtutɔkʌbaʊt sʌmɛnuvɛrib rif liɪn t rʌdusitʃs pikɝʌn d wir ɡoʊŋtus tɑr t wɪðʌt rɪʃʌfɪʃɝʌn dʃiz ɡoʊɪŋtuɡɪvðʌfɝs t tɔk wɪtʃɪzðʌlaɪv dɪk s pɪriʌn s tɔk", + "ref_phonemes": "bʌt ɛvɝi sɛkʌnd ðɛrz ɔl θɪŋz wir ɡoʊɪŋ tu tɔk ʌbaʊt aɪm ɡoʊɪŋ tu vɛri brifli ɪntrʌdus itʃ spikɝ ʌnd wir ɡoʊɪŋ tu stɑrt wɪð trɪʃʌ fɪʃɝ ʌnd ʃiz ɡoʊɪŋ tu ɡɪv ðʌ fɝst tɔk wɪtʃ ɪz ðʌ laɪvd ɪkspɪriʌns tɔk ", + "duration": 1.0833814144134521, + "PER": 13.924050632911392, + "score": { + "S": 10, + "D": 6, + "I": 6, + "N": 158 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɪnsaɪʌn tɪs t s wiwikɑr vʌpæθʌn d wihoʊpðætðætɛn d zɪnʌp leɪs wɛr wikænɪfɛk tɪv limitðʌnid zʌv peɪʃʌn sʌn d soʊwiɑr vɛriɡ reɪt fʌl fɔrðʌɪn dʌvɪdʒʌwʌl zðæt kæn", + "ref_phonemes": "saɪʌntɪsts wi kɑrv ʌ pæθ ʌnd wi hoʊp ðæt ðæt ɛndz ɪn ʌ pleɪs wɛr wi kæn ɪfɛktɪvli mit ðʌ nidz ʌv peɪʃʌnts ʌnd soʊ wir vɛri ɡreɪtfʌl fɔr ðʌ ɪndʌvɪdʒʌwʌlz ðæt kæn ", + "duration": 0.8760693073272705, + "PER": 4.6875, + "score": { + "S": 0, + "D": 1, + "I": 5, + "N": 128 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɑr tɪk jʌleɪtðʌɪk s pɪriʌn sʌvɛmisiɛfɛsæz vɛridɪfʌkʌl tæzðætɪz sʌt rɪʃʌhæzaɪθɪŋkɔl moʊs tθɝdijɪr zʌv laɪv dɪk s pɪriʌn s wɪðɛmisiɛfɛs", + "ref_phonemes": "ɑrtɪkjʌlʌt ðʌ ɪkspɪriʌns ʌv mɛksf æz vɛri dɪfʌkʌlt æz ðæt ɪz trɪʃʌ hæz aɪ θɪŋk ɔlmoʊst θɝdi jɪrz ʌv laɪvd ɪkspɪriʌns wɪð mɛksf ", + "duration": 0.7682247161865234, + "PER": 17.307692307692307, + "score": { + "S": 3, + "D": 2, + "I": 13, + "N": 104 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʌn dðɛr wɝrɪlɛn t lʌsɛfɝt sʌvhɝmʌðɝʌn dðʌnudʒɝziɛn isiʌfɛs tʌsoʊsieɪʃʌnʌn dθruðɛrɛfɝt sʃiwɑz daɪʌɡ noʊs tætðʌeɪdʒʌv t wɛl v wɪðɛmisiʌfɛs", + "ref_phonemes": "ʌnd ðɛr wɝ rɪlɛntlɪs ɛfɝts ʌv hɝ mʌðɝ ʌnd ðʌ nu dʒɝzi mɛksf ʌsoʊsieɪʃʌn θru ðɛr ɛfɝts ʃi wɑz daɪʌɡnoʊst æt ðʌ eɪdʒ ʌv twɛlv wɪð mɛksf ", + "duration": 0.6951873302459717, + "PER": 17.75700934579439, + "score": { + "S": 3, + "D": 2, + "I": 14, + "N": 107 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʌn dʃimʌtʃleɪtɝkʌn tɪn juz tumitðoʊztʃælʌndʒɪzæʃizʌwaɪf mʌðɝʌv tutʃɪl d rʌnʌn dðʌt rɛʒɝʌv", + "ref_phonemes": "ʌnd ʃi mʌtʃ leɪtɝ kʌntɪnjuz tu mit ðoʊz tʃælʌndʒɪz ʃiz ʌ waɪf mʌðɝ ʌv tu tʃɪldrʌn ʌnd ðʌ trɛʒɝɝ ʌv ", + "duration": 0.6333308219909668, + "PER": 2.5316455696202533, + "score": { + "S": 0, + "D": 1, + "I": 1, + "N": 79 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "nujɔr k sɪtibeɪs tʌp raɪvʌp raɪvʌtɛk wʌtifɝmʌn dʃizɔl soʊʌɡɪf tʌd kʌm junʌkeɪtɝsʌm vɛrimʌtʃlʊkɪŋfɔr wɝd tuhirɪŋhɝp ɝs pɛk tɪvɑnðʌf jutʃɝrisɝtʃɪnɛmisiɛfɛs", + "ref_phonemes": "ʌ nu jɔrk sɪti beɪst praɪvʌt ɛkwʌti fɝm ʌnd ʃiz ɔlsoʊ ʌ ɡɪftʌd kʌmjunʌkeɪtɝ aɪm vɛri mʌtʃ lʊkɪŋ fɔrwɝd tu hirɪŋ hɝ pɝspɛktɪv ɑn ðʌ fjutʃɝ risɝtʃ ɪn mɛksf ", + "duration": 0.742694616317749, + "PER": 13.600000000000001, + "score": { + "S": 3, + "D": 2, + "I": 12, + "N": 125 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "soʊaɪwɪl tɝnɪtoʊvɝtut rɪʃʌfɔrðʌlaɪv dɪk s pɪriʌn s tɔkθæŋk juaɪæm maɪneɪmɪz k rɪpʌpipoʊkɪkɝaɪm fɔr tijɪr zoʊl dɑ", + "ref_phonemes": "aɪ wɪl tɝn ɪt oʊvɝ tu trɪʃʌ fɔr ðʌ laɪvd ɪkspɪriʌns tɔk trɪʃʌ fɪʃɝ θæŋk ju maɪ neɪm ɪz trɪʃʌ fɪʃɝ aɪm fɔrti jɪrz oʊld ", + "duration": 0.7665371894836426, + "PER": 27.956989247311824, + "score": { + "S": 4, + "D": 9, + "I": 13, + "N": 93 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɡʊd mɔr nɪŋɛvɝiwʌnɪt sɝmæmk rɪs tʌfɝk lɪm sʌn", + "ref_phonemes": "noʊt ðʌ kæpʃʌnz ɑr aɪ dʒɛnɝeɪtʌd ʌnd meɪ kʌnteɪn ɛrɝz ɡʊd mɔrnɪŋ ɛvriwʌn ɪts ʌm aɪm krɪstʌfɝ klɛmʌnsʌn ", + "duration": 0.6554243564605713, + "PER": 60.0, + "score": { + "S": 4, + "D": 47, + "I": 0, + "N": 85 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʌɡ rub liðæt sɛn tɝfɔr beɪsɪk mɛt ʌpɑlɪk risɝtʃʌn dɪt s maɪɡ reɪt p lɛʒɝʌn ðhʌnɝtuɪn t rʌdusðʌnɛk s t s pikɝɛm p rʌfɛsɝlɔrisɛl sɝf rʌm kʌlʌm biʌjunʌvɝsʌtisoʊ", + "ref_phonemes": "ðʌ ɡrup lidɝ æt sɛntɝ fɔr beɪsɪk mɛtʌbɑlɪk risɝtʃ ʌnd ɪts maɪ ɡreɪt plɛʒɝ ʌnd hʌnɝ tu ɪntrʌdus ðʌ nɛkst spikɝ prʌfɛsɝ lɔri zɛltsɝ frʌm kʌlʌmbiʌ junʌvɝsʌti soʊ ", + "duration": 0.8487632274627686, + "PER": 7.633587786259542, + "score": { + "S": 5, + "D": 3, + "I": 2, + "N": 131 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "lɔriɡ rædʒueɪtɪd f rʌm p rɪn s tʌn junʌvɝsʌtidiðʌpiʌ s tiæt rɑkʌfɛlɝjunʌvɝsʌtidɪd poʊs tɑk s ʌl wɝkæt kɪŋz kɑlɪdʒlʌn dʌnʌn d rɪtɝn d tukʌlʌm biʌjunʌvɝsʌtiʌn ðhɪz", + "ref_phonemes": "lɔri ɡrædʒueɪtɪd frʌm prɪnstʌn junʌvɝsʌti ʌnd dɪd ʌ fɪdz æt rɑkʌfɛlɝ junʌvɝsʌti dɪd poʊstdɑktɝʌl wɝk æt kɪŋz kɑlɪdʒ lʌndʌn ʌnd rɪtɝnd tu kʌlʌmbiʌ junʌvɝsʌti ʌnd ʃiz ", + "duration": 0.7745053768157959, + "PER": 11.510791366906476, + "score": { + "S": 13, + "D": 3, + "I": 0, + "N": 139 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "dʌn t rʌmɛn dʌs wɝk fɔr mɪniɪsɑn pɝɪfɝib reɪn k rɔs tɔk mɛkʌnɪzʌm z pɝteɪnɪŋtuɛnɝdʒihoʊmioʊs tʌsʌs fidɪŋbɪheɪv jɝʌn dðɛm risʌn t lilɔriwɑzɔl soʊp rʌmoʊtʌd tufʊl", + "ref_phonemes": "dʌn trʌmɛndʌs wɝk fɔr mɛni jɪrz ɑn pɝɪfɝi breɪn krɔs tɔk mɛkʌnɪzʌmz pɝteɪnɪŋ tu ɛnɝdʒi hoʊmioʊsteɪsʌs fidɪŋ bɪheɪvjɝ ʌnd risʌntli lɔri wɑz ɔlsoʊ prʌmoʊtʌd tu fʊl ", + "duration": 1.4417462348937988, + "PER": 6.61764705882353, + "score": { + "S": 3, + "D": 3, + "I": 3, + "N": 136 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "rʌfɛsɝsoʊðɪsʌlɪtʌl bɪtʌvænʌp deɪt tuðʌɪn t rʌdʌkʃʌnɛmʌn d kʌn ɡ rætʃʌleɪʃʌn zʌn d tudeɪwir ɡaɪnuhirʌbaʊt sʌmɝɪn t rʌs tɪŋwɝkʌn daɪlʊk fɔr ɝd tuhirɪŋʌbaʊt s", + "ref_phonemes": "prʌfɛsɝ soʊ ðɪs lɪtʌl bɪt ʌv æn ʌpdeɪt tu ðʌ ɪntrʌdʌkʃʌn ʌnd kʌŋrætʃʌleɪʃʌnz ʌnd tʌdeɪ wir ɡoʊɪŋ tu hir ʌbaʊt sʌm ɪntrʌstɪŋ wɝk ʌnd aɪ lʊk fɔrwɝd tu hirɪŋ ʌbaʊt ", + "duration": 0.6553902626037598, + "PER": 10.687022900763358, + "score": { + "S": 4, + "D": 4, + "I": 6, + "N": 131 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɪm pʌθɛtɪk nɝvʌs sɪs tʌm rɛɡ jʌleɪʃʌnʌv b raʊnaɪdʌpoʊz tɪs jufʌŋkʃʌn soʊp liz lɔriðʌs teɪt sɪz jʊr z soʊaɪd laɪk tuθæŋkðʌɔr ɡʌnaɪzɝz fɔrɪn vaɪtɪŋmi", + "ref_phonemes": "sɪmpʌθɛtɪk nɝvʌs sɪstʌm rɛɡjʌleɪʃʌn ʌv braʊn ædʌpoʊs tɪsju fʌŋkʃʌn soʊ pliz lɔri ðʌ steɪdʒ ɪz jʊrz soʊ aɪd laɪk tu θæŋk ðʌ ɔrɡʌnaɪzɝz fɔr ɪnvaɪtɪŋ mi ", + "duration": 0.7081990242004395, + "PER": 4.838709677419355, + "score": { + "S": 4, + "D": 1, + "I": 1, + "N": 124 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "tudeɪɪt s rɪliʌp lɛʒɝɑm soʊmaɪ læbdʒɛnɝʌlis tʌdiz nɝʌl sɝkʌt sðæt rɛɡ jʌleɪtæpʌtaɪtʌn d mʌtæbʌlɪzʌm fɔrðʌlɑrdʒpɑr t maɪlæbhæz rɪlibɪn foʊkʌsɪŋɑn sɛn t rʌl", + "ref_phonemes": "tʌdeɪ ɪts rɪli ʌ plɛʒɝ soʊ maɪ læb dʒɛnɝʌli stʌdiz nʊrʌl sɝkʌts ðæt rɛɡjʌleɪt æpʌtaɪt ʌnd mʌtæbʌlɪzʌm fɔr ðʌ lɑrdʒ pɑrt maɪ læb hæz rɪli bɪn foʊkʌsɪŋ ɑn sɛntrʌl ", + "duration": 0.7597057819366455, + "PER": 3.787878787878788, + "score": { + "S": 2, + "D": 1, + "I": 2, + "N": 132 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "sɝkʌt saɪm bʌt tudeɪaɪm ɡoʊɪŋtutɔkʌbaʊtʌkʌm p lit linuɛriʌʌv risɝtʃfɔr maɪlæb wir s tɪl dɪvɛlʌpɪŋʌlɑtʌvðʌtul zɑn wɪtʃfoʊkʌsɪzɑnðʌpɝɪfɝisoʊnʌθɪŋɪz", + "ref_phonemes": "sɝkʌts bʌt tʌdeɪ aɪm ɡoʊɪŋ tu tɔk ʌbaʊt ʌ kʌmplitli nu ɛriʌ ʌv risɝtʃ fɔr maɪ læb wir stɪl dɪvɛlʌpɪŋ ʌ lɑt ʌv ðʌ tulz wɪtʃ foʊkʌsɪz ɑn ðʌ pɝɪfɝi soʊ nʌθɪŋ ɪz ", + "duration": 0.6351938247680664, + "PER": 4.8, + "score": { + "S": 1, + "D": 0, + "I": 5, + "N": 125 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʌb lɪʃðætaɪm tɔkɪŋʌbaʊt tudeɪɑmʌn d wʌtaɪwɑn t tutɔk tubɪkɔzðɪsɪzʌp rɪtidaɪvɝsɑdiʌn s wɪtʃaɪm supɝɪk saɪtʌdʌbaʊtaɪwɑn t tutɔk tuʌlɪtʌl bɪtʌbaʊt", + "ref_phonemes": "pʌblɪʃt ðæt aɪm tɔkɪŋ ʌbaʊt tʌdeɪ ʌnd wʌt aɪ wɑnt tu tɔk tu ju bɪkɔz ðɪs ɪz ʌ prɪti daɪvɝs ɑdiʌns wɪtʃ aɪm supɝ ɪksaɪtʌd ʌbaʊt aɪ wɑnt tu tɔk tu ju ʌ lɪtʌl bɪt ʌbaʊt ", + "duration": 0.7179651260375977, + "PER": 6.923076923076923, + "score": { + "S": 1, + "D": 6, + "I": 2, + "N": 130 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "waɪɪt s boʊθɪn t rʌs tɪŋʌn d k lɪnɪkʌlirɛlʌvʌn t pʌtɛnʃʌlitus tʌdisɪm pʌθɛtɪk rɛɡ jʌleɪʃʌnʌv mʌtæbʌlɪzʌm foʊkʌsɪŋɑn b rænætʌpoʊs t tɪs juɔr bætʌn daɪm ɡɪŋtuɔl soʊtɔk tujuʌbaʊt", + "ref_phonemes": "waɪ ɪts boʊθ ɪntrʌstɪŋ ʌnd klɪnɪkʌli rɛlʌvʌnt pʌtɛnʃʌli tu stʌdi sɪmpʌθɛtɪk rɛɡjʌleɪʃʌn ʌv mʌtæbʌlɪzʌm foʊkʌsɪŋ ɑn braʊn ædʌpoʊs tɪsju ɔr bæt ʌnd aɪm ɡoʊɪŋ tu ɔlsoʊ tɔk tu ju ʌbaʊt ", + "duration": 0.9842815399169922, + "PER": 3.9735099337748347, + "score": { + "S": 2, + "D": 3, + "I": 1, + "N": 151 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʌt raɪʌl zʌn d t rɪb jʌleɪʃʌn zʌn d p rɑɡ rɛsðæt wiv meɪdɪn dɪvɛlʌpɪŋðʌtul zʌn dɛseɪzðætɑræktʃʌwʌlinidʌd tus tʌdiðɪsʌmʌp roʊp riʌt lisoʊaɪdoʊn t nid tuɪn t rʌdusðɪs", + "ref_phonemes": "ðʌ traɪʌlz ʌnd trɪbjʌleɪʃʌnz ʌnd prɑɡrɛs ðæt wiv meɪd ɪn dɪvɛlʌpɪŋ ðʌ tulz ʌnd ʌseɪz ðæt ɑr æktʃʌwʌli nidʌd tu stʌdi ðɪs ʌproʊpriɪtli soʊ aɪ doʊnt nid tu ɪntrʌdus ðɪs ", + "duration": 0.8679783344268799, + "PER": 3.64963503649635, + "score": { + "S": 2, + "D": 1, + "I": 2, + "N": 137 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "laɪdɪnðɪs rum bʌtdʒʌs t tuseɪðætðɪsɪzðʌs tɑr tɪŋpɔɪn tɑmʌn d wʌtɪn t rɪɡ d miʌbaʊtðʌb raʊnætʌpoʊs t tɪs jusɪs tʌm wɑzaʊs tʌdizðæt wɝdʌn juzɪŋʌpɛtɪmʌdʒɪŋwɪðʌ", + "ref_phonemes": "slaɪd ɪn ðɪs rum bʌt dʒʌst tu seɪ ðæt ðɪs ɪz ʌ stɑrtɪŋ pɔɪnt ʌnd wʌt ɪntriɡd mi ʌbaʊt ðʌ braʊn ædʌpoʊs tɪsju sɪstʌm wɑz stʌdiz ðæt wɝ dʌn juzɪŋ pɛt ɪmɪdʒɪŋ wɪð ʌ ", + "duration": 1.0389914512634277, + "PER": 8.59375, + "score": { + "S": 3, + "D": 1, + "I": 7, + "N": 128 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "reɪdioʊleɪbʌl d ɡ lukoʊs t reɪsɝɪndʒɛk tʌdɪn tupeɪʃʌn s wɛrɪt wɑz noʊtʌs tðæt koʊl d z s tɪm jʌleɪt s tɪm jʌleɪtʌd b rænʌtʌpoʊs ttɪsʌɡ lukoʊzʌp teɪkʌn d b rænʌtʌpoʊs tɪs juɪn linɪn dʌvɪdʒʌwʌl zʌn d", + "ref_phonemes": "reɪdioʊ leɪbʌl ɡlukoʊs treɪsɝ ɪndʒɛktʌd ɪntu peɪʃʌnts wʌt wɑz noʊtʌst ðæt koʊld stɪmjʌleɪt stɪmjʌleɪtʌd braʊn ædʌpoʊs tɪsju ɡlukoʊs ʌpteɪk ɪn braʊn ædʌpoʊs tɪsju ɪn lin ɪndʌvɪdʒʌwʌlz ʌnd ", + "duration": 0.8744871616363525, + "PER": 12.5, + "score": { + "S": 10, + "D": 4, + "I": 6, + "N": 160 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɪs koʊl d s tɪm jʌleɪtʌd ɡ lusʌk ɡ lukʌsʌp teɪk wɑz dɪk ris tɪn pipʌl wɪðʌmʌɛlʌveɪtʌd biʌmaɪʌnoʊbisʌtiʌn d soʊðɪs taɪpʌv", + "ref_phonemes": "ðɪs koʊl stɪmjʌleɪtʌd ɡlukoʊs ɡlukoʊs ʌpteɪk wɑz dɪkrist ɪn pipʌl wɪð ɛlʌveɪtɪd bimi ʌnd oʊbisʌti ʌnd soʊ ðɪs taɪp ʌv ", + "duration": 0.7209563255310059, + "PER": 16.3265306122449, + "score": { + "S": 6, + "D": 4, + "I": 6, + "N": 98 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɑb zɝveɪʃʌn rɪlisɛtɔfʌhoʊl kɑtʌdʒkɑtʌdʒɪn dʌs t riʌv pipʌlhuwɝlʊkɪŋtujuzʌbætæk tʌveɪtɝzæzθɛrʌp jutɪkæn tibisʌtitɑr ɡʌt sʌn d boʊθðʌk lɪnɪkʌl", + "ref_phonemes": "ɑbzɝveɪʃʌn rɪli sɛt ɔf ʌ hoʊl kɑtʌdʒ kɑtʌdʒ ɪndʌstri ʌv pipʌl hu wɝ lʊkɪŋ tu juz bæt æktʌveɪtɝz æz θɛrʌpjutɪk ænti oʊbisʌti tɑrɡʌts ʌnd boʊθ ðʌ klɪnʌkʌl ", + "duration": 0.9998283386230469, + "PER": 3.1746031746031744, + "score": { + "S": 1, + "D": 2, + "I": 1, + "N": 126 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "eɪtʌʌn dðʌbeɪsɪk risɝtʃdeɪtʌsɔr tʌvʃoʊdoʊvɝtaɪmðætðɪs rileɪʃʌnʃɪpɪz mʌtʃmɔr kɑm p lɛk sʌn daɪθɪŋk rɪliðʌbɛs t weɪʌvhaɪlaɪtɪŋðɪsɪzʌrisʌn t s tʌdiðæt wɑz", + "ref_phonemes": "deɪtʌ ʌnd ðʌ beɪsɪk risɝtʃ deɪtʌ sɔrt ʌv ʃoʊd oʊvɝ taɪm ðæt ðɪs rileɪʃʌnʃɪp ɪz mʌtʃ mɔr kɑmplɛks ʌnd aɪ θɪŋk rɪli ðʌ bɛst weɪ ʌv haɪlaɪtɪŋ ðɪs ɪz ʌ risʌnt stʌdi ðæt wɑz ", + "duration": 0.8344237804412842, + "PER": 0.7407407407407408, + "score": { + "S": 0, + "D": 1, + "I": 0, + "N": 135 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʌb lɪʃtʌmlæsʌkʌpʌl jɪr zʌɡoʊnaʊbaɪpɔl koʊʌnæt rɑkʌfɛlɝʌn d wʌθhidɪdɪzðeɪdɪdʌhjudʒrɛt rʌs pɛk tɪv s tʌdiʌvoʊvɝfɪf tiθaʊzʌn d pɛt s kæn z fɔr kæn sɝ", + "ref_phonemes": "pʌblɪʃt læst ʌ kʌpʌl jɪrz ʌɡoʊ naʊ baɪ pɔl koʊʌn æt rɑkʌfɛlɝ ʌnd wʌt hi dɪd ɪz ðeɪ dɪd ʌ hjudʒ rɛnt rɛtrʌspɛktɪv stʌdi ʌv oʊvɝ fɪfti θaʊzʌnd pɛt skænz fɔr kænsɝ ", + "duration": 1.0727267265319824, + "PER": 6.976744186046512, + "score": { + "S": 1, + "D": 6, + "I": 2, + "N": 129 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "eɪʃʌn t sʌn d soʊðiz peɪʃʌn t s wɝnɑt koʊl dɪk s poʊz dðɪs wɑzdʒʌs t beɪs laɪn b raʊnætʌpoʊs t tɪsuæk tɪvʌtiʌn d wʌθhidɪd wɑʒhibeɪsɪkʌlis t rætʌfaɪdɔlʌvðʌpeɪʃʌn sɪn tubæt", + "ref_phonemes": "peɪʃʌnts ʌnd soʊ ðiz peɪʃʌnts wɝ nɑt koʊld ɪkspoʊzd ðɪs ɪz dʒʌst beɪslaɪn braʊn ædʌpoʊs tɪsju æktɪvʌti ʌnd wʌt hi dɪd wɑz hi beɪsɪkli strætʌfaɪd ɔl ʌv ðʌ peɪʃʌnts ɪntu bæd ", + "duration": 0.7666685581207275, + "PER": 7.801418439716312, + "score": { + "S": 5, + "D": 3, + "I": 3, + "N": 141 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɑzʌtɪvɔr bæt nɛɡʌtɪv peɪʃʌn sʌn dðɛnænʌlaɪz dʌhoʊl bʌntʃʌv dɪfɝʌn t mɛtʌbɑlɪk p roʊfaɪl zʌn d wʌθhifaʊn dɪz soʊðʌpeɪʃʌn sðæθhædðʌʌmp rɛzʌn sʌvʌæk tɪv bætʃ", + "ref_phonemes": "pɑzʌtɪv ɔr bæd nɛɡʌtɪv peɪʃʌnts ʌnd ðɛn ænʌlaɪzd ʌ hoʊl bʌntʃ ʌv dɪfɝʌnt mɛtʌbɑlɪk proʊfaɪlz ʌnd wʌt hi faʊnd ɪz soʊ ðʌ peɪʃʌnts ðæt hæd ðʌ prɛzʌns ʌv æktɪv bæt ", + "duration": 1.1155200004577637, + "PER": 7.633587786259542, + "score": { + "S": 3, + "D": 3, + "I": 4, + "N": 131 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃoʊnhirɪn b raʊn soʊðeɪhæd loʊɝɡ lukoʊsɛbeɪs laɪn naʊðɪsɪfɛk tɑn ɡ laɪsimiʌwɑz rɪlip rɪtimɑdʌs t bʌt wɛn", + "ref_phonemes": "ʃoʊn hir ɪn braʊn soʊ ðeɪ hæd loʊɝ ɡlukoʊs æt beɪslaɪn naʊ ðɪs ɪfɛkt ɑn ɡlaɪkeɪmiʌ wɑz rɪli prɪti mɑdʌst bʌt wɛn ", + "duration": 0.6056215763092041, + "PER": 5.4945054945054945, + "score": { + "S": 3, + "D": 2, + "I": 0, + "N": 91 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "s t rætʌfaɪd baɪbiɛmaɪnaʊjukæn siænɪn tɝækʃʌn bɪt winðʌbætʌn dðʌɛlʌveɪtʌd biɛmaɪwɛrætʌmæt loʊbiʌmaɪsʌju", + "ref_phonemes": "hi strætʌfaɪd baɪ bimi naʊ ju kæn si æn ɪntɝækʃʌn bɪtwin ðʌ bæt ʌnd ðʌ ɛlʌveɪtɪd bimi wir æt æt loʊ bimi aɪz ju ", + "duration": 0.7244853973388672, + "PER": 18.181818181818183, + "score": { + "S": 5, + "D": 3, + "I": 8, + "N": 88 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "oʊn lijudoʊn t rɪlisiɛniɪfɛk tʌvðʌb rænʌtʌpoʊs tɪs juæk tɪvʌtibʌtætðʌhaɪbiɛmaɪz naʊjus tɑr t tusiʌp rʌtɛk tɪvɪfɛk tɑn wɛrðoʊzʌmɪn dʌvɪdʒʌwʌl ʒhæd loʊɝɡ laɪsimiʌ", + "ref_phonemes": "oʊnli si ju doʊnt rɪli si ɛni ɪfɛkt ʌv ðʌ braʊn ædʌpoʊs tɪsju æktɪvʌti bʌt æt ðʌ haɪ bimi naʊ ju wɪl stɑrt tu si ʌ prʌtɛktɪv ɪfɛkt wɛr ðoʊz ɪndʌvɪdʒʌwʌlz hæd loʊɝ ɡlaɪsɛmiʌ ", + "duration": 1.0047948360443115, + "PER": 13.66906474820144, + "score": { + "S": 6, + "D": 6, + "I": 7, + "N": 139 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʌn dðɪsɔl soʊt ræk tθruðʌp rɛvʌlʌn sʌv taɪudaɪʌbitiz soʊɔl soʊðʌɪn dʌvɪdʒʌwʌl z jukʊd sisʌm mɑdʌs t p rʌtɛkʃʌnʌmʌv ɡ lukoʊzɪn tɑlɝʌn sɪnðʌɪnðʌ", + "ref_phonemes": "ʌnd ðɪs ɔlsoʊ trækt θru ðʌ prɛvʌlʌns ʌv taɪp tu daɪʌbitiz soʊ ɔlsoʊ ðʌ ɪndʌvɪdʒʌwʌlz ju kʊd si sʌm mɑdʌst prʌtɛkʃʌn ʌv ɡlukoʊs ɪntɑlɝʌns ɪn ðʌ ɪn ðʌ ", + "duration": 0.8040943145751953, + "PER": 4.132231404958678, + "score": { + "S": 1, + "D": 2, + "I": 2, + "N": 121 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "eɪʃʌn t sðæθhæd b raʊnætʌpoʊs t tɪʃoʊæk tɪvʌtibʌt jurɪlis tɑr t tusiʌlɑrdʒɪfɛk t saɪzɪnðʌkɑn tɛk s tʌvʌbiʌmaɪzoʊvɝθɝdiʌn d soʊðɪs reɪzʌzðʌpɑsʌbɪlʌtiðæt meɪbiaɪm k lɪr li", + "ref_phonemes": "peɪʃʌnts ðæt hæd braʊn ædʌpoʊs tɪsju æktɪvʌti bʌt ju rɪli stɑrt tu si ʌ lɑrdʒ ɪfɛkt saɪz ɪn ðʌ kɑntɛkst ʌv ʌ bimi ɪz oʊvɝ θɝdi ʌnd soʊ ðɪs reɪzʌz ðʌ pɑsʌbɪlʌti ðæt meɪbi klɪrli ", + "duration": 0.9099242687225342, + "PER": 8.450704225352112, + "score": { + "S": 6, + "D": 1, + "I": 5, + "N": 142 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "b ræt b raʊnætʌpoʊs t tɪsuæk tɪveɪtɝzɑr nɑt sʌfɪʃʌn t tuʌp rɪvɛn toʊbisʌtiæz jukʊd siðɛr wɝp lɛn tiʌv pipʌlhuhæd biʌmaɪzoʊvɝθɝdiðætɪn fæk tɔl soʊhædæk tɪv bæt bʌtɪt meɪ", + "ref_phonemes": "braʊn braʊn ædʌpoʊs tɪsju æktʌveɪtɝz ɑr nɑt sʌfɪʃʌnt tu prɪvɛnt oʊbisʌti æz ju kæn si ðɛr ɑr plɛnti ʌv pipʌl hu hæd bimi oʊvɝ θɝdi ðæt ɪn fækt ɔlsoʊ hæv æktɪv fæt bʌt ɪt meɪ ", + "duration": 1.0343899726867676, + "PER": 12.949640287769784, + "score": { + "S": 11, + "D": 2, + "I": 5, + "N": 139 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "rɪlijus fʌlæzʌtɑr ɡʌt tuɪm p ruv mɛtæbʌlɪzʌmaɪmɪnðʌkɑn tɛk s tʌvoʊbisʌtiʌn d soʊaɪmaɪʃoʊd jubɪfɔrðʌpɛt taɪp", + "ref_phonemes": "bi rɪli jusfʌl æz ʌ tɑrɡʌt tu ɪmpruv mʌtæbʌlɪzʌm ɪn ðʌ kɑntɛkst ʌv oʊbisʌti ʌnd soʊ aɪ ʃoʊd ju bɪfɔr ðʌ pɛt taɪp ", + "duration": 0.9105074405670166, + "PER": 10.0, + "score": { + "S": 1, + "D": 2, + "I": 6, + "N": 90 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "vʌʌp roʊtʃtus tʌdiʌɡ ukʌsʌp teɪkæzʌsɪɡ nʌlʌvæk tɪv bætʌnʌðɝweɪðætʌmpipʌlhæv s tʌdidæk tɪveɪtʌd bætɪnhjumʌn zɪz baɪdɝɛk tʌθɝmɑɡ rʌfibɪkɔz wɛn bæt", + "ref_phonemes": "ʌv ʌproʊtʃ tu stʌdi ɡlukoʊs ʌpteɪk æz ʌ sɪɡnʌl ʌv æktɪv bæt ʌnʌðɝ weɪ ðæt pipʌl hæv stʌdid æktʌveɪtʌd bæt ɪn hjumʌnz ɪz baɪ dɝɛkt θɝmʌɡrʌfi bɪkɔz wɛn bæd ", + "duration": 1.0588557720184326, + "PER": 9.6, + "score": { + "S": 4, + "D": 3, + "I": 5, + "N": 125 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "æk tɪveɪtʌdɪtɔl soʊdʒɛnɝeɪt ʃhitʌn d soʊðɪʃhæzɔl soʊbɪn juz d bʌt waɪlʌmðiz s tʌdiʒhæv bɪn rɪliɪn t rʌs tɪŋʌn dʌɪn t rɪɡɪŋɪnhjumʌn zɪnðʌɛn dɪf jurɪliwɑn tʌ", + "ref_phonemes": "ɪz æktʌveɪtʌd ɪt ɔlsoʊ dʒɛnɝeɪts hit ʌnd soʊ ðɪs ɪz ɔlsoʊ bɪn juzd bʌt waɪl ðiz stʌdiz hæv bɪn rɪli ɪntrʌstɪŋ ʌnd ɪntriɡɪŋ ɪn hjumʌnz ɪn ðʌ ɛnd ɪf ju rɪli wɑnt tu ", + "duration": 0.8380434513092041, + "PER": 10.76923076923077, + "score": { + "S": 7, + "D": 3, + "I": 4, + "N": 130 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "dɝs tæn d wʌt s ɡoʊɪŋɑnʌn d wʌtɪzðʌrileɪʃʌnʃɪp bɪt winʌmoʊbisʌtiʌn d mɛtʌbʌlʌdʌs fʌŋkʃʌnʌn d b raʊnætʌpoʊs t tɪs jujurɪlinid tuɡɛt tuʌmɔr mɛkʌnɪs tɪk mɑdʌl", + "ref_phonemes": "ʌndɝstænd wʌts ɡoʊɪŋ ɑn ʌnd wʌt ɪz ðʌ rileɪʃʌnʃɪp bɪtwin oʊbisʌti ʌnd mɛtʌbɑlɪk dɪsfʌŋkʃʌn ʌnd braʊn ædʌpoʊs tɪsju ju rɪli nid tu ɡɛt tu ʌ mɔr mɛkʌnɪstɪk mɑdʌl ", + "duration": 0.6316015720367432, + "PER": 7.575757575757576, + "score": { + "S": 4, + "D": 3, + "I": 3, + "N": 132 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "wɪtʃb rɪŋzʌs turoʊdʌn sʌn d soʊðɪsɪz beɪsɪk liʌsʌmɝiʌv wʌtɪz noʊnʌbaʊtðʌsɝkʌt s rɛɡ jʌleɪtɪŋʌθɝmʌl rɛɡ jʌleɪʃʌnʌn d b rɛnʌtʌpoʊs tɪs uθɝmʌdʒɛnʌsʌsɪn roʊdʌn s", + "ref_phonemes": "wɪtʃ brɪŋz ʌs tu roʊdʌnts ʌnd soʊ ðɪs ɪz beɪsɪkli ʌ sʌmɝi ʌv wʌt ɪz noʊn ʌbaʊt ðʌ sɝkʌts rɛɡjʌleɪtɪŋ θɝmʌl rɛɡjʌleɪʃʌn ʌnd braʊn ædʌpoʊs tɪsju θɝmʌdʒʌnisʌz ɪn roʊdʌnts ", + "duration": 0.7193620204925537, + "PER": 7.913669064748201, + "score": { + "S": 6, + "D": 4, + "I": 1, + "N": 139 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðizɑr p rɪtiwɛl mæp taʊt baɪmɛnidɪfɝʌn t læb zɑmʌn d soʊwʌθhæpʌn zɪzʌθɝmʌl sɛn sɝiɪn fɝmeɪʃʌn soʊboʊθhitʌn d wɔr mɪn fɝmeɪʃʌnɪz rileɪdʌn d p rɑsɛs tɪnðʌ", + "ref_phonemes": "soʊ ðiz ɑr prɪti wɛl mæpt aʊt baɪ mɛni dɪfɝʌnt læbz ʌnd soʊ wʌt hæpʌnz ɪz θɝmʌl sɛnsɝi ɪnfɝmeɪʃʌn soʊ boʊθ hit ʌnd wɔrm ɪnfɝmeɪʃʌn ɪz rileɪd ʌnd prɑsɛst ɪn ðʌ ", + "duration": 1.133971929550171, + "PER": 5.46875, + "score": { + "S": 1, + "D": 3, + "I": 3, + "N": 128 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "haɪpʌθælʌmʌsðɪs sðiz sɪɡ nʌl zðɛn ɡɛt rileɪdɪn tuðʌɑmhaɪn d p reɪnʌn daʊtθruðʌmɪn tɝmidiʌt lætɝʌl kɑlʌm", + "ref_phonemes": "haɪpʌθɑlʌzʌm ðɪs ðiz sɪɡnʌlz ðɛn ɡɛt rileɪd ɪntu ðʌ hɪndbreɪn ʌnd aʊt θru ðʌ ɪntɝmidiɪt lætɝʌl kɑlʌm ", + "duration": 0.7116918563842773, + "PER": 11.904761904761903, + "score": { + "S": 5, + "D": 0, + "I": 5, + "N": 84 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðʌs paɪnʌl kɔr dʌn dɪn tuðʌsɪm pʌθɛtɪk ɡæŋɡ liʌn wɪtʃfaɪnʌlijuhævðʌsɪm pʌθɛtɪk nɝrʌn zðætðɛn p rʌdʒɛk taʊt tub raʊnætʌpoʊs t tɪs junaʊðʌvæs t mʌdʒɔrʌtiʌv risɝtʃsɛt s", + "ref_phonemes": "ʌv ðʌ spaɪnʌl kɔrd ʌnd ɪntu ðʌ sɪmpʌθɛtɪk ɡæŋɡlʌn wɪtʃ faɪnʌli ju hæv ðʌ sɪmpʌθɛtɪk nʊrɑnz ðæt ðɛn prɑdʒɛkt aʊt tu braʊn ædʌpoʊs tɪsju naʊ ðʌ væst mʌdʒɔrʌti ʌv risɝtʃ ðæts ", + "duration": 0.7637672424316406, + "PER": 7.092198581560284, + "score": { + "S": 6, + "D": 2, + "I": 2, + "N": 141 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɪndʌnɪnθɝmʌrɛɡ jʌlʌtɔrisɝkʌt ʃhæziðɝfoʊkʌs tɑnðʌsɝkʌt sɪnðʌb reɪn wɪtʃhæv bɪn naʊðʌpɑp jʌleɪʃʌn zɪn sʌm pɑp jʌleɪʃʌn z rɛɡ jʌleɪtɪŋɑnθɝmʌl kʌn t roʊlɔr", + "ref_phonemes": "bɪn dʌn ɪn θɝmoʊ rɛɡjʌlʌtɔri sɝkʌts hæz iðɝ foʊkʌst ɑn ðʌ sɝkʌts ɪn ðʌ breɪn wɪtʃ hæv bɪn rɪtʌn naʊ ðʌ pɑpjʌleɪʃʌnz ɪn sʌm pɑpjʌleɪʃʌnz rɛɡjʌleɪtɪŋ θɝmʌl kʌntroʊl ɑr ", + "duration": 0.7406878471374512, + "PER": 8.75912408759124, + "score": { + "S": 3, + "D": 7, + "I": 2, + "N": 137 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɪlik waɪt naɪs lidɪfaɪn dɔrðeɪv foʊkʌs taʊtɪnðʌb rænætʌpoʊs tɪsudipoʊɪt sɛl fʌn d wʌt maɪɡ rupɪz foʊkʌsɪŋɑnɪz", + "ref_phonemes": "rɪli kwaɪt naɪsli dɪfaɪnd ɔr ðeɪ foʊkʌst aʊt ɪn ðʌ braʊn ædʌpoʊs tɪsju dipoʊ ɪtsɛlf ʌnd wʌt maɪ ɡrup ɪz foʊkʌsɪŋ ɑn ɪz ", + "duration": 0.7072248458862305, + "PER": 6.25, + "score": { + "S": 2, + "D": 3, + "I": 1, + "N": 96 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ræðɝðʌp rʌdʒɛkʃʌn f rʌmðʌsɪm pʌθɛtɪkɡæŋɡliʌnaʊt tub raʊnætʌpoʊs t tɪsuʌn d soʊðɛr d bɪn bɪkɔzʌvðɪs lɪŋk bɪt win biɛmaɪɛlʌveɪtʌd biɛmaɪdaɪbitizɪm pɛr d b raʊnætʌpoʊs t", + "ref_phonemes": "ræðɝ ðʌ prʌdʒɛkʃʌn frʌm ðʌ sɪmpʌθɛtɪk ɡæŋɡlʌn aʊt tu braʊn ædʌpoʊs tɪsju ʌnd soʊ ðɛr hæv bɪn bɪkɔz ʌv ðɪs lɪŋk bɪtwin bimi ɛlʌveɪtɪd bimi daɪʌbitiz ɪmpɛrd braʊn ædʌpoʊs ", + "duration": 1.0613641738891602, + "PER": 12.142857142857142, + "score": { + "S": 6, + "D": 4, + "I": 7, + "N": 140 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʃufʌŋkʃʌnɪŋsoʊðɛrv bɪn mɛniɡ rup sðæθhæv juz dænʌmʌl mɑdʌl z tut raɪtuʌn dɝs tæn d wʌtɪzðʌlɪŋk bɪt winɛlʌveɪtʌd biɛmaɪʌn dɑmɪm pɛr dæɪm pɛr dʌb rɛn", + "ref_phonemes": "tɪsju fʌŋkʃʌnɪŋ soʊ ðɛr hæv bɪn mɛni ɡrups ðæt hæv juzd ænʌmʌl mɑdʌlz tu traɪ tu ʌndɝstænd wʌt ɪz ðʌ lɪŋk bɪtwin ɛlʌveɪtɪd bimi ʌnd ɪmpɛrd æt ɪmpɛrd braʊn ", + "duration": 0.9303829669952393, + "PER": 13.492063492063492, + "score": { + "S": 5, + "D": 7, + "I": 5, + "N": 126 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʌpoʊs tɪsufʌŋkʃʌnʌn d beɪsɪk liɑm dɪpɛn dɪŋɑn wɛr julʊkðɛrhæv bɪn mɛnidɪfɝʌn t sɛl taɪp sʌn d mɛkʌnɪzʌm zɪm p lʌkeɪtʌdʌn d soʊðʌb rɛnætʌpoʊs tɪs juɪzʌ", + "ref_phonemes": "ædʌpoʊs tɪsju fʌŋkʃʌn ʌnd beɪsɪkli dɪpɛndɪŋ ɑn wɛr ju lʊk ðɛr hæv bɪn mɛni dɪfɝʌnt sɛl taɪps ʌnd mɛkʌnɪzʌmz ɪmplɪkeɪtɪd ʌnd soʊ ðʌ braʊn ædʌpoʊs tɪsju ɪz ʌ ", + "duration": 0.8274374008178711, + "PER": 7.8125, + "score": { + "S": 4, + "D": 4, + "I": 2, + "N": 128 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "wɛl kʌm tuðʌhjubɝmʌn læppɑd kæs t wɛr widɪs kʌs saɪʌn sʌn d saɪʌn s beɪs tul z fɔrɛv rideɪlaɪfaɪmeɪdʒɔrhjubɝmʌnʌn daɪmʌp rʌfɛsɝʌv nʊrʌbɑldʒi", + "ref_phonemes": "wɛlkʌm tu ðʌ hubɝmʌn læb poʊdkæst wɛr wi dɪskʌs saɪʌns ʌnd saɪʌnsbeɪst tulz fɔr ɛvrideɪ laɪf aɪm ændru hubɝmʌn ʌnd aɪm ʌ prʌfɛsɝ ʌv nʊroʊbaɪɑlʌdʒi ", + "duration": 0.6731712818145752, + "PER": 13.114754098360656, + "score": { + "S": 5, + "D": 7, + "I": 4, + "N": 122 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɑp tʌmɑlʌdʒiæt s tæm fɝd s kulʌv mɛdʌsʌn tudeɪwiɑr dɪs kʌsɪŋðʌɪm jun sɪs tʌmʌn d wiɑrɔl soʊdɪs kʌsɪŋðʌnɝvʌs sɪs tʌm", + "ref_phonemes": "ʌnd ɑpθʌmɑlʌdʒi æt stænfɝd skul ʌv mɛdʌsʌn tʌdeɪ wi ɑr dɪskʌsɪŋ ðʌ ɪmjun sɪstʌm ʌnd wi ɑr ɔlsoʊ dɪskʌsɪŋ ðʌ nɝvʌs sɪstʌm ", + "duration": 0.6602332592010498, + "PER": 6.0606060606060606, + "score": { + "S": 3, + "D": 3, + "I": 0, + "N": 99 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɪtʃɪzðʌb reɪn s paɪnʌl kɔr dʌn dðʌkʌnɛkʃʌn zʌvðʌb reɪnʌn d s paɪnʌl kɔr d wɪðɔlðʌɔr ɡʌn zʌvðʌbɑdiwiɑrɔl soʊɡoʊɪŋtudɪs kʌʃhaʊðʌnɝvʌs sɪs tʌm kæn bi", + "ref_phonemes": "wɪtʃ ɪz ðʌ breɪn spaɪnʌl kɔrd ʌnd ðʌ kʌnɛkʃʌnz ʌv ðʌ breɪn ʌnd spaɪnʌl kɔrd wɪð ɔl ðʌ ɔrɡʌnz ʌv ðʌ bɑdi wi ɑr ɔlsoʊ ɡoʊɪŋ tu dɪskʌs haʊ ðʌ nɝvʌs sɪstʌm kæn bi ", + "duration": 0.6163160800933838, + "PER": 1.6, + "score": { + "S": 1, + "D": 1, + "I": 0, + "N": 125 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "uz d tuæk tɪveɪtʌn d kʌn t roʊlðʌɪm jun sɪs tʌm naʊʌbaʊt tɛn t wɛn tijɪr zʌɡoʊɪf sʌm bɑdisɛdðætðʌmaɪn d kʊd kʌn t roʊl", + "ref_phonemes": "juzd tu æktʌveɪt ʌnd kʌntroʊl ðʌ ɪmjun sɪstʌm naʊ ʌbaʊt tɛn twɛnti jɪrz ʌɡoʊ ɪf sʌmbɑdi sɛd ðæt ðʌ maɪnd kʊd kʌntroʊl ", + "duration": 0.6416995525360107, + "PER": 2.083333333333333, + "score": { + "S": 1, + "D": 1, + "I": 0, + "N": 96 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɪm jun sɪs tʌmɪt p rɑbʌb liɡɛt læf taʊtʌv moʊs tækʌdɛmɪk kɑn fɝʌn sɪzʌn d sɝtʌn liðʌwɝk wʊdʌn t bipʌb lɪʃtɪn k wɑlʌtidʒɝnʌl z bʌt naʊʌdeɪzðɛrɑr dʌzʌn z", + "ref_phonemes": "ðʌ ɪmjun sɪstʌm ðeɪd prɑbʌbli ɡɛt læft aʊt ʌv moʊst ækʌdɛmɪk kɑnfɝʌnsʌz ʌnd sɝtʌnli ðʌ wɝk wʊdʌnt bi pʌblɪʃt ɪn kwɑlʌti dʒɝnʌlz bʌt naʊʌdeɪz ðɛr ɑr dʌzʌnz ", + "duration": 0.519967794418335, + "PER": 4.6875, + "score": { + "S": 2, + "D": 4, + "I": 0, + "N": 128 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "nɑθhʌn d rʌd zʌv k wɑlʌtipʊr riv jud s tʌdizɑnhaʊðʌmaɪn dʌn ðhaʊðʌnɝvʌs sɪs tʌm kæn kʌn t roʊlæk tɪveɪʃʌnʌvðʌɪm jun sɪs tʌm", + "ref_phonemes": "ɪf nɑt hʌndrʌdz ʌv kwɑlʌti pɪrʌvɝid stʌdiz ɑn haʊ ðʌ maɪnd ʌnd haʊ ðʌ nɝvʌs sɪstʌm kæn kʌntroʊl æktʌveɪʃʌn ʌv ðʌ ɪmjun sɪstʌm ", + "duration": 0.6744656562805176, + "PER": 9.70873786407767, + "score": { + "S": 7, + "D": 2, + "I": 1, + "N": 103 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɪzʌwʌn dɝfʌl ɡ roʊɪŋbɑdiʌv risɝtʃʌn ddʒʌs t tuɡɪv juʌhɪn tʌv wɛr wiɑrhɛdʌd wɪððɪsdʒʌs tðɪs læs t wikðɛr wɑzʌpeɪpɝpʌb lɪʃtɪn neɪtʃɝ", + "ref_phonemes": "ðɪs ɪz ʌ wʌndɝfʌl ɡroʊɪŋ bɑdi ʌv risɝtʃ ʌnd dʒʌst tu ɡɪv ju ʌ hɪnt ʌv wɛr wi ɑr hɛdʌd wɪð ðɪs dʒʌst ðɪs læst wik ðɛr wɑz ʌ peɪpɝ pʌblɪʃt ɪn neɪtʃɝ ", + "duration": 0.7575032711029053, + "PER": 2.631578947368421, + "score": { + "S": 0, + "D": 3, + "I": 0, + "N": 114 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɪtʃɪzðʌeɪpɛk sdʒɝnʌl fɔr saɪʌn tɪfɪk pʌb lɪʃɪŋp rɪmɪrdʒɝnʌlɪk s t rim lis t rɪndʒʌn tʌpeɪpɝpʌb lɪʃtɪn neɪtʃɝ", + "ref_phonemes": "wɪtʃ ɪz ðʌ eɪpɛks dʒɝnʌl fɔr saɪʌntɪfɪk pʌblɪʃɪŋ prɛmɪr dʒɝnʌl ɪkstrimli strɪndʒʌnt ʌ peɪpɝ pʌblɪʃt ɪn neɪtʃɝ ", + "duration": 0.5118510723114014, + "PER": 2.1505376344086025, + "score": { + "S": 1, + "D": 1, + "I": 0, + "N": 93 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "rʌmtʃufumɑz læbæθhɑr vɝd mɛdʌkʌl s kulɪk s p lɔr ðhaʊækʌpʌŋktʃɝkæn rʌdusɪn f lʌmeɪʃʌnɪnðʌbɑdi", + "ref_phonemes": "frʌm kjufu mɑz læb æt hɑrvɝd mɛdʌkʌl skul ɪksplɔrd haʊ ækjupʌŋktʃɝ kæn rʌdus ɪnflʌmeɪʃʌn ɪn ðʌ bɑdi ", + "duration": 0.623298168182373, + "PER": 8.433734939759036, + "score": { + "S": 5, + "D": 2, + "I": 0, + "N": 83 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ʌn daɪwɪl dɪs k raɪbðʌs tʌdiɪnʌbɪt mɔr dɪteɪl leɪtɝbʌt wʌtðeɪdɪs kʌvɝd wɑzðæt baɪs tɪm jʌleɪtɪŋðʌbɑdiɪn pɝtɪk jʌlɝweɪzæt pɝtɪk jʌlɝsaɪt sɑnðʌbɑdi", + "ref_phonemes": "ʌnd aɪ wɪl dɪskraɪb ðɪs stʌdi ɪn ʌ bɪt mɔr dɪteɪl leɪtɝ bʌt wʌt ðeɪ dɪskʌvɝd wɑz ðæt baɪ stɪmjʌleɪtɪŋ ðʌ bɑdi ɪn pɝtɪkjʌlɝ weɪz æt pɝtɪkjʌlɝ saɪts ɑn ðʌ bɑdi ", + "duration": 0.7624337673187256, + "PER": 1.574803149606299, + "score": { + "S": 1, + "D": 1, + "I": 0, + "N": 127 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðeɪwɝeɪbʌl tulɪbɝeɪt sɝtʌn sɛl zʌn d mɑlʌk jul zðætɛnhæn s tðʌfʌŋkʃʌnʌvðʌɪm jun sɪs tʌmʌn d pʌtɛnʃʌlikæn bijuz d tukɑm bæt", + "ref_phonemes": "ðeɪ wɝ eɪbʌl tu lɪbɝeɪt sɝtʌn sɛlz ʌnd mɑlʌkjulz ðæt ɛnhæns ðʌ fʌŋkʃʌn ʌv ðʌ ɪmjun sɪstʌm ʌnd pʌtɛnʃʌli kæn bi juzd tu kʌmbæt ", + "duration": 0.5106832981109619, + "PER": 1.9607843137254901, + "score": { + "S": 1, + "D": 0, + "I": 1, + "N": 102 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "f ʌn t taɪp sʌvɪn fɛkʃʌnʌn ddʒʌs t tuɡɪv juʌnʌðɝlɪtʌlhɪn tðeɪfaʊn dðætʌpɝtɪk jʌlɝtaɪpʌvɔr ɡʌn tɪs jukɔl d fæʃʌsʌmʌv jumeɪhævhɝdʌv fæʃʌ", + "ref_phonemes": "dɪfɝʌnt taɪps ʌv ɪnfɛkʃʌn ʌnd dʒʌst tu ɡɪv ju ʌnʌðɝ lɪtʌl hɪnt ðeɪ faʊnd ðæt ʌ pɝtɪkjʌlɝ taɪp ʌv ɔrɡʌn tɪsju kɔld fɑʃiʌ sʌm ʌv ju meɪ hæv hɝd ʌv fɑʃiʌ ", + "duration": 0.6843860149383545, + "PER": 5.833333333333333, + "score": { + "S": 2, + "D": 5, + "I": 0, + "N": 120 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "æʃʌsɝaʊn d zaʊɝmʌsʌl zdʒʌs t tulʊkætɪt jumaɪtθɪŋkɪt sʌkaɪn dʌv jus lʌs tɪs juɪt sɔr tʌv laɪkʌdɛn s bæɡðʌ", + "ref_phonemes": "fɑʃiʌ sɝaʊndz aʊɝ mʌsʌlz dʒʌst tu lʊk æt ɪt ju maɪt θɪŋk ɪts ʌ kaɪnd ʌv juslʌs tɪsju ɪts sɔrt ʌv laɪk ʌ dɛns bæɡ ", + "duration": 0.5258910655975342, + "PER": 6.8181818181818175, + "score": { + "S": 1, + "D": 3, + "I": 2, + "N": 88 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɪn wɪtʃðʌmʌsʌl zɑr kʌn teɪn d wɛlɪt tɝn zaʊtðætðoʊz dɛn s bæɡ zɑr mʌtʃs mɑr tɝðæn wiθɔtðeɪdoʊn θhævʌmaɪn dʌvðɛroʊn", + "ref_phonemes": "ɪn wɪtʃ ðʌ mʌsʌlz ɑr kʌnteɪnd wɛl ɪt tɝnz aʊt ðæt ðoʊz dɛns bæɡz ɑr mʌtʃ smɑrtɝ ðæn wi θɔt ðeɪ doʊnt hæv ʌ maɪnd ʌv ðɛr oʊn ", + "duration": 0.481795072555542, + "PER": 1.0416666666666665, + "score": { + "S": 1, + "D": 0, + "I": 0, + "N": 96 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "baɪs tɪm jʌleɪtɪŋðʌfæʃʌɪnʌpɝtɪk jʌlɝloʊkeɪʃʌnɑnðʌbɑdiðɛr zʌpæθweɪlidɪŋaʊtʌvðæt fæʃʌdɝɛk t lituænɔr ɡʌn kɔl dðʌɪd rinʌmʌdʌlʌ", + "ref_phonemes": "bʌt baɪ stɪmjʌleɪtɪŋ ðʌ fɑʃiʌ ɪn ʌ pɝtɪkjʌlɝ loʊkeɪʃʌn ɑn ðʌ bɑdi ðɛrz ʌ pæθweɪ lidɪŋ aʊt ʌv ðæt fɑʃiʌ dɝɛktli tu æn ɔrɡʌn kɔld ðʌ ʌdrinʌl mɪdʌlʌ ", + "duration": 0.7554316520690918, + "PER": 8.47457627118644, + "score": { + "S": 4, + "D": 6, + "I": 0, + "N": 118 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "aɪlɪk s p leɪn wʌtɔlðɪs min zðæt kʊd lɪbɝeɪt pɝtɪk jʌlɝkɛmʌkʌl zðæθhædʌpoʊtʌn tæn tiɪn f læmʌtɔriɪfɛk twʌ wʌt wibeɪsɪkʌliseɪɪŋ", + "ref_phonemes": "aɪl ɪkspleɪn wʌt ɔl ðɪs minz ðæt kʊd lɪbɝeɪt pɝtɪkjʌlɝ kɛmɪkʌlz ðæt hæd ʌ poʊtʌnt æntɪfʌndlʌmɪti ɪfɛkt soʊ wʌt wir beɪsɪkli seɪɪŋ ", + "duration": 0.5529844760894775, + "PER": 13.88888888888889, + "score": { + "S": 7, + "D": 4, + "I": 4, + "N": 108 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ðætðʌnɝvʌs sɪs tʌmæk t sæzʌsɛtʌvhaɪweɪz bɪt winðʌdɪfɝʌn t tɪs juzʌv jɔr bɑdikɔlɪŋɪn tuækʃʌnðʌɪm jun sɪs tʌm", + "ref_phonemes": "ɪz ðæt ðʌ nɝvʌs sɪstʌm ækts æz ʌ sɛt ʌv haɪweɪz bɪtwin ðʌ dɪfɝʌnt tɪsjuz ʌv jɔr bɑdi kɔlɪŋ ɪntu ækʃʌn ðʌ ɪmjun sɪstʌm ", + "duration": 0.569286584854126, + "PER": 2.127659574468085, + "score": { + "S": 0, + "D": 2, + "I": 0, + "N": 94 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "lɪbɝeɪtɪŋpɝtɪk jʌlɝmɑlʌk jul zðæt kæn rʌdusɪn f lʌmeɪʃʌnʌn d lɛd tufæs tɝhilɪŋʌn daɪwɪlɪk s p leɪnhaʊɔlvðæt wɝk s", + "ref_phonemes": "lɪbɝeɪtɪŋ pɝtɪkjʌlɝ mɑlʌkjulz ðæt kæn rʌdus ɪnflʌmeɪʃʌn ʌnd lɛd tu fæstɝ hilɪŋ ʌnd aɪ wɪl ɪkspleɪn haʊ ɔl ʌv ðæt wɝks ", + "duration": 0.6461203098297119, + "PER": 1.0309278350515463, + "score": { + "S": 0, + "D": 1, + "I": 0, + "N": 97 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "z wɛlæz sʌmʌðɝnɑnækʌpʌŋktʃɝmɛθʌd z fɔræk tɪveɪtɪŋʌn dɛnhæn sɪŋðʌfʌŋkʃʌnʌvðʌm jun sɪs tʌm", + "ref_phonemes": "æz wɛl æz sʌm ʌðɝ nɑnʌkʌnstwɛk mɛθʌdz fɔr æktʌveɪtɪŋ ʌnd ɛnhænsɪŋ ðʌ fʌŋkʃʌn ʌv ðʌ ɪmjun sɪstʌm ", + "duration": 0.47069787979125977, + "PER": 13.924050632911392, + "score": { + "S": 6, + "D": 3, + "I": 2, + "N": 79 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "soʊtudeɪwir ɡoʊŋtubitɔkɪŋɔlʌbaʊθhilɪŋwɪððʌmaɪn dɪnʌkʌm p lit linɑn mɪs tɪkʌl nɑnæb s t ræk t sɛn s", + "ref_phonemes": "soʊ tʌdeɪ wir ɡoʊɪŋ tu bi tɔkɪŋ ɔl ʌbaʊt hilɪŋ wɪð ðʌ maɪnd ɪn ʌ kʌmplitli nɑnmɪstʌkʌl nɑnʌbæstrækt sɛns ", + "duration": 0.6115849018096924, + "PER": 6.976744186046512, + "score": { + "S": 4, + "D": 2, + "I": 0, + "N": 86 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɪfɔr wibɪɡɪnaɪd laɪk tuɛm fʌsaɪzðætðɪs pɔd kæs tɪz sɛpɝɪt f rʌm maɪtitʃɪŋʌn d risɝtʃroʊl zæt s tæm fɝdɪtɪʒhaʊɛvɝpɑr tʌv maɪdɪzaɪɝʌn dɛfɝt", + "ref_phonemes": "bɪfɔr wi bɪɡɪn aɪd laɪk tu ɛmfʌsaɪz ðæt ðɪs poʊdkæst ɪz sɛpɝɪt frʌm maɪ titʃɪŋ ʌnd risɝtʃ roʊlz æt stænfɝd ɪt ɪz haʊɛvɝ pɑrt ʌv maɪ dɪzaɪɝ ʌnd ɛfɝt ", + "duration": 0.5911626815795898, + "PER": 4.201680672268908, + "score": { + "S": 3, + "D": 2, + "I": 0, + "N": 119 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "b rɪŋzɪroʊks t tukʌn sumɝɪn fɝmeɪʃʌnʌbaʊt saɪʌn sʌn d saɪʌn s rɪleɪtɪd tul z tuðʌdʒɛnɝʌl pʌb lɪkɪn kipɪŋwɪððætθim", + "ref_phonemes": "tu brɪŋ zɪroʊ kɑst tu kʌnsumɝ ɪnfɝmeɪʃʌn ʌbaʊt saɪʌns ʌnd saɪʌnsɛrʌleɪtɪd tulz tu ðʌ dʒɛnɝʌl pʌblɪk ɪn kipɪŋ wɪð ðæt θim ", + "duration": 0.5159361362457275, + "PER": 5.0, + "score": { + "S": 1, + "D": 4, + "I": 0, + "N": 100 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "laɪk tuθæŋkðʌs pɑn sɝzʌv tudeɪz pɔd kæs taʊɝfɝs t s pɑn sɝɪz roʊkʌroʊkʌmeɪk saɪɡ læsʌzʌn d sʌn ɡ læsɪz", + "ref_phonemes": "aɪd laɪk tu θæŋk ðʌ spɑnsɝz ʌv tʌdeɪz poʊdkæst aʊɝ fɝst spɑnsɝ ɪz roʊkʌ roʊkʌ meɪks aɪɡlæsʌz ʌnd sʌŋlæsɪz ", + "duration": 0.5679464340209961, + "PER": 9.195402298850574, + "score": { + "S": 3, + "D": 4, + "I": 1, + "N": 87 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ætɑrʌvæb sʌlut sʊpɝb k wɑlʌtiaɪv s pɛn tʌlaɪf taɪm wɝkɪŋɑnðʌvɪʒʌwʌl sɪs tʌmʌn daɪkæn tɛl juðæt wʌnʌvðʌmeɪdʒɝɪʃuz", + "ref_phonemes": "ðæt ɑr æbsʌlut sʌbɝb kwɑlʌti aɪv spɛnt ʌ laɪftaɪm wɝkɪŋ ɑn ðʌ vɪʒʌwʌl sɪstʌm ʌnd aɪ kæn tɛl ju ðæt wʌn ʌv ðʌ meɪdʒɝ ɪʃuz ", + "duration": 0.5675010681152344, + "PER": 5.208333333333334, + "score": { + "S": 2, + "D": 1, + "I": 2, + "N": 96 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "ɝvɪʒʌwʌl sɪs tʌmhæz tukʌn tɛn d wɪðɪʒhaʊtusiθɪŋz k lɪr liɪn b raɪtɪn vaɪrʌn mʌn t sɔr dɪmɝɪn vaɪrʌn mʌn t sɛt sɛtɝʌ", + "ref_phonemes": "aʊɝ vɪʒʌwʌl sɪstʌm hæz tu kʌntɛnd wɪð ɪz haʊ tu si θɪŋz klɪrli ɪn braɪt ɪnvaɪrʌnmʌnts ɔr dɪmɝ ɪnvaɪrʌnmʌnts ɛt sɛtɝʌ ", + "duration": 0.6079168319702148, + "PER": 3.125, + "score": { + "S": 1, + "D": 2, + "I": 0, + "N": 96 + } + }, + { + "model": "HuBERT fine-tuned", + "phonemes": "roʊkoʊk lɪr liʌn dɝs tæn d zðʌsaɪn sʌvðʌvɪʒʌwʌl sɪs tʌm bɪkɔz wʌnθɪŋðæt s wʌn dɝfʌlʌbaʊtðɛr sʌn ɡ læsʌzɪzðæt jukæn biɪnʌvɛrib raɪtɪn vaɪrʌn mʌn t", + "ref_phonemes": "roʊkʌ klɪrli ʌndɝstændz ðʌ saɪʌns ʌv ðʌ vɪʒʌwʌl sɪstʌm bɪkɔz wʌn θɪŋ ðæts wʌndɝfʌl ʌbaʊt ðɛr sʌŋlæsɪz ɪz ðæt ju kæn bi ɪn ʌ vɛri braɪt ɪnvaɪrʌnmʌnt ", + "duration": 0.5231845378875732, + "PER": 4.958677685950414, + "score": { + "S": 3, + "D": 1, + "I": 2, + "N": 121 + } + } +] \ No newline at end of file