Newer
Older
" <td>tak</td>\n",
" <td>ADV</td>\n",
" <td>tak</td>\n",
" <td>ADV</td>\n",
" <td>samo</td>\n",
" <td>NUM</td>\n",
" <td>czterdziestu</td>\n",
" <td>VERB</td>\n",
" <td>dziękuję</td>\n",
" <td>NUM</td>\n",
" <td>trzech</td>\n",
" <td>NOUN</td>\n",
" <td>panu</td>\n",
" <td>NOUN</td>\n",
" <td>stoczni</td>\n",
" </tr>\n",
" <tr>\n",
" <th>47</th>\n",
" <td>SUBSTITUTION</td>\n",
" <td>NOUN</td>\n",
" <td>dobranoc</td>\n",
" <td>kieruje</td>\n",
" </tr>\n",
" <tr>\n",
" <th>48</th>\n",
" <td>SUBSTITUTION</td>\n",
" <td>proszę</td>\n",
" <td>PRON</td>\n",
" <td>się</td>\n",
" <td>ADV</td>\n",
" <td>bardzo</td>\n",
" <td>ADP</td>\n",
" <td>dobranoc</td>\n",
" </tr>\n",
" <tr>\n",
" <th>51</th>\n",
" <td>INSERTION</td>\n",
" <td></td>\n",
" <td></td>\n",
" <td>SPACE</td>\n",
" <td></td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" step_type reference_word_pos reference_word_text hypothesis_word_pos \\\n",
2076
2077
2078
2079
2080
2081
2082
2083
2084
2085
2086
2087
2088
2089
2090
2091
2092
2093
2094
2095
2096
2097
2098
2099
2100
2101
2102
2103
2104
2105
2106
2107
2108
2109
2110
2111
2112
2113
2114
2115
2116
2117
2118
2119
2120
2121
2122
2123
2124
2125
2126
2127
"0 CORRECT ADJ dobry ADJ \n",
"1 CORRECT NOUN wieczór NOUN \n",
"2 DELETION PRON xxx \n",
"3 DELETION VERB słucham \n",
"4 SUBSTITUTION ADJ dobry ADP \n",
"5 CORRECT NOUN wieczór NOUN \n",
"6 SUBSTITUTION NOUN panu CCONJ \n",
"7 SUBSTITUTION VERB mam PART \n",
"8 SUBSTITUTION ADP do PART \n",
"9 SUBSTITUTION NOUN pana PUNCT \n",
"10 SUBSTITUTION NOUN prośbę X \n",
"11 SUBSTITUTION VERB proszę PUNCT \n",
"12 SUBSTITUTION VERB zobaczyć ADV \n",
"13 SUBSTITUTION ADP z SCONJ \n",
"14 SUBSTITUTION NOUN pętli DET \n",
"15 CORRECT ADJ Szczęśliwickiej ADJ \n",
"16 INSERTION DET \n",
"17 CORRECT NUM sto NUM \n",
"18 INSERTION DET \n",
"19 INSERTION PUNCT \n",
"20 CORRECT NOUN osiemdziesiąt NOUN \n",
"21 SUBSTITUTION NUM cztery PUNCT \n",
"22 SUBSTITUTION ADV jutro AUX \n",
"23 SUBSTITUTION ADP w DET \n",
"24 CORRECT NOUN sobotę NOUN \n",
"25 INSERTION PUNCT \n",
"26 INSERTION PUNCT \n",
"27 SUBSTITUTION ADP o X \n",
"28 SUBSTITUTION ADJ dwunastej PUNCT \n",
"29 SUBSTITUTION CCONJ i PUNCT \n",
"30 SUBSTITUTION ADJ trzynastej PROPN \n",
"31 SUBSTITUTION VERB proszę PUNCT \n",
"32 SUBSTITUTION VERB podać PUNCT \n",
"33 CORRECT NOUN rozkład NOUN \n",
"34 SUBSTITUTION ADJ dwunasta PUNCT \n",
"35 SUBSTITUTION NUM dwie DET \n",
"36 SUBSTITUTION ADV tak VERB \n",
"37 SUBSTITUTION NUM dwadzieścia DET \n",
"38 SUBSTITUTION NUM dwie NOUN \n",
"39 CORRECT ADV tak ADV \n",
"40 SUBSTITUTION NUM czterdzieści ADV \n",
"41 SUBSTITUTION NUM dwie ADP \n",
"42 CORRECT NOUN trzynasta NOUN \n",
"43 CORRECT ADV tak ADV \n",
"44 SUBSTITUTION ADV samo NUM \n",
"45 SUBSTITUTION VERB dziękuję NUM \n",
"46 CORRECT NOUN panu NOUN \n",
"47 SUBSTITUTION NOUN dobranoc VERB \n",
"48 SUBSTITUTION VERB proszę PRON \n",
"49 SUBSTITUTION ADV bardzo ADP \n",
"50 CORRECT NOUN dobranoc NOUN \n",
"51 INSERTION SPACE \n",
2130
2131
2132
2133
2134
2135
2136
2137
2138
2139
2140
2141
2142
2143
2144
2145
2146
2147
2148
2149
2150
2151
2152
2153
2154
2155
2156
2157
2158
2159
2160
2161
2162
2163
2164
2165
2166
2167
2168
2169
2170
2171
2172
2173
2174
2175
2176
2177
2178
2179
2180
2181
"0 dobry \n",
"1 wieczór \n",
"2 \n",
"3 \n",
"4 w \n",
"5 sali \n",
"6 oraz \n",
"7 tak \n",
"8 naprawdę \n",
"9 < \n",
"10 unk \n",
"11 > \n",
"12 tak \n",
"13 jak \n",
"14 ten \n",
"15 nieszczęśliwi \n",
"16 ta \n",
"17 osiemdziesiąt \n",
"18 te \n",
"19 < \n",
"20 unk \n",
"21 > \n",
"22 to \n",
"23 taka \n",
"24 zabawa \n",
"25 - \n",
"26 < \n",
"27 unk \n",
"28 > \n",
"29 < \n",
"30 unk \n",
"31 > \n",
"32 < \n",
"33 unk \n",
"34 > \n",
"35 ta \n",
"36 sięga \n",
"37 tej \n",
"38 szepeta \n",
"39 stąd \n",
"40 tak \n",
"41 od \n",
"42 pieszczot \n",
"43 tak \n",
"44 czterdziestu \n",
"45 trzech \n",
"46 stoczni \n",
"47 kieruje \n",
"48 się \n",
"49 na \n",
"50 dobranoc \n",
"51 "
]
},
"metadata": {},
"output_type": "display_data"
},
{
"name": "stdout",
"output_type": "stream",
"text": [
"--------------------------------------------------------------\n",
"--------------------------------------------------------------\n",
"--------------------------------------------------------------\n",
"record_id: LUNA.PL__KIEDY__KIEPSKAJAKOSC__M__1_2007-03-23_15_29_03__1_2007-03-23_15_29_03\n",
"properties_confiog: AJN ASR\n",
"gold transcript: xxx dzień dobry dzień dobry proszę pana chciałbym się dowiedzieć o której będzie siedemset osiem siedemset dwadzieścia sześć z Placu Wilsona najbliższy siedemset osiem piętnasta pięćdziesiąt aha a linia siedemset dwadzieścia sześć o dopiero szesnasta dwana~ zero dwa aha czy i piętnasta pięćdziesiąt dobra dziękuję bardzo proszę bardzo\n",
"asr transcript: dobre dobre szkoła uczą się trudnej sztuki o przyszłość przeszedł płatów ono najbliższe <unk> siedemset osiem jedenasta pięćdziesiąt a linia siedemset dwadzieścia sześć <unk> dopiero szesnasto dwa zero dwa - od do w m2 \n",
2204
2205
2206
2207
2208
2209
2210
2211
2212
2213
2214
2215
2216
2217
2218
2219
2220
2221
2222
2223
2224
2225
2226
2227
2228
2229
2230
2231
2232
2233
2234
2235
"\n"
]
},
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>step_type</th>\n",
" <th>reference_word_text</th>\n",
" <th>hypothesis_word_text</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>0</th>\n",
" <td>DELETION</td>\n",
" <td>xxx</td>\n",
" <td></td>\n",
" <td>DELETION</td>\n",
" <td>dzień</td>\n",
" <td></td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>DELETION</td>\n",
" <td></td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>DELETION</td>\n",
" <td>dzień</td>\n",
" <td></td>\n",
" <td>DELETION</td>\n",
" <td>dobry</td>\n",
" <td></td>\n",
" <td>DELETION</td>\n",
" <td>proszę</td>\n",
" <td></td>\n",
" <td>DELETION</td>\n",
" <td>pana</td>\n",
" <td></td>\n",
" </tr>\n",
" <tr>\n",
" <th>7</th>\n",
" <td>DELETION</td>\n",
" <td></td>\n",
" </tr>\n",
" <tr>\n",
" <th>8</th>\n",
" <td>DELETION</td>\n",
" <td>się</td>\n",
" <td></td>\n",
" <td>DELETION</td>\n",
" <td>dowiedzieć</td>\n",
" <td></td>\n",
" <td>DELETION</td>\n",
" <td>o</td>\n",
" <td></td>\n",
" <td>DELETION</td>\n",
" <td>której</td>\n",
" <td></td>\n",
" <td>SUBSTITUTION</td>\n",
" <td>będzie</td>\n",
" <td>{'id': '97706128-6c06-49b2-bd0d-289d267b9eaf',...</td>\n",
" <td>SUBSTITUTION</td>\n",
" <td>siedemset</td>\n",
" <td>{'id': 'cf76ee40-5c88-401c-9ee8-bf379c54e1ff',...</td>\n",
" </tr>\n",
" <td>SUBSTITUTION</td>\n",
" <td>osiem</td>\n",
" <td>{'id': '10ac0766-ed02-46da-83bf-fb83b41bf306',...</td>\n",
" <td>SUBSTITUTION</td>\n",
" <td>siedemset</td>\n",
" <td>{'id': '93fd858e-33f2-47a1-99ca-0eef8bf041e7',...</td>\n",
" <td>SUBSTITUTION</td>\n",
" <td>dwadzieścia</td>\n",
" <td>{'id': 'ed3e6703-68c4-45ed-8ffc-2e62e3a58f59',...</td>\n",
" <td>SUBSTITUTION</td>\n",
" <td>sześć</td>\n",
" <td>{'id': '45832f9f-f294-4dfe-85d5-6aece2f44a8b',...</td>\n",
" <td>SUBSTITUTION</td>\n",
" <td>z</td>\n",
" <td>{'id': '784cc894-079c-4d2b-a88e-50bed8a0fdcc',...</td>\n",
" <td>SUBSTITUTION</td>\n",
" <td>Placu</td>\n",
" <td>{'id': '3a490c81-6e2b-4bf5-ae74-665ab0da46fe',...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>20</th>\n",
" <td>SUBSTITUTION</td>\n",
" <td>Wilsona</td>\n",
" <td>{'id': 'b789258a-6c14-41a6-b297-07f088250996',...</td>\n",
" <td>SUBSTITUTION</td>\n",
" <td>najbliższy</td>\n",
" <td>{'id': '67837002-ca71-44ff-ac1b-9ed040d7be19',...</td>\n",
" <td>SUBSTITUTION</td>\n",
" <td>siedemset</td>\n",
" <td>{'id': '01eea712-2c8f-4240-9a92-e28339209bad',...</td>\n",
" <td>SUBSTITUTION</td>\n",
" <td>osiem</td>\n",
" <td>{'id': 'e2e7e72c-5b62-42b6-8d2d-7ee667bc962b',...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>24</th>\n",
" <td>SUBSTITUTION</td>\n",
" <td>piętnasta</td>\n",
" <td>{'id': '40e58b70-3895-4478-a716-2618ab4188cb',...</td>\n",
" <td>SUBSTITUTION</td>\n",
" <td>pięćdziesiąt</td>\n",
" <td>{'id': '0264cb00-774c-407b-a1d6-09b14c3d40d7',...</td>\n",
" <td>SUBSTITUTION</td>\n",
" <td>aha</td>\n",
" <td>{'id': 'ad04606b-f48d-4101-863d-0c3e228d5b20',...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>27</th>\n",
" <td>SUBSTITUTION</td>\n",
" <td>a</td>\n",
" <td>{'id': 'c11b8f03-dcf3-4bad-9980-d0d4bcbb05d6',...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>28</th>\n",
" <td>SUBSTITUTION</td>\n",
" <td>linia</td>\n",
" <td>{'id': '6cb9d96c-e03c-4200-adc6-504081776716',...</td>\n",
" <td>SUBSTITUTION</td>\n",
" <td>siedemset</td>\n",
" <td>{'id': 'c1be6d7d-6e31-42cf-b487-dadfb813b949',...</td>\n",
" <td>SUBSTITUTION</td>\n",
" <td>dwadzieścia</td>\n",
" <td>{'id': '7546b817-909f-40cf-a99b-1c3e38e6b71e',...</td>\n",
" <td>SUBSTITUTION</td>\n",
" <td>sześć</td>\n",
" <td>{'id': '83dc5c76-c19a-4fcf-afc5-91c1af848aa8',...</td>\n",
" <td>SUBSTITUTION</td>\n",
" <td>o</td>\n",
" <td>{'id': '06521db4-6f76-4df2-acac-abf09216c23c',...</td>\n",
" <td>SUBSTITUTION</td>\n",
" <td>dopiero</td>\n",
" <td>{'id': 'b5c87393-9250-408b-9b7e-87a6a63270b9',...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>34</th>\n",
" <td>SUBSTITUTION</td>\n",
" <td>szesnasta</td>\n",
" <td>{'id': '51a9e4d4-59ee-4c49-8bf7-631c14dd81df',...</td>\n",
" <td>SUBSTITUTION</td>\n",
" <td>dwana~</td>\n",
" <td>{'id': 'dfa946ba-5afd-466a-805a-0b0304992887',...</td>\n",
" <td>SUBSTITUTION</td>\n",
" <td>zero</td>\n",
" <td>{'id': 'e4a7a144-d356-4690-b467-ee9664c72541',...</td>\n",
" <td>SUBSTITUTION</td>\n",
" <td>dwa</td>\n",
" <td>{'id': '1712bf77-0159-4ac4-9f1c-9188722435a2',...</td>\n",
" <td>SUBSTITUTION</td>\n",
" <td>aha</td>\n",
" <td>{'id': '3fe15df0-90f8-42b9-b944-5fa1d4d68acf',...</td>\n",
" <td>SUBSTITUTION</td>\n",
" <td>czy</td>\n",
" <td>{'id': '3995879e-cfe7-4c6d-8c6c-f9cc7b60c8ba',...</td>\n",
" <td>SUBSTITUTION</td>\n",
" <td>i</td>\n",
" <td>{'id': '0673baac-5122-4d7c-89ae-7fa3cb6a85bd',...</td>\n",
" <td>SUBSTITUTION</td>\n",
" <td>piętnasta</td>\n",
" <td>{'id': 'bbecbad1-e7f2-4d74-a407-0965471ff77a',...</td>\n",
" <td>SUBSTITUTION</td>\n",
" <td>pięćdziesiąt</td>\n",
" <td>{'id': '02751a1c-1066-454b-8bc9-1366c8a123f8',...</td>\n",
" <td>SUBSTITUTION</td>\n",
" <td>dobra</td>\n",
" <td>{'id': '2af896fd-271d-4d13-865a-de5f1c019870',...</td>\n",
" <td>SUBSTITUTION</td>\n",
" <td>dziękuję</td>\n",
" <td>{'id': '16310151-713a-445b-809b-f4c145c2ded0',...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>45</th>\n",
" <td>SUBSTITUTION</td>\n",
" <td>bardzo</td>\n",
" <td>{'id': '1565f3f6-7646-4039-9b0d-a983c9251152',...</td>\n",
" <td>SUBSTITUTION</td>\n",
" <td>proszę</td>\n",
" <td>{'id': '43027b2b-d799-451e-8d3a-dbfb46c88796',...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>47</th>\n",
" <td>SUBSTITUTION</td>\n",
" <td>bardzo</td>\n",
" <td>{'id': '64449d2e-d139-4a2b-b8a0-f2003e3a61d4',...</td>\n",
2522
2523
2524
2525
2526
2527
2528
2529
2530
2531
2532
2533
2534
2535
2536
2537
2538
2539
2540
2541
2542
2543
2544
2545
2546
2547
2548
2549
2550
2551
2552
2553
2554
2555
2556
2557
2558
2559
2560
2561
2562
2563
2564
2565
2566
2567
2568
2569
2570
2571
2572
2573
2574
2575
2576
2577
2578
2579
2580
2581
2582
2583
2584
2585
2586
2587
2588
2589
2590
2591
2592
2593
2594
2595
2596
2597
2598
2599
2600
2601
2602
2603
2604
2605
2606
2607
2608
2609
2610
2611
2612
2613
2614
2615
2616
2617
2618
2619
2620
2621
2622
2623
2624
2625
2626
2627
2628
2629
2630
2631
2632
2633
2634
2635
2636
2637
2638
2639
2640
2641
2642
2643
2644
2645
2646
2647
2648
2649
2650
2651
2652
2653
2654
2655
2656
2657
2658
2659
2660
2661
2662
2663
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" step_type reference_word_text \\\n",
"0 DELETION xxx \n",
"1 DELETION dzień \n",
"2 DELETION dobry \n",
"3 DELETION dzień \n",
"4 DELETION dobry \n",
"5 DELETION proszę \n",
"6 DELETION pana \n",
"7 DELETION chciałbym \n",
"8 DELETION się \n",
"9 DELETION dowiedzieć \n",
"10 DELETION o \n",
"11 DELETION której \n",
"12 SUBSTITUTION będzie \n",
"13 SUBSTITUTION siedemset \n",
"14 SUBSTITUTION osiem \n",
"15 SUBSTITUTION siedemset \n",
"16 SUBSTITUTION dwadzieścia \n",
"17 SUBSTITUTION sześć \n",
"18 SUBSTITUTION z \n",
"19 SUBSTITUTION Placu \n",
"20 SUBSTITUTION Wilsona \n",
"21 SUBSTITUTION najbliższy \n",
"22 SUBSTITUTION siedemset \n",
"23 SUBSTITUTION osiem \n",
"24 SUBSTITUTION piętnasta \n",
"25 SUBSTITUTION pięćdziesiąt \n",
"26 SUBSTITUTION aha \n",
"27 SUBSTITUTION a \n",
"28 SUBSTITUTION linia \n",
"29 SUBSTITUTION siedemset \n",
"30 SUBSTITUTION dwadzieścia \n",
"31 SUBSTITUTION sześć \n",
"32 SUBSTITUTION o \n",
"33 SUBSTITUTION dopiero \n",
"34 SUBSTITUTION szesnasta \n",
"35 SUBSTITUTION dwana~ \n",
"36 SUBSTITUTION zero \n",
"37 SUBSTITUTION dwa \n",
"38 SUBSTITUTION aha \n",
"39 SUBSTITUTION czy \n",
"40 SUBSTITUTION i \n",
"41 SUBSTITUTION piętnasta \n",
"42 SUBSTITUTION pięćdziesiąt \n",
"43 SUBSTITUTION dobra \n",
"44 SUBSTITUTION dziękuję \n",
"45 SUBSTITUTION bardzo \n",
"46 SUBSTITUTION proszę \n",
"47 SUBSTITUTION bardzo \n",
"\n",
" hypothesis_word_text \n",
"0 \n",
"1 \n",
"2 \n",
"3 \n",
"4 \n",
"5 \n",
"6 \n",
"7 \n",
"8 \n",
"9 \n",
"10 \n",
"11 \n",
"12 {'id': '97706128-6c06-49b2-bd0d-289d267b9eaf',... \n",
"13 {'id': 'cf76ee40-5c88-401c-9ee8-bf379c54e1ff',... \n",
"14 {'id': '10ac0766-ed02-46da-83bf-fb83b41bf306',... \n",
"15 {'id': '93fd858e-33f2-47a1-99ca-0eef8bf041e7',... \n",
"16 {'id': 'ed3e6703-68c4-45ed-8ffc-2e62e3a58f59',... \n",
"17 {'id': '45832f9f-f294-4dfe-85d5-6aece2f44a8b',... \n",
"18 {'id': '784cc894-079c-4d2b-a88e-50bed8a0fdcc',... \n",
"19 {'id': '3a490c81-6e2b-4bf5-ae74-665ab0da46fe',... \n",
"20 {'id': 'b789258a-6c14-41a6-b297-07f088250996',... \n",
"21 {'id': '67837002-ca71-44ff-ac1b-9ed040d7be19',... \n",
"22 {'id': '01eea712-2c8f-4240-9a92-e28339209bad',... \n",
"23 {'id': 'e2e7e72c-5b62-42b6-8d2d-7ee667bc962b',... \n",
"24 {'id': '40e58b70-3895-4478-a716-2618ab4188cb',... \n",
"25 {'id': '0264cb00-774c-407b-a1d6-09b14c3d40d7',... \n",
"26 {'id': 'ad04606b-f48d-4101-863d-0c3e228d5b20',... \n",
"27 {'id': 'c11b8f03-dcf3-4bad-9980-d0d4bcbb05d6',... \n",
"28 {'id': '6cb9d96c-e03c-4200-adc6-504081776716',... \n",
"29 {'id': 'c1be6d7d-6e31-42cf-b487-dadfb813b949',... \n",
"30 {'id': '7546b817-909f-40cf-a99b-1c3e38e6b71e',... \n",
"31 {'id': '83dc5c76-c19a-4fcf-afc5-91c1af848aa8',... \n",
"32 {'id': '06521db4-6f76-4df2-acac-abf09216c23c',... \n",
"33 {'id': 'b5c87393-9250-408b-9b7e-87a6a63270b9',... \n",
"34 {'id': '51a9e4d4-59ee-4c49-8bf7-631c14dd81df',... \n",
"35 {'id': 'dfa946ba-5afd-466a-805a-0b0304992887',... \n",
"36 {'id': 'e4a7a144-d356-4690-b467-ee9664c72541',... \n",
"37 {'id': '1712bf77-0159-4ac4-9f1c-9188722435a2',... \n",
"38 {'id': '3fe15df0-90f8-42b9-b944-5fa1d4d68acf',... \n",
"39 {'id': '3995879e-cfe7-4c6d-8c6c-f9cc7b60c8ba',... \n",
"40 {'id': '0673baac-5122-4d7c-89ae-7fa3cb6a85bd',... \n",
"41 {'id': 'bbecbad1-e7f2-4d74-a407-0965471ff77a',... \n",
"42 {'id': '02751a1c-1066-454b-8bc9-1366c8a123f8',... \n",
"43 {'id': '2af896fd-271d-4d13-865a-de5f1c019870',... \n",
"44 {'id': '16310151-713a-445b-809b-f4c145c2ded0',... \n",
"45 {'id': '1565f3f6-7646-4039-9b0d-a983c9251152',... \n",
"46 {'id': '43027b2b-d799-451e-8d3a-dbfb46c88796',... \n",
"47 {'id': '64449d2e-d139-4a2b-b8a0-f2003e3a61d4',... "
]
},
"metadata": {},
"output_type": "display_data"
},
{
"name": "stdout",
"output_type": "stream",
"text": [
"\n"
]
},
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>step_type</th>\n",
" <th>reference_word_pos</th>\n",
" <th>reference_word_text</th>\n",
" <th>hypothesis_word_pos</th>\n",
" <th>hypothesis_word_text</th>\n",
" <th>0</th>\n",
" <td>DELETION</td>\n",
" <td>PRON</td>\n",
" <td>xxx</td>\n",
" <td></td>\n",
" <th>1</th>\n",
" <td>DELETION</td>\n",
" <td>NOUN</td>\n",
" <td>dzień</td>\n",
" <td></td>\n",
" <th>2</th>\n",
" <td>CORRECT</td>\n",
" <td>ADJ</td>\n",
" <td>dobry</td>\n",
" <td>ADJ</td>\n",
" <td>dobre</td>\n",
" <th>3</th>\n",
" <td>DELETION</td>\n",
" <td>NOUN</td>\n",
" <td>dzień</td>\n",
" <td></td>\n",
" <td></td>\n",
" <td>ADJ</td>\n",
" <td>dobry</td>\n",
" <td>ADJ</td>\n",
" <td>dobre</td>\n",
" <td>VERB</td>\n",
" <td>proszę</td>\n",
" <td></td>\n",
" <th>6</th>\n",
" <td>CORRECT</td>\n",
" <td>NOUN</td>\n",
" <td>pana</td>\n",
" <td>NOUN</td>\n",
" <td>szkoła</td>\n",
" <td>VERB</td>\n",
" <td>chciałbym</td>\n",
" <td>VERB</td>\n",
" <td>uczą</td>\n",
" <td>PRON</td>\n",
" <td>się</td>\n",
" <td>PRON</td>\n",
" <td>się</td>\n",
" <th>9</th>\n",
" <td>INSERTION</td>\n",
" <td></td>\n",
" <td></td>\n",
" <td>ADJ</td>\n",
" <td>trudnej</td>\n",
" <td>VERB</td>\n",
" <td>dowiedzieć</td>\n",
" <td>NOUN</td>\n",
" <td>sztuki</td>\n",
" <td>ADP</td>\n",
" <td>o</td>\n",
" <td>ADP</td>\n",
" <td>o</td>\n",
" <th>12</th>\n",
" <td>SUBSTITUTION</td>\n",
" <td>DET</td>\n",
" <td>której</td>\n",
" <td>NOUN</td>\n",
" <td>przyszłość</td>\n",
" <td>VERB</td>\n",
" <td>będzie</td>\n",
" <td>VERB</td>\n",
" <td>przeszedł</td>\n",
" <th>14</th>\n",
" <td>DELETION</td>\n",
" <td>NUM</td>\n",
" <td>siedemset</td>\n",
" <td></td>\n",
" <td></td>\n",
" <th>15</th>\n",
" <td>DELETION</td>\n",
" <td>NUM</td>\n",
" <td>osiem</td>\n",
" <td></td>\n",
" <td></td>\n",
" </tr>\n",
" <tr>\n",
" <th>16</th>\n",
" <td>NOUN</td>\n",
" <td>siedemset</td>\n",
" <td>NOUN</td>\n",
" <td>płatów</td>\n",
" <th>17</th>\n",
" <td>DELETION</td>\n",
" <td>NUM</td>\n",
" <td>dwadzieścia</td>\n",
" <td></td>\n",
" <td></td>\n",
" </tr>\n",
" <tr>\n",
" <th>18</th>\n",
" <td>DELETION</td>\n",
" <td>NUM</td>\n",
" <td>sześć</td>\n",
" <td></td>\n",
" <td></td>\n",
" </tr>\n",
" <tr>\n",
" <th>19</th>\n",
" <td>ADP</td>\n",
" <td>z</td>\n",
" <td>PRON</td>\n",
" <td>ono</td>\n",
" <th>20</th>\n",
" <td>SUBSTITUTION</td>\n",
" <td>PROPN</td>\n",
" <td>Placu</td>\n",
" <td>ADJ</td>\n",
" <td>najbliższe</td>\n",
" <th>21</th>\n",
" <td>SUBSTITUTION</td>\n",
" <td>PROPN</td>\n",
" <td>Wilsona</td>\n",
" <td>PUNCT</td>\n",
" <td><</td>\n",
" <th>22</th>\n",
" <td>SUBSTITUTION</td>\n",
" <td>ADJ</td>\n",
" <td>najbliższy</td>\n",
" <td>NOUN</td>\n",
" <td>unk</td>\n",
" <th>23</th>\n",
" <td>SUBSTITUTION</td>\n",
" <td>NUM</td>\n",
" <td>siedemset</td>\n",
" <td>PUNCT</td>\n",
" <td>></td>\n",
" <th>24</th>\n",
" <td>SUBSTITUTION</td>\n",
" <td>NUM</td>\n",
" <td>osiem</td>\n",
" <td>NOUN</td>\n",
" <td>siedemset</td>\n",
" <td>ADJ</td>\n",
" <td>piętnasta</td>\n",
" <td>ADJ</td>\n",
" <td>osiem</td>\n",
" <td>NOUN</td>\n",
" <td>pięćdziesiąt</td>\n",
" <td>VERB</td>\n",
" <td>jedenasta</td>\n",
" <th>27</th>\n",
" <td>SUBSTITUTION</td>\n",
" <td>NOUN</td>\n",
" <td>CCONJ</td>\n",
" <td>a</td>\n",
" <td>CCONJ</td>\n",
" <td>a</td>\n",
" <td>NOUN</td>\n",
" <td>linia</td>\n",
" <td>NOUN</td>\n",
" <td>linia</td>\n",
" <th>30</th>\n",
" <td>CORRECT</td>\n",
" <td>NUM</td>\n",
" <td>siedemset</td>\n",
" <td>NUM</td>\n",
" <td>siedemset</td>\n",
" <td>NUM</td>\n",
" <td>dwadzieścia</td>\n",
" <td>NUM</td>\n",
" <td>dwadzieścia</td>\n",
" <td>NUM</td>\n",
" <td>sześć</td>\n",
" <td>NUM</td>\n",
" <td>sześć</td>\n",
" <td></td>\n",
" <td></td>\n",
" </tr>\n",
" <tr>\n",
" <td>PART</td>\n",
" <td>dopiero</td>\n",
" <td>PUNCT</td>\n",
" <td><</td>\n",
" <td>NOUN</td>\n",
" <td>szesnasta</td>\n",
" <td>NOUN</td>\n",
" <td>unk</td>\n",
" <th>36</th>\n",
" <td>SUBSTITUTION</td>\n",
" <td>ADJ</td>\n",
" <td>dwana</td>\n",
" <td>PUNCT</td>\n",
" <td>></td>\n",
" <th>37</th>\n",
" <td>SUBSTITUTION</td>\n",
" <td>NOUN</td>\n",
" <td>~</td>\n",
" <td>PART</td>\n",
" <td>dopiero</td>\n",
" <td>NOUN</td>\n",
" <td>zero</td>\n",
" <td>ADV</td>\n",
" <td>szesnasto</td>\n",
" <td>NUM</td>\n",
" <td>dwa</td>\n",
" <td>NUM</td>\n",
" <td>dwa</td>\n",
" <td>NOUN</td>\n",
" <td>aha</td>\n",
" <td></td>\n",
" <th>41</th>\n",
" <td>DELETION</td>\n",
" <td>CCONJ</td>\n",
" <td>czy</td>\n",
" <td></td>\n",