Skip to content

Commit 5be37dc

Browse files
committed
created cache file for corrections to corpus
1 parent 8d68377 commit 5be37dc

7 files changed

Lines changed: 620 additions & 118 deletions
Lines changed: 15 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,15 @@
1+
,doc_offset,corpus_span,correct_span,error_type
2+
0,15.0,"[41, 51): 'CUNNINGHAM'","(33, 51]: 'RANDALL CUNNINGHAM'",Token
3+
1,15.0,"[41, 51): 'CUNNINGHAM'","(33,51] 'RANDALL CUNNINGHAM'",Token
4+
2,15.0,"[15, 40): 'AMERICAN FOOTBALL-RANDALL'","[15, 32): 'AMERICAN FOOTBALL'",Token
5+
3,15.0,"[15, 40): 'AMERICAN FOOTBALL-RANDALL'","[33, 40): 'RANDALL'",Token
6+
4,15.0,"[41, 51): 'CUNNINGHAM'","[33,51): 'RANDALL CUNNINGHAM'",Token
7+
5,39.0,"[11, 23): 'Boxing-Bruno'","[18, 23): 'Bruno'",Token
8+
6,39.0,,"[18, 23): 'Bruno' ",Token
9+
7,60.0,"[1358, 1371): 'Tripoli-based'","[1358, 1365): 'Tripoli'",Token
10+
8,65.0,"[1125, 1134): 'asset-St.'","[1131, 1146): 'St. Louis based'",Token
11+
9,65.0,"[592, 607): 'St. Louis-based'","[592, 601): 'St. Louis'",Token
12+
10,65.0,"[1125, 1134): 'asset-St.'",,Token
13+
11,175.0,"[252, 264): 'London-based'","[252, 258): 'London'",Token
14+
12,181.0,"[1761, 1774): 'Moscow-backed'","[1761, 1767): 'Moscow'",Token
15+
13,198.0,"[39, 47): 'aid-U.N.'","[43, 47): 'U.N.'",Token
Lines changed: 45 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,45 @@
1+
,doc_offset,corpus_span,correct_span,error_type
2+
0,3.0,"[21, 37): 'SKIING-WORLD CUP'","[28, 37): 'WORLD CUP'",Token
3+
1,3.0,"[21, 37): 'SKIING-WORLD CUP'","[28,37)'WORLD CUP'",Token
4+
2,22.0,"[19, 23): 'ARAB'","[19, 35): 'ARAB CONTRACTORS'",Token
5+
3,27.0,"[565, 573): 'X-DENVER'","[567, 573): 'DENVER'",Token
6+
4,27.0,,"[567, 573): 'DENVER'",Token
7+
5,27.0,"[889, 900): 'Y-GREEN BAY'","[891, 900): 'GREEN BAY'",Token
8+
6,29.0,"[25, 44): 'FOOTBALL-OHIO STATE'","[34, 44): 'OHIO STATE'",Token
9+
7,29.0,"[25, 44): 'FOOTBALL-OHIO STATE'","[34,44): 'OHIO STATE'",Token
10+
8,39.0,"[1158, 1175): 'AbelardoFernandez'","[1158, 1175): 'Abelardo Fernandez'",Token
11+
9,54.0,"[1145, 1152): 'Boxmeer'","[1141, 1152): 'van Boxmeer'",Token
12+
10,54.0,"[11, 27): 'INTERVIEW-ZYWIEC'","[21, 27): 'ZYWIEC'",Token
13+
11,54.0,"[2594, 2601): 'Boxmeer'","[2590, 2601): 'van Boxmeer'",Token
14+
12,54.0,"[3231, 3241): 'Full Light'","[3224, 3241): 'Zywiec Full Light'",Token
15+
13,54.0,"[3421, 3428): 'Boxmeer'","[3417, 3428): 'van Boxmeer'",Token
16+
14,54.0,,"[?, 27): 'ZYWIEC'",Token
17+
15,56.0,"[11, 16): 'UK-US'","[11, 13): 'UK'",Token
18+
16,56.0,"[11, 16): 'UK-US'","[11,13) 'UK'",Token
19+
17,56.0,"[11, 16): 'UK-US'","[14, 16): 'US'",Token
20+
18,56.0,"[11, 16): 'UK-US'","[14,16) 'UK'",Token
21+
19,60.0,"[345, 363): 'Trade and Industry'","[345, 373): 'Trade and Industry Secretary'",Token
22+
20,63.0,"[19, 39): 'office-Conservatives'","[26, 39): 'Conservatives' ",Token
23+
21,63.0,"[19, 39): 'office-Conservatives'","[27, 39): 'Conservatives'",Token
24+
22,68.0,"[11, 19): 'Canadian'","[11, 30): 'Canadian West Coast'",Token
25+
23,68.0,"[157, 165): 'Canadian'",,Token
26+
24,70.0,"[177, 197): 'New York Commodities'","[177, 202): 'New York Commodities Desk'",Token
27+
25,71.0,"[153, 173): 'New York Commodities'","[153, 178): 'New York Commodities Desk'",Token
28+
26,75.0,"[2736, 2752): 'Newmont-Santa Fe'","[2736, 2743): 'Newmont'",Token
29+
27,75.0,"[2736, 2752): 'Newmont-Santa Fe'","[2744, 2752): 'Santa Fe'",Token
30+
28,114.0,"[11, 17): 'Iowa-S'","[11, 15): 'Iowa'",Token
31+
29,114.0,"[11, 17): 'Iowa-S'","[11, 15): 'Iowa' ",Token
32+
30,114.0,"[51, 61): 'sales-USDA'","[57, 61): 'USDA'",Token
33+
31,114.0,"[51, 61): 'sales-USDA'",,Token
34+
32,123.0,"[11, 17): 'Iowa-S'","[11, 15): 'Iowa' ",Token
35+
33,178.0,"[951, 960): 'then-U.S.'","[956, 960): 'U.S.'",Token
36+
34,183.0,"[18, 35): 'SKIING-GLADISHIVA'","[25, 35): 'GLADISHIVA'",Token
37+
35,186.0,,"[1398, 1405): 'Austria'",Token
38+
36,188.0,"[18, 34): 'SKIING-WORLD CUP'","[25, 34): 'WORLD CUP'",Token
39+
37,190.0,"[11, 27): 'BOBSLEIGH-SHIMER'","[21, 27): 'SHIMER'",Token
40+
38,190.0,"[11, 27): 'BOBSLEIGH-SHIMER'",,Token
41+
39,191.0,"[11, 25): 'SKIING-CHINESE'","[18, 25): 'CHINESE'",Token
42+
40,192.0,"[11, 30): 'BOBSLEIGH-WORLD CUP'","[21, 30): 'WORLD CUP'",Token
43+
41,194.0,"[21, 37): 'SKIING-WORLD CUP'","[28, 37): 'WORLD CUP'",Token
44+
42,195.0,"[21, 37): 'SKIING-WORLD CUP'","[28, 37): 'WORLD CUP'",Token
45+
43,214.0,"[243, 262): 'Saturday'sWorld Cup'","[253, 262): 'World Cup'",Token
Lines changed: 20 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,20 @@
1+
,doc_offset,corpus_span,correct_span,error_type
2+
0,80.0,,"[44, 59): 'Interfax'",Token
3+
1,80.0,,"[51, 59): 'Interfax'",Token
4+
2,115.0,,"[23, 27): 'News'",Token
5+
3,163.0,"[220, 232): 'x-AEK Athens'","[222, 232): 'AEK Athens'",Token
6+
4,163.0,"[271, 283): 'x-Olympiakos'","[273, 283): 'Olympiakos'",Token
7+
5,163.0,"[308, 313): 'x-PAO'","[310, 313): 'PAO'",Token
8+
6,169.0,"[50, 61): 'trip-Canada'","[55, 61): 'Canada'",Token
9+
7,298.0,"[49, 60): '1997--Ruehe'","[55, 60): 'Ruehe'",Token
10+
8,343.0,"[11, 31): 'AUSTRALIAN RULES-AFL'","[11, 21): 'AUSTRALIAN'",Token
11+
9,343.0,"[11, 31): 'AUSTRALIAN RULES-AFL'","[11, 27): 'AUSTRALIAN RULES'",Token
12+
10,343.0,"[11, 31): 'AUSTRALIAN RULES-AFL'","[28, 31): 'AFL'",Token
13+
11,343.0,"[11, 31): 'AUSTRALIAN RULES-AFL'","[11, 21): 'AUSTRALIAN'",Token
14+
12,422.0,"[236, 246): 'Videoton(*'","[236, 244): 'Videoton'",Token
15+
13,593.0,"[45, 57): 'France-Juppe'","[45, 51): 'France'",Token
16+
14,593.0,"[45, 57): 'France-Juppe'","[52, 57): 'Juppe'",Token
17+
15,626.0,"[42, 59): 'disarmament-China'","[42, 59): 'disarmament-China'",Token
18+
16,701.0,"[17, 30): 'union-England'","[23, 30): 'England'",Token
19+
17,918.0,"[11, 24): 'INTERVIEW-T&N'","[11, 24): 'INTERVIEW-T&N'",Token
20+
18,918.0,"[11, 24): 'INTERVIEW-T&N'","[21, 24): 'T&N'",Token
Lines changed: 196 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,196 @@
1+
,fold,line_no,doc_offset,corpus_span,correct_span,correct_line
2+
0,test,1131.0,3.0,"[21, 37): 'SKIING-WORLD CUP'","[28, 37): 'WORLD CUP'","SKIING NNP I-NP I-MISC
3+
- : OI-MISC
4+
WORLD NNP I-NP I-MISC"
5+
1,test,1131.0,3.0,"[21, 37): 'SKIING-WORLD CUP'","[28,37)'WORLD CUP'",
6+
2,test,5174.0,22.0,"[19, 23): 'ARAB'","[19, 35): 'ARAB CONTRACTORS'",
7+
3,test,6545.0,27.0,"[565, 573): 'X-DENVER'","[567, 573): 'DENVER'","X IN I-PP O
8+
- : 0 0
9+
DENVER NNP I-NP I-MISC"
10+
4,test,-2.0,27.0,,"[567, 573): 'DENVER'",
11+
5,test,6640.0,27.0,"[889, 900): 'Y-GREEN BAY'","[891, 900): 'GREEN BAY'","YNNP I-NP O
12+
- : O O
13+
GREEN NNP I-NP I-MISC"
14+
6,test,6851.0,29.0,"[25, 44): 'FOOTBALL-OHIO STATE'","[34, 44): 'OHIO STATE'","FOOTBALL NNP I-NP O
15+
- : O O
16+
OHIO NNP I-NP I-MISC"
17+
7,test,6851.0,29.0,"[25, 44): 'FOOTBALL-OHIO STATE'","[34,44): 'OHIO STATE'","FOOTBALL NNP I-NP O
18+
-: O O
19+
OHIO NNP I-NP I-MISC"
20+
8,test,8644.0,39.0,"[1158, 1175): 'AbelardoFernandez'","[1158, 1175): 'Abelardo Fernandez'","Abelardo NNS I-NP I-PER
21+
Fernandez NNS I-NP I-PER"
22+
9,test,12284.0,54.0,"[1145, 1152): 'Boxmeer'","[1141, 1152): 'van Boxmeer'",
23+
10,test,12068.0,54.0,"[11, 27): 'INTERVIEW-ZYWIEC'","[21, 27): 'ZYWIEC'","INTERVIEW NNP I-NP O
24+
- : O O
25+
ZYWIEC NNP I-NP I-MISC"
26+
11,test,12555.0,54.0,"[2594, 2601): 'Boxmeer'","[2590, 2601): 'van Boxmeer'",
27+
12,test,12682.0,54.0,"[3231, 3241): 'Full Light'","[3224, 3241): 'Zywiec Full Light'",
28+
13,test,12720.0,54.0,"[3421, 3428): 'Boxmeer'","[3417, 3428): 'van Boxmeer'",
29+
14,test,-2.0,54.0,,"[?, 27): 'ZYWIEC'",
30+
15,test,13001.0,56.0,"[11, 16): 'UK-US'","[11, 13): 'UK'","UK NNP I-NP I-MISC
31+
- : O O
32+
US NNP I-NP I-MISC"
33+
16,test,13001.0,56.0,"[11, 16): 'UK-US'","[11,13) 'UK'","UK NNP I-NP I-MISC
34+
- : O O
35+
US NNP I-NP I-MISC"
36+
17,test,13001.0,56.0,"[11, 16): 'UK-US'","[14, 16): 'US'","UK NNP I-NP I-MISC
37+
- : O O
38+
US NNP I-NP I-MISC"
39+
18,test,13001.0,56.0,"[11, 16): 'UK-US'","[14,16) 'UK'","UK NNP I-NP I-MISC
40+
- : O O
41+
US NNP I-NP I-MISC"
42+
19,test,13447.0,60.0,"[345, 363): 'Trade and Industry'","[345, 373): 'Trade and Industry Secretary'",
43+
20,test,14467.0,63.0,"[19, 39): 'office-Conservatives'","[26, 39): 'Conservatives' ","office NNP I-NP O
44+
- : O O
45+
Conservatives JJ I-NP I-MISC"
46+
21,test,14467.0,63.0,"[19, 39): 'office-Conservatives'","[27, 39): 'Conservatives'","office NNP I-NP O
47+
- : O O
48+
Conservatives JJ I-NP I-MISC"
49+
22,test,15155.0,68.0,"[11, 19): 'Canadian'","[11, 30): 'Canadian West Coast'",
50+
23,test,15183.0,68.0,"[157, 165): 'Canadian'",,
51+
24,test,15337.0,70.0,"[177, 197): 'New York Commodities'","[177, 202): 'New York Commodities Desk'",
52+
25,test,15380.0,71.0,"[153, 173): 'New York Commodities'","[153, 178): 'New York Commodities Desk'",
53+
26,test,16319.0,75.0,"[2736, 2752): 'Newmont-Santa Fe'","[2736, 2743): 'Newmont'","NewmontNNP I-NP I-ORG
54+
- : O O
55+
Santa NNP I-NP I-ORG"
56+
27,test,16319.0,75.0,"[2736, 2752): 'Newmont-Santa Fe'","[2744, 2752): 'Santa Fe'","Newmont NNP I-NP I-ORG
57+
- :O O
58+
Santa NNP I-NP I-ORG"
59+
28,test,26720.0,114.0,"[11, 17): 'Iowa-S'","[11, 15): 'Iowa'","Iowa I-NP I-LOC
60+
- : O O
61+
S NNP I-NP I-LOC"
62+
29,test,26720.0,114.0,"[11, 17): 'Iowa-S'","[11, 15): 'Iowa' ","Iowa I-NP I-LOC
63+
- : O O
64+
S NNP I-NP I-LOC"
65+
30,test,26728.0,114.0,"[51, 61): 'sales-USDA'","[57, 61): 'USDA'","sales NNP I-NP O
66+
- : O O
67+
USDA NN I-NP I-MISC"
68+
31,test,26728.0,114.0,"[51, 61): 'sales-USDA'",,"sales NNP I-NP O
69+
- : O O
70+
USDA NN I-NP I-MISC"
71+
32,test,28718.0,123.0,"[11, 17): 'Iowa-S'","[11, 15): 'Iowa' ","Iowa NNP I-NP I-LOC
72+
- : O O
73+
S NNP I-NP I-LOC"
74+
33,test,38688.0,178.0,"[951, 960): 'then-U.S.'","[956, 960): 'U.S.'","then RB I-ADVP O
75+
- : O O
76+
U.S. JJ I-NP I-MISC"
77+
34,test,39979.0,183.0,"[18, 35): 'SKIING-GLADISHIVA'","[25, 35): 'GLADISHIVA'","SKIING NNP I-NP O
78+
- : O O
79+
GLADISHIVA NNP I-NP I-MISC"
80+
35,test,-2.0,186.0,,"[1398, 1405): 'Austria'",
81+
36,test,41169.0,188.0,"[18, 34): 'SKIING-WORLD CUP'","[25, 34): 'WORLD CUP'","SKIING NNP I-NP O
82+
- : O O
83+
WORLD NNP I-NP I-MISC"
84+
37,test,41413.0,190.0,"[11, 27): 'BOBSLEIGH-SHIMER'","[21, 27): 'SHIMER'","BOBSLEIGH NNP I-NP O
85+
- : O O
86+
SHIMER NNP I-NP I-MISC"
87+
38,test,41413.0,190.0,"[11, 27): 'BOBSLEIGH-SHIMER'",,"BOBSLEIGH NNP I-NP O
88+
- : O O
89+
SHIMER NNP I-NP I-MISC"
90+
39,test,41595.0,191.0,"[11, 25): 'SKIING-CHINESE'","[18, 25): 'CHINESE'","SKIING NNP I-NP O
91+
- : O O
92+
CHINESE JJ I-NP I-MISC"
93+
40,test,41850.0,192.0,"[11, 30): 'BOBSLEIGH-WORLD CUP'","[21, 30): 'WORLD CUP'","BOBSLEIGH NNP I-NP O
94+
- : O O
95+
WORLD NNP I-NP I-MISC"
96+
41,test,42385.0,194.0,"[21, 37): 'SKIING-WORLD CUP'","[28, 37): 'WORLD CUP'","SKIING NNP I-NP O
97+
-: O O
98+
WORLD NNP I-NP I-MISC"
99+
42,test,-1.0,195.0,"[21, 37): 'SKIING-WORLD CUP'","[28, 37): 'WORLD CUP'",
100+
43,test,46987.0,214.0,"[243, 262): 'Saturday'sWorld Cup'","[253, 262): 'World Cup'","Saturday NNP I-NP O
101+
's POS B-NP O
102+
World NNP B-NP I-MISC"
103+
44,dev,4120.0,15.0,"[41, 51): 'CUNNINGHAM'","(33, 51]: 'RANDALL CUNNINGHAM'","FOOTBALL NNP I-NP O
104+
- : O O
105+
RANDALL NNP I-NP I-MISC"
106+
45,dev,4120.0,15.0,"[41, 51): 'CUNNINGHAM'","(33,51] 'RANDALL CUNNINGHAM'","FOOTBALL NNP I-NP O
107+
- : O O
108+
RANDALL NNP I-NP I-MISC"
109+
46,dev,4118.0,15.0,"[15, 40): 'AMERICAN FOOTBALL-RANDALL'","[15, 32): 'AMERICAN FOOTBALL'","FOOTBALL NNP I-NP O
110+
- : O O
111+
RANDALL NNP I-NP I-MISC"
112+
47,dev,4118.0,15.0,"[15, 40): 'AMERICAN FOOTBALL-RANDALL'","[33, 40): 'RANDALL'","FOOTBALL NNP I-NP O
113+
- : O O
114+
RANDALL NNP I-NP I-MISC"
115+
48,dev,4120.0,15.0,"[41, 51): 'CUNNINGHAM'","[33,51): 'RANDALL CUNNINGHAM'","FOOTBALL NNP I-NP O
116+
- : O O
117+
RANDALL NNP I-NP I-MISC"
118+
49,dev,10619.0,39.0,"[11, 23): 'Boxing-Bruno'","[18, 23): 'Bruno'","Boxing NNP I-NP O
119+
- : O O
120+
Bruno NN I-NP I-MISC"
121+
50,dev,-2.0,39.0,,"[18, 23): 'Bruno' ",
122+
51,dev,15911.0,60.0,"[1358, 1371): 'Tripoli-based'","[1358, 1365): 'Tripoli'","Tripoli NNP I-NP I-LOC
123+
- : O O
124+
based JJ I-NP I-MISC"
125+
52,dev,19233.0,65.0,"[1125, 1134): 'asset-St.'","[1131, 1146): 'St. Louis based'","asset NNP I-NP O
126+
- : O O
127+
St NN I-NP I-MISC"
128+
53,dev,19130.0,65.0,"[592, 607): 'St. Louis-based'","[592, 601): 'St. Louis'","Louis NNP I-NP I-LOC
129+
- : O O
130+
based JJ I-NP I-MISC"
131+
54,dev,19233.0,65.0,"[1125, 1134): 'asset-St.'",,"asset NNP I-NP O
132+
- : O O
133+
St NN I-NP I-MISC"
134+
55,dev,44837.0,175.0,"[252, 264): 'London-based'","[252, 258): 'London'","London NNP I_NP I-LOC
135+
- : O O
136+
based JJ I-NP I-MISC"
137+
56,dev,46457.0,181.0,"[1761, 1774): 'Moscow-backed'","[1761, 1767): 'Moscow'","Moscow NNP I-NP I-ORG
138+
- : O O
139+
backed JJ I-NP I-MISC"
140+
57,dev,50964.0,198.0,"[39, 47): 'aid-U.N.'","[43, 47): 'U.N.'","aid NN I-NP O
141+
- . O O
142+
U.N. NN I-NP I-ORG"
143+
58,train,17719.0,80.0,,"[44, 59): 'Interfax'","rebels NNP I-PP O
144+
- . O O
145+
Interfax NN I-NP O"
146+
59,train,-2.0,80.0,,"[51, 59): 'Interfax'",
147+
60,train,-2.0,115.0,,"[23, 27): 'News'",
148+
61,train,37914.0,163.0,"[220, 232): 'x-AEK Athens'","[222, 232): 'AEK Athens'","x NNP I-NP O
149+
- . O O
150+
AEK IN I-NP I-ORG"
151+
62,train,37926.0,163.0,"[271, 283): 'x-Olympiakos'","[273, 283): 'Olympiakos'","x NNP I-NP O
152+
- . O O
153+
Olympiakos NNS I-NP I-ORG"
154+
63,train,37933.0,163.0,"[308, 313): 'x-PAO'","[310, 313): 'PAO'","x NNP I-NP O
155+
- . O O
156+
PAO JJ I-NP I-ORG"
157+
64,train,38844.0,169.0,"[50, 61): 'trip-Canada'","[55, 61): 'Canada'","trip NNP I-NP O
158+
- . O O
159+
Canada NN I-NP I-MISC"
160+
65,train,65636.0,298.0,"[49, 60): '1997--Ruehe'","[55, 60): 'Ruehe'","1997CD I-NP O
161+
-- : O O
162+
Ruehe CD I-NP I-MISC"
163+
66,train,75410.0,343.0,"[11, 31): 'AUSTRALIAN RULES-AFL'","[11, 21): 'AUSTRALIAN'","RULES NNP I-NP O
164+
- : O O
165+
AFL NNP I-NP I-MISC"
166+
67,train,75410.0,343.0,"[11, 31): 'AUSTRALIAN RULES-AFL'","[11, 27): 'AUSTRALIAN RULES'","RULES NNP I-NP O
167+
- . O O
168+
AFL NNP I-NP I-MISC"
169+
68,train,75410.0,343.0,"[11, 31): 'AUSTRALIAN RULES-AFL'","[28, 31): 'AFL'","RULES NNP I-NP O
170+
- : O O
171+
AFL NNP I-NP I-MISC"
172+
69,train,75410.0,343.0,"[11, 31): 'AUSTRALIAN RULES-AFL'","[11, 21): 'AUSTRALIAN'","RULES NNP I-NP O
173+
- : O O
174+
AFL NNP I-NP I-MISC"
175+
70,train,95553.0,422.0,"[236, 246): 'Videoton(*'","[236, 244): 'Videoton'","Videoton NN I-NP I-ORG
176+
( ( O O
177+
* SYM O O"
178+
71,train,139024.0,593.0,"[45, 57): 'France-Juppe'","[45, 51): 'France'","France NNP I-NP I-LOC
179+
- . O O
180+
Juppe JJ I-NP I-PER"
181+
72,train,139024.0,593.0,"[45, 57): 'France-Juppe'","[52, 57): 'Juppe'","France NNP I-NP I-LOC
182+
- . O O
183+
Juppe JJ I-NP I-PER"
184+
73,train,146605.0,626.0,"[42, 59): 'disarmament-China'","[42, 59): 'disarmament-China'","disarmament NNP I-NP O
185+
- . O O
186+
China NN I-NP I-LOC"
187+
74,train,164709.0,701.0,"[17, 30): 'union-England'","[23, 30): 'England'","union NNP I-NP O
188+
- . O O
189+
England JJ I-NP I-ORG"
190+
75,train,213462.0,918.0,"[11, 24): 'INTERVIEW-T&N'","[11, 24): 'INTERVIEW-T&N'","INTERVIEW NNP I-NP O
191+
- . O O
192+
T&N NNP I-NP I-MISC"
193+
76,train,213462.0,918.0,"[11, 24): 'INTERVIEW-T&N'","[21, 24): 'T&N'"," INTERVIEW NNP I-NP O
194+
- . O O
195+
T&N NNP I-NP I-MISC"
196+
77,,,,,,

corrected_labels/token_edits.csv

Lines changed: 78 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,78 @@
1+
,fold,line_no,doc_offset,corpus_span,correct_span,correct_line
2+
0,test,1131,3.0,"[21, 37): 'SKIING-WORLD CUP'","[28, 37): 'WORLD CUP'",
3+
1,test,1131,3.0,"[21, 37): 'SKIING-WORLD CUP'","[28,37)'WORLD CUP'",
4+
2,test,5174,22.0,"[19, 23): 'ARAB'","[19, 35): 'ARAB CONTRACTORS'",
5+
3,test,6545,27.0,"[565, 573): 'X-DENVER'","[567, 573): 'DENVER'",
6+
4,test,-2,27.0,,"[567, 573): 'DENVER'",
7+
5,test,6640,27.0,"[889, 900): 'Y-GREEN BAY'","[891, 900): 'GREEN BAY'",
8+
6,test,6851,29.0,"[25, 44): 'FOOTBALL-OHIO STATE'","[34, 44): 'OHIO STATE'",
9+
7,test,6851,29.0,"[25, 44): 'FOOTBALL-OHIO STATE'","[34,44): 'OHIO STATE'",
10+
8,test,8644,39.0,"[1158, 1175): 'AbelardoFernandez'","[1158, 1175): 'Abelardo Fernandez'",
11+
9,test,12284,54.0,"[1145, 1152): 'Boxmeer'","[1141, 1152): 'van Boxmeer'",
12+
10,test,12068,54.0,"[11, 27): 'INTERVIEW-ZYWIEC'","[21, 27): 'ZYWIEC'",
13+
11,test,12555,54.0,"[2594, 2601): 'Boxmeer'","[2590, 2601): 'van Boxmeer'",
14+
12,test,12682,54.0,"[3231, 3241): 'Full Light'","[3224, 3241): 'Zywiec Full Light'",
15+
13,test,12720,54.0,"[3421, 3428): 'Boxmeer'","[3417, 3428): 'van Boxmeer'",
16+
14,test,-2,54.0,,"[?, 27): 'ZYWIEC'",
17+
15,test,13001,56.0,"[11, 16): 'UK-US'","[11, 13): 'UK'",
18+
16,test,13001,56.0,"[11, 16): 'UK-US'","[11,13) 'UK'",
19+
17,test,13001,56.0,"[11, 16): 'UK-US'","[14, 16): 'US'",
20+
18,test,13001,56.0,"[11, 16): 'UK-US'","[14,16) 'UK'",
21+
19,test,13447,60.0,"[345, 363): 'Trade and Industry'","[345, 373): 'Trade and Industry Secretary'",
22+
20,test,14467,63.0,"[19, 39): 'office-Conservatives'","[26, 39): 'Conservatives' ",
23+
21,test,14467,63.0,"[19, 39): 'office-Conservatives'","[27, 39): 'Conservatives'",
24+
22,test,15155,68.0,"[11, 19): 'Canadian'","[11, 30): 'Canadian West Coast'",
25+
23,test,15183,68.0,"[157, 165): 'Canadian'",,
26+
24,test,15337,70.0,"[177, 197): 'New York Commodities'","[177, 202): 'New York Commodities Desk'",
27+
25,test,15380,71.0,"[153, 173): 'New York Commodities'","[153, 178): 'New York Commodities Desk'",
28+
26,test,16319,75.0,"[2736, 2752): 'Newmont-Santa Fe'","[2736, 2743): 'Newmont'",
29+
27,test,16319,75.0,"[2736, 2752): 'Newmont-Santa Fe'","[2744, 2752): 'Santa Fe'",
30+
28,test,26720,114.0,"[11, 17): 'Iowa-S'","[11, 15): 'Iowa'",
31+
29,test,26720,114.0,"[11, 17): 'Iowa-S'","[11, 15): 'Iowa' ",
32+
30,test,26728,114.0,"[51, 61): 'sales-USDA'","[57, 61): 'USDA'",
33+
31,test,26728,114.0,"[51, 61): 'sales-USDA'",,
34+
32,test,28718,123.0,"[11, 17): 'Iowa-S'","[11, 15): 'Iowa' ",
35+
33,test,38688,178.0,"[951, 960): 'then-U.S.'","[956, 960): 'U.S.'",
36+
34,test,39979,183.0,"[18, 35): 'SKIING-GLADISHIVA'","[25, 35): 'GLADISHIVA'",
37+
35,test,-2,186.0,,"[1398, 1405): 'Austria'",
38+
36,test,41169,188.0,"[18, 34): 'SKIING-WORLD CUP'","[25, 34): 'WORLD CUP'",
39+
37,test,41413,190.0,"[11, 27): 'BOBSLEIGH-SHIMER'","[21, 27): 'SHIMER'",
40+
38,test,41413,190.0,"[11, 27): 'BOBSLEIGH-SHIMER'",,
41+
39,test,41595,191.0,"[11, 25): 'SKIING-CHINESE'","[18, 25): 'CHINESE'",
42+
40,test,41850,192.0,"[11, 30): 'BOBSLEIGH-WORLD CUP'","[21, 30): 'WORLD CUP'",
43+
41,test,42385,194.0,"[21, 37): 'SKIING-WORLD CUP'","[28, 37): 'WORLD CUP'",
44+
42,test,-1,195.0,"[21, 37): 'SKIING-WORLD CUP'","[28, 37): 'WORLD CUP'",
45+
43,test,46987,214.0,"[243, 262): 'Saturday'sWorld Cup'","[253, 262): 'World Cup'",
46+
0,dev,4120,15.0,"[41, 51): 'CUNNINGHAM'","(33, 51]: 'RANDALL CUNNINGHAM'",
47+
1,dev,4120,15.0,"[41, 51): 'CUNNINGHAM'","(33,51] 'RANDALL CUNNINGHAM'",
48+
2,dev,4118,15.0,"[15, 40): 'AMERICAN FOOTBALL-RANDALL'","[15, 32): 'AMERICAN FOOTBALL'",
49+
3,dev,4118,15.0,"[15, 40): 'AMERICAN FOOTBALL-RANDALL'","[33, 40): 'RANDALL'",
50+
4,dev,4120,15.0,"[41, 51): 'CUNNINGHAM'","[33,51): 'RANDALL CUNNINGHAM'",
51+
5,dev,10619,39.0,"[11, 23): 'Boxing-Bruno'","[18, 23): 'Bruno'",
52+
6,dev,-2,39.0,,"[18, 23): 'Bruno' ",
53+
7,dev,15911,60.0,"[1358, 1371): 'Tripoli-based'","[1358, 1365): 'Tripoli'",
54+
8,dev,19233,65.0,"[1125, 1134): 'asset-St.'","[1131, 1146): 'St. Louis based'",
55+
9,dev,19130,65.0,"[592, 607): 'St. Louis-based'","[592, 601): 'St. Louis'",
56+
10,dev,19233,65.0,"[1125, 1134): 'asset-St.'",,
57+
11,dev,44837,175.0,"[252, 264): 'London-based'","[252, 258): 'London'",
58+
12,dev,46457,181.0,"[1761, 1774): 'Moscow-backed'","[1761, 1767): 'Moscow'",
59+
13,dev,50964,198.0,"[39, 47): 'aid-U.N.'","[43, 47): 'U.N.'",
60+
0,train,17719,80.0,,"[44, 59): 'Interfax'",
61+
1,train,-2,80.0,,"[51, 59): 'Interfax'",
62+
2,train,-2,115.0,,"[23, 27): 'News'",
63+
3,train,37914,163.0,"[220, 232): 'x-AEK Athens'","[222, 232): 'AEK Athens'",
64+
4,train,37926,163.0,"[271, 283): 'x-Olympiakos'","[273, 283): 'Olympiakos'",
65+
5,train,37933,163.0,"[308, 313): 'x-PAO'","[310, 313): 'PAO'",
66+
6,train,38844,169.0,"[50, 61): 'trip-Canada'","[55, 61): 'Canada'",
67+
7,train,65636,298.0,"[49, 60): '1997--Ruehe'","[55, 60): 'Ruehe'",
68+
8,train,75410,343.0,"[11, 31): 'AUSTRALIAN RULES-AFL'","[11, 21): 'AUSTRALIAN'",
69+
9,train,75410,343.0,"[11, 31): 'AUSTRALIAN RULES-AFL'","[11, 27): 'AUSTRALIAN RULES'",
70+
10,train,75410,343.0,"[11, 31): 'AUSTRALIAN RULES-AFL'","[28, 31): 'AFL'",
71+
11,train,75410,343.0,"[11, 31): 'AUSTRALIAN RULES-AFL'","[11, 21): 'AUSTRALIAN'",
72+
12,train,95553,422.0,"[236, 246): 'Videoton(*'","[236, 244): 'Videoton'",
73+
13,train,139024,593.0,"[45, 57): 'France-Juppe'","[45, 51): 'France'",
74+
14,train,139024,593.0,"[45, 57): 'France-Juppe'","[52, 57): 'Juppe'",
75+
15,train,146605,626.0,"[42, 59): 'disarmament-China'","[42, 59): 'disarmament-China'",
76+
16,train,164709,701.0,"[17, 30): 'union-England'","[23, 30): 'England'",
77+
17,train,213462,918.0,"[11, 24): 'INTERVIEW-T&N'","[11, 24): 'INTERVIEW-T&N'",
78+
18,train,213462,918.0,"[11, 24): 'INTERVIEW-T&N'","[21, 24): 'T&N'",

0 commit comments

Comments
 (0)