BIG Reorganize examples (#4213)
* Created using Colaboratory * [examples] reorganize files * remove run_tpu_glue.py as superseded by TPU support in Trainer * Bugfix: int, not tuple * move files around
This commit is contained in:
7
tests/fixtures/tests_samples/.gitignore
vendored
Normal file
7
tests/fixtures/tests_samples/.gitignore
vendored
Normal file
@@ -0,0 +1,7 @@
|
||||
*.*
|
||||
cache*
|
||||
temp*
|
||||
!*.txt
|
||||
!*.tsv
|
||||
!*.json
|
||||
!.gitignore
|
||||
202
tests/fixtures/tests_samples/GermEval/dev.txt
vendored
Normal file
202
tests/fixtures/tests_samples/GermEval/dev.txt
vendored
Normal file
@@ -0,0 +1,202 @@
|
||||
Gleich O
|
||||
darauf O
|
||||
entwirft O
|
||||
er O
|
||||
seine O
|
||||
Selbstdarstellung O
|
||||
" O
|
||||
Ecce B-OTH
|
||||
homo I-OTH
|
||||
" O
|
||||
in O
|
||||
enger O
|
||||
Auseinandersetzung O
|
||||
mit O
|
||||
diesem O
|
||||
Bild O
|
||||
Jesu B-PER
|
||||
. O
|
||||
|
||||
1980 O
|
||||
kam O
|
||||
der O
|
||||
Crown B-OTH
|
||||
als O
|
||||
Versuch O
|
||||
von O
|
||||
Toyota B-ORG
|
||||
, O
|
||||
sich O
|
||||
in O
|
||||
der O
|
||||
Oberen O
|
||||
Mittelklasse O
|
||||
zu O
|
||||
etablieren O
|
||||
, O
|
||||
auch O
|
||||
nach O
|
||||
Deutschland B-LOC
|
||||
. O
|
||||
|
||||
– O
|
||||
4:26 O
|
||||
# O
|
||||
Sometime B-OTH
|
||||
Ago/La I-OTH
|
||||
Fiesta I-OTH
|
||||
– O
|
||||
23:18 O
|
||||
Alle O
|
||||
Stücke O
|
||||
wurden O
|
||||
von O
|
||||
Corea B-PER
|
||||
komponiert O
|
||||
mit O
|
||||
Ausnahme O
|
||||
der O
|
||||
einleitenden O
|
||||
Improvisation O
|
||||
zu O
|
||||
Sometime B-OTH
|
||||
Ago I-OTH
|
||||
. O
|
||||
|
||||
Bis O
|
||||
2013 O
|
||||
steigen O
|
||||
die O
|
||||
Mittel O
|
||||
aus O
|
||||
dem O
|
||||
EU-Budget B-ORGpart
|
||||
auf O
|
||||
rund O
|
||||
120 O
|
||||
Millionen O
|
||||
Euro B-OTH
|
||||
. O
|
||||
|
||||
Daraus O
|
||||
entwickelte O
|
||||
sich O
|
||||
im O
|
||||
Rokoko B-OTH
|
||||
die O
|
||||
Sitte O
|
||||
des O
|
||||
gemeinsamen O
|
||||
Weinens O
|
||||
im O
|
||||
Theater O
|
||||
, O
|
||||
das O
|
||||
die O
|
||||
Standesgrenzen O
|
||||
innerhalb O
|
||||
des O
|
||||
Publikums O
|
||||
überbrücken O
|
||||
sollte O
|
||||
. O
|
||||
|
||||
Die O
|
||||
Spinne O
|
||||
hatte O
|
||||
sie O
|
||||
mit O
|
||||
Seidenfäden O
|
||||
an O
|
||||
ihrem O
|
||||
Schwanz O
|
||||
gefesselt O
|
||||
und O
|
||||
nach O
|
||||
oben O
|
||||
gezogen O
|
||||
. O
|
||||
|
||||
In O
|
||||
Deutschland B-LOC
|
||||
ist O
|
||||
nach O
|
||||
StGB O
|
||||
eine O
|
||||
Anwerbung O
|
||||
für O
|
||||
die O
|
||||
Fremdenlegion O
|
||||
strafbar O
|
||||
. O
|
||||
|
||||
Am O
|
||||
Donnerstag O
|
||||
wird O
|
||||
sich O
|
||||
zeigen O
|
||||
, O
|
||||
ob O
|
||||
die O
|
||||
Idee O
|
||||
der O
|
||||
DLR-Forscher B-ORGpart
|
||||
funktioniert O
|
||||
. O
|
||||
|
||||
Der O
|
||||
sechste O
|
||||
Lauf O
|
||||
der O
|
||||
ADAC B-ORG
|
||||
GT I-ORG
|
||||
Mastersstand O
|
||||
ganz O
|
||||
klar O
|
||||
im O
|
||||
Mittelpunkt O
|
||||
des O
|
||||
Motorsport-Wochenendes O
|
||||
auf O
|
||||
dem O
|
||||
Eurospeedway B-ORG
|
||||
Lausitz I-ORG
|
||||
. O
|
||||
|
||||
Nach O
|
||||
den O
|
||||
schwächeren O
|
||||
Vorgaben O
|
||||
der O
|
||||
Wall B-ORG
|
||||
Street I-ORG
|
||||
vom O
|
||||
Vortag O
|
||||
setzten O
|
||||
die O
|
||||
deutschen B-LOCderiv
|
||||
Standardwerte O
|
||||
ihren O
|
||||
Konsolidierungskurs O
|
||||
fort O
|
||||
. O
|
||||
|
||||
Kolb B-PER
|
||||
war O
|
||||
seit O
|
||||
1986 O
|
||||
im O
|
||||
Turnverein O
|
||||
als O
|
||||
Leiter O
|
||||
tätig O
|
||||
, O
|
||||
darunter O
|
||||
elf O
|
||||
Jahre O
|
||||
als O
|
||||
Hauptleiter O
|
||||
in O
|
||||
der O
|
||||
Männerriege O
|
||||
. O
|
||||
25
tests/fixtures/tests_samples/GermEval/labels.txt
vendored
Normal file
25
tests/fixtures/tests_samples/GermEval/labels.txt
vendored
Normal file
@@ -0,0 +1,25 @@
|
||||
B-LOC
|
||||
B-LOCderiv
|
||||
B-LOCpart
|
||||
B-ORG
|
||||
B-ORGderiv
|
||||
B-ORGpart
|
||||
B-OTH
|
||||
B-OTHderiv
|
||||
B-OTHpart
|
||||
B-PER
|
||||
B-PERderiv
|
||||
B-PERpart
|
||||
I-LOC
|
||||
I-LOCderiv
|
||||
I-LOCpart
|
||||
I-ORG
|
||||
I-ORGderiv
|
||||
I-ORGpart
|
||||
I-OTH
|
||||
I-OTHderiv
|
||||
I-OTHpart
|
||||
I-PER
|
||||
I-PERderiv
|
||||
I-PERpart
|
||||
O
|
||||
200
tests/fixtures/tests_samples/GermEval/train.txt
vendored
Normal file
200
tests/fixtures/tests_samples/GermEval/train.txt
vendored
Normal file
@@ -0,0 +1,200 @@
|
||||
Schartau B-PER
|
||||
sagte O
|
||||
dem O
|
||||
" O
|
||||
Tagesspiegel B-ORG
|
||||
" O
|
||||
vom O
|
||||
Freitag O
|
||||
, O
|
||||
Fischer B-PER
|
||||
sei O
|
||||
" O
|
||||
in O
|
||||
einer O
|
||||
Weise O
|
||||
aufgetreten O
|
||||
, O
|
||||
die O
|
||||
alles O
|
||||
andere O
|
||||
als O
|
||||
überzeugend O
|
||||
war O
|
||||
" O
|
||||
. O
|
||||
|
||||
Firmengründer O
|
||||
Wolf B-PER
|
||||
Peter I-PER
|
||||
Bree I-PER
|
||||
arbeitete O
|
||||
Anfang O
|
||||
der O
|
||||
siebziger O
|
||||
Jahre O
|
||||
als O
|
||||
Möbelvertreter O
|
||||
, O
|
||||
als O
|
||||
er O
|
||||
einen O
|
||||
fliegenden O
|
||||
Händler O
|
||||
aus O
|
||||
dem O
|
||||
Libanon B-LOC
|
||||
traf O
|
||||
. O
|
||||
|
||||
Ob O
|
||||
sie O
|
||||
dabei O
|
||||
nach O
|
||||
dem O
|
||||
Runden O
|
||||
Tisch O
|
||||
am O
|
||||
23. O
|
||||
April O
|
||||
in O
|
||||
Berlin B-LOC
|
||||
durch O
|
||||
ein O
|
||||
pädagogisches O
|
||||
Konzept O
|
||||
unterstützt O
|
||||
wird O
|
||||
, O
|
||||
ist O
|
||||
allerdings O
|
||||
zu O
|
||||
bezweifeln O
|
||||
. O
|
||||
|
||||
Bayern B-ORG
|
||||
München I-ORG
|
||||
ist O
|
||||
wieder O
|
||||
alleiniger O
|
||||
Top- O
|
||||
Favorit O
|
||||
auf O
|
||||
den O
|
||||
Gewinn O
|
||||
der O
|
||||
deutschen B-LOCderiv
|
||||
Fußball-Meisterschaft O
|
||||
. O
|
||||
|
||||
Dabei O
|
||||
hätte O
|
||||
der O
|
||||
tapfere O
|
||||
Schlussmann O
|
||||
allen O
|
||||
Grund O
|
||||
gehabt O
|
||||
, O
|
||||
sich O
|
||||
viel O
|
||||
früher O
|
||||
aufzuregen O
|
||||
. O
|
||||
|
||||
ARD-Programmchef B-ORGpart
|
||||
Günter B-PER
|
||||
Struve I-PER
|
||||
war O
|
||||
wegen O
|
||||
eines O
|
||||
vierwöchigen O
|
||||
Urlaubs O
|
||||
für O
|
||||
eine O
|
||||
Stellungnahme O
|
||||
nicht O
|
||||
erreichbar O
|
||||
. O
|
||||
|
||||
Alternativ O
|
||||
sollten O
|
||||
sich O
|
||||
die O
|
||||
Restaurantbetreiber O
|
||||
aus O
|
||||
Sicht O
|
||||
der O
|
||||
Solingerin B-LOCderiv
|
||||
zu O
|
||||
längeren O
|
||||
Öffnungszeiten O
|
||||
verpflichten O
|
||||
, O
|
||||
um O
|
||||
wartende O
|
||||
Kunden O
|
||||
aufzunehmen O
|
||||
. O
|
||||
|
||||
Die O
|
||||
Deutsche B-ORG
|
||||
Flugsicherung I-ORG
|
||||
( O
|
||||
DFS B-ORG
|
||||
) O
|
||||
beschloss O
|
||||
ein O
|
||||
Flugverbot O
|
||||
für O
|
||||
alle O
|
||||
internationalen O
|
||||
Flughäfen O
|
||||
mit O
|
||||
Ausnahme O
|
||||
der O
|
||||
beiden O
|
||||
Berliner B-LOCderiv
|
||||
Flughäfen O
|
||||
bis O
|
||||
2.00 O
|
||||
Uhr O
|
||||
nachts O
|
||||
. O
|
||||
|
||||
New O
|
||||
Small O
|
||||
Family O
|
||||
mit O
|
||||
E-Motor O
|
||||
: O
|
||||
Studie O
|
||||
E-Up O
|
||||
! O
|
||||
|
||||
Eine O
|
||||
Schwachstelle O
|
||||
war O
|
||||
beispielsweise O
|
||||
der O
|
||||
Spiegelkasten O
|
||||
. O
|
||||
|
||||
Denn O
|
||||
durch O
|
||||
den O
|
||||
Einsatz O
|
||||
moderner O
|
||||
Fahrzeugtechnik O
|
||||
( O
|
||||
Dieseltriebwagen O
|
||||
) O
|
||||
und O
|
||||
schalldämmender O
|
||||
Fenster O
|
||||
entsteht O
|
||||
keine O
|
||||
Einschränkung O
|
||||
der O
|
||||
Wohnqualität O
|
||||
. O
|
||||
7
tests/fixtures/tests_samples/MRPC/dev.tsv
vendored
Normal file
7
tests/fixtures/tests_samples/MRPC/dev.tsv
vendored
Normal file
@@ -0,0 +1,7 @@
|
||||
Quality #1 ID #2 ID #1 String #2 String
|
||||
1 1355540 1355592 He said the foodservice pie business doesn 't fit the company 's long-term growth strategy . " The foodservice pie business does not fit our long-term growth strategy .
|
||||
0 2029631 2029565 Magnarelli said Racicot hated the Iraqi regime and looked forward to using his long years of training in the war . His wife said he was " 100 percent behind George Bush " and looked forward to using his years of training in the war .
|
||||
0 487993 487952 The dollar was at 116.92 yen against the yen , flat on the session , and at 1.2891 against the Swiss franc , also flat . The dollar was at 116.78 yen JPY = , virtually flat on the session , and at 1.2871 against the Swiss franc CHF = , down 0.1 percent .
|
||||
1 1989515 1989458 The AFL-CIO is waiting until October to decide if it will endorse a candidate . The AFL-CIO announced Wednesday that it will decide in October whether to endorse a candidate before the primaries .
|
||||
0 1783137 1782659 No dates have been set for the civil or the criminal trial . No dates have been set for the criminal or civil cases , but Shanley has pleaded not guilty .
|
||||
1 3039165 3039036 Wal-Mart said it would check all of its million-plus domestic workers to ensure they were legally employed . It has also said it would review all of its domestic employees more than 1 million to ensure they have legal status .
|
||||
|
Can't render this file because it contains an unexpected character in line 3 and column 155.
|
7
tests/fixtures/tests_samples/MRPC/train.tsv
vendored
Normal file
7
tests/fixtures/tests_samples/MRPC/train.tsv
vendored
Normal file
@@ -0,0 +1,7 @@
|
||||
Quality #1 ID #2 ID #1 String #2 String
|
||||
1 1355540 1355592 He said the foodservice pie business doesn 't fit the company 's long-term growth strategy . " The foodservice pie business does not fit our long-term growth strategy .
|
||||
0 2029631 2029565 Magnarelli said Racicot hated the Iraqi regime and looked forward to using his long years of training in the war . His wife said he was " 100 percent behind George Bush " and looked forward to using his years of training in the war .
|
||||
0 487993 487952 The dollar was at 116.92 yen against the yen , flat on the session , and at 1.2891 against the Swiss franc , also flat . The dollar was at 116.78 yen JPY = , virtually flat on the session , and at 1.2871 against the Swiss franc CHF = , down 0.1 percent .
|
||||
1 1989515 1989458 The AFL-CIO is waiting until October to decide if it will endorse a candidate . The AFL-CIO announced Wednesday that it will decide in October whether to endorse a candidate before the primaries .
|
||||
0 1783137 1782659 No dates have been set for the civil or the criminal trial . No dates have been set for the criminal or civil cases , but Shanley has pleaded not guilty .
|
||||
1 3039165 3039036 Wal-Mart said it would check all of its million-plus domestic workers to ensure they were legally employed . It has also said it would review all of its domestic employees more than 1 million to ensure they have legal status .
|
||||
|
Can't render this file because it contains an unexpected character in line 3 and column 155.
|
140
tests/fixtures/tests_samples/SQUAD/dev-v2.0.json
vendored
Normal file
140
tests/fixtures/tests_samples/SQUAD/dev-v2.0.json
vendored
Normal file
@@ -0,0 +1,140 @@
|
||||
{
|
||||
"version": "v2.0",
|
||||
"data": [{
|
||||
"title": "Normans",
|
||||
"paragraphs": [{
|
||||
"qas": [{
|
||||
"question": "In what country is Normandy located?",
|
||||
"id": "56ddde6b9a695914005b9628",
|
||||
"answers": [{
|
||||
"text": "France",
|
||||
"answer_start": 159
|
||||
}],
|
||||
"is_impossible": false
|
||||
}, {
|
||||
"question": "When were the Normans in Normandy?",
|
||||
"id": "56ddde6b9a695914005b9629",
|
||||
"answers": [{
|
||||
"text": "10th and 11th centuries",
|
||||
"answer_start": 94
|
||||
}],
|
||||
"is_impossible": false
|
||||
}, {
|
||||
"question": "From which countries did the Norse originate?",
|
||||
"id": "56ddde6b9a695914005b962a",
|
||||
"answers": [{
|
||||
"text": "Denmark, Iceland and Norway",
|
||||
"answer_start": 256
|
||||
}],
|
||||
"is_impossible": false
|
||||
}, {
|
||||
"plausible_answers": [{
|
||||
"text": "Rollo",
|
||||
"answer_start": 308
|
||||
}],
|
||||
"question": "Who did King Charles III swear fealty to?",
|
||||
"id": "5ad39d53604f3c001a3fe8d3",
|
||||
"answers": [],
|
||||
"is_impossible": true
|
||||
}, {
|
||||
"plausible_answers": [{
|
||||
"text": "10th century",
|
||||
"answer_start": 671
|
||||
}],
|
||||
"question": "When did the Frankish identity emerge?",
|
||||
"id": "5ad39d53604f3c001a3fe8d4",
|
||||
"answers": [],
|
||||
"is_impossible": true
|
||||
}],
|
||||
"context": "The Normans (Norman: Nourmands; French: Normands; Latin: Normanni) were the people who in the 10th and 11th centuries gave their name to Normandy, a region in France. They were descended from Norse (\"Norman\" comes from \"Norseman\") raiders and pirates from Denmark, Iceland and Norway who, under their leader Rollo, agreed to swear fealty to King Charles III of West Francia. Through generations of assimilation and mixing with the native Frankish and Roman-Gaulish populations, their descendants would gradually merge with the Carolingian-based cultures of West Francia. The distinct cultural and ethnic identity of the Normans emerged initially in the first half of the 10th century, and it continued to evolve over the succeeding centuries."
|
||||
}, {
|
||||
"qas": [{
|
||||
"question": "Who was the duke in the battle of Hastings?",
|
||||
"id": "56dddf4066d3e219004dad5f",
|
||||
"answers": [{
|
||||
"text": "William the Conqueror",
|
||||
"answer_start": 1022
|
||||
}],
|
||||
"is_impossible": false
|
||||
}, {
|
||||
"plausible_answers": [{
|
||||
"text": "Antioch",
|
||||
"answer_start": 1295
|
||||
}],
|
||||
"question": "What principality did William the conquerer found?",
|
||||
"id": "5ad3a266604f3c001a3fea2b",
|
||||
"answers": [],
|
||||
"is_impossible": true
|
||||
}],
|
||||
"context": "The Norman dynasty had a major political, cultural and military impact on medieval Europe and even the Near East. The Normans were famed for their martial spirit and eventually for their Christian piety, becoming exponents of the Catholic orthodoxy into which they assimilated. They adopted the Gallo-Romance language of the Frankish land they settled, their dialect becoming known as Norman, Normaund or Norman French, an important literary language. The Duchy of Normandy, which they formed by treaty with the French crown, was a great fief of medieval France, and under Richard I of Normandy was forged into a cohesive and formidable principality in feudal tenure. The Normans are noted both for their culture, such as their unique Romanesque architecture and musical traditions, and for their significant military accomplishments and innovations. Norman adventurers founded the Kingdom of Sicily under Roger II after conquering southern Italy on the Saracens and Byzantines, and an expedition on behalf of their duke, William the Conqueror, led to the Norman conquest of England at the Battle of Hastings in 1066. Norman cultural and military influence spread from these new European centres to the Crusader states of the Near East, where their prince Bohemond I founded the Principality of Antioch in the Levant, to Scotland and Wales in Great Britain, to Ireland, and to the coasts of north Africa and the Canary Islands."
|
||||
}]
|
||||
}, {
|
||||
"title": "Computational_complexity_theory",
|
||||
"paragraphs": [{
|
||||
"qas": [{
|
||||
"question": "What branch of theoretical computer science deals with broadly classifying computational problems by difficulty and class of relationship?",
|
||||
"id": "56e16182e3433e1400422e28",
|
||||
"answers": [{
|
||||
"text": "Computational complexity theory",
|
||||
"answer_start": 0
|
||||
}],
|
||||
"is_impossible": false
|
||||
}, {
|
||||
"plausible_answers": [{
|
||||
"text": "algorithm",
|
||||
"answer_start": 472
|
||||
}],
|
||||
"question": "What is a manual application of mathematical steps?",
|
||||
"id": "5ad5316b5b96ef001a10ab76",
|
||||
"answers": [],
|
||||
"is_impossible": true
|
||||
}],
|
||||
"context": "Computational complexity theory is a branch of the theory of computation in theoretical computer science that focuses on classifying computational problems according to their inherent difficulty, and relating those classes to each other. A computational problem is understood to be a task that is in principle amenable to being solved by a computer, which is equivalent to stating that the problem may be solved by mechanical application of mathematical steps, such as an algorithm."
|
||||
}, {
|
||||
"qas": [{
|
||||
"question": "What measure of a computational problem broadly defines the inherent difficulty of the solution?",
|
||||
"id": "56e16839cd28a01900c67887",
|
||||
"answers": [{
|
||||
"text": "if its solution requires significant resources",
|
||||
"answer_start": 46
|
||||
}],
|
||||
"is_impossible": false
|
||||
}, {
|
||||
"question": "What method is used to intuitively assess or quantify the amount of resources required to solve a computational problem?",
|
||||
"id": "56e16839cd28a01900c67888",
|
||||
"answers": [{
|
||||
"text": "mathematical models of computation",
|
||||
"answer_start": 176
|
||||
}],
|
||||
"is_impossible": false
|
||||
}, {
|
||||
"question": "What are two basic primary resources used to guage complexity?",
|
||||
"id": "56e16839cd28a01900c67889",
|
||||
"answers": [{
|
||||
"text": "time and storage",
|
||||
"answer_start": 305
|
||||
}],
|
||||
"is_impossible": false
|
||||
}, {
|
||||
"plausible_answers": [{
|
||||
"text": "the number of gates in a circuit",
|
||||
"answer_start": 436
|
||||
}],
|
||||
"question": "What unit is measured to determine circuit simplicity?",
|
||||
"id": "5ad532575b96ef001a10ab7f",
|
||||
"answers": [],
|
||||
"is_impossible": true
|
||||
}, {
|
||||
"plausible_answers": [{
|
||||
"text": "the number of processors",
|
||||
"answer_start": 502
|
||||
}],
|
||||
"question": "What number is used in perpendicular computing?",
|
||||
"id": "5ad532575b96ef001a10ab80",
|
||||
"answers": [],
|
||||
"is_impossible": true
|
||||
}],
|
||||
"context": "A problem is regarded as inherently difficult if its solution requires significant resources, whatever the algorithm used. The theory formalizes this intuition, by introducing mathematical models of computation to study these problems and quantifying the amount of resources needed to solve them, such as time and storage. Other complexity measures are also used, such as the amount of communication (used in communication complexity), the number of gates in a circuit (used in circuit complexity) and the number of processors (used in parallel computing). One of the roles of computational complexity theory is to determine the practical limits on what computers can and cannot do."
|
||||
}]
|
||||
}]
|
||||
}
|
||||
140
tests/fixtures/tests_samples/SQUAD/train-v2.0.json
vendored
Normal file
140
tests/fixtures/tests_samples/SQUAD/train-v2.0.json
vendored
Normal file
@@ -0,0 +1,140 @@
|
||||
{
|
||||
"version": "v2.0",
|
||||
"data": [{
|
||||
"title": "Normans",
|
||||
"paragraphs": [{
|
||||
"qas": [{
|
||||
"question": "In what country is Normandy located?",
|
||||
"id": "56ddde6b9a695914005b9628",
|
||||
"answers": [{
|
||||
"text": "France",
|
||||
"answer_start": 159
|
||||
}],
|
||||
"is_impossible": false
|
||||
}, {
|
||||
"question": "When were the Normans in Normandy?",
|
||||
"id": "56ddde6b9a695914005b9629",
|
||||
"answers": [{
|
||||
"text": "10th and 11th centuries",
|
||||
"answer_start": 94
|
||||
}],
|
||||
"is_impossible": false
|
||||
}, {
|
||||
"question": "From which countries did the Norse originate?",
|
||||
"id": "56ddde6b9a695914005b962a",
|
||||
"answers": [{
|
||||
"text": "Denmark, Iceland and Norway",
|
||||
"answer_start": 256
|
||||
}],
|
||||
"is_impossible": false
|
||||
}, {
|
||||
"plausible_answers": [{
|
||||
"text": "Rollo",
|
||||
"answer_start": 308
|
||||
}],
|
||||
"question": "Who did King Charles III swear fealty to?",
|
||||
"id": "5ad39d53604f3c001a3fe8d3",
|
||||
"answers": [],
|
||||
"is_impossible": true
|
||||
}, {
|
||||
"plausible_answers": [{
|
||||
"text": "10th century",
|
||||
"answer_start": 671
|
||||
}],
|
||||
"question": "When did the Frankish identity emerge?",
|
||||
"id": "5ad39d53604f3c001a3fe8d4",
|
||||
"answers": [],
|
||||
"is_impossible": true
|
||||
}],
|
||||
"context": "The Normans (Norman: Nourmands; French: Normands; Latin: Normanni) were the people who in the 10th and 11th centuries gave their name to Normandy, a region in France. They were descended from Norse (\"Norman\" comes from \"Norseman\") raiders and pirates from Denmark, Iceland and Norway who, under their leader Rollo, agreed to swear fealty to King Charles III of West Francia. Through generations of assimilation and mixing with the native Frankish and Roman-Gaulish populations, their descendants would gradually merge with the Carolingian-based cultures of West Francia. The distinct cultural and ethnic identity of the Normans emerged initially in the first half of the 10th century, and it continued to evolve over the succeeding centuries."
|
||||
}, {
|
||||
"qas": [{
|
||||
"question": "Who was the duke in the battle of Hastings?",
|
||||
"id": "56dddf4066d3e219004dad5f",
|
||||
"answers": [{
|
||||
"text": "William the Conqueror",
|
||||
"answer_start": 1022
|
||||
}],
|
||||
"is_impossible": false
|
||||
}, {
|
||||
"plausible_answers": [{
|
||||
"text": "Antioch",
|
||||
"answer_start": 1295
|
||||
}],
|
||||
"question": "What principality did William the conquerer found?",
|
||||
"id": "5ad3a266604f3c001a3fea2b",
|
||||
"answers": [],
|
||||
"is_impossible": true
|
||||
}],
|
||||
"context": "The Norman dynasty had a major political, cultural and military impact on medieval Europe and even the Near East. The Normans were famed for their martial spirit and eventually for their Christian piety, becoming exponents of the Catholic orthodoxy into which they assimilated. They adopted the Gallo-Romance language of the Frankish land they settled, their dialect becoming known as Norman, Normaund or Norman French, an important literary language. The Duchy of Normandy, which they formed by treaty with the French crown, was a great fief of medieval France, and under Richard I of Normandy was forged into a cohesive and formidable principality in feudal tenure. The Normans are noted both for their culture, such as their unique Romanesque architecture and musical traditions, and for their significant military accomplishments and innovations. Norman adventurers founded the Kingdom of Sicily under Roger II after conquering southern Italy on the Saracens and Byzantines, and an expedition on behalf of their duke, William the Conqueror, led to the Norman conquest of England at the Battle of Hastings in 1066. Norman cultural and military influence spread from these new European centres to the Crusader states of the Near East, where their prince Bohemond I founded the Principality of Antioch in the Levant, to Scotland and Wales in Great Britain, to Ireland, and to the coasts of north Africa and the Canary Islands."
|
||||
}]
|
||||
}, {
|
||||
"title": "Computational_complexity_theory",
|
||||
"paragraphs": [{
|
||||
"qas": [{
|
||||
"question": "What branch of theoretical computer science deals with broadly classifying computational problems by difficulty and class of relationship?",
|
||||
"id": "56e16182e3433e1400422e28",
|
||||
"answers": [{
|
||||
"text": "Computational complexity theory",
|
||||
"answer_start": 0
|
||||
}],
|
||||
"is_impossible": false
|
||||
}, {
|
||||
"plausible_answers": [{
|
||||
"text": "algorithm",
|
||||
"answer_start": 472
|
||||
}],
|
||||
"question": "What is a manual application of mathematical steps?",
|
||||
"id": "5ad5316b5b96ef001a10ab76",
|
||||
"answers": [],
|
||||
"is_impossible": true
|
||||
}],
|
||||
"context": "Computational complexity theory is a branch of the theory of computation in theoretical computer science that focuses on classifying computational problems according to their inherent difficulty, and relating those classes to each other. A computational problem is understood to be a task that is in principle amenable to being solved by a computer, which is equivalent to stating that the problem may be solved by mechanical application of mathematical steps, such as an algorithm."
|
||||
}, {
|
||||
"qas": [{
|
||||
"question": "What measure of a computational problem broadly defines the inherent difficulty of the solution?",
|
||||
"id": "56e16839cd28a01900c67887",
|
||||
"answers": [{
|
||||
"text": "if its solution requires significant resources",
|
||||
"answer_start": 46
|
||||
}],
|
||||
"is_impossible": false
|
||||
}, {
|
||||
"question": "What method is used to intuitively assess or quantify the amount of resources required to solve a computational problem?",
|
||||
"id": "56e16839cd28a01900c67888",
|
||||
"answers": [{
|
||||
"text": "mathematical models of computation",
|
||||
"answer_start": 176
|
||||
}],
|
||||
"is_impossible": false
|
||||
}, {
|
||||
"question": "What are two basic primary resources used to guage complexity?",
|
||||
"id": "56e16839cd28a01900c67889",
|
||||
"answers": [{
|
||||
"text": "time and storage",
|
||||
"answer_start": 305
|
||||
}],
|
||||
"is_impossible": false
|
||||
}, {
|
||||
"plausible_answers": [{
|
||||
"text": "the number of gates in a circuit",
|
||||
"answer_start": 436
|
||||
}],
|
||||
"question": "What unit is measured to determine circuit simplicity?",
|
||||
"id": "5ad532575b96ef001a10ab7f",
|
||||
"answers": [],
|
||||
"is_impossible": true
|
||||
}, {
|
||||
"plausible_answers": [{
|
||||
"text": "the number of processors",
|
||||
"answer_start": 502
|
||||
}],
|
||||
"question": "What number is used in perpendicular computing?",
|
||||
"id": "5ad532575b96ef001a10ab80",
|
||||
"answers": [],
|
||||
"is_impossible": true
|
||||
}],
|
||||
"context": "A problem is regarded as inherently difficult if its solution requires significant resources, whatever the algorithm used. The theory formalizes this intuition, by introducing mathematical models of computation to study these problems and quantifying the amount of resources needed to solve them, such as time and storage. Other complexity measures are also used, such as the amount of communication (used in communication complexity), the number of gates in a circuit (used in circuit complexity) and the number of processors (used in parallel computing). One of the roles of computational complexity theory is to determine the practical limits on what computers can and cannot do."
|
||||
}]
|
||||
}]
|
||||
}
|
||||
10
tests/fixtures/tests_samples/STS-B/dev.tsv
vendored
Normal file
10
tests/fixtures/tests_samples/STS-B/dev.tsv
vendored
Normal file
@@ -0,0 +1,10 @@
|
||||
index genre filename year old_index source1 source2 sentence1 sentence2 score
|
||||
0 main-captions MSRvid 2012test 0000 none none A man with a hard hat is dancing. A man wearing a hard hat is dancing. 5.000
|
||||
1 main-captions MSRvid 2012test 0002 none none A young child is riding a horse. A child is riding a horse. 4.750
|
||||
2 main-captions MSRvid 2012test 0003 none none A man is feeding a mouse to a snake. The man is feeding a mouse to the snake. 5.000
|
||||
3 main-captions MSRvid 2012test 0007 none none A woman is playing the guitar. A man is playing guitar. 2.400
|
||||
4 main-captions MSRvid 2012test 0008 none none A woman is playing the flute. A man is playing a flute. 2.750
|
||||
5 main-captions MSRvid 2012test 0010 none none A woman is cutting an onion. A man is cutting onions. 2.615
|
||||
6 main-captions MSRvid 2012test 0015 none none A man is erasing a chalk board. The man is erasing the chalk board. 5.000
|
||||
7 main-captions MSRvid 2012test 0023 none none A woman is carrying a boy. A woman is carrying her baby. 2.333
|
||||
8 main-captions MSRvid 2012test 0027 none none Three men are playing guitars. Three men are on stage playing guitars. 3.750
|
||||
|
10
tests/fixtures/tests_samples/STS-B/train.tsv
vendored
Normal file
10
tests/fixtures/tests_samples/STS-B/train.tsv
vendored
Normal file
@@ -0,0 +1,10 @@
|
||||
index genre filename year old_index source1 source2 sentence1 sentence2 score
|
||||
0 main-captions MSRvid 2012test 0001 none none A plane is taking off. An air plane is taking off. 5.000
|
||||
1 main-captions MSRvid 2012test 0004 none none A man is playing a large flute. A man is playing a flute. 3.800
|
||||
2 main-captions MSRvid 2012test 0005 none none A man is spreading shreded cheese on a pizza. A man is spreading shredded cheese on an uncooked pizza. 3.800
|
||||
3 main-captions MSRvid 2012test 0006 none none Three men are playing chess. Two men are playing chess. 2.600
|
||||
4 main-captions MSRvid 2012test 0009 none none A man is playing the cello. A man seated is playing the cello. 4.250
|
||||
5 main-captions MSRvid 2012test 0011 none none Some men are fighting. Two men are fighting. 4.250
|
||||
6 main-captions MSRvid 2012test 0012 none none A man is smoking. A man is skating. 0.500
|
||||
7 main-captions MSRvid 2012test 0013 none none The man is playing the piano. The man is playing the guitar. 1.600
|
||||
8 main-captions MSRvid 2012test 0014 none none A man is playing on a guitar and singing. A woman is playing an acoustic guitar and singing. 2.200
|
||||
|
@@ -28,7 +28,7 @@ class DataCollatorIntegrationTest(unittest.TestCase):
|
||||
MODEL_ID = "bert-base-cased-finetuned-mrpc"
|
||||
tokenizer = AutoTokenizer.from_pretrained(MODEL_ID)
|
||||
data_args = GlueDataTrainingArguments(
|
||||
task_name="mrpc", data_dir="./examples/tests_samples/MRPC", overwrite_cache=True
|
||||
task_name="mrpc", data_dir="./tests/fixtures/tests_samples/MRPC", overwrite_cache=True
|
||||
)
|
||||
dataset = GlueDataset(data_args, tokenizer=tokenizer, evaluate=True)
|
||||
data_collator = DefaultDataCollator()
|
||||
@@ -39,7 +39,7 @@ class DataCollatorIntegrationTest(unittest.TestCase):
|
||||
MODEL_ID = "distilroberta-base"
|
||||
tokenizer = AutoTokenizer.from_pretrained(MODEL_ID)
|
||||
data_args = GlueDataTrainingArguments(
|
||||
task_name="sts-b", data_dir="./examples/tests_samples/STS-B", overwrite_cache=True
|
||||
task_name="sts-b", data_dir="./tests/fixtures/tests_samples/STS-B", overwrite_cache=True
|
||||
)
|
||||
dataset = GlueDataset(data_args, tokenizer=tokenizer, evaluate=True)
|
||||
data_collator = DefaultDataCollator()
|
||||
@@ -91,7 +91,7 @@ class TrainerIntegrationTest(unittest.TestCase):
|
||||
tokenizer = AutoTokenizer.from_pretrained(MODEL_ID)
|
||||
model = AutoModelForSequenceClassification.from_pretrained(MODEL_ID)
|
||||
data_args = GlueDataTrainingArguments(
|
||||
task_name="mrpc", data_dir="./examples/tests_samples/MRPC", overwrite_cache=True
|
||||
task_name="mrpc", data_dir="./tests/fixtures/tests_samples/MRPC", overwrite_cache=True
|
||||
)
|
||||
eval_dataset = GlueDataset(data_args, tokenizer=tokenizer, evaluate=True)
|
||||
|
||||
|
||||
Reference in New Issue
Block a user