Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Adds test data and code to regenerate it #299

Draft
wants to merge 1 commit into
base: master
Choose a base branch
from
Draft
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
4 changes: 4 additions & 0 deletions tests/testdata/Makefile
Original file line number Diff line number Diff line change
@@ -0,0 +1,4 @@
SUBDIRS = copy delete ice_g2p identity reverse tur_inflection upper

all:
for dir in $(SUBDIRS); do $(MAKE) -C $$dir; done
2 changes: 2 additions & 0 deletions tests/testdata/README.md
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
This directory contains test data for tests involving actual
sequence-to-sequence training. To regenerate the data, run `make -j`.
8 changes: 8 additions & 0 deletions tests/testdata/copy/Makefile
Original file line number Diff line number Diff line change
@@ -0,0 +1,8 @@
SHELL := /bin/bash

all: train.tsv dev.tsv test.tsv

%.tsv:
.././generate.py --vocabulary 16 --length 5 --seed 1951 --size 100 > /tmp/copy_$@
paste /tmp/copy_$@ <(paste -d'\0' /tmp/copy_$@ /tmp/copy_$@) > $@
rm /tmp/copy_$@
100 changes: 100 additions & 0 deletions tests/testdata/copy/dev.tsv
Original file line number Diff line number Diff line change
@@ -0,0 +1,100 @@
eplnjcdd eplnjcddeplnjcdd
p pp
ibejfod ibejfodibejfod
pab pabpab
dlfcgbk dlfcgbkdlfcgbk
olfop olfopolfop
gcfohaobgcf gcfohaobgcfgcfohaobgcf
ejnpc ejnpcejnpc
mo momo
pifg pifgpifg
cjefakb cjefakbcjefakb
o oo
pjcjlek pjcjlekpjcjlek
hehdgc hehdgchehdgc
mmhf mmhfmmhf
nih nihnih
l ll
hgahdmme hgahdmmehgahdmme
llhekbhgg llhekbhggllhekbhgg
fjmcif fjmciffjmcif
kpkji kpkjikpkji
dlef dlefdlef
naljdol naljdolnaljdol
dapf dapfdapf
ae aeae
pikn piknpikn
kdnkma kdnkmakdnkma
jmoe jmoejmoe
hkcd hkcdhkcd
bae baebae
npdchffilp npdchffilpnpdchffilp
feci fecifeci
cfhm cfhmcfhm
eb ebeb
ej ejej
kha khakha
fhhen fhhenfhhen
clobjl clobjlclobjl
bdcnnfk bdcnnfkbdcnnfk
apjnmed apjnmedapjnmed
epopgd epopgdepopgd
eoa eoaeoa
mak makmak
ilg ilgilg
odnfeap odnfeapodnfeap
jebn jebnjebn
mo momo
ijiele ijieleijiele
efolbe efolbeefolbe
hjfmp hjfmphjfmp
g gg
ohog ohogohog
lmggl lmggllmggl
ncbkj ncbkjncbkj
bk bkbk
odkcf odkcfodkcf
ojnoi ojnoiojnoi
eeaf eeafeeaf
iljalco iljalcoiljalco
cbod cbodcbod
fjh fjhfjh
cfkmlfe cfkmlfecfkmlfe
bljo bljobljo
gdejbbjh gdejbbjhgdejbbjh
opofbihg opofbihgopofbihg
koj kojkoj
mn mnmn
ne nene
hkkjk hkkjkhkkjk
bjlifgeo bjlifgeobjlifgeo
blb blbblb
neeb neebneeb
dogb dogbdogb
llenp llenpllenp
acia aciaacia
cceg ccegcceg
ipbfghh ipbfghhipbfghh
icbmm icbmmicbmm
jiakjo jiakjojiakjo
ndaek ndaekndaek
minelhf minelhfminelhf
fmcbh fmcbhfmcbh
icmp icmpicmp
oigkcacd oigkcacdoigkcacd
efn efnefn
jednkp jednkpjednkp
eajcb eajcbeajcb
calemkd calemkdcalemkd
hokdk hokdkhokdk
ahb ahbahb
biikpho biikphobiikpho
lbjdide lbjdidelbjdide
kjlob kjlobkjlob
jhhd jhhdjhhd
aiffmono aiffmonoaiffmono
gfnpe gfnpegfnpe
bjbbkj bjbbkjbjbbkj
jabie jabiejabie
jmlokf jmlokfjmlokf
hmjb hmjbhmjb
100 changes: 100 additions & 0 deletions tests/testdata/copy/test.tsv
Original file line number Diff line number Diff line change
@@ -0,0 +1,100 @@
eplnjcdd eplnjcddeplnjcdd
p pp
ibejfod ibejfodibejfod
pab pabpab
dlfcgbk dlfcgbkdlfcgbk
olfop olfopolfop
gcfohaobgcf gcfohaobgcfgcfohaobgcf
ejnpc ejnpcejnpc
mo momo
pifg pifgpifg
cjefakb cjefakbcjefakb
o oo
pjcjlek pjcjlekpjcjlek
hehdgc hehdgchehdgc
mmhf mmhfmmhf
nih nihnih
l ll
hgahdmme hgahdmmehgahdmme
llhekbhgg llhekbhggllhekbhgg
fjmcif fjmciffjmcif
kpkji kpkjikpkji
dlef dlefdlef
naljdol naljdolnaljdol
dapf dapfdapf
ae aeae
pikn piknpikn
kdnkma kdnkmakdnkma
jmoe jmoejmoe
hkcd hkcdhkcd
bae baebae
npdchffilp npdchffilpnpdchffilp
feci fecifeci
cfhm cfhmcfhm
eb ebeb
ej ejej
kha khakha
fhhen fhhenfhhen
clobjl clobjlclobjl
bdcnnfk bdcnnfkbdcnnfk
apjnmed apjnmedapjnmed
epopgd epopgdepopgd
eoa eoaeoa
mak makmak
ilg ilgilg
odnfeap odnfeapodnfeap
jebn jebnjebn
mo momo
ijiele ijieleijiele
efolbe efolbeefolbe
hjfmp hjfmphjfmp
g gg
ohog ohogohog
lmggl lmggllmggl
ncbkj ncbkjncbkj
bk bkbk
odkcf odkcfodkcf
ojnoi ojnoiojnoi
eeaf eeafeeaf
iljalco iljalcoiljalco
cbod cbodcbod
fjh fjhfjh
cfkmlfe cfkmlfecfkmlfe
bljo bljobljo
gdejbbjh gdejbbjhgdejbbjh
opofbihg opofbihgopofbihg
koj kojkoj
mn mnmn
ne nene
hkkjk hkkjkhkkjk
bjlifgeo bjlifgeobjlifgeo
blb blbblb
neeb neebneeb
dogb dogbdogb
llenp llenpllenp
acia aciaacia
cceg ccegcceg
ipbfghh ipbfghhipbfghh
icbmm icbmmicbmm
jiakjo jiakjojiakjo
ndaek ndaekndaek
minelhf minelhfminelhf
fmcbh fmcbhfmcbh
icmp icmpicmp
oigkcacd oigkcacdoigkcacd
efn efnefn
jednkp jednkpjednkp
eajcb eajcbeajcb
calemkd calemkdcalemkd
hokdk hokdkhokdk
ahb ahbahb
biikpho biikphobiikpho
lbjdide lbjdidelbjdide
kjlob kjlobkjlob
jhhd jhhdjhhd
aiffmono aiffmonoaiffmono
gfnpe gfnpegfnpe
bjbbkj bjbbkjbjbbkj
jabie jabiejabie
jmlokf jmlokfjmlokf
hmjb hmjbhmjb
100 changes: 100 additions & 0 deletions tests/testdata/copy/train.tsv
Original file line number Diff line number Diff line change
@@ -0,0 +1,100 @@
eplnjcdd eplnjcddeplnjcdd
p pp
ibejfod ibejfodibejfod
pab pabpab
dlfcgbk dlfcgbkdlfcgbk
olfop olfopolfop
gcfohaobgcf gcfohaobgcfgcfohaobgcf
ejnpc ejnpcejnpc
mo momo
pifg pifgpifg
cjefakb cjefakbcjefakb
o oo
pjcjlek pjcjlekpjcjlek
hehdgc hehdgchehdgc
mmhf mmhfmmhf
nih nihnih
l ll
hgahdmme hgahdmmehgahdmme
llhekbhgg llhekbhggllhekbhgg
fjmcif fjmciffjmcif
kpkji kpkjikpkji
dlef dlefdlef
naljdol naljdolnaljdol
dapf dapfdapf
ae aeae
pikn piknpikn
kdnkma kdnkmakdnkma
jmoe jmoejmoe
hkcd hkcdhkcd
bae baebae
npdchffilp npdchffilpnpdchffilp
feci fecifeci
cfhm cfhmcfhm
eb ebeb
ej ejej
kha khakha
fhhen fhhenfhhen
clobjl clobjlclobjl
bdcnnfk bdcnnfkbdcnnfk
apjnmed apjnmedapjnmed
epopgd epopgdepopgd
eoa eoaeoa
mak makmak
ilg ilgilg
odnfeap odnfeapodnfeap
jebn jebnjebn
mo momo
ijiele ijieleijiele
efolbe efolbeefolbe
hjfmp hjfmphjfmp
g gg
ohog ohogohog
lmggl lmggllmggl
ncbkj ncbkjncbkj
bk bkbk
odkcf odkcfodkcf
ojnoi ojnoiojnoi
eeaf eeafeeaf
iljalco iljalcoiljalco
cbod cbodcbod
fjh fjhfjh
cfkmlfe cfkmlfecfkmlfe
bljo bljobljo
gdejbbjh gdejbbjhgdejbbjh
opofbihg opofbihgopofbihg
koj kojkoj
mn mnmn
ne nene
hkkjk hkkjkhkkjk
bjlifgeo bjlifgeobjlifgeo
blb blbblb
neeb neebneeb
dogb dogbdogb
llenp llenpllenp
acia aciaacia
cceg ccegcceg
ipbfghh ipbfghhipbfghh
icbmm icbmmicbmm
jiakjo jiakjojiakjo
ndaek ndaekndaek
minelhf minelhfminelhf
fmcbh fmcbhfmcbh
icmp icmpicmp
oigkcacd oigkcacdoigkcacd
efn efnefn
jednkp jednkpjednkp
eajcb eajcbeajcb
calemkd calemkdcalemkd
hokdk hokdkhokdk
ahb ahbahb
biikpho biikphobiikpho
lbjdide lbjdidelbjdide
kjlob kjlobkjlob
jhhd jhhdjhhd
aiffmono aiffmonoaiffmono
gfnpe gfnpegfnpe
bjbbkj bjbbkjbjbbkj
jabie jabiejabie
jmlokf jmlokfjmlokf
hmjb hmjbhmjb
9 changes: 9 additions & 0 deletions tests/testdata/delete/Makefile
Original file line number Diff line number Diff line change
@@ -0,0 +1,9 @@
SHELL := /bin/bash

all: train.tsv dev.tsv test.tsv

%.tsv:
paste \
<(.././generate.py --vocabulary 16 --length 5 --seed 1953 --size 100) \
/dev/null \
> $@
Loading