updated elg recipes

This commit is contained in:
Joerg Tiedemann 2022-03-11 21:04:00 +02:00
parent 84a9bf4eab
commit cc3be228a6
4 changed files with 2253 additions and 1568 deletions

File diff suppressed because it is too large Load Diff

View File

@ -256,6 +256,34 @@ ces-eng/latest/wikisource.aa.ces-eng.ces.gz
ces-eng/latest/wikisource.aa.ces-eng.eng.gz
ces-eng/latest/wikisource.ab.ces-eng.ces.gz
ces-eng/latest/wikisource.ab.ces-eng.eng.gz
ces-ukr/latest/wikibooks.aa.ces-ukr.ces.gz
ces-ukr/latest/wikibooks.aa.ces-ukr.ukr.gz
ces-ukr/latest/wikinews.aa.ces-ukr.ces.gz
ces-ukr/latest/wikinews.aa.ces-ukr.ukr.gz
ces-ukr/latest/wikipedia.aa.ces-ukr.ces.gz
ces-ukr/latest/wikipedia.aa.ces-ukr.ukr.gz
ces-ukr/latest/wikipedia.ab.ces-ukr.ces.gz
ces-ukr/latest/wikipedia.ab.ces-ukr.ukr.gz
ces-ukr/latest/wikipedia.ac.ces-ukr.ces.gz
ces-ukr/latest/wikipedia.ac.ces-ukr.ukr.gz
ces-ukr/latest/wikipedia.ad.ces-ukr.ces.gz
ces-ukr/latest/wikipedia.ad.ces-ukr.ukr.gz
ces-ukr/latest/wikipedia.ae.ces-ukr.ces.gz
ces-ukr/latest/wikipedia.ae.ces-ukr.ukr.gz
ces-ukr/latest/wikipedia.af.ces-ukr.ces.gz
ces-ukr/latest/wikipedia.af.ces-ukr.ukr.gz
ces-ukr/latest/wikipedia.ag.ces-ukr.ces.gz
ces-ukr/latest/wikipedia.ag.ces-ukr.ukr.gz
ces-ukr/latest/wikipedia.ah.ces-ukr.ces.gz
ces-ukr/latest/wikipedia.ah.ces-ukr.ukr.gz
ces-ukr/latest/wikipedia.ai.ces-ukr.ces.gz
ces-ukr/latest/wikipedia.ai.ces-ukr.ukr.gz
ces-ukr/latest/wikiquote.aa.ces-ukr.ces.gz
ces-ukr/latest/wikiquote.aa.ces-ukr.ukr.gz
ces-ukr/latest/wikisource.aa.ces-ukr.ces.gz
ces-ukr/latest/wikisource.aa.ces-ukr.ukr.gz
ces-ukr/latest/wikisource.ab.ces-ukr.ces.gz
ces-ukr/latest/wikisource.ab.ces-ukr.ukr.gz
cha-eng/latest/wiki.aa.cha-eng.cha.gz
cha-eng/latest/wiki.aa.cha-eng.eng.gz
che-eng/latest/wiki.aa.che-eng.che.gz
@ -2550,6 +2578,22 @@ ron-eng/latest/wikiquote.aa.ron-eng.eng.gz
ron-eng/latest/wikiquote.aa.ron-eng.ron.gz
ron-eng/latest/wikisource.aa.ron-eng.eng.gz
ron-eng/latest/wikisource.aa.ron-eng.ron.gz
ron-ukr/latest/wikibooks.aa.ron-ukr.ron.gz
ron-ukr/latest/wikibooks.aa.ron-ukr.ukr.gz
ron-ukr/latest/wikinews.aa.ron-ukr.ron.gz
ron-ukr/latest/wikinews.aa.ron-ukr.ukr.gz
ron-ukr/latest/wikipedia.aa.ron-ukr.ron.gz
ron-ukr/latest/wikipedia.aa.ron-ukr.ukr.gz
ron-ukr/latest/wikipedia.ab.ron-ukr.ron.gz
ron-ukr/latest/wikipedia.ab.ron-ukr.ukr.gz
ron-ukr/latest/wikipedia.ac.ron-ukr.ron.gz
ron-ukr/latest/wikipedia.ac.ron-ukr.ukr.gz
ron-ukr/latest/wikipedia.ad.ron-ukr.ron.gz
ron-ukr/latest/wikipedia.ad.ron-ukr.ukr.gz
ron-ukr/latest/wikiquote.aa.ron-ukr.ron.gz
ron-ukr/latest/wikiquote.aa.ron-ukr.ukr.gz
ron-ukr/latest/wikisource.aa.ron-ukr.ron.gz
ron-ukr/latest/wikisource.aa.ron-ukr.ukr.gz
rue-eng/latest/wiki.aa.rue-eng.eng.gz
rue-eng/latest/wiki.aa.rue-eng.rue.gz
run-eng/latest/wiki.aa.run-eng.eng.gz
@ -2722,6 +2766,18 @@ sin-eng/latest/wiki.aa.sin-eng.eng.gz
sin-eng/latest/wiki.aa.sin-eng.sin.gz
sin-eng/latest/wikibooks.aa.sin-eng.eng.gz
sin-eng/latest/wikibooks.aa.sin-eng.sin.gz
slk-ukr/latest/wikibooks.aa.slk-ukr.slk.gz
slk-ukr/latest/wikibooks.aa.slk-ukr.ukr.gz
slk-ukr/latest/wikipedia.aa.slk-ukr.slk.gz
slk-ukr/latest/wikipedia.aa.slk-ukr.ukr.gz
slk-ukr/latest/wikipedia.ab.slk-ukr.slk.gz
slk-ukr/latest/wikipedia.ab.slk-ukr.ukr.gz
slk-ukr/latest/wikipedia.ac.slk-ukr.slk.gz
slk-ukr/latest/wikipedia.ac.slk-ukr.ukr.gz
slk-ukr/latest/wikiquote.aa.slk-ukr.slk.gz
slk-ukr/latest/wikiquote.aa.slk-ukr.ukr.gz
slk-ukr/latest/wikisource.aa.slk-ukr.slk.gz
slk-ukr/latest/wikisource.aa.slk-ukr.ukr.gz
slv-eng/latest/wiki.aa.slv-eng.eng.gz
slv-eng/latest/wiki.aa.slv-eng.slv.gz
slv-eng/latest/wiki.ab.slv-eng.eng.gz
@ -3042,6 +3098,120 @@ udm-eng/latest/wiki.aa.udm-eng.eng.gz
udm-eng/latest/wiki.aa.udm-eng.udm.gz
uig-eng/latest/wiki.aa.uig-eng.eng.gz
uig-eng/latest/wiki.aa.uig-eng.uig.gz
ukr-ces/latest/wikibooks.aa.ukr-ces.ces.gz
ukr-ces/latest/wikibooks.aa.ukr-ces.ukr.gz
ukr-ces/latest/wikinews.aa.ukr-ces.ces.gz
ukr-ces/latest/wikinews.aa.ukr-ces.ukr.gz
ukr-ces/latest/wikipedia.aa.ukr-ces.ces.gz
ukr-ces/latest/wikipedia.aa.ukr-ces.ukr.gz
ukr-ces/latest/wikipedia.ab.ukr-ces.ces.gz
ukr-ces/latest/wikipedia.ab.ukr-ces.ukr.gz
ukr-ces/latest/wikipedia.ac.ukr-ces.ces.gz
ukr-ces/latest/wikipedia.ac.ukr-ces.ukr.gz
ukr-ces/latest/wikipedia.ad.ukr-ces.ces.gz
ukr-ces/latest/wikipedia.ad.ukr-ces.ukr.gz
ukr-ces/latest/wikipedia.ae.ukr-ces.ces.gz
ukr-ces/latest/wikipedia.ae.ukr-ces.ukr.gz
ukr-ces/latest/wikipedia.af.ukr-ces.ces.gz
ukr-ces/latest/wikipedia.af.ukr-ces.ukr.gz
ukr-ces/latest/wikipedia.ag.ukr-ces.ces.gz
ukr-ces/latest/wikipedia.ag.ukr-ces.ukr.gz
ukr-ces/latest/wikipedia.ah.ukr-ces.ces.gz
ukr-ces/latest/wikipedia.ah.ukr-ces.ukr.gz
ukr-ces/latest/wikipedia.ai.ukr-ces.ces.gz
ukr-ces/latest/wikipedia.ai.ukr-ces.ukr.gz
ukr-ces/latest/wikipedia.aj.ukr-ces.ces.gz
ukr-ces/latest/wikipedia.aj.ukr-ces.ukr.gz
ukr-ces/latest/wikipedia.ak.ukr-ces.ces.gz
ukr-ces/latest/wikipedia.ak.ukr-ces.ukr.gz
ukr-ces/latest/wikipedia.al.ukr-ces.ces.gz
ukr-ces/latest/wikipedia.al.ukr-ces.ukr.gz
ukr-ces/latest/wikipedia.am.ukr-ces.ces.gz
ukr-ces/latest/wikipedia.am.ukr-ces.ukr.gz
ukr-ces/latest/wikipedia.an.ukr-ces.ces.gz
ukr-ces/latest/wikipedia.an.ukr-ces.ukr.gz
ukr-ces/latest/wikipedia.ao.ukr-ces.ces.gz
ukr-ces/latest/wikipedia.ao.ukr-ces.ukr.gz
ukr-ces/latest/wikiquote.aa.ukr-ces.ces.gz
ukr-ces/latest/wikiquote.aa.ukr-ces.ukr.gz
ukr-ces/latest/wikisource.aa.ukr-ces.ces.gz
ukr-ces/latest/wikisource.aa.ukr-ces.ukr.gz
ukr-dan/latest/wikibooks.aa.ukr-dan.dan.gz
ukr-dan/latest/wikibooks.aa.ukr-dan.ukr.gz
ukr-dan/latest/wikinews.aa.ukr-dan.dan.gz
ukr-dan/latest/wikinews.aa.ukr-dan.ukr.gz
ukr-dan/latest/wikipedia.aa.ukr-dan.dan.gz
ukr-dan/latest/wikipedia.aa.ukr-dan.ukr.gz
ukr-dan/latest/wikipedia.ab.ukr-dan.dan.gz
ukr-dan/latest/wikipedia.ab.ukr-dan.ukr.gz
ukr-dan/latest/wikipedia.ac.ukr-dan.dan.gz
ukr-dan/latest/wikipedia.ac.ukr-dan.ukr.gz
ukr-dan/latest/wikipedia.ad.ukr-dan.dan.gz
ukr-dan/latest/wikipedia.ad.ukr-dan.ukr.gz
ukr-dan/latest/wikipedia.ae.ukr-dan.dan.gz
ukr-dan/latest/wikipedia.ae.ukr-dan.ukr.gz
ukr-dan/latest/wikipedia.af.ukr-dan.dan.gz
ukr-dan/latest/wikipedia.af.ukr-dan.ukr.gz
ukr-dan/latest/wikipedia.ag.ukr-dan.dan.gz
ukr-dan/latest/wikipedia.ag.ukr-dan.ukr.gz
ukr-dan/latest/wikipedia.ah.ukr-dan.dan.gz
ukr-dan/latest/wikipedia.ah.ukr-dan.ukr.gz
ukr-dan/latest/wikipedia.ai.ukr-dan.dan.gz
ukr-dan/latest/wikipedia.ai.ukr-dan.ukr.gz
ukr-dan/latest/wikipedia.aj.ukr-dan.dan.gz
ukr-dan/latest/wikipedia.aj.ukr-dan.ukr.gz
ukr-dan/latest/wikipedia.ak.ukr-dan.dan.gz
ukr-dan/latest/wikipedia.ak.ukr-dan.ukr.gz
ukr-dan/latest/wikipedia.al.ukr-dan.dan.gz
ukr-dan/latest/wikipedia.al.ukr-dan.ukr.gz
ukr-dan/latest/wikipedia.am.ukr-dan.dan.gz
ukr-dan/latest/wikipedia.am.ukr-dan.ukr.gz
ukr-dan/latest/wikipedia.an.ukr-dan.dan.gz
ukr-dan/latest/wikipedia.an.ukr-dan.ukr.gz
ukr-dan/latest/wikipedia.ao.ukr-dan.dan.gz
ukr-dan/latest/wikipedia.ao.ukr-dan.ukr.gz
ukr-dan/latest/wikiquote.aa.ukr-dan.dan.gz
ukr-dan/latest/wikiquote.aa.ukr-dan.ukr.gz
ukr-dan/latest/wikisource.aa.ukr-dan.dan.gz
ukr-dan/latest/wikisource.aa.ukr-dan.ukr.gz
ukr-deu/latest/wikibooks.aa.ukr-deu.deu.gz
ukr-deu/latest/wikibooks.aa.ukr-deu.ukr.gz
ukr-deu/latest/wikinews.aa.ukr-deu.deu.gz
ukr-deu/latest/wikinews.aa.ukr-deu.ukr.gz
ukr-deu/latest/wikipedia.aa.ukr-deu.deu.gz
ukr-deu/latest/wikipedia.aa.ukr-deu.ukr.gz
ukr-deu/latest/wikipedia.ab.ukr-deu.deu.gz
ukr-deu/latest/wikipedia.ab.ukr-deu.ukr.gz
ukr-deu/latest/wikipedia.ac.ukr-deu.deu.gz
ukr-deu/latest/wikipedia.ac.ukr-deu.ukr.gz
ukr-deu/latest/wikipedia.ad.ukr-deu.deu.gz
ukr-deu/latest/wikipedia.ad.ukr-deu.ukr.gz
ukr-deu/latest/wikipedia.ae.ukr-deu.deu.gz
ukr-deu/latest/wikipedia.ae.ukr-deu.ukr.gz
ukr-deu/latest/wikipedia.af.ukr-deu.deu.gz
ukr-deu/latest/wikipedia.af.ukr-deu.ukr.gz
ukr-deu/latest/wikipedia.ag.ukr-deu.deu.gz
ukr-deu/latest/wikipedia.ag.ukr-deu.ukr.gz
ukr-deu/latest/wikipedia.ah.ukr-deu.deu.gz
ukr-deu/latest/wikipedia.ah.ukr-deu.ukr.gz
ukr-deu/latest/wikipedia.ai.ukr-deu.deu.gz
ukr-deu/latest/wikipedia.ai.ukr-deu.ukr.gz
ukr-deu/latest/wikipedia.aj.ukr-deu.deu.gz
ukr-deu/latest/wikipedia.aj.ukr-deu.ukr.gz
ukr-deu/latest/wikipedia.ak.ukr-deu.deu.gz
ukr-deu/latest/wikipedia.ak.ukr-deu.ukr.gz
ukr-deu/latest/wikipedia.al.ukr-deu.deu.gz
ukr-deu/latest/wikipedia.al.ukr-deu.ukr.gz
ukr-deu/latest/wikipedia.am.ukr-deu.deu.gz
ukr-deu/latest/wikipedia.am.ukr-deu.ukr.gz
ukr-deu/latest/wikipedia.an.ukr-deu.deu.gz
ukr-deu/latest/wikipedia.an.ukr-deu.ukr.gz
ukr-deu/latest/wikipedia.ao.ukr-deu.deu.gz
ukr-deu/latest/wikipedia.ao.ukr-deu.ukr.gz
ukr-deu/latest/wikiquote.aa.ukr-deu.deu.gz
ukr-deu/latest/wikiquote.aa.ukr-deu.ukr.gz
ukr-deu/latest/wikisource.aa.ukr-deu.deu.gz
ukr-deu/latest/wikisource.aa.ukr-deu.ukr.gz
ukr-eng/latest/wiki.aa.ukr-eng.eng.gz
ukr-eng/latest/wiki.aa.ukr-eng.ukr.gz
ukr-eng/latest/wiki.ab.ukr-eng.eng.gz
@ -3082,6 +3252,196 @@ ukr-eng/latest/wikiquote.aa.ukr-eng.eng.gz
ukr-eng/latest/wikiquote.aa.ukr-eng.ukr.gz
ukr-eng/latest/wikisource.aa.ukr-eng.eng.gz
ukr-eng/latest/wikisource.aa.ukr-eng.ukr.gz
ukr-hun/latest/wikibooks.aa.ukr-hun.hun.gz
ukr-hun/latest/wikibooks.aa.ukr-hun.ukr.gz
ukr-hun/latest/wikinews.aa.ukr-hun.hun.gz
ukr-hun/latest/wikinews.aa.ukr-hun.ukr.gz
ukr-hun/latest/wikipedia.aa.ukr-hun.hun.gz
ukr-hun/latest/wikipedia.aa.ukr-hun.ukr.gz
ukr-hun/latest/wikipedia.ab.ukr-hun.hun.gz
ukr-hun/latest/wikipedia.ab.ukr-hun.ukr.gz
ukr-hun/latest/wikipedia.ac.ukr-hun.hun.gz
ukr-hun/latest/wikipedia.ac.ukr-hun.ukr.gz
ukr-hun/latest/wikipedia.ad.ukr-hun.hun.gz
ukr-hun/latest/wikipedia.ad.ukr-hun.ukr.gz
ukr-hun/latest/wikipedia.ae.ukr-hun.hun.gz
ukr-hun/latest/wikipedia.ae.ukr-hun.ukr.gz
ukr-hun/latest/wikipedia.af.ukr-hun.hun.gz
ukr-hun/latest/wikipedia.af.ukr-hun.ukr.gz
ukr-hun/latest/wikipedia.ag.ukr-hun.hun.gz
ukr-hun/latest/wikipedia.ag.ukr-hun.ukr.gz
ukr-hun/latest/wikipedia.ah.ukr-hun.hun.gz
ukr-hun/latest/wikipedia.ah.ukr-hun.ukr.gz
ukr-hun/latest/wikipedia.ai.ukr-hun.hun.gz
ukr-hun/latest/wikipedia.ai.ukr-hun.ukr.gz
ukr-hun/latest/wikipedia.aj.ukr-hun.hun.gz
ukr-hun/latest/wikipedia.aj.ukr-hun.ukr.gz
ukr-hun/latest/wikipedia.ak.ukr-hun.hun.gz
ukr-hun/latest/wikipedia.ak.ukr-hun.ukr.gz
ukr-hun/latest/wikipedia.al.ukr-hun.hun.gz
ukr-hun/latest/wikipedia.al.ukr-hun.ukr.gz
ukr-hun/latest/wikipedia.am.ukr-hun.hun.gz
ukr-hun/latest/wikipedia.am.ukr-hun.ukr.gz
ukr-hun/latest/wikipedia.an.ukr-hun.hun.gz
ukr-hun/latest/wikipedia.an.ukr-hun.ukr.gz
ukr-hun/latest/wikipedia.ao.ukr-hun.hun.gz
ukr-hun/latest/wikipedia.ao.ukr-hun.ukr.gz
ukr-hun/latest/wikiquote.aa.ukr-hun.hun.gz
ukr-hun/latest/wikiquote.aa.ukr-hun.ukr.gz
ukr-hun/latest/wikisource.aa.ukr-hun.hun.gz
ukr-hun/latest/wikisource.aa.ukr-hun.ukr.gz
ukr-pol/latest/wikibooks.aa.ukr-pol.pol.gz
ukr-pol/latest/wikibooks.aa.ukr-pol.ukr.gz
ukr-pol/latest/wikinews.aa.ukr-pol.pol.gz
ukr-pol/latest/wikinews.aa.ukr-pol.ukr.gz
ukr-pol/latest/wikipedia.aa.ukr-pol.pol.gz
ukr-pol/latest/wikipedia.aa.ukr-pol.ukr.gz
ukr-pol/latest/wikipedia.ab.ukr-pol.pol.gz
ukr-pol/latest/wikipedia.ab.ukr-pol.ukr.gz
ukr-pol/latest/wikipedia.ac.ukr-pol.pol.gz
ukr-pol/latest/wikipedia.ac.ukr-pol.ukr.gz
ukr-pol/latest/wikipedia.ad.ukr-pol.pol.gz
ukr-pol/latest/wikipedia.ad.ukr-pol.ukr.gz
ukr-pol/latest/wikipedia.ae.ukr-pol.pol.gz
ukr-pol/latest/wikipedia.ae.ukr-pol.ukr.gz
ukr-pol/latest/wikipedia.af.ukr-pol.pol.gz
ukr-pol/latest/wikipedia.af.ukr-pol.ukr.gz
ukr-pol/latest/wikipedia.ag.ukr-pol.pol.gz
ukr-pol/latest/wikipedia.ag.ukr-pol.ukr.gz
ukr-pol/latest/wikipedia.ah.ukr-pol.pol.gz
ukr-pol/latest/wikipedia.ah.ukr-pol.ukr.gz
ukr-pol/latest/wikipedia.ai.ukr-pol.pol.gz
ukr-pol/latest/wikipedia.ai.ukr-pol.ukr.gz
ukr-pol/latest/wikipedia.aj.ukr-pol.pol.gz
ukr-pol/latest/wikipedia.aj.ukr-pol.ukr.gz
ukr-pol/latest/wikipedia.ak.ukr-pol.pol.gz
ukr-pol/latest/wikipedia.ak.ukr-pol.ukr.gz
ukr-pol/latest/wikipedia.al.ukr-pol.pol.gz
ukr-pol/latest/wikipedia.al.ukr-pol.ukr.gz
ukr-pol/latest/wikipedia.am.ukr-pol.pol.gz
ukr-pol/latest/wikipedia.am.ukr-pol.ukr.gz
ukr-pol/latest/wikipedia.an.ukr-pol.pol.gz
ukr-pol/latest/wikipedia.an.ukr-pol.ukr.gz
ukr-pol/latest/wikipedia.ao.ukr-pol.pol.gz
ukr-pol/latest/wikipedia.ao.ukr-pol.ukr.gz
ukr-pol/latest/wikiquote.aa.ukr-pol.pol.gz
ukr-pol/latest/wikiquote.aa.ukr-pol.ukr.gz
ukr-pol/latest/wikisource.aa.ukr-pol.pol.gz
ukr-pol/latest/wikisource.aa.ukr-pol.ukr.gz
ukr-ron/latest/wikibooks.aa.ukr-ron.ron.gz
ukr-ron/latest/wikibooks.aa.ukr-ron.ukr.gz
ukr-ron/latest/wikinews.aa.ukr-ron.ron.gz
ukr-ron/latest/wikinews.aa.ukr-ron.ukr.gz
ukr-ron/latest/wikipedia.aa.ukr-ron.ron.gz
ukr-ron/latest/wikipedia.aa.ukr-ron.ukr.gz
ukr-ron/latest/wikipedia.ab.ukr-ron.ron.gz
ukr-ron/latest/wikipedia.ab.ukr-ron.ukr.gz
ukr-ron/latest/wikipedia.ac.ukr-ron.ron.gz
ukr-ron/latest/wikipedia.ac.ukr-ron.ukr.gz
ukr-ron/latest/wikipedia.ad.ukr-ron.ron.gz
ukr-ron/latest/wikipedia.ad.ukr-ron.ukr.gz
ukr-ron/latest/wikipedia.ae.ukr-ron.ron.gz
ukr-ron/latest/wikipedia.ae.ukr-ron.ukr.gz
ukr-ron/latest/wikipedia.af.ukr-ron.ron.gz
ukr-ron/latest/wikipedia.af.ukr-ron.ukr.gz
ukr-ron/latest/wikipedia.ag.ukr-ron.ron.gz
ukr-ron/latest/wikipedia.ag.ukr-ron.ukr.gz
ukr-ron/latest/wikipedia.ah.ukr-ron.ron.gz
ukr-ron/latest/wikipedia.ah.ukr-ron.ukr.gz
ukr-ron/latest/wikipedia.ai.ukr-ron.ron.gz
ukr-ron/latest/wikipedia.ai.ukr-ron.ukr.gz
ukr-ron/latest/wikipedia.aj.ukr-ron.ron.gz
ukr-ron/latest/wikipedia.aj.ukr-ron.ukr.gz
ukr-ron/latest/wikipedia.ak.ukr-ron.ron.gz
ukr-ron/latest/wikipedia.ak.ukr-ron.ukr.gz
ukr-ron/latest/wikipedia.al.ukr-ron.ron.gz
ukr-ron/latest/wikipedia.al.ukr-ron.ukr.gz
ukr-ron/latest/wikipedia.am.ukr-ron.ron.gz
ukr-ron/latest/wikipedia.am.ukr-ron.ukr.gz
ukr-ron/latest/wikipedia.an.ukr-ron.ron.gz
ukr-ron/latest/wikipedia.an.ukr-ron.ukr.gz
ukr-ron/latest/wikipedia.ao.ukr-ron.ron.gz
ukr-ron/latest/wikipedia.ao.ukr-ron.ukr.gz
ukr-ron/latest/wikiquote.aa.ukr-ron.ron.gz
ukr-ron/latest/wikiquote.aa.ukr-ron.ukr.gz
ukr-ron/latest/wikisource.aa.ukr-ron.ron.gz
ukr-ron/latest/wikisource.aa.ukr-ron.ukr.gz
ukr-slk/latest/wikibooks.aa.ukr-slk.slk.gz
ukr-slk/latest/wikibooks.aa.ukr-slk.ukr.gz
ukr-slk/latest/wikinews.aa.ukr-slk.slk.gz
ukr-slk/latest/wikinews.aa.ukr-slk.ukr.gz
ukr-slk/latest/wikipedia.aa.ukr-slk.slk.gz
ukr-slk/latest/wikipedia.aa.ukr-slk.ukr.gz
ukr-slk/latest/wikipedia.ab.ukr-slk.slk.gz
ukr-slk/latest/wikipedia.ab.ukr-slk.ukr.gz
ukr-slk/latest/wikipedia.ac.ukr-slk.slk.gz
ukr-slk/latest/wikipedia.ac.ukr-slk.ukr.gz
ukr-slk/latest/wikipedia.ad.ukr-slk.slk.gz
ukr-slk/latest/wikipedia.ad.ukr-slk.ukr.gz
ukr-slk/latest/wikipedia.ae.ukr-slk.slk.gz
ukr-slk/latest/wikipedia.ae.ukr-slk.ukr.gz
ukr-slk/latest/wikipedia.af.ukr-slk.slk.gz
ukr-slk/latest/wikipedia.af.ukr-slk.ukr.gz
ukr-slk/latest/wikipedia.ag.ukr-slk.slk.gz
ukr-slk/latest/wikipedia.ag.ukr-slk.ukr.gz
ukr-slk/latest/wikipedia.ah.ukr-slk.slk.gz
ukr-slk/latest/wikipedia.ah.ukr-slk.ukr.gz
ukr-slk/latest/wikipedia.ai.ukr-slk.slk.gz
ukr-slk/latest/wikipedia.ai.ukr-slk.ukr.gz
ukr-slk/latest/wikipedia.aj.ukr-slk.slk.gz
ukr-slk/latest/wikipedia.aj.ukr-slk.ukr.gz
ukr-slk/latest/wikipedia.ak.ukr-slk.slk.gz
ukr-slk/latest/wikipedia.ak.ukr-slk.ukr.gz
ukr-slk/latest/wikipedia.al.ukr-slk.slk.gz
ukr-slk/latest/wikipedia.al.ukr-slk.ukr.gz
ukr-slk/latest/wikipedia.am.ukr-slk.slk.gz
ukr-slk/latest/wikipedia.am.ukr-slk.ukr.gz
ukr-slk/latest/wikipedia.an.ukr-slk.slk.gz
ukr-slk/latest/wikipedia.an.ukr-slk.ukr.gz
ukr-slk/latest/wikipedia.ao.ukr-slk.slk.gz
ukr-slk/latest/wikipedia.ao.ukr-slk.ukr.gz
ukr-slk/latest/wikiquote.aa.ukr-slk.slk.gz
ukr-slk/latest/wikiquote.aa.ukr-slk.ukr.gz
ukr-slk/latest/wikisource.aa.ukr-slk.slk.gz
ukr-slk/latest/wikisource.aa.ukr-slk.ukr.gz
ukr-swe/latest/wikibooks.aa.ukr-swe.swe.gz
ukr-swe/latest/wikibooks.aa.ukr-swe.ukr.gz
ukr-swe/latest/wikinews.aa.ukr-swe.swe.gz
ukr-swe/latest/wikinews.aa.ukr-swe.ukr.gz
ukr-swe/latest/wikipedia.aa.ukr-swe.swe.gz
ukr-swe/latest/wikipedia.aa.ukr-swe.ukr.gz
ukr-swe/latest/wikipedia.ab.ukr-swe.swe.gz
ukr-swe/latest/wikipedia.ab.ukr-swe.ukr.gz
ukr-swe/latest/wikipedia.ac.ukr-swe.swe.gz
ukr-swe/latest/wikipedia.ac.ukr-swe.ukr.gz
ukr-swe/latest/wikipedia.ad.ukr-swe.swe.gz
ukr-swe/latest/wikipedia.ad.ukr-swe.ukr.gz
ukr-swe/latest/wikipedia.ae.ukr-swe.swe.gz
ukr-swe/latest/wikipedia.ae.ukr-swe.ukr.gz
ukr-swe/latest/wikipedia.af.ukr-swe.swe.gz
ukr-swe/latest/wikipedia.af.ukr-swe.ukr.gz
ukr-swe/latest/wikipedia.ag.ukr-swe.swe.gz
ukr-swe/latest/wikipedia.ag.ukr-swe.ukr.gz
ukr-swe/latest/wikipedia.ah.ukr-swe.swe.gz
ukr-swe/latest/wikipedia.ah.ukr-swe.ukr.gz
ukr-swe/latest/wikipedia.ai.ukr-swe.swe.gz
ukr-swe/latest/wikipedia.ai.ukr-swe.ukr.gz
ukr-swe/latest/wikipedia.aj.ukr-swe.swe.gz
ukr-swe/latest/wikipedia.aj.ukr-swe.ukr.gz
ukr-swe/latest/wikipedia.ak.ukr-swe.swe.gz
ukr-swe/latest/wikipedia.ak.ukr-swe.ukr.gz
ukr-swe/latest/wikipedia.al.ukr-swe.swe.gz
ukr-swe/latest/wikipedia.al.ukr-swe.ukr.gz
ukr-swe/latest/wikipedia.am.ukr-swe.swe.gz
ukr-swe/latest/wikipedia.am.ukr-swe.ukr.gz
ukr-swe/latest/wikipedia.an.ukr-swe.swe.gz
ukr-swe/latest/wikipedia.an.ukr-swe.ukr.gz
ukr-swe/latest/wikipedia.ao.ukr-swe.swe.gz
ukr-swe/latest/wikipedia.ao.ukr-swe.ukr.gz
ukr-swe/latest/wikiquote.aa.ukr-swe.swe.gz
ukr-swe/latest/wikiquote.aa.ukr-swe.ukr.gz
ukr-swe/latest/wikisource.aa.ukr-swe.swe.gz
ukr-swe/latest/wikisource.aa.ukr-swe.ukr.gz
urd-eng/latest/wiki.aa.urd-eng.eng.gz
urd-eng/latest/wiki.aa.urd-eng.urd.gz
urd-eng/latest/wikibooks.aa.urd-eng.eng.gz

View File

@ -65,6 +65,16 @@ engukr-quantize-student:
make SRCLANGS=eng TRGLANGS=ukr test-quantized-tiny11-student
## special thing: student models with pivot-based data (does that work?)
elg-ukr-students:
for l in bul dan deu fin hun nob ron swe slk tur; do \
${MAKE} STUDENT_DATA=pft-nopar SRCLANGS=ukr TRGLANGS=$$l train-tiny11-student; \
done
elg-ukr-students-test:
${MAKE} STUDENT_DATA=ftmono-pft-nopar SRCLANGS=ukr TRGLANGS=deu train-tiny11-student
${MAKE} STUDENT_DATA=ftmono-pft-nopar SRCLANGS=ukr TRGLANGS=hun train-tiny11-student
elg-eval:
${MAKE} elg-eval-tfbig
@ -97,12 +107,23 @@ elg-eval-multi:
done
elg-eval-zle:
for p in zle2zle zlw2zle zle2fin zle2zlw; do \
for p in zle2zle zlw2zle zle2fin zle2zlw zls2zlw zlw2zls; do \
${MAKE} MODELTYPE=transformer-big tatoeba-$${p}-eval-bt; \
${MAKE} MODELTYPE=transformer-big tatoeba-$${p}-multieval-bt; \
${MAKE} MODELTYPE=transformer-big tatoeba-$${p}-eval-testsets-bt; \
done
elg-eval-big2zle:
for l in deu fra spa por ita; do \
${MAKE} MODELTYPE=transformer-big tatoeba-zle2$${l}-eval; \
${MAKE} MODELTYPE=transformer-big tatoeba-zle2$${l}-multieval; \
${MAKE} MODELTYPE=transformer-big tatoeba-zle2$${l}-eval-testsets; \
${MAKE} MODELTYPE=transformer-big tatoeba-$${l}2zle-eval; \
${MAKE} MODELTYPE=transformer-big tatoeba-$${l}2zle-multieval; \
${MAKE} MODELTYPE=transformer-big tatoeba-$${l}2zle-eval-testsets; \
done
elg-pivot-eval:
for l in dan swe fin deu ron tur; do \
if [ -e work/$$l-ukr ]; then \
@ -143,6 +164,19 @@ elg-dist-pivot-tmp:
${MAKE} SRCLANGS="ces slk" TRGLANGS=ukr dist-pbt-tatoeba
${MAKE} TRGLANGS="ces slk" SRCLANGS=ukr dist-pft-tatoeba
elg-eval-pivot-tmp:
${MAKE} MODELTYPE=transformer-big tatoeba-gmq2zle-eval-pbt
${MAKE} MODELTYPE=transformer-big tatoeba-gmq2zle-multieval-pbt
${MAKE} MODELTYPE=transformer-big tatoeba-zle2gmq-eval-pft
${MAKE} MODELTYPE=transformer-big tatoeba-zle2gmq-multieval-pft
# ${MAKE} SRCLANGS="ces slk" TRGLANGS=ukr eval-pbt-tatoeba
# ${MAKE} SRCLANGS="ces slk" TRGLANGS=ukr tatoeba-multilingual-eval-pbt
# ${MAKE} TRGLANGS="ces slk" SRCLANGS=ukr eval-pft-tatoeba
# ${MAKE} TRGLANGS="ces slk" SRCLANGS=ukr tatoeba-multilingual-eval-pft
elg-gmq2zle-pivot:
${MAKE} MODELTYPE=transformer-big CPUJOB_HPC_MEM=32g tatoeba-gmq2zle-trainjob-pbt
@ -174,6 +208,8 @@ elg-ukr2fin:
${MAKE} tatoeba-ukr2fin-trainjob-pbt-pft
elg-deu2ukr:
${MAKE} tatoeba-deu2ukr-trainjob-pbt
${MAKE} tatoeba-ukr2deu-trainjob-pft

View File

@ -182,7 +182,7 @@ ALLWIKIS_TRG = ${patsubst %,${OUTPUT_DIR}/%.${PART}_${MODELNAME}.${LANGPAIR}.${T
## don't delete translated text if the process crashes
.PRECIOUS: ${WIKI_TRG}
.PRECIOUS: ${WIKI_TRG} ${ALLWIKIPARTS_TRG} ${ALLWIKIS_TRG}
ifdef LOCAL_SCRATCH
@ -286,12 +286,19 @@ released-data.txt: .
swift list ${BT_CONTAINER} | grep -v README.md | grep -v '.txt' > $@
swift upload ${BT_CONTAINER} $@
TODAY := $(shell date +%F)
released-data-size.txt: .
${MAKE} check-latest-all | grep '^[0-9]' > $@
swift download ${BT_CONTAINER} released-data-size.txt
mv $@ $@.${TODAY}
head -n-1 $@.${TODAY} | grep [a-z] > $@.old
${MAKE} check-latest-all > $@.new
cat $@.old $@.new | grep '^[1-9]' | sort -k2,2 > $@
cat $@ | awk '{ sum += $$1 } END { print sum }' > $@.tmp
cat $@.tmp >> $@
rm -f cat $@.tmp
swift upload ${BT_CONTAINER} released-data-size.txt
swift upload ${BT_CONTAINER} $@
swift upload ${BT_CONTAINER} $@.${TODAY}
rm -f $@.tmp $@.${TODAY} $@.new $@.old
# download released data
@ -333,20 +340,37 @@ prepare-allwikis: ${LANGPAIR}/${MODELNAME}/decoder.yml ${ALLWIKIS_TXT}
.PHONY: translate
translate: ${WIKI_LATEST_README} ${WIKI_LATEST_TRG}
ifneq (${WIKI_LATEST_SRC},)
${MAKE} ${WIKI_LATEST_SRC}
endif
## translate all parts
.PHONY: translate-all-parts
translate-all-parts: ${ALLWIKIPARTS_LATEST_TRG}
ifneq (${ALLWIKIPARTS_LATEST_SRC},)
${MAKE} ${ALLWIKIPARTS_LATEST_SRC}
endif
## translate all wikis and all parts
.PHONY: translate-all
translate-all:
for s in ${WIKISOURCES}; do \
${MAKE} translate-allparts; \
${MAKE} WIKISOURCE=$$s translate-all-parts; \
done
## create all source language files
.PHONY: latest-all-source-parts
latest-all-source-parts: ${ALLWIKIPARTS_LATEST_SRC}
.PHONY: latest-all-sources
latest-all-sources:
for s in ${WIKISOURCES}; do \
${MAKE} WIKISOURCE=$$s latest-all-source-parts; \
done
## create jobs for translating all parts
## (only start the job if the file does not exist yet)
.PHONY: translate-all-parts-jobs
@ -478,7 +502,8 @@ ${WIKI_DIR}/${SRC}/.done:
${OUTPUT_DIR}/%.${PART}_${MODELNAME}.${LANGPAIR}.${SRC}.spm.gz: ${WIKI_DIR}/${SRC}/%.${PART}.gz
# ${OUTPUT_DIR}/%.${PART}_${MODELNAME}.${LANGPAIR}.${SRC}.spm.gz: ${WIKI_DIR}/${SRC}/%.${PART}.gz
${OUTPUT_DIR}/%_${MODELNAME}.${LANGPAIR}.${SRC}.spm.gz: ${WIKI_DIR}/${SRC}/%.gz
ifneq (${MODELZIP},)
mkdir -p ${dir $@}
${MAKE} ${LANGPAIR}/${MODELNAME}/decoder.yml
@ -494,7 +519,8 @@ endif
## merge SentencePiece segments in the source text
## (Why? because we filter out some data from the original wiki text, see above)
${WIKI_SRC}: ${WIKI_PRE}
# ${WIKI_SRC}: ${WIKI_PRE}
${OUTPUT_DIR}/${WIKISOURCE}.%.${LANGPAIR}.${SRC}.gz: ${OUTPUT_DIR}/${WIKISOURCE}.%.${LANGPAIR}.${SRC}.spm.gz
ifneq (${MODELZIP},)
mkdir -p ${dir $@}
${GZCAT} $< |\
@ -511,11 +537,13 @@ endif
## --> this allows multiple translation iterations
## without duplicating the data we want to use in MT training
${WIKI_LATEST_SRC}: ${WIKI_SRC}
# ${WIKI_LATEST_SRC}: ${WIKI_SRC}
${OUTPUT_DIR}/latest/${WIKISOURCE}.%.${LANGPAIR}.${SRC}.gz: ${OUTPUT_DIR}/${WIKISOURCE}.%_${MODELNAME}.${LANGPAIR}.${SRC}.gz
mkdir -p ${dir $@}
cp $< $@
${WIKI_LATEST_TRG}: ${WIKI_TRG}
# ${WIKI_LATEST_TRG}: ${WIKI_TRG}
${OUTPUT_DIR}/latest/${WIKISOURCE}.%.${LANGPAIR}.${TRG}.gz: ${OUTPUT_DIR}/${WIKISOURCE}.%_${MODELNAME}.${LANGPAIR}.${TRG}.gz
mkdir -p ${dir $@}
cp $< $@
@ -534,7 +562,6 @@ ifneq (${MODELZIP},)
-i ${PWD}/$< \
-c decoder.yml \
-d ${MARIAN_GPUS} \
--quiet-translation \
${MARIAN_DECODER_FLAGS} |\
sed 's/ //g;s/▁/ /g' | sed 's/^ *//;s/ *$$//' |\
gzip -c > ${PWD}/$@