FintoAI-data-YKL / dvc.lock
juhoinkinen's picture
Upload folder using huggingface_hub
0179b9a verified
raw
history blame
18.2 kB
schema: '2.0'
stages:
loadvoc-fi:
cmd: annif loadvoc ykl-omikuji-parabel-fi corpora/ykl-classes.tsv
deps:
- path: corpora/ykl-classes.tsv
md5: b2f29070ccedefda72994b8db324e371
size: 187637
- path: venv-installed
md5: 2e6baa8289dac9e06cb525999eb39a70
size: 42
outs:
- path: data/vocabs/ykl-fi
md5: 680732b8de9b5108536ccea40462734e.dir
size: 764449
nfiles: 3
train-omikuji-parabel-fi:
cmd: annif train ykl-omikuji-parabel-fi -j 8 corpora/kirjaesittelyt2021/kvesit-ykl-fin-train.tsv
deps:
- path: corpora/kirjaesittelyt2021/kvesit-ykl-fin-train.tsv
md5: ffa2c09b76a8a5370dbe71540da8c0ff
size: 38164190
- path: data/vocabs/ykl
md5: 3b9896e0ea6b1a4fa9820f015831fd93.dir
size: 6503819
nfiles: 3
- path: venv-installed
md5: 2e6baa8289dac9e06cb525999eb39a70
size: 42
params:
projects.toml:
ykl-omikuji-parabel-fi:
name: YKL Omikuji Parabel Finnish
language: fi
backend: omikuji
analyzer: voikko(fi)
vocab: ykl
ngram: 1
min_df: 1
outs:
- path: data/projects/ykl-omikuji-parabel-fi
md5: e506a5b142c024d089a449b9ab99da7c.dir
size: 119198246
nfiles: 6
eval-omikuji-parabel-fi:
cmd: annif eval ykl-omikuji-parabel-fi -j 8 -m Precision@1 -m NDCG --metrics-file
reports/test-omikuji-parabel-fi.json corpora/kirjaesittelyt2021/kvesit-ykl-fin-test.tsv
deps:
- path: corpora/kirjaesittelyt2021/kvesit-ykl-fin-test.tsv
md5: e4497d02e1c12d30de314f25ac5c5a8e
size: 3289456
- path: data/projects/ykl-omikuji-parabel-fi
md5: e506a5b142c024d089a449b9ab99da7c.dir
size: 119198246
nfiles: 6
- path: venv-installed
md5: 2e6baa8289dac9e06cb525999eb39a70
size: 42
outs:
- path: reports/test-omikuji-parabel-fi.json
md5: e0079ca11936a9627c9ee5b4a23e4c48
size: 100
install:
cmd: python3 -m venv venv && . venv/bin/activate && pip install -U pip wheel setuptools
&& pip install -r requirements.txt && cp requirements.txt venv-installed
deps:
- path: requirements.txt
hash: md5
md5: f85f21b68735b126c2241fbff83fd0ef
size: 41
outs:
- path: venv-installed
hash: md5
md5: f85f21b68735b126c2241fbff83fd0ef
size: 41
train-omikuji-bonsai-fi:
cmd: annif train ykl-omikuji-bonsai-fi -j 8 corpora/kirjaesittelyt2021/kvesit-ykl-fin-train.tsv
deps:
- path: corpora/kirjaesittelyt2021/kvesit-ykl-fin-train.tsv
md5: ffa2c09b76a8a5370dbe71540da8c0ff
size: 38164190
- path: data/vocabs/ykl
md5: 3b9896e0ea6b1a4fa9820f015831fd93.dir
size: 6503819
nfiles: 3
- path: venv-installed
md5: 2e6baa8289dac9e06cb525999eb39a70
size: 42
params:
projects.toml:
ykl-omikuji-bonsai-fi:
name: YKL Omikuji Bonsai Finnish
language: fi
backend: omikuji
cluster_balanced: 'False'
cluster_k: 100
max_depth: 3
analyzer: voikko(fi)
vocab: ykl
ngram: 1
min_df: 1
outs:
- path: data/projects/ykl-omikuji-bonsai-fi
md5: 1166661a5b68a9c155a57d40592d11eb.dir
size: 114643724
nfiles: 6
eval-omikuji-bonsai-fi:
cmd: annif eval ykl-omikuji-bonsai-fi -j 8 -m Precision@1 -m NDCG --metrics-file
reports/test-omikuji-bonsai-fi.json corpora/kirjaesittelyt2021/kvesit-ykl-fin-test.tsv
deps:
- path: corpora/kirjaesittelyt2021/kvesit-ykl-fin-test.tsv
md5: e4497d02e1c12d30de314f25ac5c5a8e
size: 3289456
- path: data/projects/ykl-omikuji-bonsai-fi
md5: 1166661a5b68a9c155a57d40592d11eb.dir
size: 114643724
nfiles: 6
- path: venv-installed
md5: 2e6baa8289dac9e06cb525999eb39a70
size: 42
outs:
- path: reports/test-omikuji-bonsai-fi.json
md5: da9fafaa27f186fff29cb24b505c2fa2
size: 100
load-vocab:
cmd: annif load-vocab ykl corpora/ykl-skos.ttl
deps:
- path: corpora/ykl-skos.ttl
md5: fea11c863134c9e8379ea52e0f31e28a
size: 3901929
- path: venv-installed
hash: md5
md5: f85f21b68735b126c2241fbff83fd0ef
size: 41
outs:
- path: data/vocabs/ykl
hash: md5
md5: 083422d4d504723b2eb4fc4ee8805a99.dir
size: 6503179
nfiles: 3
train-omikuji-bonsai@0:
cmd: annif train ykl-omikuji-bonsai-fi -j 8 corpora/kirjaesittelyt2021/kvesit-ykl-fin-train.tsv
deps:
- path: corpora/kirjaesittelyt2021/kvesit-ykl-fin-train.tsv
md5: cc52c6a5c21d799aad3fb73a889cd90e
size: 36684502
- path: data/vocabs/ykl
hash: md5
md5: 083422d4d504723b2eb4fc4ee8805a99.dir
size: 6503179
nfiles: 3
- path: venv-installed
hash: md5
md5: f85f21b68735b126c2241fbff83fd0ef
size: 41
params:
projects.toml:
ykl-omikuji-bonsai-fi:
name: YKL Omikuji Bonsai Finnish
language: fi
backend: omikuji
cluster_balanced: 'False'
cluster_k: 100
max_depth: 3
analyzer: voikko(fi)
vocab: ykl
ngram: 1
min_df: 1
access: hidden
outs:
- path: data/projects/ykl-omikuji-bonsai-fi
hash: md5
md5: 9bdaf3071b9fe0d13f72e1b2d6873bfb.dir
size: 110266624
nfiles: 6
eval-omikuji-bonsai@0:
cmd: annif eval ykl-omikuji-bonsai-fi -j 8 -m Precision@1 -m NDCG --metrics-file
reports/test-omikuji-bonsai-fi.json --results-file reports/test-omikuji-bonsai-fi.csv
corpora/kirjaesittelyt2021/kvesit-ykl-fin-test.tsv
deps:
- path: corpora/kirjaesittelyt2021/kvesit-ykl-fin-test.tsv
md5: 9f8d094ae71ec68c5d40dde46d991e1f
size: 4534782
- path: data/projects/ykl-omikuji-bonsai-fi
hash: md5
md5: 9bdaf3071b9fe0d13f72e1b2d6873bfb.dir
size: 110266624
nfiles: 6
- path: venv-installed
hash: md5
md5: f85f21b68735b126c2241fbff83fd0ef
size: 41
outs:
- path: reports/test-omikuji-bonsai-fi.csv
hash: md5
md5: 3c536124365595cea86fa741f9c355cb
size: 237892
- path: reports/test-omikuji-bonsai-fi.json
hash: md5
md5: 24f9c18652995a673cb765edf417b2c8
size: 100
train-omikuji-bonsai@1:
cmd: annif train ykl-omikuji-bonsai-sv -j 8 corpora/kirjaesittelyt2021/kvesit-ykl-swe-train.tsv
deps:
- path: corpora/kirjaesittelyt2021/kvesit-ykl-swe-train.tsv
md5: fa74f039e20594e212d2429eb3e74c13
size: 2367569
- path: data/vocabs/ykl
hash: md5
md5: 083422d4d504723b2eb4fc4ee8805a99.dir
size: 6503179
nfiles: 3
- path: venv-installed
hash: md5
md5: f85f21b68735b126c2241fbff83fd0ef
size: 41
params:
projects.toml:
ykl-omikuji-bonsai-sv:
name: YKL Omikuji Bonsai Swedish
language: sv
backend: omikuji
cluster_balanced: 'False'
cluster_k: 100
max_depth: 3
analyzer: snowball(swedish)
vocab: ykl
ngram: 1
min_df: 1
access: hidden
outs:
- path: data/projects/ykl-omikuji-bonsai-sv
hash: md5
md5: e589e2a60b5f7cdcc5e67c7443b4c87a.dir
size: 8507130
nfiles: 6
train-omikuji-bonsai@2:
cmd: annif train ykl-omikuji-bonsai-en -j 8 corpora/kirjaesittelyt2021/kvesit-ykl-eng-train.tsv
deps:
- path: corpora/kirjaesittelyt2021/kvesit-ykl-eng-train.tsv
md5: 87548d6f8f9a8185dc870e8112668c87
size: 1730632
- path: data/vocabs/ykl
hash: md5
md5: 083422d4d504723b2eb4fc4ee8805a99.dir
size: 6503179
nfiles: 3
- path: venv-installed
hash: md5
md5: f85f21b68735b126c2241fbff83fd0ef
size: 41
params:
projects.toml:
ykl-omikuji-bonsai-en:
name: YKL Omikuji Bonsai English
language: en
backend: omikuji
cluster_balanced: 'False'
cluster_k: 100
max_depth: 3
analyzer: snowball(english)
vocab: ykl
ngram: 1
min_df: 1
access: hidden
outs:
- path: data/projects/ykl-omikuji-bonsai-en
hash: md5
md5: 0bce7445a6e1df060f800ec5516959c1.dir
size: 5332560
nfiles: 6
eval-omikuji-bonsai@2:
cmd: annif eval ykl-omikuji-bonsai-en -j 8 -m Precision@1 -m NDCG --metrics-file
reports/test-omikuji-bonsai-en.json --results-file reports/test-omikuji-bonsai-en.csv
corpora/kirjaesittelyt2021/kvesit-ykl-eng-test.tsv
deps:
- path: corpora/kirjaesittelyt2021/kvesit-ykl-eng-test.tsv
md5: bc7f924d84a20e9ab91e2600fd2415ec
size: 210866
- path: data/projects/ykl-omikuji-bonsai-en
hash: md5
md5: 0bce7445a6e1df060f800ec5516959c1.dir
size: 5332560
nfiles: 6
- path: venv-installed
hash: md5
md5: f85f21b68735b126c2241fbff83fd0ef
size: 41
outs:
- path: reports/test-omikuji-bonsai-en.csv
hash: md5
md5: e4734c53c0225ad899a06926e8b7e0d1
size: 212494
- path: reports/test-omikuji-bonsai-en.json
hash: md5
md5: 6f0029dd304ac0fc94b7817aa9ea3462
size: 100
train-omikuji-parabel@0:
cmd: annif train ykl-omikuji-parabel-fi -j 8 corpora/kirjaesittelyt2021/kvesit-ykl-fin-train.tsv
deps:
- path: corpora/kirjaesittelyt2021/kvesit-ykl-fin-train.tsv
md5: cc52c6a5c21d799aad3fb73a889cd90e
size: 36684502
- path: data/vocabs/ykl
hash: md5
md5: 083422d4d504723b2eb4fc4ee8805a99.dir
size: 6503179
nfiles: 3
- path: venv-installed
hash: md5
md5: f85f21b68735b126c2241fbff83fd0ef
size: 41
params:
projects.toml:
ykl-omikuji-parabel-fi:
name: YKL Omikuji Parabel Finnish
language: fi
backend: omikuji
analyzer: voikko(fi)
vocab: ykl
ngram: 1
min_df: 1
access: hidden
outs:
- path: data/projects/ykl-omikuji-parabel-fi
hash: md5
md5: 44ab11d0b3e729a0dcd3b88fdadb7567.dir
size: 114032199
nfiles: 6
eval-omikuji-parabel@0:
cmd: annif eval ykl-omikuji-parabel-fi -j 8 -m Precision@1 -m NDCG --metrics-file
reports/test-omikuji-parabel-fi.json --results-file reports/test-omikuji-parabel-fi.csv
corpora/kirjaesittelyt2021/kvesit-ykl-fin-test.tsv
deps:
- path: corpora/kirjaesittelyt2021/kvesit-ykl-fin-test.tsv
md5: 9f8d094ae71ec68c5d40dde46d991e1f
size: 4534782
- path: data/projects/ykl-omikuji-parabel-fi
hash: md5
md5: 44ab11d0b3e729a0dcd3b88fdadb7567.dir
size: 114032199
nfiles: 6
- path: venv-installed
hash: md5
md5: f85f21b68735b126c2241fbff83fd0ef
size: 41
outs:
- path: reports/test-omikuji-parabel-fi.csv
hash: md5
md5: 6ef001dff735a3b3a64082c02721736c
size: 236720
- path: reports/test-omikuji-parabel-fi.json
hash: md5
md5: 1a7877d85e63ee67dc0c77f8b5c25ba2
size: 97
train-omikuji-parabel@1:
cmd: annif train ykl-omikuji-parabel-sv -j 8 corpora/kirjaesittelyt2021/kvesit-ykl-swe-train.tsv
deps:
- path: corpora/kirjaesittelyt2021/kvesit-ykl-swe-train.tsv
md5: fa74f039e20594e212d2429eb3e74c13
size: 2367569
- path: data/vocabs/ykl
hash: md5
md5: 083422d4d504723b2eb4fc4ee8805a99.dir
size: 6503179
nfiles: 3
- path: venv-installed
hash: md5
md5: f85f21b68735b126c2241fbff83fd0ef
size: 41
params:
projects.toml:
ykl-omikuji-parabel-sv:
name: YKL Omikuji Parabel Swedish
language: sv
backend: omikuji
analyzer: snowball(swedish)
vocab: ykl
ngram: 1
min_df: 1
access: hidden
outs:
- path: data/projects/ykl-omikuji-parabel-sv
hash: md5
md5: ce70c5681d39ac52e3b2a9fc2efa7f4a.dir
size: 8635331
nfiles: 6
eval-omikuji-parabel@1:
cmd: annif eval ykl-omikuji-parabel-sv -j 8 -m Precision@1 -m NDCG --metrics-file
reports/test-omikuji-parabel-sv.json --results-file reports/test-omikuji-parabel-sv.csv
corpora/kirjaesittelyt2021/kvesit-ykl-swe-test.tsv
deps:
- path: corpora/kirjaesittelyt2021/kvesit-ykl-swe-test.tsv
md5: a9177ace2f0d1dffa6a424fccdf04b37
size: 287821
- path: data/projects/ykl-omikuji-parabel-sv
hash: md5
md5: ce70c5681d39ac52e3b2a9fc2efa7f4a.dir
size: 8635331
nfiles: 6
- path: venv-installed
hash: md5
md5: f85f21b68735b126c2241fbff83fd0ef
size: 41
outs:
- path: reports/test-omikuji-parabel-sv.csv
hash: md5
md5: a9b65c5400c421b4ce9f1f7e44dffccd
size: 214164
- path: reports/test-omikuji-parabel-sv.json
hash: md5
md5: 7f68b59b4db8a3a6116e8ec105913678
size: 87
train-omikuji-parabel@2:
cmd: annif train ykl-omikuji-parabel-en -j 8 corpora/kirjaesittelyt2021/kvesit-ykl-eng-train.tsv
deps:
- path: corpora/kirjaesittelyt2021/kvesit-ykl-eng-train.tsv
md5: 87548d6f8f9a8185dc870e8112668c87
size: 1730632
- path: data/vocabs/ykl
hash: md5
md5: 083422d4d504723b2eb4fc4ee8805a99.dir
size: 6503179
nfiles: 3
- path: venv-installed
hash: md5
md5: f85f21b68735b126c2241fbff83fd0ef
size: 41
params:
projects.toml:
ykl-omikuji-parabel-en:
name: YKL Omikuji Parabel English
language: en
backend: omikuji
analyzer: snowball(english)
vocab: ykl
ngram: 1
min_df: 1
access: hidden
outs:
- path: data/projects/ykl-omikuji-parabel-en
hash: md5
md5: f1d1a08423ae130c839f3db15bc9ddf3.dir
size: 5326770
nfiles: 6
eval-omikuji-parabel@2:
cmd: annif eval ykl-omikuji-parabel-en -j 8 -m Precision@1 -m NDCG --metrics-file
reports/test-omikuji-parabel-en.json --results-file reports/test-omikuji-parabel-en.csv
corpora/kirjaesittelyt2021/kvesit-ykl-eng-test.tsv
deps:
- path: corpora/kirjaesittelyt2021/kvesit-ykl-eng-test.tsv
md5: bc7f924d84a20e9ab91e2600fd2415ec
size: 210866
- path: data/projects/ykl-omikuji-parabel-en
hash: md5
md5: f1d1a08423ae130c839f3db15bc9ddf3.dir
size: 5326770
nfiles: 6
- path: venv-installed
hash: md5
md5: f85f21b68735b126c2241fbff83fd0ef
size: 41
outs:
- path: reports/test-omikuji-parabel-en.csv
hash: md5
md5: c856d122742783f93908ed93bf2357fc
size: 212459
- path: reports/test-omikuji-parabel-en.json
hash: md5
md5: 1a00cc0b691c5a04e71f5f29896af3a2
size: 100
eval-omikuji-bonsai@1:
cmd: annif eval ykl-omikuji-bonsai-sv -j 8 -m Precision@1 -m NDCG --metrics-file
reports/test-omikuji-bonsai-sv.json --results-file reports/test-omikuji-bonsai-sv.csv
corpora/kirjaesittelyt2021/kvesit-ykl-swe-test.tsv
deps:
- path: corpora/kirjaesittelyt2021/kvesit-ykl-swe-test.tsv
md5: a9177ace2f0d1dffa6a424fccdf04b37
size: 287821
- path: data/projects/ykl-omikuji-bonsai-sv
hash: md5
md5: e589e2a60b5f7cdcc5e67c7443b4c87a.dir
size: 8507130
nfiles: 6
- path: venv-installed
hash: md5
md5: f85f21b68735b126c2241fbff83fd0ef
size: 41
outs:
- path: reports/test-omikuji-bonsai-sv.csv
hash: md5
md5: 9a6cd19c12e6d7da7f0021735d81c62a
size: 214103
- path: reports/test-omikuji-bonsai-sv.json
hash: md5
md5: 95ea663acf56c7fbd27d43f755758610
size: 87
eval-ensemble@0:
cmd: annif eval ykl-fi -j 8 -m Precision@1 -m NDCG --metrics-file reports/test-fi.json
--results-file reports/test-fi.csv corpora/kirjaesittelyt2021/kvesit-ykl-fin-test.tsv
deps:
- path: corpora/kirjaesittelyt2021/kvesit-ykl-fin-test.tsv
hash: md5
md5: 9f8d094ae71ec68c5d40dde46d991e1f
size: 4534782
- path: data/projects/ykl-fi
hash: md5
md5: d751713988987e9331980363e24189ce.dir
size: 0
nfiles: 0
- path: venv-installed
hash: md5
md5: f85f21b68735b126c2241fbff83fd0ef
size: 41
outs:
- path: reports/test-fi.csv
hash: md5
md5: 38c9f688aaf641cc166db2dc72da3ef1
size: 237209
- path: reports/test-fi.json
hash: md5
md5: 47cfa99502a3ab3f5a1852b8708cccf9
size: 100
eval-ensemble@1:
cmd: annif eval ykl-sv -j 8 -m Precision@1 -m NDCG --metrics-file reports/test-sv.json
--results-file reports/test-sv.csv corpora/kirjaesittelyt2021/kvesit-ykl-swe-test.tsv
deps:
- path: corpora/kirjaesittelyt2021/kvesit-ykl-swe-test.tsv
hash: md5
md5: a9177ace2f0d1dffa6a424fccdf04b37
size: 287821
- path: data/projects/ykl-sv
hash: md5
md5: d751713988987e9331980363e24189ce.dir
size: 0
nfiles: 0
- path: venv-installed
hash: md5
md5: f85f21b68735b126c2241fbff83fd0ef
size: 41
outs:
- path: reports/test-sv.csv
hash: md5
md5: 2fff6f3bc20fddd861bf040622e28166
size: 214271
- path: reports/test-sv.json
hash: md5
md5: 4f76e748ac704e7b47d74c2c459cacaf
size: 87
eval-ensemble@2:
cmd: annif eval ykl-en -j 8 -m Precision@1 -m NDCG --metrics-file reports/test-en.json
--results-file reports/test-en.csv corpora/kirjaesittelyt2021/kvesit-ykl-eng-test.tsv
deps:
- path: corpora/kirjaesittelyt2021/kvesit-ykl-eng-test.tsv
hash: md5
md5: bc7f924d84a20e9ab91e2600fd2415ec
size: 210866
- path: data/projects/ykl-en
hash: md5
md5: d751713988987e9331980363e24189ce.dir
size: 0
nfiles: 0
- path: venv-installed
hash: md5
md5: f85f21b68735b126c2241fbff83fd0ef
size: 41
outs:
- path: reports/test-en.csv
hash: md5
md5: eea5b22824d23cb90267eb969a613300
size: 212565
- path: reports/test-en.json
hash: md5
md5: 8d41a89395974efbf8ae06880f94d3c4
size: 100