run-title: tashkeela-d2 | |
debug: false | |
paths: | |
base: ./dataset/ashaar | |
save: ./models | |
load: tashkeela-d2.pt | |
resume: ./models/Tashkeela-D2/tashkeela-d2.pt | |
constants: ./dataset/helpers/constants | |
word-embs: vocab.vec | |
test: test | |
loader: | |
wembs-limit: -1 | |
num-workers: 0 | |
train: | |
epochs: 1000 | |
batch-size: 32 | |
char-embed-dim: 32 | |
resume: false | |
resume-lr: false | |
max-word-len: 13 | |
max-sent-len: 10 | |
rnn-cell: lstm | |
sent-lstm-layers: 2 | |
word-lstm-layers: 2 | |
sent-lstm-units: 256 | |
word-lstm-units: 512 | |
decoder-units: 256 | |
sent-dropout: 0.2 | |
diac-dropout: 0 | |
final-dropout: 0.2 | |
sent-mask-zero: false | |
lr-factor: 0.5 | |
lr-patience: 1 | |
lr-min: 1.e-7 | |
lr-init: 0.002 | |
weight-decay: 0 | |
vertical-dropout: 0.25 | |
recurrent-dropout: 0.25 | |
stopping-delta: 1.e-7 | |
stopping-patience: 3 | |
predictor: | |
batch-size: 75 | |
stride: 2 | |
window: 20 | |
gt-signal-prob: 0 | |
seed-idx: 0 | |
sentence-break: | |
stride: 2 | |
window: 10 | |
min-window: 1 | |
export-map: false | |
files: | |
- train/train.txt | |
- val/val.txt | |
delimeters: | |
- ، | |
- ؛ | |
- ',' | |
- ; | |
- « | |
- » | |
- '{' | |
- '}' | |
- '(' | |
- ')' | |
- '[' | |
- ']' | |
- '.' | |
- '*' | |
- '-' | |
- ':' | |
- '?' | |
- '!' | |
- ؟ | |
segment: | |
stride: 2 | |
window: 10 | |
min-window: 1 | |
export-map: false | |
files: | |
- train/train.txt | |
- val/val.txt | |
delimeters: | |
- ، | |
- ؛ | |
- ',' | |
- ; | |
- « | |
- » | |
- '{' | |
- '}' | |
- '(' | |
- ')' | |
- '[' | |
- ']' | |
- '.' | |
- '*' | |
- '-' | |
- ':' | |
- '?' | |
- '!' | |
- ؟ |