|
a |
|
b/tests/training/dep_parser_config.yml |
|
|
1 |
# 🤖 PIPELINE DEFINITION |
|
|
2 |
nlp: |
|
|
3 |
"@core": pipeline |
|
|
4 |
|
|
|
5 |
lang: fr |
|
|
6 |
|
|
|
7 |
components: |
|
|
8 |
parser: |
|
|
9 |
'@factory': eds.biaffine_dep_parser |
|
|
10 |
hidden_size: 64 |
|
|
11 |
decoding_mode: greedy |
|
|
12 |
dropout_p: 0. |
|
|
13 |
use_attrs: ['pos_'] |
|
|
14 |
|
|
|
15 |
embedding: |
|
|
16 |
'@factory': eds.transformer |
|
|
17 |
model: hf-internal-testing/tiny-bert |
|
|
18 |
window: 512 |
|
|
19 |
stride: 256 |
|
|
20 |
|
|
|
21 |
# 📈 SCORERS |
|
|
22 |
scorer: |
|
|
23 |
speed: false |
|
|
24 |
dep: |
|
|
25 |
'@metrics': "eds.dep_parsing" |
|
|
26 |
|
|
|
27 |
# 🎛️ OPTIMIZER |
|
|
28 |
optimizer: |
|
|
29 |
optim: adamw |
|
|
30 |
module: ${ nlp } |
|
|
31 |
total_steps: ${ train.max_steps } |
|
|
32 |
groups: |
|
|
33 |
".*": |
|
|
34 |
lr: 1e-3 |
|
|
35 |
|
|
|
36 |
# 📚 DATA |
|
|
37 |
train_data: |
|
|
38 |
data: |
|
|
39 |
"@readers": conll |
|
|
40 |
path: ./rhapsodie_sample.conllu |
|
|
41 |
shuffle: dataset |
|
|
42 |
batch_size: 1 docs |
|
|
43 |
pipe_names: [ "parser" ] |
|
|
44 |
|
|
|
45 |
val_data: |
|
|
46 |
"@readers": conll |
|
|
47 |
path: ./rhapsodie_sample.conllu |
|
|
48 |
|
|
|
49 |
# 🚀 TRAIN SCRIPT OPTIONS |
|
|
50 |
train: |
|
|
51 |
nlp: ${ nlp } |
|
|
52 |
train_data: ${ train_data } |
|
|
53 |
val_data: ${ val_data } |
|
|
54 |
max_steps: 20 |
|
|
55 |
validation_interval: 10 |
|
|
56 |
max_grad_norm: 5.0 |
|
|
57 |
scorer: ${ scorer } |
|
|
58 |
num_workers: 0 |
|
|
59 |
optimizer: ${ optimizer } |
|
|
60 |
grad_dev_policy: "clip_mean" |
|
|
61 |
log_weight_grads: true |