koptelovmax commited on
Commit
3bf0a5e
β€’
1 Parent(s): e56df02

Model update

Browse files
README.md CHANGED
@@ -1,5 +1,5 @@
1
  ---
2
- title: Test2
3
  emoji: 😻
4
  colorFrom: indigo
5
  colorTo: blue
 
1
  ---
2
+ title: AMRdemo
3
  emoji: 😻
4
  colorFrom: indigo
5
  colorTo: blue
model_stog/amrlib_meta.json CHANGED
@@ -5,6 +5,6 @@
5
  "inference_module":".parse_xfm.inference",
6
  "inference_class":"Inference",
7
  "model_fn":"pytorch_model.bin",
8
- "base_model":"facebook/bart-large",
9
  "kwargs":{}
10
  }
 
5
  "inference_module":".parse_xfm.inference",
6
  "inference_class":"Inference",
7
  "model_fn":"pytorch_model.bin",
8
+ "base_model":"facebook/bart-base",
9
  "kwargs":{}
10
  }
model_stog/config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "facebook/bart-large",
3
  "activation_dropout": 0.1,
4
  "activation_function": "gelu",
5
  "add_bias_logits": false,
@@ -11,18 +11,18 @@
11
  "bos_token_id": 0,
12
  "classif_dropout": 0.1,
13
  "classifier_dropout": 0.0,
14
- "d_model": 1024,
15
- "decoder_attention_heads": 16,
16
- "decoder_ffn_dim": 4096,
17
  "decoder_layerdrop": 0.0,
18
- "decoder_layers": 12,
19
  "decoder_start_token_id": 2,
20
  "dropout": 0.1,
21
  "early_stopping": true,
22
- "encoder_attention_heads": 16,
23
- "encoder_ffn_dim": 4096,
24
  "encoder_layerdrop": 0.0,
25
- "encoder_layers": 12,
26
  "eos_token_id": 2,
27
  "forced_eos_token_id": 2,
28
  "gradient_checkpointing": false,
@@ -41,8 +41,9 @@
41
  "max_position_embeddings": 1024,
42
  "model_type": "bart",
43
  "normalize_before": false,
 
44
  "num_beams": 4,
45
- "num_hidden_layers": 12,
46
  "pad_token_id": 1,
47
  "scale_embedding": false,
48
  "task_specific_params": {
@@ -57,7 +58,7 @@
57
  "max_out_len": 1024,
58
  "max_train_graph_len": 512,
59
  "max_train_sent_len": 100,
60
- "model_name_or_path": "facebook/bart-large",
61
  "save_at_end": false,
62
  "save_tokenizer": false,
63
  "train_fn": "train.txt.nowiki"
 
1
  {
2
+ "_name_or_path": "facebook/bart-base",
3
  "activation_dropout": 0.1,
4
  "activation_function": "gelu",
5
  "add_bias_logits": false,
 
11
  "bos_token_id": 0,
12
  "classif_dropout": 0.1,
13
  "classifier_dropout": 0.0,
14
+ "d_model": 768,
15
+ "decoder_attention_heads": 12,
16
+ "decoder_ffn_dim": 3072,
17
  "decoder_layerdrop": 0.0,
18
+ "decoder_layers": 6,
19
  "decoder_start_token_id": 2,
20
  "dropout": 0.1,
21
  "early_stopping": true,
22
+ "encoder_attention_heads": 12,
23
+ "encoder_ffn_dim": 3072,
24
  "encoder_layerdrop": 0.0,
25
+ "encoder_layers": 6,
26
  "eos_token_id": 2,
27
  "forced_eos_token_id": 2,
28
  "gradient_checkpointing": false,
 
41
  "max_position_embeddings": 1024,
42
  "model_type": "bart",
43
  "normalize_before": false,
44
+ "normalize_embedding": true,
45
  "num_beams": 4,
46
+ "num_hidden_layers": 6,
47
  "pad_token_id": 1,
48
  "scale_embedding": false,
49
  "task_specific_params": {
 
58
  "max_out_len": 1024,
59
  "max_train_graph_len": 512,
60
  "max_train_sent_len": 100,
61
+ "model_name_or_path": "facebook/bart-base",
62
  "save_at_end": false,
63
  "save_tokenizer": false,
64
  "train_fn": "train.txt.nowiki"
model_stog/{model_parse_xfm_bart_large.json β†’ model_parse_xfm_bart_base.json} RENAMED
@@ -1,6 +1,6 @@
1
  { "gen_args" :
2
  {
3
- "model_name_or_path" : "facebook/bart-large",
4
  "corpus_dir" : "data/tdata_xfm/",
5
  "train_fn" : "train.txt.nowiki",
6
  "eval_fn" : "dev.txt.nowiki",
@@ -31,12 +31,12 @@
31
  "save_total_limit" : 1,
32
  "logging_steps" : 300,
33
  "num_train_epochs" : 16,
34
- "per_device_train_batch_size" : 8,
35
- "gradient_accumulation_steps" : 4,
36
  "weight_decay" : 0.004,
37
  "learning_rate" : 5e-5,
38
  "max_grad_norm" : 1.0,
39
- "warmup_steps" : 5200,
40
  "seed" : 42
41
  }
42
  }
 
1
  { "gen_args" :
2
  {
3
+ "model_name_or_path" : "facebook/bart-base",
4
  "corpus_dir" : "data/tdata_xfm/",
5
  "train_fn" : "train.txt.nowiki",
6
  "eval_fn" : "dev.txt.nowiki",
 
31
  "save_total_limit" : 1,
32
  "logging_steps" : 300,
33
  "num_train_epochs" : 16,
34
+ "per_device_train_batch_size" : 16,
35
+ "gradient_accumulation_steps" : 1,
36
  "weight_decay" : 0.004,
37
  "learning_rate" : 5e-5,
38
  "max_grad_norm" : 1.0,
39
+ "warmup_steps" : 3467,
40
  "seed" : 42
41
  }
42
  }
model_stog/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d9bdcde696e63224ba56853469689d2e22e64c324eedee6e48348e806eedd45b
3
- size 1625557313
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:281b14c587df85226e182dd220535f5eb5e1a4a499836bc6cfe812f5e0adc5e0
3
+ size 557979193