Upload 6 files

Browse files

the first submission

Files changed (6) hide show

config.json +32 -0
config.yaml +52 -0
pytorch_model.bin +3 -0
special_tokens_map.json +6 -0
tokenizer.json +0 -0
tokenizer_config.json +202 -0

config.json ADDED Viewed

	@@ -0,0 +1,32 @@

+{
+  "align_long_axis": false,
+  "architectures": [
+    "NougatModel"
+  ],
+  "decoder_layer": 6,
+  "embed_dim": 128,
+  "encoder_layer": [
+    2,
+    2,
+    14,
+    2
+  ],
+  "hidden_dimension": 1024,
+  "input_size": [
+    896,
+    672
+  ],
+  "max_length": 4096,
+  "max_position_embeddings": 4096,
+  "model_type": "nougat",
+  "num_heads": [
+    4,
+    8,
+    16,
+    32
+  ],
+  "patch_size": 4,
+  "torch_dtype": "float32",
+  "transformers_version": "4.34.1",
+  "window_size": 7
+}

config.yaml ADDED Viewed

	@@ -0,0 +1,52 @@

+resume_from_checkpoint_path: None
+result_path: 'result'
+model_path: None
+dataset_paths:
+  - '/root/autodl-tmp/Nougat-Data/train.jsonl'
+tokenizer: './config/tokenizer.json'
+exp_name: 'nougat-middle'
+train_batch_sizes:
+  - 1
+num_workers: 4
+val_batch_sizes:
+  - 1
+val_batches: 1
+input_size:
+  - 896
+  - 672
+max_length: 4096
+max_position_embeddings: 4096
+accumulate_grad_batches: 3
+window_size: 7
+patch_size: 4
+embed_dim: 128
+hidden_dimension: 1024
+num_heads:
+  - 4
+  - 8
+  - 16
+  - 32
+encoder_layer:
+  - 2
+  - 2
+  - 14
+  - 2
+decoder_layer: 6
+align_long_axis: False
+num_nodes: 1
+seed: 25
+lr: 5e-05
+min_lr: 7.5e-06
+lr_step: 16
+gamma: 0.9996
+warmup_steps: 250
+num_training_samples_per_epoch: 10000
+max_epochs: 30
+max_steps: -1
+val_check_interval: None
+check_val_every_n_epoch: 1
+gradient_clip_val: 0.5
+verbose: False
+debug: False
+job: None
+exp_version: '20240206_132202'

pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:94d5d26420db2b4b1bb6690ee35bc181c87a3a35cc078f897c76b9108a7af009
+size 934321433

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,6 @@

+{
+  "bos_token": "<s>",
+  "eos_token": "</s>",
+  "pad_token": "<pad>",
+  "unk_token": "<unk>"
+}

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,202 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "<pad>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "3": {
+      "content": "<unk>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "4": {
+      "content": "[START_REF]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "5": {
+      "content": "[END_REF]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "6": {
+      "content": "[IMAGE]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "7": {
+      "content": "<fragments>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "8": {
+      "content": "</fragments>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "9": {
+      "content": "<work>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "10": {
+      "content": "</work>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "11": {
+      "content": "[START_SUP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "12": {
+      "content": "[END_SUP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "13": {
+      "content": "[START_SUB]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "14": {
+      "content": "[END_SUB]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "15": {
+      "content": "[START_DNA]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "16": {
+      "content": "[END_DNA]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "17": {
+      "content": "[START_AMINO]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "18": {
+      "content": "[END_AMINO]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "19": {
+      "content": "[START_SMILES]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "20": {
+      "content": "[END_SMILES]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "21": {
+      "content": "[START_I_SMILES]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "22": {
+      "content": "[END_I_SMILES]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "<s>",
+  "clean_up_tokenization_spaces": true,
+  "eos_token": "</s>",
+  "max_length": 4096,
+  "model_max_length": 1000000000000000019884624838656,
+  "pad_to_multiple_of": null,
+  "pad_token": "<pad>",
+  "pad_token_type_id": 0,
+  "padding_side": "right",
+  "stride": 0,
+  "tokenizer_class": "PreTrainedTokenizerFast",
+  "truncation_side": "right",
+  "truncation_strategy": "longest_first",
+  "unk_token": "<unk>"
+}