VictorChew commited on
Commit
20fa540
·
verified ·
1 Parent(s): 903be5e

Upload folder using huggingface_hub

Browse files
README.md CHANGED
@@ -26,6 +26,7 @@ Table is an effective way to represent structured data in scientific publication
26
 
27
  ## Changelog
28
  Tips: Current version of StructEqTable is able to process table images from scientific documents such as arXiv, Scihub papers. Times New Roman And Songti(宋体) are main fonts used in table image, other fonts may decrease the accuracy of the model's output.
 
29
  - [2024/8/08] 🔥 We have released the TensorRT accelerated version, which only takes about 1 second for most images on GPU A100. Please follow the tutorial to install the environment and compile the model weights.
30
  - [2024/7/30] We have released the first version of StructEqTable.
31
 
 
26
 
27
  ## Changelog
28
  Tips: Current version of StructEqTable is able to process table images from scientific documents such as arXiv, Scihub papers. Times New Roman And Songti(宋体) are main fonts used in table image, other fonts may decrease the accuracy of the model's output.
29
+ - **[2024/8/22] 🔥 We have released our [latest model](https://huggingface.co/U4R/StructTable-base/tree/v0.2), fine-tuned on the DocGenome dataset. This version features improved inference speed and robustness, achieved through data augmentation and reduced image token num.**
30
  - [2024/8/08] 🔥 We have released the TensorRT accelerated version, which only takes about 1 second for most images on GPU A100. Please follow the tutorial to install the environment and compile the model weights.
31
  - [2024/7/30] We have released the first version of StructEqTable.
32
 
config.json CHANGED
@@ -20,7 +20,7 @@
20
  },
21
  "tie_word_embeddings": false,
22
  "torch_dtype": "float32",
23
- "transformers_version": "4.37.2",
24
  "use_cache": false,
25
  "vision_config": {
26
  "attention_dropout": 0.2,
 
20
  },
21
  "tie_word_embeddings": false,
22
  "torch_dtype": "float32",
23
+ "transformers_version": "4.39.1",
24
  "use_cache": false,
25
  "vision_config": {
26
  "attention_dropout": 0.2,
generation_config.json CHANGED
@@ -3,6 +3,6 @@
3
  "decoder_start_token_id": 0,
4
  "eos_token_id": 1,
5
  "pad_token_id": 0,
6
- "transformers_version": "4.37.2",
7
  "use_cache": false
8
  }
 
3
  "decoder_start_token_id": 0,
4
  "eos_token_id": 1,
5
  "pad_token_id": 0,
6
+ "transformers_version": "4.39.1",
7
  "use_cache": false
8
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:66baeb5e3b8e13f7e30cdf998c6724af7a97e8a2a3c78ece70666b6e2af278ce
3
  size 1294046176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85661216f7547cba62312829bff47755d12907ea49ebb49dad65ade6ebf64706
3
  size 1294046176
preprocessor_config.json CHANGED
@@ -3,7 +3,7 @@
3
  "do_normalize": true,
4
  "image_processor_type": "Pix2StructImageProcessor",
5
  "is_vqa": false,
6
- "max_patches": 4096,
7
  "patch_size": {
8
  "height": 16,
9
  "width": 16
 
3
  "do_normalize": true,
4
  "image_processor_type": "Pix2StructImageProcessor",
5
  "is_vqa": false,
6
+ "max_patches": 2048,
7
  "patch_size": {
8
  "height": 16,
9
  "width": 16