VictorChew
commited on
Upload folder using huggingface_hub
Browse files- README.md +1 -0
- config.json +1 -1
- generation_config.json +1 -1
- model.safetensors +1 -1
- preprocessor_config.json +1 -1
README.md
CHANGED
@@ -26,6 +26,7 @@ Table is an effective way to represent structured data in scientific publication
|
|
26 |
|
27 |
## Changelog
|
28 |
Tips: Current version of StructEqTable is able to process table images from scientific documents such as arXiv, Scihub papers. Times New Roman And Songti(宋体) are main fonts used in table image, other fonts may decrease the accuracy of the model's output.
|
|
|
29 |
- [2024/8/08] 🔥 We have released the TensorRT accelerated version, which only takes about 1 second for most images on GPU A100. Please follow the tutorial to install the environment and compile the model weights.
|
30 |
- [2024/7/30] We have released the first version of StructEqTable.
|
31 |
|
|
|
26 |
|
27 |
## Changelog
|
28 |
Tips: Current version of StructEqTable is able to process table images from scientific documents such as arXiv, Scihub papers. Times New Roman And Songti(宋体) are main fonts used in table image, other fonts may decrease the accuracy of the model's output.
|
29 |
+
- **[2024/8/22] 🔥 We have released our [latest model](https://huggingface.co/U4R/StructTable-base/tree/v0.2), fine-tuned on the DocGenome dataset. This version features improved inference speed and robustness, achieved through data augmentation and reduced image token num.**
|
30 |
- [2024/8/08] 🔥 We have released the TensorRT accelerated version, which only takes about 1 second for most images on GPU A100. Please follow the tutorial to install the environment and compile the model weights.
|
31 |
- [2024/7/30] We have released the first version of StructEqTable.
|
32 |
|
config.json
CHANGED
@@ -20,7 +20,7 @@
|
|
20 |
},
|
21 |
"tie_word_embeddings": false,
|
22 |
"torch_dtype": "float32",
|
23 |
-
"transformers_version": "4.
|
24 |
"use_cache": false,
|
25 |
"vision_config": {
|
26 |
"attention_dropout": 0.2,
|
|
|
20 |
},
|
21 |
"tie_word_embeddings": false,
|
22 |
"torch_dtype": "float32",
|
23 |
+
"transformers_version": "4.39.1",
|
24 |
"use_cache": false,
|
25 |
"vision_config": {
|
26 |
"attention_dropout": 0.2,
|
generation_config.json
CHANGED
@@ -3,6 +3,6 @@
|
|
3 |
"decoder_start_token_id": 0,
|
4 |
"eos_token_id": 1,
|
5 |
"pad_token_id": 0,
|
6 |
-
"transformers_version": "4.
|
7 |
"use_cache": false
|
8 |
}
|
|
|
3 |
"decoder_start_token_id": 0,
|
4 |
"eos_token_id": 1,
|
5 |
"pad_token_id": 0,
|
6 |
+
"transformers_version": "4.39.1",
|
7 |
"use_cache": false
|
8 |
}
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1294046176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:85661216f7547cba62312829bff47755d12907ea49ebb49dad65ade6ebf64706
|
3 |
size 1294046176
|
preprocessor_config.json
CHANGED
@@ -3,7 +3,7 @@
|
|
3 |
"do_normalize": true,
|
4 |
"image_processor_type": "Pix2StructImageProcessor",
|
5 |
"is_vqa": false,
|
6 |
-
"max_patches":
|
7 |
"patch_size": {
|
8 |
"height": 16,
|
9 |
"width": 16
|
|
|
3 |
"do_normalize": true,
|
4 |
"image_processor_type": "Pix2StructImageProcessor",
|
5 |
"is_vqa": false,
|
6 |
+
"max_patches": 2048,
|
7 |
"patch_size": {
|
8 |
"height": 16,
|
9 |
"width": 16
|