Training in progress, step 50

Browse files

Files changed (5) hide show

README.md +2 -5
config.json +4 -76
model.safetensors +1 -1
runs/Dec31_21-38-49_228ad310bd3c/events.out.tfevents.1704058742.228ad310bd3c.23033.0 +3 -0
training_args.bin +1 -1

README.md CHANGED Viewed

@@ -6,9 +6,6 @@ tags:
 model-index:
 - name: git-base-instagram-cap
   results: []
-pipeline_tag: image-to-text
-language:
-- en
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -16,7 +13,7 @@ should probably proofread and complete it, then remove this comment. -->
 # git-base-instagram-cap
-This model is a fine-tuned version of [microsoft/git-base](https://huggingface.co/microsoft/git-base) on an [Instagram Caption](https://huggingface.co/datasets/mrSoul7766/instagram_post_captions) dataset.
 It achieves the following results on the evaluation set:
 - Loss: 0.1859
 - Wer Score: 1.0566
@@ -73,4 +70,4 @@ The following hyperparameters were used during training:
 - Transformers 4.37.0.dev0
 - Pytorch 2.1.0+cu121
 - Datasets 2.16.1
-- Tokenizers 0.15.0

 model-index:
 - name: git-base-instagram-cap
   results: []
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 # git-base-instagram-cap
+This model is a fine-tuned version of [microsoft/git-base](https://huggingface.co/microsoft/git-base) on an unknown dataset.
 It achieves the following results on the evaluation set:
 - Loss: 0.1859
 - Wer Score: 1.0566
 - Transformers 4.37.0.dev0
 - Pytorch 2.1.0+cu121
 - Datasets 2.16.1
+- Tokenizers 0.15.0

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_commit_hash": null,
   "architectures": [
     "GitForCausalLM"
   ],
@@ -22,85 +22,13 @@
   "position_embedding_type": "absolute",
   "tie_word_embeddings": false,
   "torch_dtype": "float32",
-  "transformers_version": null,
   "use_cache": true,
   "vision_config": {
-    "_name_or_path": "",
-    "add_cross_attention": false,
-    "architectures": null,
-    "attention_dropout": 0.0,
-    "bad_words_ids": null,
-    "begin_suppress_tokens": null,
-    "bos_token_id": null,
-    "chunk_size_feed_forward": 0,
-    "cross_attention_hidden_size": null,
-    "decoder_start_token_id": null,
-    "diversity_penalty": 0.0,
-    "do_sample": false,
     "dropout": 0.0,
-    "early_stopping": false,
-    "encoder_no_repeat_ngram_size": 0,
-    "eos_token_id": null,
-    "exponential_decay_length_penalty": null,
-    "finetuning_task": null,
-    "forced_bos_token_id": null,
-    "forced_eos_token_id": null,
-    "hidden_act": "quick_gelu",
-    "hidden_size": 768,
-    "id2label": {
-      "0": "LABEL_0",
-      "1": "LABEL_1"
-    },
-    "image_size": 224,
     "initializer_factor": 1.0,
-    "initializer_range": 0.02,
-    "intermediate_size": 3072,
-    "is_decoder": false,
-    "is_encoder_decoder": false,
-    "label2id": {
-      "LABEL_0": 0,
-      "LABEL_1": 1
-    },
-    "layer_norm_eps": 1e-05,
-    "length_penalty": 1.0,
-    "max_length": 20,
-    "min_length": 0,
     "model_type": "git_vision_model",
-    "no_repeat_ngram_size": 0,
-    "num_attention_heads": 12,
-    "num_beam_groups": 1,
-    "num_beams": 1,
-    "num_channels": 3,
-    "num_hidden_layers": 12,
-    "num_return_sequences": 1,
-    "output_attentions": false,
-    "output_hidden_states": false,
-    "output_scores": false,
-    "pad_token_id": null,
-    "patch_size": 16,
-    "prefix": null,
-    "problem_type": null,
-    "projection_dim": 512,
-    "pruned_heads": {},
-    "remove_invalid_values": false,
-    "repetition_penalty": 1.0,
-    "return_dict": true,
-    "return_dict_in_generate": false,
-    "sep_token_id": null,
-    "suppress_tokens": null,
-    "task_specific_params": null,
-    "temperature": 1.0,
-    "tf_legacy_loss": false,
-    "tie_encoder_decoder": false,
-    "tie_word_embeddings": true,
-    "tokenizer_class": null,
-    "top_k": 50,
-    "top_p": 1.0,
-    "torch_dtype": null,
-    "torchscript": false,
-    "transformers_version": "4.26.0.dev0",
-    "typical_p": 1.0,
-    "use_bfloat16": false
   },
   "vocab_size": 30522
-}

 {
+  "_name_or_path": "microsoft/git-base",
   "architectures": [
     "GitForCausalLM"
   ],
   "position_embedding_type": "absolute",
   "tie_word_embeddings": false,
   "torch_dtype": "float32",
+  "transformers_version": "4.37.0.dev0",
   "use_cache": true,
   "vision_config": {
     "dropout": 0.0,
     "initializer_factor": 1.0,
     "model_type": "git_vision_model",
+    "projection_dim": 512
   },
   "vocab_size": 30522
+}

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:aceb1e9825e815ed1713c24e84c47aeeea0bccaf7bbf9abd96a7aa0308cfad19
 size 706516040

 version https://git-lfs.github.com/spec/v1
+oid sha256:d3de9541afdadfa55c1d95b83b44a0da0bacac2af4d40e3f5a08a412e83032d8
 size 706516040

runs/Dec31_21-38-49_228ad310bd3c/events.out.tfevents.1704058742.228ad310bd3c.23033.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1f306798b8794cc1e192fa3d6ef291ab67fef4cecf50362b17170f0e29a59dd2
+size 5071

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:120b38f7735acecb7ca416b0fe4332cc4d824231c6e5b5a066da025f8c62799d
 size 4728

 version https://git-lfs.github.com/spec/v1
+oid sha256:481560160e79d73d54389c0f78ef5b1dee3b592a93860c3af9d61d8ba74eb06a
 size 4728