Training in progress, step 500
Browse files- README.md +204 -0
- adapter_config.json +17 -0
- adapter_model.safetensors +3 -0
- config.json +24 -0
- model.safetensors +3 -0
- runs/Feb14_18-00-58_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1707901259.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.3167.0 +3 -0
- runs/Feb14_18-03-40_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1707901421.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.3167.1 +3 -0
- runs/Feb14_18-10-21_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1707901822.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.3422.0 +3 -0
- runs/Feb14_19-12-57_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1707905578.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.3724.0 +3 -0
- runs/Jan09_15-27-10_pjt20230003-aer2024010004-dp-6f7b5c9687-mrddk/events.out.tfevents.1704781632.pjt20230003-aer2024010004-dp-6f7b5c9687-mrddk.2426.0 +3 -0
- runs/Jan09_16-37-00_pjt20230003-aer2024010004-dp-6f7b5c9687-mrddk/events.out.tfevents.1704785821.pjt20230003-aer2024010004-dp-6f7b5c9687-mrddk.2426.1 +3 -0
- runs/Jan09_17-16-55_pjt20230003-aer2024010004-dp-6f7b5c9687-mrddk/events.out.tfevents.1704788217.pjt20230003-aer2024010004-dp-6f7b5c9687-mrddk.2822.0 +3 -0
- runs/Jan09_17-22-16_pjt20230003-aer2024010004-dp-6f7b5c9687-mrddk/events.out.tfevents.1704788538.pjt20230003-aer2024010004-dp-6f7b5c9687-mrddk.3022.0 +3 -0
- runs/Jan09_17-27-05_pjt20230003-aer2024010004-dp-6f7b5c9687-mrddk/events.out.tfevents.1704788826.pjt20230003-aer2024010004-dp-6f7b5c9687-mrddk.3022.1 +3 -0
- runs/Jan09_17-30-31_pjt20230003-aer2024010004-dp-6f7b5c9687-mrddk/events.out.tfevents.1704789032.pjt20230003-aer2024010004-dp-6f7b5c9687-mrddk.3022.2 +3 -0
- runs/Jan09_17-40-53_pjt20230003-aer2024010004-dp-6f7b5c9687-mrddk/events.out.tfevents.1704789653.pjt20230003-aer2024010004-dp-6f7b5c9687-mrddk.3022.3 +3 -0
- runs/Jan10_15-55-18_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704869719.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.837.2 +3 -0
- runs/Jan10_17-45-04_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704876305.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.1381.0 +3 -0
- runs/Jan11_09-59-48_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704934788.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.1686.0 +3 -0
- runs/Jan11_13-19-21_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704946761.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.1686.1 +3 -0
- runs/Jan11_13-20-25_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704946826.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.1686.2 +3 -0
- runs/Jan11_13-28-32_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704947312.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.1686.3 +3 -0
- runs/Jan11_13-34-05_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704947646.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.1686.4 +3 -0
- runs/Jan11_13-35-03_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704947703.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.1686.5 +3 -0
- runs/Jan11_13-36-00_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704947760.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.1955.0 +3 -0
- runs/Jan11_13-37-48_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704947869.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.2149.0 +3 -0
- runs/Jan11_13-38-52_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704947932.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.2358.0 +3 -0
- runs/Jan11_13-41-46_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704948107.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.2568.0 +3 -0
- runs/Jan11_13-44-53_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704948294.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.2568.1 +3 -0
- runs/Jan11_15-03-48_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704953028.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.3026.0 +3 -0
- runs/Jan11_15-30-37_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704954638.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.3221.0 +3 -0
- runs/Jan12_10-00-40_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1705021240.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.4178.0 +3 -0
- runs/Jan12_11-30-11_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1705026611.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.4552.0 +3 -0
- runs/Jan18_16-29-38_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1705562979.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.17530.0 +3 -0
- special_tokens_map.json +7 -0
- tokenizer.json +0 -0
- tokenizer_config.json +55 -0
- training_args.bin +3 -0
- vocab.txt +0 -0
README.md
ADDED
@@ -0,0 +1,204 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
library_name: peft
|
3 |
+
base_model: distilbert-base-uncased
|
4 |
+
---
|
5 |
+
|
6 |
+
# Model Card for Model ID
|
7 |
+
|
8 |
+
<!-- Provide a quick summary of what the model is/does. -->
|
9 |
+
|
10 |
+
|
11 |
+
|
12 |
+
## Model Details
|
13 |
+
|
14 |
+
### Model Description
|
15 |
+
|
16 |
+
<!-- Provide a longer summary of what this model is. -->
|
17 |
+
|
18 |
+
|
19 |
+
|
20 |
+
- **Developed by:** [More Information Needed]
|
21 |
+
- **Funded by [optional]:** [More Information Needed]
|
22 |
+
- **Shared by [optional]:** [More Information Needed]
|
23 |
+
- **Model type:** [More Information Needed]
|
24 |
+
- **Language(s) (NLP):** [More Information Needed]
|
25 |
+
- **License:** [More Information Needed]
|
26 |
+
- **Finetuned from model [optional]:** [More Information Needed]
|
27 |
+
|
28 |
+
### Model Sources [optional]
|
29 |
+
|
30 |
+
<!-- Provide the basic links for the model. -->
|
31 |
+
|
32 |
+
- **Repository:** [More Information Needed]
|
33 |
+
- **Paper [optional]:** [More Information Needed]
|
34 |
+
- **Demo [optional]:** [More Information Needed]
|
35 |
+
|
36 |
+
## Uses
|
37 |
+
|
38 |
+
<!-- Address questions around how the model is intended to be used, including the foreseeable users of the model and those affected by the model. -->
|
39 |
+
|
40 |
+
### Direct Use
|
41 |
+
|
42 |
+
<!-- This section is for the model use without fine-tuning or plugging into a larger ecosystem/app. -->
|
43 |
+
|
44 |
+
[More Information Needed]
|
45 |
+
|
46 |
+
### Downstream Use [optional]
|
47 |
+
|
48 |
+
<!-- This section is for the model use when fine-tuned for a task, or when plugged into a larger ecosystem/app -->
|
49 |
+
|
50 |
+
[More Information Needed]
|
51 |
+
|
52 |
+
### Out-of-Scope Use
|
53 |
+
|
54 |
+
<!-- This section addresses misuse, malicious use, and uses that the model will not work well for. -->
|
55 |
+
|
56 |
+
[More Information Needed]
|
57 |
+
|
58 |
+
## Bias, Risks, and Limitations
|
59 |
+
|
60 |
+
<!-- This section is meant to convey both technical and sociotechnical limitations. -->
|
61 |
+
|
62 |
+
[More Information Needed]
|
63 |
+
|
64 |
+
### Recommendations
|
65 |
+
|
66 |
+
<!-- This section is meant to convey recommendations with respect to the bias, risk, and technical limitations. -->
|
67 |
+
|
68 |
+
Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
|
69 |
+
|
70 |
+
## How to Get Started with the Model
|
71 |
+
|
72 |
+
Use the code below to get started with the model.
|
73 |
+
|
74 |
+
[More Information Needed]
|
75 |
+
|
76 |
+
## Training Details
|
77 |
+
|
78 |
+
### Training Data
|
79 |
+
|
80 |
+
<!-- This should link to a Dataset Card, perhaps with a short stub of information on what the training data is all about as well as documentation related to data pre-processing or additional filtering. -->
|
81 |
+
|
82 |
+
[More Information Needed]
|
83 |
+
|
84 |
+
### Training Procedure
|
85 |
+
|
86 |
+
<!-- This relates heavily to the Technical Specifications. Content here should link to that section when it is relevant to the training procedure. -->
|
87 |
+
|
88 |
+
#### Preprocessing [optional]
|
89 |
+
|
90 |
+
[More Information Needed]
|
91 |
+
|
92 |
+
|
93 |
+
#### Training Hyperparameters
|
94 |
+
|
95 |
+
- **Training regime:** [More Information Needed] <!--fp32, fp16 mixed precision, bf16 mixed precision, bf16 non-mixed precision, fp16 non-mixed precision, fp8 mixed precision -->
|
96 |
+
|
97 |
+
#### Speeds, Sizes, Times [optional]
|
98 |
+
|
99 |
+
<!-- This section provides information about throughput, start/end time, checkpoint size if relevant, etc. -->
|
100 |
+
|
101 |
+
[More Information Needed]
|
102 |
+
|
103 |
+
## Evaluation
|
104 |
+
|
105 |
+
<!-- This section describes the evaluation protocols and provides the results. -->
|
106 |
+
|
107 |
+
### Testing Data, Factors & Metrics
|
108 |
+
|
109 |
+
#### Testing Data
|
110 |
+
|
111 |
+
<!-- This should link to a Dataset Card if possible. -->
|
112 |
+
|
113 |
+
[More Information Needed]
|
114 |
+
|
115 |
+
#### Factors
|
116 |
+
|
117 |
+
<!-- These are the things the evaluation is disaggregating by, e.g., subpopulations or domains. -->
|
118 |
+
|
119 |
+
[More Information Needed]
|
120 |
+
|
121 |
+
#### Metrics
|
122 |
+
|
123 |
+
<!-- These are the evaluation metrics being used, ideally with a description of why. -->
|
124 |
+
|
125 |
+
[More Information Needed]
|
126 |
+
|
127 |
+
### Results
|
128 |
+
|
129 |
+
[More Information Needed]
|
130 |
+
|
131 |
+
#### Summary
|
132 |
+
|
133 |
+
|
134 |
+
|
135 |
+
## Model Examination [optional]
|
136 |
+
|
137 |
+
<!-- Relevant interpretability work for the model goes here -->
|
138 |
+
|
139 |
+
[More Information Needed]
|
140 |
+
|
141 |
+
## Environmental Impact
|
142 |
+
|
143 |
+
<!-- Total emissions (in grams of CO2eq) and additional considerations, such as electricity usage, go here. Edit the suggested text below accordingly -->
|
144 |
+
|
145 |
+
Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
|
146 |
+
|
147 |
+
- **Hardware Type:** [More Information Needed]
|
148 |
+
- **Hours used:** [More Information Needed]
|
149 |
+
- **Cloud Provider:** [More Information Needed]
|
150 |
+
- **Compute Region:** [More Information Needed]
|
151 |
+
- **Carbon Emitted:** [More Information Needed]
|
152 |
+
|
153 |
+
## Technical Specifications [optional]
|
154 |
+
|
155 |
+
### Model Architecture and Objective
|
156 |
+
|
157 |
+
[More Information Needed]
|
158 |
+
|
159 |
+
### Compute Infrastructure
|
160 |
+
|
161 |
+
[More Information Needed]
|
162 |
+
|
163 |
+
#### Hardware
|
164 |
+
|
165 |
+
[More Information Needed]
|
166 |
+
|
167 |
+
#### Software
|
168 |
+
|
169 |
+
[More Information Needed]
|
170 |
+
|
171 |
+
## Citation [optional]
|
172 |
+
|
173 |
+
<!-- If there is a paper or blog post introducing the model, the APA and Bibtex information for that should go in this section. -->
|
174 |
+
|
175 |
+
**BibTeX:**
|
176 |
+
|
177 |
+
[More Information Needed]
|
178 |
+
|
179 |
+
**APA:**
|
180 |
+
|
181 |
+
[More Information Needed]
|
182 |
+
|
183 |
+
## Glossary [optional]
|
184 |
+
|
185 |
+
<!-- If relevant, include terms and calculations in this section that can help readers understand the model or model card. -->
|
186 |
+
|
187 |
+
[More Information Needed]
|
188 |
+
|
189 |
+
## More Information [optional]
|
190 |
+
|
191 |
+
[More Information Needed]
|
192 |
+
|
193 |
+
## Model Card Authors [optional]
|
194 |
+
|
195 |
+
[More Information Needed]
|
196 |
+
|
197 |
+
## Model Card Contact
|
198 |
+
|
199 |
+
[More Information Needed]
|
200 |
+
|
201 |
+
|
202 |
+
### Framework versions
|
203 |
+
|
204 |
+
- PEFT 0.7.1
|
adapter_config.json
ADDED
@@ -0,0 +1,17 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"auto_mapping": null,
|
3 |
+
"base_model_name_or_path": "bert-base-cased",
|
4 |
+
"encoder_dropout": 0.0,
|
5 |
+
"encoder_hidden_size": 128,
|
6 |
+
"encoder_num_layers": 2,
|
7 |
+
"encoder_reparameterization_type": "MLP",
|
8 |
+
"inference_mode": true,
|
9 |
+
"num_attention_heads": 12,
|
10 |
+
"num_layers": 12,
|
11 |
+
"num_transformer_submodules": 1,
|
12 |
+
"num_virtual_tokens": 20,
|
13 |
+
"peft_type": "P_TUNING",
|
14 |
+
"revision": null,
|
15 |
+
"task_type": "QUESTION_ANS",
|
16 |
+
"token_dim": 768
|
17 |
+
}
|
adapter_model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b6e4f94867219f0b28d341681356ed5f61d8a5f723eccccafeea96040f613fd1
|
3 |
+
size 67880
|
config.json
ADDED
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "distilbert-base-uncased",
|
3 |
+
"activation": "gelu",
|
4 |
+
"architectures": [
|
5 |
+
"DistilBertForQuestionAnswering"
|
6 |
+
],
|
7 |
+
"attention_dropout": 0.1,
|
8 |
+
"dim": 768,
|
9 |
+
"dropout": 0.1,
|
10 |
+
"hidden_dim": 3072,
|
11 |
+
"initializer_range": 0.02,
|
12 |
+
"max_position_embeddings": 512,
|
13 |
+
"model_type": "distilbert",
|
14 |
+
"n_heads": 12,
|
15 |
+
"n_layers": 6,
|
16 |
+
"pad_token_id": 0,
|
17 |
+
"qa_dropout": 0.1,
|
18 |
+
"seq_classif_dropout": 0.2,
|
19 |
+
"sinusoidal_pos_embds": false,
|
20 |
+
"tie_weights_": true,
|
21 |
+
"torch_dtype": "float32",
|
22 |
+
"transformers_version": "4.36.2",
|
23 |
+
"vocab_size": 30522
|
24 |
+
}
|
model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:37a3e4ac06598d45d176952702706b9f2e4ad9e4ec9839bb811939e384ad7163
|
3 |
+
size 265470032
|
runs/Feb14_18-00-58_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1707901259.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.3167.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b3bf3a7431fcc3b6993025d39a17dc0e30f31658ff9513a32b9e3b440550018d
|
3 |
+
size 4336
|
runs/Feb14_18-03-40_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1707901421.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.3167.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:922d45e5bd097140d37e4e7c43fba00250e6fa1667fb97edf54f23dfd6614a1a
|
3 |
+
size 4714
|
runs/Feb14_18-10-21_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1707901822.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.3422.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eca04d7087a2b853dc69cdcbd5b2e2f1ae49b7862eb3efaf73c7762bbe0febc8
|
3 |
+
size 17241
|
runs/Feb14_19-12-57_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1707905578.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.3724.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5caeff75477d869e4fc0be13b34ed681674cd05c999815fcea2f6151154b8e6
|
3 |
+
size 4714
|
runs/Jan09_15-27-10_pjt20230003-aer2024010004-dp-6f7b5c9687-mrddk/events.out.tfevents.1704781632.pjt20230003-aer2024010004-dp-6f7b5c9687-mrddk.2426.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b499a4aef668bef5800f8b13b43b06690e4368c8956154cf3ce82572c0f70cf
|
3 |
+
size 5550
|
runs/Jan09_16-37-00_pjt20230003-aer2024010004-dp-6f7b5c9687-mrddk/events.out.tfevents.1704785821.pjt20230003-aer2024010004-dp-6f7b5c9687-mrddk.2426.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fa3e0b749a3506315bec53fe822a2e3262cfabd6de9be3a4dc72700a09c1a34b
|
3 |
+
size 5550
|
runs/Jan09_17-16-55_pjt20230003-aer2024010004-dp-6f7b5c9687-mrddk/events.out.tfevents.1704788217.pjt20230003-aer2024010004-dp-6f7b5c9687-mrddk.2822.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6e98dd0ac300c79c7b474998be9e92b3bf10fbb351218898146e6f9bb7823632
|
3 |
+
size 4925
|
runs/Jan09_17-22-16_pjt20230003-aer2024010004-dp-6f7b5c9687-mrddk/events.out.tfevents.1704788538.pjt20230003-aer2024010004-dp-6f7b5c9687-mrddk.3022.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:93ae9662b8612287e17b86d7db1704930f03af980146a58922e6cca4fa2b1675
|
3 |
+
size 5550
|
runs/Jan09_17-27-05_pjt20230003-aer2024010004-dp-6f7b5c9687-mrddk/events.out.tfevents.1704788826.pjt20230003-aer2024010004-dp-6f7b5c9687-mrddk.3022.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2bba49b2dc2b5aab21c55da573ac6ef7007bf16f02eeeeaa2d97b5a4c850f16d
|
3 |
+
size 5550
|
runs/Jan09_17-30-31_pjt20230003-aer2024010004-dp-6f7b5c9687-mrddk/events.out.tfevents.1704789032.pjt20230003-aer2024010004-dp-6f7b5c9687-mrddk.3022.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e1ae656332369a81e86d1666676573d90bb42a7cfaf214dc517b1452177f444b
|
3 |
+
size 5550
|
runs/Jan09_17-40-53_pjt20230003-aer2024010004-dp-6f7b5c9687-mrddk/events.out.tfevents.1704789653.pjt20230003-aer2024010004-dp-6f7b5c9687-mrddk.3022.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f834054bb7fdb20ded14caed04daed051e72e5ac3c628ffd2de3fb5bf212445
|
3 |
+
size 5550
|
runs/Jan10_15-55-18_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704869719.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.837.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f4d4766be92dc9683365f005c8b141650ec5429eb470d4cda2819d496f1571a1
|
3 |
+
size 10553
|
runs/Jan10_17-45-04_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704876305.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.1381.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:32df4ac45c04fc21f7280729c75481145440357113acb619709ed02bbea91c9d
|
3 |
+
size 10553
|
runs/Jan11_09-59-48_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704934788.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.1686.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b87e578bd8956e50c86cabeecdae0a1d3dd6f9ac21c475a9815cc7a0f3bfdc1
|
3 |
+
size 10553
|
runs/Jan11_13-19-21_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704946761.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.1686.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f9fa68026b467cf86770c837dce71ed54962c2d57fbfdd7dbb860ecad2d2e466
|
3 |
+
size 4336
|
runs/Jan11_13-20-25_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704946826.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.1686.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3894724e7d1e6f81b80216e9ea7d41b5c96e8f368b070bc0a153f2fcab065516
|
3 |
+
size 4336
|
runs/Jan11_13-28-32_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704947312.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.1686.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5dcd1748ebc9fe6a240163d6f3073bf9a8989bb99cd8d9c2474dbee96199162b
|
3 |
+
size 4451
|
runs/Jan11_13-34-05_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704947646.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.1686.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ec37afa3cadd4617afd374fc0c318fdc93b520cda418bfc13e4d24bd3f5322ea
|
3 |
+
size 4451
|
runs/Jan11_13-35-03_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704947703.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.1686.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4f6ae78394d1ef195724ff3f5e05a7509a87233dfa37517f461bbbaa970f490
|
3 |
+
size 4451
|
runs/Jan11_13-36-00_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704947760.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.1955.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f22f604782250294343a87c28cbf08175caecb01f0b0c4d989ffccfd98cecc89
|
3 |
+
size 4451
|
runs/Jan11_13-37-48_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704947869.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.2149.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f101e590874dbf4d4f6168929c84cbc423c4d1555d345be6adfdc68528e0b00
|
3 |
+
size 4451
|
runs/Jan11_13-38-52_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704947932.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.2358.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:844c7bdb93b2323cad9699f35f409d015ae406343a4c30515dd1852c41c669b6
|
3 |
+
size 4336
|
runs/Jan11_13-41-46_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704948107.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.2568.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1bbc07022defd3ea68538326ad52650956172d055d237346cc402c3eed7bdd27
|
3 |
+
size 4336
|
runs/Jan11_13-44-53_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704948294.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.2568.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f2eb49be0f60726800914f29e557339a67c904b52b6290ca4bc4588c3e2e175b
|
3 |
+
size 10553
|
runs/Jan11_15-03-48_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704953028.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.3026.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e9dd7a4bdd359a536703973e2ec17b5d03fc6e89a724286625af46fe152b8954
|
3 |
+
size 4336
|
runs/Jan11_15-30-37_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1704954638.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.3221.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1b489f53a85b75314a7ad1a9a6171cee5ccf702fd39ea5de422b6b87fa75d447
|
3 |
+
size 5830
|
runs/Jan12_10-00-40_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1705021240.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.4178.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:05e6db3ee543c39b604e0334358457e6d72d0964e5c79a0f0e5748c2eea2a0c8
|
3 |
+
size 10558
|
runs/Jan12_11-30-11_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1705026611.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.4552.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8a1e1f1a8ede88d2ed18fb1d17f2ca24b31b378f641616db0bc7f56fcd182d8e
|
3 |
+
size 10558
|
runs/Jan18_16-29-38_pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8/events.out.tfevents.1705562979.pjt20230003-aer2024010004-dp-5d9c8bc8b6-8b5n8.17530.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab8ff82179dc49eb29e3b948bfaf7ed472ddc3d670aafb21ec42f01c0b282ffe
|
3 |
+
size 10558
|
special_tokens_map.json
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"cls_token": "[CLS]",
|
3 |
+
"mask_token": "[MASK]",
|
4 |
+
"pad_token": "[PAD]",
|
5 |
+
"sep_token": "[SEP]",
|
6 |
+
"unk_token": "[UNK]"
|
7 |
+
}
|
tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer_config.json
ADDED
@@ -0,0 +1,55 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"added_tokens_decoder": {
|
3 |
+
"0": {
|
4 |
+
"content": "[PAD]",
|
5 |
+
"lstrip": false,
|
6 |
+
"normalized": false,
|
7 |
+
"rstrip": false,
|
8 |
+
"single_word": false,
|
9 |
+
"special": true
|
10 |
+
},
|
11 |
+
"100": {
|
12 |
+
"content": "[UNK]",
|
13 |
+
"lstrip": false,
|
14 |
+
"normalized": false,
|
15 |
+
"rstrip": false,
|
16 |
+
"single_word": false,
|
17 |
+
"special": true
|
18 |
+
},
|
19 |
+
"101": {
|
20 |
+
"content": "[CLS]",
|
21 |
+
"lstrip": false,
|
22 |
+
"normalized": false,
|
23 |
+
"rstrip": false,
|
24 |
+
"single_word": false,
|
25 |
+
"special": true
|
26 |
+
},
|
27 |
+
"102": {
|
28 |
+
"content": "[SEP]",
|
29 |
+
"lstrip": false,
|
30 |
+
"normalized": false,
|
31 |
+
"rstrip": false,
|
32 |
+
"single_word": false,
|
33 |
+
"special": true
|
34 |
+
},
|
35 |
+
"103": {
|
36 |
+
"content": "[MASK]",
|
37 |
+
"lstrip": false,
|
38 |
+
"normalized": false,
|
39 |
+
"rstrip": false,
|
40 |
+
"single_word": false,
|
41 |
+
"special": true
|
42 |
+
}
|
43 |
+
},
|
44 |
+
"clean_up_tokenization_spaces": true,
|
45 |
+
"cls_token": "[CLS]",
|
46 |
+
"do_lower_case": false,
|
47 |
+
"mask_token": "[MASK]",
|
48 |
+
"model_max_length": 512,
|
49 |
+
"pad_token": "[PAD]",
|
50 |
+
"sep_token": "[SEP]",
|
51 |
+
"strip_accents": null,
|
52 |
+
"tokenize_chinese_chars": true,
|
53 |
+
"tokenizer_class": "BertTokenizer",
|
54 |
+
"unk_token": "[UNK]"
|
55 |
+
}
|
training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea102f66790e739e3b6975bb83aad447c4b6d3c0bf6a7247e4d6eb698c7aea84
|
3 |
+
size 4283
|
vocab.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|