procne commited on
Commit
1cf22b5
·
1 Parent(s): b5423c5

Training in progress, step 500

Browse files
config.json ADDED
@@ -0,0 +1,46 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "distilgpt2",
3
+ "_num_labels": 1,
4
+ "activation_function": "gelu_new",
5
+ "architectures": [
6
+ "GPT2LMHeadModel"
7
+ ],
8
+ "attn_pdrop": 0.1,
9
+ "bos_token_id": 50256,
10
+ "embd_pdrop": 0.1,
11
+ "eos_token_id": 50256,
12
+ "id2label": {
13
+ "0": "LABEL_0"
14
+ },
15
+ "initializer_range": 0.02,
16
+ "label2id": {
17
+ "LABEL_0": 0
18
+ },
19
+ "layer_norm_epsilon": 1e-05,
20
+ "model_type": "gpt2",
21
+ "n_ctx": 1024,
22
+ "n_embd": 768,
23
+ "n_head": 12,
24
+ "n_inner": null,
25
+ "n_layer": 6,
26
+ "n_positions": 1024,
27
+ "reorder_and_upcast_attn": false,
28
+ "resid_pdrop": 0.1,
29
+ "scale_attn_by_inverse_layer_idx": false,
30
+ "scale_attn_weights": true,
31
+ "summary_activation": null,
32
+ "summary_first_dropout": 0.1,
33
+ "summary_proj_to_labels": true,
34
+ "summary_type": "cls_index",
35
+ "summary_use_proj": true,
36
+ "task_specific_params": {
37
+ "text-generation": {
38
+ "do_sample": true,
39
+ "max_length": 50
40
+ }
41
+ },
42
+ "torch_dtype": "float32",
43
+ "transformers_version": "4.36.1",
44
+ "use_cache": true,
45
+ "vocab_size": 50257
46
+ }
emissions.csv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ timestamp,project_name,run_id,duration,emissions,emissions_rate,cpu_power,gpu_power,ram_power,cpu_energy,gpu_energy,ram_energy,energy_consumed,country_name,country_iso_code,region,cloud_provider,cloud_region,os,python_version,codecarbon_version,cpu_count,cpu_model,gpu_count,gpu_model,longitude,latitude,ram_total_size,tracking_mode,on_cloud,pue
2
+ 2023-12-26T23:59:38,codecarbon,19dfeae0-e8c5-408e-a43c-9cd14853b3af,89.27425599098206,0.0017050477526745,1.9098985858215876e-05,42.5,296.966,2.868726253509521,0.0010539124945799,0.0071814051923436,7.108294170151245e-05,0.0083064006286251,United States,USA,california,,,Linux-5.15.133.1-microsoft-standard-WSL2-x86_64-with-glibc2.35,3.10.12,2.2.3,24,12th Gen Intel(R) Core(TM) i9-12900K,1,1 x NVIDIA GeForce RTX 3080,-121.487,38.6645,7.649936676025391,machine,N,1.0
3
+ 2023-12-27T00:06:24,codecarbon,c47b5a74-bc90-4c7d-b323-5a3fff8d73d1,88.75363397598267,0.00170033727477682,1.9157945411417663e-05,42.5,297.6,2.8687262535095215,0.0010477749794721605,0.007164999425998463,7.067841039727701e-05,0.0082834528158679,United States,USA,california,,,Linux-5.15.133.1-microsoft-standard-WSL2-x86_64-with-glibc2.35,3.10.12,2.2.3,24,12th Gen Intel(R) Core(TM) i9-12900K,1,1 x NVIDIA GeForce RTX 3080,-121.487,38.6645,7.649936676025391,machine,N,1.0
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50bcbe9a92114ea558080e3c7826d169e2ce83eca607d2f1518482fcf049c231
3
+ size 327657928
runs/Dec26_23-58-03_Mythril/events.out.tfevents.1703663888.Mythril.27641.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a05959a59c969e452fae48a608b6a853ab7cfab5e3ce7a89c785fdb9bc3efc7
3
+ size 6021
runs/Dec26_23-58-03_Mythril/events.out.tfevents.1703664170.Mythril.27641.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3b273deeab7ebc6f01c38f5ad1c5c6bbcaff08784f16455d0c968299c1933cc
3
+ size 359
runs/Dec27_00-04-50_Mythril/events.out.tfevents.1703664296.Mythril.644.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb1df4511d95cca80200a706ed6382959700582c98af03419e2adc8aae19f50a
3
+ size 5125
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ea52d0583410b620c28a293502da096ffc06b6b70f9458ed3892d1f6163b391
3
+ size 4728