Spaces:

distributed
/

model_convergence

Sleeping

kmfoda commited on Oct 4, 2024

Commit

3e82d9d

1 Parent(s): d1c9a3c

Update current results

Files changed (3) hide show

app.py CHANGED Viewed

@@ -58,7 +58,7 @@ with demo:
         dropdown_1 = gr.Dropdown(choices = models, value = models[0])
         button_1 = gr.Button("Submit")
     with gr.Row():
-        chart = gr.LinePlot(df, "Step", "Loss", color="Test", x_lim = (0, 3000))
     button_1.click(return_results, dropdown_1, chart)

         dropdown_1 = gr.Dropdown(choices = models, value = models[0])
         button_1 = gr.Button("Submit")
     with gr.Row():
+        chart = gr.LinePlot(df, "Step", "Loss", color="Test", x_lim = (0, max(df['Step'])))
     button_1.click(return_results, dropdown_1, chart)

evaluate.py CHANGED Viewed

@@ -10,7 +10,7 @@ from transformers import AutoModelForCausalLM, AutoTokenizer
 device = "cuda"
 test_indices_length = 1000
-models = ["distributed/optimized-gpt2-250m", "distributed/optimized-gpt2-250m-v0.1.1", "distributed/gpt2-94m"]
 if os.path.exists("results.json"):
     with open('results.json', 'r') as file:
@@ -28,7 +28,7 @@ for model_name in models:
     refs = list_repo_refs(model_name, repo_type="model")
     global_epoch = max([int(tag.name) for tag in refs.tags]) if refs.tags else None
-    for epoch in range(0,global_epoch, 5):
         if str(epoch) in results[model_name]['main-net'].keys():
             continue

 device = "cuda"
 test_indices_length = 1000
+models = ["distributed/optimized-gpt2-250m", "distributed/optimized-gpt2-250m-v0.1.3", "distributed/optimized-gpt2-250m-v0.1.1", "distributed/gpt2-94m"]
 if os.path.exists("results.json"):
     with open('results.json', 'r') as file:
     refs = list_repo_refs(model_name, repo_type="model")
     global_epoch = max([int(tag.name) for tag in refs.tags]) if refs.tags else None
+    for epoch in range(0,global_epoch, 1):
         if str(epoch) in results[model_name]['main-net'].keys():
             continue

results.json CHANGED Viewed

@@ -1,6 +1,55 @@
 {
     "distributed/optimized-gpt2-250m": {
-        "main-net": {},
         "baseline": {
             "0": [
                 10.95511245727539

 {
     "distributed/optimized-gpt2-250m": {
+        "main-net": {
+            "0": [
+                10.996320237222296
+            ],
+            "1": [
+                10.96618640299416
+            ],
+            "2": [
+                10.90651673192917
+            ],
+            "3": [
+                10.81940748757928
+            ],
+            "4": [
+                10.712032748685024
+            ],
+            "5": [
+                10.591520558323776
+            ],
+            "6": [
+                10.446569502482404
+            ],
+            "7": [
+                10.32113439958174
+            ],
+            "8": [
+                10.1767857876407
+            ],
+            "9": [
+                10.047991905456934
+            ],
+            "10": [
+                9.923473688189903
+            ],
+            "11": [
+                9.804602791635613
+            ],
+            "12": [
+                9.697358704748607
+            ],
+            "13": [
+                9.610764950228923
+            ],
+            "14": [
+                9.533995848289777
+            ],
+            "15": [
+                9.494339939102112
+            ]
+        },
         "baseline": {
             "0": [
                 10.95511245727539