loodvanniekerkginkgo commited on
Commit
21f87d6
·
1 Parent(s): 6921c9e

Text edits and added heldout sequences

Browse files
about.py CHANGED
@@ -1,4 +1,4 @@
1
- ABOUT_TEXT = """
2
  ## About this challenge
3
 
4
  We're inviting the ML/bio community to predict developability properties for 244 antibodies from the [GDPa1 dataset](https://huggingface.co/datasets/ginkgo-datapoints/GDPa1).
@@ -8,12 +8,26 @@ We're inviting the ML/bio community to predict developability properties for 244
8
  Antibodies have to be manufacturable, stable in high concentrations, and have low off-target effects.
9
  Properties such as these can often hinder the progression of an antibody to the clinic, and are collectively referred to as 'developability'.
10
  Here we show 5 of these properties and invite the community to submit and develop better predictors, which will be tested out on a heldout private set to assess model generalization.
 
 
 
 
 
 
 
 
 
 
 
 
 
11
 
12
  **How to submit?**
13
 
14
- 1. Download the [GDPa1 dataset](https://huggingface.co/datasets/ginkgo-datapoints/GDPa1)
15
- 2. Make predictions for all the antibody sequences for your property of interest.
16
- 3. Submit a CSV file containing the `"antibody_name"` column and a column from GDPa1 matching the property name you are predicting (e.g. `"antibody_name,Titer"` if you are predicting Titer).
 
17
  There is an example submission file on the "✉️ Submit" tab.
18
 
19
  For the cross-validation metrics (if training only on the GDPa1 dataset), use the `"hierarchical_cluster_IgG_isotype_stratified_fold"` column to split the dataset into folds and make predictions for each of the folds.
@@ -30,13 +44,10 @@ For the heldout private set, we will calculate these results privately at the en
30
 
31
  We'd like to add some more existing models to the leaderboard. Some examples of models we'd like to add:
32
  - ESM embeddings + ridge regression
33
- - Absolute folding stability models
34
  - AbLEF
35
 
36
  If you would like to collaborate with others, start a discussion on the "Community" tab at the top of this page.
37
-
38
- ### FAQs
39
-
40
  """
41
  # Note(Lood): Let's track these FAQs in the main Google Doc and have that remain the source of truth.
42
  FAQS = {
 
1
+ ABOUT_INTRO = """
2
  ## About this challenge
3
 
4
  We're inviting the ML/bio community to predict developability properties for 244 antibodies from the [GDPa1 dataset](https://huggingface.co/datasets/ginkgo-datapoints/GDPa1).
 
8
  Antibodies have to be manufacturable, stable in high concentrations, and have low off-target effects.
9
  Properties such as these can often hinder the progression of an antibody to the clinic, and are collectively referred to as 'developability'.
10
  Here we show 5 of these properties and invite the community to submit and develop better predictors, which will be tested out on a heldout private set to assess model generalization.
11
+ """
12
+
13
+ ABOUT_TEXT = """
14
+
15
+ **How to participate?**
16
+
17
+ There are two tracks to the competition:
18
+ - Track 1: If you already have a developability model, you can submit your predictions for the GDPa1 dataset.
19
+ - Track 2: If you don't have a model, train one using cross-validaiton on the GDPa1 dataset and submit your predictions under the "Cross-validation" option.
20
+ This will provide you with a more accurate estimate of your model's performance on the private test set.
21
+
22
+ Finally, submit your predictions on the heldout private test set. This will not appear on the leaderboard, and will be used to determine the winners at the close of the competition.
23
+ There may be some points during the competition where we will release current results on the private test set.
24
 
25
  **How to submit?**
26
 
27
+ 1. Create a Hugging Face account if you don't have one yet (this is used to track unique submissions).
28
+ 2. Download the [GDPa1 dataset](https://huggingface.co/datasets/ginkgo-datapoints/GDPa1)
29
+ 3. Make predictions for all the antibody sequences for your property of interest.
30
+ 4. Submit a CSV file containing the `"antibody_name"` column and a column from GDPa1 matching the property name you are predicting (e.g. `"antibody_name,Titer"` if you are predicting Titer).
31
  There is an example submission file on the "✉️ Submit" tab.
32
 
33
  For the cross-validation metrics (if training only on the GDPa1 dataset), use the `"hierarchical_cluster_IgG_isotype_stratified_fold"` column to split the dataset into folds and make predictions for each of the folds.
 
44
 
45
  We'd like to add some more existing models to the leaderboard. Some examples of models we'd like to add:
46
  - ESM embeddings + ridge regression
47
+ - Absolute folding stability models (for Thermostability)
48
  - AbLEF
49
 
50
  If you would like to collaborate with others, start a discussion on the "Community" tab at the top of this page.
 
 
 
51
  """
52
  # Note(Lood): Let's track these FAQs in the main Google Doc and have that remain the source of truth.
53
  FAQS = {
app.py CHANGED
@@ -12,7 +12,7 @@ from constants import (
12
  EXAMPLE_FILE_DICT,
13
  LEADERBOARD_DISPLAY_COLUMNS,
14
  )
15
- from about import ABOUT_TEXT, FAQS
16
  from submit import make_submission
17
 
18
  def format_leaderboard_table(df_results: pd.DataFrame, assay: str | None = None):
@@ -80,7 +80,10 @@ with gr.Blocks() as demo:
80
  show_download_button=False,
81
  width="50vw", # 50% of the "viewport width"
82
  )
 
 
83
  gr.Markdown(ABOUT_TEXT)
 
84
  for i, (question, answer) in enumerate(FAQS.items()):
85
  # Would love to make questions bold but accordion doesn't support it
86
  question = f"{i+1}. {question}"
@@ -215,6 +218,7 @@ with gr.Blocks() as demo:
215
  """
216
  <div style="text-align: center; font-size: 14px; color: gray; margin-top: 2em;">
217
  📬 For questions or feedback, contact <a href="mailto:[email protected]">[email protected]</a> or visit the Community tab at the top of this page.
 
218
  </div>
219
  """,
220
  elem_id="contact-footer",
 
12
  EXAMPLE_FILE_DICT,
13
  LEADERBOARD_DISPLAY_COLUMNS,
14
  )
15
+ from about import ABOUT_INTRO, ABOUT_TEXT, FAQS
16
  from submit import make_submission
17
 
18
  def format_leaderboard_table(df_results: pd.DataFrame, assay: str | None = None):
 
80
  show_download_button=False,
81
  width="50vw", # 50% of the "viewport width"
82
  )
83
+ gr.Markdown(ABOUT_INTRO)
84
+ gr.Image(value="./assets/prediction_explainer.png", show_label=False, show_download_button=False, width="50vw")
85
  gr.Markdown(ABOUT_TEXT)
86
+ gr.Markdown("### FAQs")
87
  for i, (question, answer) in enumerate(FAQS.items()):
88
  # Would love to make questions bold but accordion doesn't support it
89
  question = f"{i+1}. {question}"
 
218
  """
219
  <div style="text-align: center; font-size: 14px; color: gray; margin-top: 2em;">
220
  📬 For questions or feedback, contact <a href="mailto:[email protected]">[email protected]</a> or visit the Community tab at the top of this page.
221
+ Visit the <a href="https://datapoints.ginkgo.bio/ai-competitions/2025-abdev-competition">Competition Registration page</a> to sign up for updates and to register a team.
222
  </div>
223
  """,
224
  elem_id="contact-footer",
constants.py CHANGED
@@ -41,12 +41,14 @@ CV_COLUMN = "hierarchical_cluster_IgG_isotype_stratified_fold"
41
  EXAMPLE_FILE_DICT = {
42
  "GDPa1": "data/example-predictions.csv",
43
  "GDPa1_cross_validation": "data/example-predictions-cv.csv",
 
44
  }
45
  ANTIBODY_NAMES_DICT = {
46
  "GDPa1": pd.read_csv(EXAMPLE_FILE_DICT["GDPa1"])["antibody_name"].tolist(),
47
  "GDPa1_cross_validation": pd.read_csv(EXAMPLE_FILE_DICT["GDPa1_cross_validation"])[
48
  "antibody_name"
49
  ].tolist(),
 
50
  }
51
 
52
  # Huggingface API
 
41
  EXAMPLE_FILE_DICT = {
42
  "GDPa1": "data/example-predictions.csv",
43
  "GDPa1_cross_validation": "data/example-predictions-cv.csv",
44
+ "heldout_test": "data/example-predictions-heldout.csv",
45
  }
46
  ANTIBODY_NAMES_DICT = {
47
  "GDPa1": pd.read_csv(EXAMPLE_FILE_DICT["GDPa1"])["antibody_name"].tolist(),
48
  "GDPa1_cross_validation": pd.read_csv(EXAMPLE_FILE_DICT["GDPa1_cross_validation"])[
49
  "antibody_name"
50
  ].tolist(),
51
+ "heldout_test": pd.read_csv(EXAMPLE_FILE_DICT["heldout_test"])["antibody_name"].tolist(), # TODO add a test for this validation
52
  }
53
 
54
  # Huggingface API
data/metrics_all.csv DELETED
@@ -1,26 +0,0 @@
1
- assay,model,spearman,spearman_cross_val,top_10_recall,top_10_recall_cross_val
2
- HIC,Aggrescan3D - aggrescan_average_score,0.422834774225429,,0.3333333333333333,
3
- AC-SINS_pH7.4,TAP - linear regression,0.4019194824087021,0.3401456689218918,0.375,0.2799999999999999
4
- HIC,TAP - linear regression,0.3622075317102941,0.2222991438172065,0.4166666666666667,0.43
5
- AC-SINS_pH7.4,TAP - PNC,0.358762795727933,,0.2916666666666667,
6
- HIC,Aggrescan3D - aggrescan_90_score,0.3585224061081473,,0.2083333333333333,
7
- PR_CHO,Saprot_VH - solubility_probability,0.3365516014806938,,0.0833333333333333,
8
- AC-SINS_pH7.4,TAP - SFvCSP,0.3203773185543964,,0.2083333333333333,
9
- HIC,Aggrescan3D - aggrescan_max_score,0.3044160918625593,,0.2083333333333333,
10
- PR_CHO,TAP - linear regression,0.260631929274264,0.1560705020744792,0.8333333333333334,0.47
11
- HIC,TAP - SFvCSP,0.2450651623577951,,0.2083333333333333,
12
- PR_CHO,TAP - SFvCSP,0.2381972244142228,,0.0,
13
- Tm2,Saprot_VH - stability_score,0.1924791603648384,,0.1666666666666666,
14
- HIC,TAP - CDR Length,0.1923458958277369,,0.0833333333333333,
15
- Titer,AntiFold,0.1878766623808878,,0.0833333333333333,
16
- HIC,DeepViscosity,0.18059398754127,,0.0416666666666666,
17
- AC-SINS_pH7.4,TAP - PPC,0.1691412287169806,,0.0833333333333333,
18
- Titer,TAP - linear regression,0.1682403605307924,0.1129210260701206,0.3333333333333333,0.38
19
- PR_CHO,TAP - PNC,0.151234196032203,,0.0416666666666666,
20
- AC-SINS_pH7.4,TAP - CDR Length,0.1501689804134715,,0.0,
21
- Titer,TAP - PPC,0.1423756688786398,,0.0833333333333333,
22
- PR_CHO,Aggrescan3D - aggrescan_max_score,0.1406309504998865,,0.0833333333333333,
23
- Tm2,AntiFold,0.1218057192943458,,0.125,
24
- HIC,hic_model_name,0.1144051722170351,0.1511895582680471,0.1666666666666666,0.05
25
- Tm2,TAP - linear regression,0.0844935706523633,-0.1153965363405958,0.6666666666666666,0.64
26
- HIC,Aggrescan3D - aggrescan_cdrh3_average_score,0.0747719620306879,,0.25,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
data/metrics_all_including_low_spearman.csv DELETED
@@ -1,157 +0,0 @@
1
- feature,assay,spearman,model,spearman_abs
2
- SFvCSP - tap,HAC,0.6788395883949475,tap,0.6788395883949475
3
- PPC - tap,HAC,0.4820800038128454,tap,0.4820800038128454
4
- aggrescan_average_score,HIC,0.3717330854283424,Aggrescan3D,0.3717330854283424
5
- SFvCSP - tap,PR_Ova,0.3706710402488808,tap,0.3706710402488808
6
- Viscosity - deep-viscosity,HAC,-0.3683390278828955,DeepViscosity,0.3683390278828955
7
- aggrescan_average_score,SMAC,0.3643128778304258,Aggrescan3D,0.3643128778304258
8
- PNC - tap,AC-SINS_pH7.4,-0.358762795727933,tap,0.358762795727933
9
- aggrescan_90_score,HIC,0.3572823382390205,Aggrescan3D,0.3572823382390205
10
- solubility_probability - saprot,PR_CHO,0.3365516014806938,saprot,0.3365516014806938
11
- PNC - tap,HAC,-0.3206575607459202,tap,0.3206575607459202
12
- SFvCSP - tap,AC-SINS_pH7.4,0.3203773185543964,tap,0.3203773185543964
13
- PNC - tap,PR_Ova,-0.2932051856162034,tap,0.2932051856162034
14
- aggrescan_90_score,SMAC,0.2852401926417188,Aggrescan3D,0.2852401926417188
15
- aggrescan_max_score,SMAC,0.2720151775798609,Aggrescan3D,0.2720151775798609
16
- aggrescan_max_score,HIC,0.2579163714894611,Aggrescan3D,0.2579163714894611
17
- stability_score - saprot,HAC,0.2482190338151043,saprot,0.2482190338151043
18
- SFvCSP - tap,HIC,-0.2450651623577951,tap,0.2450651623577951
19
- aggrescan_max_score,PR_CHO,-0.24241781163854,Aggrescan3D,0.24241781163854
20
- SFvCSP - tap,PR_CHO,0.2381972244142228,tap,0.2381972244142228
21
- PNC - tap,AC-SINS_pH6.0,-0.2185768523842327,tap,0.2185768523842327
22
- PPC - tap,PR_Ova,0.205520359496246,tap,0.205520359496246
23
- aggrescan_max_score,PR_Ova,-0.1983067762197625,Aggrescan3D,0.1983067762197625
24
- stability_score - saprot,Tm2,-0.1924791603648384,saprot,0.1924791603648384
25
- CDR Length - tap,HIC,0.1923458958277369,tap,0.1923458958277369
26
- solubility_probability - saprot,PR_Ova,0.1859602281879885,saprot,0.1859602281879885
27
- PPC - tap,HIC,-0.1839687842860175,tap,0.1839687842860175
28
- aggrescan_cdrh3_average_score,Titer,0.1814699248452822,Aggrescan3D,0.1814699248452822
29
- Viscosity - deep-viscosity,HIC,0.18059398754127,DeepViscosity,0.18059398754127
30
- PPC - tap,SEC %Monomer,0.179898358348615,tap,0.179898358348615
31
- Viscosity - deep-viscosity,PR_Ova,-0.1792011299598071,DeepViscosity,0.1792011299598071
32
- aggrescan_cdrh3_average_score,Purity,-0.1774879106041495,Aggrescan3D,0.1774879106041495
33
- CDR Length - tap,SMAC,0.1753482083680697,tap,0.1753482083680697
34
- PPC - tap,Purity,-0.1743385504957838,tap,0.1743385504957838
35
- PPC - tap,Tm1,0.1717910377244919,tap,0.1717910377244919
36
- PPC - tap,AC-SINS_pH7.4,0.1691412287169806,tap,0.1691412287169806
37
- PNC - tap,SMAC,-0.1647616991330237,tap,0.1647616991330237
38
- SFvCSP - tap,AC-SINS_pH6.0,0.1631061026200202,tap,0.1631061026200202
39
- aggrescan_90_score,PR_Ova,-0.1630725493267146,Aggrescan3D,0.1630725493267146
40
- aggrescan_cdrh3_average_score,HAC,-0.1621653601888134,Aggrescan3D,0.1621653601888134
41
- aggrescan_90_score,PR_CHO,-0.1602601604994121,Aggrescan3D,0.1602601604994121
42
- PNC - tap,PR_CHO,-0.151234196032203,tap,0.151234196032203
43
- CDR Length - tap,AC-SINS_pH7.4,-0.1501689804134715,tap,0.1501689804134715
44
- stability_score - saprot,PR_CHO,0.1482133956646727,saprot,0.1482133956646727
45
- PPC - tap,AC-SINS_pH6.0,0.1448272149205899,tap,0.1448272149205899
46
- SFvCSP - tap,Tm1,0.1426983792732488,tap,0.1426983792732488
47
- PPC - tap,Titer,0.1423756688786398,tap,0.1423756688786398
48
- PNC - tap,SEC %Monomer,-0.1345634135302046,tap,0.1345634135302046
49
- aggrescan_average_score,HAC,-0.1311020701331903,Aggrescan3D,0.1311020701331903
50
- aggrescan_cdrh3_average_score,Tm2,-0.1295581308418123,Aggrescan3D,0.1295581308418123
51
- PSH - tap,HAC,0.1269358458430945,tap,0.1269358458430945
52
- aggrescan_cdrh3_average_score,AC-SINS_pH6.0,0.1241248052844776,Aggrescan3D,0.1241248052844776
53
- aggrescan_average_score,PR_Ova,-0.1225803596842919,Aggrescan3D,0.1225803596842919
54
- solubility_probability - saprot,Purity,0.120581879119953,saprot,0.120581879119953
55
- aggrescan_90_score,AC-SINS_pH6.0,-0.1156038989665139,Aggrescan3D,0.1156038989665139
56
- Viscosity - deep-viscosity,PR_CHO,-0.1125214482263828,DeepViscosity,0.1125214482263828
57
- aggrescan_cdrh3_average_score,HIC,0.1109333602778311,Aggrescan3D,0.1109333602778311
58
- PNC - tap,Tm1,-0.1094376940826625,tap,0.1094376940826625
59
- PNC - tap,Titer,-0.1043862069630446,tap,0.1043862069630446
60
- aggrescan_90_score,HAC,-0.1029367717205433,Aggrescan3D,0.1029367717205433
61
- PPC - tap,Tonset,0.1024480318260903,tap,0.1024480318260903
62
- aggrescan_average_score,Tm1,0.0984625979382824,Aggrescan3D,0.0984625979382824
63
- SFvCSP - tap,Purity,-0.0979379393217746,tap,0.0979379393217746
64
- solubility_probability - saprot,Tm2,-0.0978456145482691,saprot,0.0978456145482691
65
- SFvCSP - tap,SEC %Monomer,0.096650605592591,tap,0.096650605592591
66
- Viscosity - deep-viscosity,Tm2,0.093745084007507,DeepViscosity,0.093745084007507
67
- PNC - tap,Tonset,-0.0925140513893314,tap,0.0925140513893314
68
- aggrescan_90_score,Titer,-0.0888890152050186,Aggrescan3D,0.0888890152050186
69
- PPC - tap,PR_CHO,0.0885325199884014,tap,0.0885325199884014
70
- Viscosity - deep-viscosity,SMAC,0.0883647279655625,DeepViscosity,0.0883647279655625
71
- PPC - tap,SMAC,-0.0881450436285762,tap,0.0881450436285762
72
- SFvCSP - tap,Tonset,0.0869080829604942,tap,0.0869080829604942
73
- aggrescan_average_score,Purity,-0.0855300736249475,Aggrescan3D,0.0855300736249475
74
- PSH - tap,PR_Ova,0.0851843571887952,tap,0.0851843571887952
75
- solubility_probability - saprot,HAC,-0.0849192244020849,saprot,0.0849192244020849
76
- stability_score - saprot,PR_Ova,0.0844385315275266,saprot,0.0844385315275266
77
- aggrescan_average_score,PR_CHO,-0.082335263587056,Aggrescan3D,0.082335263587056
78
- CDR Length - tap,HAC,-0.0807572482895502,tap,0.0807572482895502
79
- Viscosity - deep-viscosity,AC-SINS_pH7.4,-0.0803879126171943,DeepViscosity,0.0803879126171943
80
- SFvCSP - tap,Titer,0.0797623802296775,tap,0.0797623802296775
81
- aggrescan_average_score,AC-SINS_pH7.4,0.078198839245547,Aggrescan3D,0.078198839245547
82
- aggrescan_max_score,Tonset,-0.0758666681469678,Aggrescan3D,0.0758666681469678
83
- stability_score - saprot,SMAC,-0.0752343621503858,saprot,0.0752343621503858
84
- stability_score - saprot,Tonset,-0.0738992116600914,saprot,0.0738992116600914
85
- stability_score - saprot,SEC %Monomer,-0.0733865038928551,saprot,0.0733865038928551
86
- CDR Length - tap,Tm2,-0.0729274519946903,tap,0.0729274519946903
87
- CDR Length - tap,SEC %Monomer,-0.0720782456119583,tap,0.0720782456119583
88
- stability_score - saprot,AC-SINS_pH7.4,0.0718305679545067,saprot,0.0718305679545067
89
- solubility_probability - saprot,Tonset,-0.0707794898935402,saprot,0.0707794898935402
90
- CDR Length - tap,Tonset,-0.0697571003932752,tap,0.0697571003932752
91
- solubility_probability - saprot,AC-SINS_pH6.0,0.0669921910968805,saprot,0.0669921910968805
92
- PSH - tap,SMAC,-0.0668504875953866,tap,0.0668504875953866
93
- CDR Length - tap,AC-SINS_pH6.0,-0.0662557372283483,tap,0.0662557372283483
94
- aggrescan_90_score,Purity,-0.0642609945737365,Aggrescan3D,0.0642609945737365
95
- CDR Length - tap,Purity,0.0640138427858363,tap,0.0640138427858363
96
- aggrescan_cdrh3_average_score,PR_CHO,-0.0639580648777149,Aggrescan3D,0.0639580648777149
97
- PSH - tap,Titer,-0.0638862853735791,tap,0.0638862853735791
98
- Viscosity - deep-viscosity,Titer,-0.0636053342823435,DeepViscosity,0.0636053342823435
99
- stability_score - saprot,HIC,-0.0625972585374469,saprot,0.0625972585374469
100
- stability_score - saprot,Titer,0.0607177541361877,saprot,0.0607177541361877
101
- aggrescan_average_score,Tonset,0.0532502341076833,Aggrescan3D,0.0532502341076833
102
- CDR Length - tap,PR_CHO,-0.0524556823713343,tap,0.0524556823713343
103
- aggrescan_90_score,AC-SINS_pH7.4,-0.0509589937861982,Aggrescan3D,0.0509589937861982
104
- PSH - tap,SEC %Monomer,-0.0487785361924088,tap,0.0487785361924088
105
- PNC - tap,Tm2,-0.0482259337861972,tap,0.0482259337861972
106
- SFvCSP - tap,SMAC,-0.0479604170867368,tap,0.0479604170867368
107
- CDR Length - tap,Tm1,0.0470910111346684,tap,0.0470910111346684
108
- PSH - tap,HIC,-0.0464732086283245,tap,0.0464732086283245
109
- aggrescan_cdrh3_average_score,SMAC,0.0462084030163925,Aggrescan3D,0.0462084030163925
110
- stability_score - saprot,Tm1,-0.0461587451740238,saprot,0.0461587451740238
111
- aggrescan_max_score,AC-SINS_pH6.0,-0.0422041355140005,Aggrescan3D,0.0422041355140005
112
- Viscosity - deep-viscosity,Tm1,0.0418758583153736,DeepViscosity,0.0418758583153736
113
- CDR Length - tap,Titer,-0.0415639454664855,tap,0.0415639454664855
114
- Viscosity - deep-viscosity,AC-SINS_pH6.0,-0.0391995375434282,DeepViscosity,0.0391995375434282
115
- aggrescan_max_score,SEC %Monomer,0.0384606168278266,Aggrescan3D,0.0384606168278266
116
- aggrescan_max_score,Purity,0.0377965473734412,Aggrescan3D,0.0377965473734412
117
- aggrescan_cdrh3_average_score,Tonset,-0.0371645511788307,Aggrescan3D,0.0371645511788307
118
- stability_score - saprot,AC-SINS_pH6.0,0.0363459090170338,saprot,0.0363459090170338
119
- PSH - tap,AC-SINS_pH7.4,-0.0360881689253704,tap,0.0360881689253704
120
- solubility_probability - saprot,Tm1,-0.0359790946528558,saprot,0.0359790946528558
121
- aggrescan_average_score,SEC %Monomer,0.0329005393127016,Aggrescan3D,0.0329005393127016
122
- solubility_probability - saprot,AC-SINS_pH7.4,0.0320374764320225,saprot,0.0320374764320225
123
- stability_score - saprot,Purity,0.0319067204658559,saprot,0.0319067204658559
124
- solubility_probability - saprot,HIC,0.0318219345388521,saprot,0.0318219345388521
125
- PSH - tap,Tm2,-0.0317350623491362,tap,0.0317350623491362
126
- aggrescan_average_score,Tm2,-0.0312770789755912,Aggrescan3D,0.0312770789755912
127
- aggrescan_cdrh3_average_score,AC-SINS_pH7.4,0.0305591682601827,Aggrescan3D,0.0305591682601827
128
- aggrescan_max_score,Tm1,-0.0301284126829971,Aggrescan3D,0.0301284126829971
129
- aggrescan_cdrh3_average_score,Tm1,-0.0293641493096082,Aggrescan3D,0.0293641493096082
130
- aggrescan_90_score,Tm1,0.0279545108349369,Aggrescan3D,0.0279545108349369
131
- aggrescan_average_score,AC-SINS_pH6.0,0.0271292409530908,Aggrescan3D,0.0271292409530908
132
- PSH - tap,Tonset,0.0258012823141481,tap,0.0258012823141481
133
- solubility_probability - saprot,SEC %Monomer,-0.0255220000167489,saprot,0.0255220000167489
134
- aggrescan_cdrh3_average_score,SEC %Monomer,-0.0242523887163972,Aggrescan3D,0.0242523887163972
135
- aggrescan_max_score,HAC,-0.0238463005336014,Aggrescan3D,0.0238463005336014
136
- Viscosity - deep-viscosity,SEC %Monomer,-0.0226036392916792,DeepViscosity,0.0226036392916792
137
- aggrescan_max_score,Titer,-0.0218947825112391,Aggrescan3D,0.0218947825112391
138
- PSH - tap,PR_CHO,0.0209381900169799,tap,0.0209381900169799
139
- aggrescan_max_score,Tm2,-0.0199308718790671,Aggrescan3D,0.0199308718790671
140
- PSH - tap,Purity,-0.0198292183035963,tap,0.0198292183035963
141
- CDR Length - tap,PR_Ova,-0.0191507855521124,tap,0.0191507855521124
142
- SFvCSP - tap,Tm2,-0.0179541460075494,tap,0.0179541460075494
143
- aggrescan_max_score,AC-SINS_pH7.4,0.0177424118352705,Aggrescan3D,0.0177424118352705
144
- Viscosity - deep-viscosity,Purity,-0.0164122333153846,DeepViscosity,0.0164122333153846
145
- PSH - tap,Tm1,0.0149070260126188,tap,0.0149070260126188
146
- PNC - tap,HIC,0.0102627218889135,tap,0.0102627218889135
147
- PPC - tap,Tm2,-0.0098872681569066,tap,0.0098872681569066
148
- PNC - tap,Purity,0.0096311210026764,tap,0.0096311210026764
149
- aggrescan_90_score,SEC %Monomer,-0.0069533060784548,Aggrescan3D,0.0069533060784548
150
- solubility_probability - saprot,Titer,-0.0068735643986468,saprot,0.0068735643986468
151
- aggrescan_cdrh3_average_score,PR_Ova,-0.0057045278689166,Aggrescan3D,0.0057045278689166
152
- Viscosity - deep-viscosity,Tonset,-0.0052886682383666,DeepViscosity,0.0052886682383666
153
- aggrescan_90_score,Tm2,0.0014898396535596,Aggrescan3D,0.0014898396535596
154
- aggrescan_90_score,Tonset,-0.0012258917323618,Aggrescan3D,0.0012258917323618
155
- solubility_probability - saprot,SMAC,-0.0008774163836285,saprot,0.0008774163836285
156
- aggrescan_average_score,Titer,-0.0003490541872287,Aggrescan3D,0.0003490541872287
157
- PSH - tap,AC-SINS_pH6.0,-6.566404038227427e-05,tap,6.566404038227427e-05
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
utils.py CHANGED
@@ -1,4 +1,3 @@
1
- from datetime import datetime, timezone, timedelta
2
  import pandas as pd
3
  from datasets import load_dataset
4
  import gradio as gr
@@ -13,9 +12,10 @@ def show_output_box(message):
13
 
14
 
15
  def fetch_hf_results():
16
- # Print current time in EST
17
- EST = timezone(timedelta(hours=-4))
18
- print(f"tmp: Fetching results from HF at {datetime.now(EST)}")
 
19
  # Should cache by default if not using force_redownload
20
  df = load_dataset(
21
  RESULTS_REPO, data_files="auto_submissions/metrics_all.csv",
 
 
1
  import pandas as pd
2
  from datasets import load_dataset
3
  import gradio as gr
 
12
 
13
 
14
  def fetch_hf_results():
15
+ # For debugging
16
+ # # Print current time in EST
17
+ # EST = timezone(timedelta(hours=-4))
18
+ # print(f"tmp: Fetching results from HF at {datetime.now(EST)}")
19
  # Should cache by default if not using force_redownload
20
  df = load_dataset(
21
  RESULTS_REPO, data_files="auto_submissions/metrics_all.csv",