Commit
·
21f87d6
1
Parent(s):
6921c9e
Text edits and added heldout sequences
Browse files- about.py +19 -8
- app.py +5 -1
- constants.py +2 -0
- data/metrics_all.csv +0 -26
- data/metrics_all_including_low_spearman.csv +0 -157
- utils.py +4 -4
about.py
CHANGED
@@ -1,4 +1,4 @@
|
|
1 |
-
|
2 |
## About this challenge
|
3 |
|
4 |
We're inviting the ML/bio community to predict developability properties for 244 antibodies from the [GDPa1 dataset](https://huggingface.co/datasets/ginkgo-datapoints/GDPa1).
|
@@ -8,12 +8,26 @@ We're inviting the ML/bio community to predict developability properties for 244
|
|
8 |
Antibodies have to be manufacturable, stable in high concentrations, and have low off-target effects.
|
9 |
Properties such as these can often hinder the progression of an antibody to the clinic, and are collectively referred to as 'developability'.
|
10 |
Here we show 5 of these properties and invite the community to submit and develop better predictors, which will be tested out on a heldout private set to assess model generalization.
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
11 |
|
12 |
**How to submit?**
|
13 |
|
14 |
-
1.
|
15 |
-
2.
|
16 |
-
3.
|
|
|
17 |
There is an example submission file on the "✉️ Submit" tab.
|
18 |
|
19 |
For the cross-validation metrics (if training only on the GDPa1 dataset), use the `"hierarchical_cluster_IgG_isotype_stratified_fold"` column to split the dataset into folds and make predictions for each of the folds.
|
@@ -30,13 +44,10 @@ For the heldout private set, we will calculate these results privately at the en
|
|
30 |
|
31 |
We'd like to add some more existing models to the leaderboard. Some examples of models we'd like to add:
|
32 |
- ESM embeddings + ridge regression
|
33 |
-
- Absolute folding stability models
|
34 |
- AbLEF
|
35 |
|
36 |
If you would like to collaborate with others, start a discussion on the "Community" tab at the top of this page.
|
37 |
-
|
38 |
-
### FAQs
|
39 |
-
|
40 |
"""
|
41 |
# Note(Lood): Let's track these FAQs in the main Google Doc and have that remain the source of truth.
|
42 |
FAQS = {
|
|
|
1 |
+
ABOUT_INTRO = """
|
2 |
## About this challenge
|
3 |
|
4 |
We're inviting the ML/bio community to predict developability properties for 244 antibodies from the [GDPa1 dataset](https://huggingface.co/datasets/ginkgo-datapoints/GDPa1).
|
|
|
8 |
Antibodies have to be manufacturable, stable in high concentrations, and have low off-target effects.
|
9 |
Properties such as these can often hinder the progression of an antibody to the clinic, and are collectively referred to as 'developability'.
|
10 |
Here we show 5 of these properties and invite the community to submit and develop better predictors, which will be tested out on a heldout private set to assess model generalization.
|
11 |
+
"""
|
12 |
+
|
13 |
+
ABOUT_TEXT = """
|
14 |
+
|
15 |
+
**How to participate?**
|
16 |
+
|
17 |
+
There are two tracks to the competition:
|
18 |
+
- Track 1: If you already have a developability model, you can submit your predictions for the GDPa1 dataset.
|
19 |
+
- Track 2: If you don't have a model, train one using cross-validaiton on the GDPa1 dataset and submit your predictions under the "Cross-validation" option.
|
20 |
+
This will provide you with a more accurate estimate of your model's performance on the private test set.
|
21 |
+
|
22 |
+
Finally, submit your predictions on the heldout private test set. This will not appear on the leaderboard, and will be used to determine the winners at the close of the competition.
|
23 |
+
There may be some points during the competition where we will release current results on the private test set.
|
24 |
|
25 |
**How to submit?**
|
26 |
|
27 |
+
1. Create a Hugging Face account if you don't have one yet (this is used to track unique submissions).
|
28 |
+
2. Download the [GDPa1 dataset](https://huggingface.co/datasets/ginkgo-datapoints/GDPa1)
|
29 |
+
3. Make predictions for all the antibody sequences for your property of interest.
|
30 |
+
4. Submit a CSV file containing the `"antibody_name"` column and a column from GDPa1 matching the property name you are predicting (e.g. `"antibody_name,Titer"` if you are predicting Titer).
|
31 |
There is an example submission file on the "✉️ Submit" tab.
|
32 |
|
33 |
For the cross-validation metrics (if training only on the GDPa1 dataset), use the `"hierarchical_cluster_IgG_isotype_stratified_fold"` column to split the dataset into folds and make predictions for each of the folds.
|
|
|
44 |
|
45 |
We'd like to add some more existing models to the leaderboard. Some examples of models we'd like to add:
|
46 |
- ESM embeddings + ridge regression
|
47 |
+
- Absolute folding stability models (for Thermostability)
|
48 |
- AbLEF
|
49 |
|
50 |
If you would like to collaborate with others, start a discussion on the "Community" tab at the top of this page.
|
|
|
|
|
|
|
51 |
"""
|
52 |
# Note(Lood): Let's track these FAQs in the main Google Doc and have that remain the source of truth.
|
53 |
FAQS = {
|
app.py
CHANGED
@@ -12,7 +12,7 @@ from constants import (
|
|
12 |
EXAMPLE_FILE_DICT,
|
13 |
LEADERBOARD_DISPLAY_COLUMNS,
|
14 |
)
|
15 |
-
from about import ABOUT_TEXT, FAQS
|
16 |
from submit import make_submission
|
17 |
|
18 |
def format_leaderboard_table(df_results: pd.DataFrame, assay: str | None = None):
|
@@ -80,7 +80,10 @@ with gr.Blocks() as demo:
|
|
80 |
show_download_button=False,
|
81 |
width="50vw", # 50% of the "viewport width"
|
82 |
)
|
|
|
|
|
83 |
gr.Markdown(ABOUT_TEXT)
|
|
|
84 |
for i, (question, answer) in enumerate(FAQS.items()):
|
85 |
# Would love to make questions bold but accordion doesn't support it
|
86 |
question = f"{i+1}. {question}"
|
@@ -215,6 +218,7 @@ with gr.Blocks() as demo:
|
|
215 |
"""
|
216 |
<div style="text-align: center; font-size: 14px; color: gray; margin-top: 2em;">
|
217 |
📬 For questions or feedback, contact <a href="mailto:[email protected]">[email protected]</a> or visit the Community tab at the top of this page.
|
|
|
218 |
</div>
|
219 |
""",
|
220 |
elem_id="contact-footer",
|
|
|
12 |
EXAMPLE_FILE_DICT,
|
13 |
LEADERBOARD_DISPLAY_COLUMNS,
|
14 |
)
|
15 |
+
from about import ABOUT_INTRO, ABOUT_TEXT, FAQS
|
16 |
from submit import make_submission
|
17 |
|
18 |
def format_leaderboard_table(df_results: pd.DataFrame, assay: str | None = None):
|
|
|
80 |
show_download_button=False,
|
81 |
width="50vw", # 50% of the "viewport width"
|
82 |
)
|
83 |
+
gr.Markdown(ABOUT_INTRO)
|
84 |
+
gr.Image(value="./assets/prediction_explainer.png", show_label=False, show_download_button=False, width="50vw")
|
85 |
gr.Markdown(ABOUT_TEXT)
|
86 |
+
gr.Markdown("### FAQs")
|
87 |
for i, (question, answer) in enumerate(FAQS.items()):
|
88 |
# Would love to make questions bold but accordion doesn't support it
|
89 |
question = f"{i+1}. {question}"
|
|
|
218 |
"""
|
219 |
<div style="text-align: center; font-size: 14px; color: gray; margin-top: 2em;">
|
220 |
📬 For questions or feedback, contact <a href="mailto:[email protected]">[email protected]</a> or visit the Community tab at the top of this page.
|
221 |
+
Visit the <a href="https://datapoints.ginkgo.bio/ai-competitions/2025-abdev-competition">Competition Registration page</a> to sign up for updates and to register a team.
|
222 |
</div>
|
223 |
""",
|
224 |
elem_id="contact-footer",
|
constants.py
CHANGED
@@ -41,12 +41,14 @@ CV_COLUMN = "hierarchical_cluster_IgG_isotype_stratified_fold"
|
|
41 |
EXAMPLE_FILE_DICT = {
|
42 |
"GDPa1": "data/example-predictions.csv",
|
43 |
"GDPa1_cross_validation": "data/example-predictions-cv.csv",
|
|
|
44 |
}
|
45 |
ANTIBODY_NAMES_DICT = {
|
46 |
"GDPa1": pd.read_csv(EXAMPLE_FILE_DICT["GDPa1"])["antibody_name"].tolist(),
|
47 |
"GDPa1_cross_validation": pd.read_csv(EXAMPLE_FILE_DICT["GDPa1_cross_validation"])[
|
48 |
"antibody_name"
|
49 |
].tolist(),
|
|
|
50 |
}
|
51 |
|
52 |
# Huggingface API
|
|
|
41 |
EXAMPLE_FILE_DICT = {
|
42 |
"GDPa1": "data/example-predictions.csv",
|
43 |
"GDPa1_cross_validation": "data/example-predictions-cv.csv",
|
44 |
+
"heldout_test": "data/example-predictions-heldout.csv",
|
45 |
}
|
46 |
ANTIBODY_NAMES_DICT = {
|
47 |
"GDPa1": pd.read_csv(EXAMPLE_FILE_DICT["GDPa1"])["antibody_name"].tolist(),
|
48 |
"GDPa1_cross_validation": pd.read_csv(EXAMPLE_FILE_DICT["GDPa1_cross_validation"])[
|
49 |
"antibody_name"
|
50 |
].tolist(),
|
51 |
+
"heldout_test": pd.read_csv(EXAMPLE_FILE_DICT["heldout_test"])["antibody_name"].tolist(), # TODO add a test for this validation
|
52 |
}
|
53 |
|
54 |
# Huggingface API
|
data/metrics_all.csv
DELETED
@@ -1,26 +0,0 @@
|
|
1 |
-
assay,model,spearman,spearman_cross_val,top_10_recall,top_10_recall_cross_val
|
2 |
-
HIC,Aggrescan3D - aggrescan_average_score,0.422834774225429,,0.3333333333333333,
|
3 |
-
AC-SINS_pH7.4,TAP - linear regression,0.4019194824087021,0.3401456689218918,0.375,0.2799999999999999
|
4 |
-
HIC,TAP - linear regression,0.3622075317102941,0.2222991438172065,0.4166666666666667,0.43
|
5 |
-
AC-SINS_pH7.4,TAP - PNC,0.358762795727933,,0.2916666666666667,
|
6 |
-
HIC,Aggrescan3D - aggrescan_90_score,0.3585224061081473,,0.2083333333333333,
|
7 |
-
PR_CHO,Saprot_VH - solubility_probability,0.3365516014806938,,0.0833333333333333,
|
8 |
-
AC-SINS_pH7.4,TAP - SFvCSP,0.3203773185543964,,0.2083333333333333,
|
9 |
-
HIC,Aggrescan3D - aggrescan_max_score,0.3044160918625593,,0.2083333333333333,
|
10 |
-
PR_CHO,TAP - linear regression,0.260631929274264,0.1560705020744792,0.8333333333333334,0.47
|
11 |
-
HIC,TAP - SFvCSP,0.2450651623577951,,0.2083333333333333,
|
12 |
-
PR_CHO,TAP - SFvCSP,0.2381972244142228,,0.0,
|
13 |
-
Tm2,Saprot_VH - stability_score,0.1924791603648384,,0.1666666666666666,
|
14 |
-
HIC,TAP - CDR Length,0.1923458958277369,,0.0833333333333333,
|
15 |
-
Titer,AntiFold,0.1878766623808878,,0.0833333333333333,
|
16 |
-
HIC,DeepViscosity,0.18059398754127,,0.0416666666666666,
|
17 |
-
AC-SINS_pH7.4,TAP - PPC,0.1691412287169806,,0.0833333333333333,
|
18 |
-
Titer,TAP - linear regression,0.1682403605307924,0.1129210260701206,0.3333333333333333,0.38
|
19 |
-
PR_CHO,TAP - PNC,0.151234196032203,,0.0416666666666666,
|
20 |
-
AC-SINS_pH7.4,TAP - CDR Length,0.1501689804134715,,0.0,
|
21 |
-
Titer,TAP - PPC,0.1423756688786398,,0.0833333333333333,
|
22 |
-
PR_CHO,Aggrescan3D - aggrescan_max_score,0.1406309504998865,,0.0833333333333333,
|
23 |
-
Tm2,AntiFold,0.1218057192943458,,0.125,
|
24 |
-
HIC,hic_model_name,0.1144051722170351,0.1511895582680471,0.1666666666666666,0.05
|
25 |
-
Tm2,TAP - linear regression,0.0844935706523633,-0.1153965363405958,0.6666666666666666,0.64
|
26 |
-
HIC,Aggrescan3D - aggrescan_cdrh3_average_score,0.0747719620306879,,0.25,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
data/metrics_all_including_low_spearman.csv
DELETED
@@ -1,157 +0,0 @@
|
|
1 |
-
feature,assay,spearman,model,spearman_abs
|
2 |
-
SFvCSP - tap,HAC,0.6788395883949475,tap,0.6788395883949475
|
3 |
-
PPC - tap,HAC,0.4820800038128454,tap,0.4820800038128454
|
4 |
-
aggrescan_average_score,HIC,0.3717330854283424,Aggrescan3D,0.3717330854283424
|
5 |
-
SFvCSP - tap,PR_Ova,0.3706710402488808,tap,0.3706710402488808
|
6 |
-
Viscosity - deep-viscosity,HAC,-0.3683390278828955,DeepViscosity,0.3683390278828955
|
7 |
-
aggrescan_average_score,SMAC,0.3643128778304258,Aggrescan3D,0.3643128778304258
|
8 |
-
PNC - tap,AC-SINS_pH7.4,-0.358762795727933,tap,0.358762795727933
|
9 |
-
aggrescan_90_score,HIC,0.3572823382390205,Aggrescan3D,0.3572823382390205
|
10 |
-
solubility_probability - saprot,PR_CHO,0.3365516014806938,saprot,0.3365516014806938
|
11 |
-
PNC - tap,HAC,-0.3206575607459202,tap,0.3206575607459202
|
12 |
-
SFvCSP - tap,AC-SINS_pH7.4,0.3203773185543964,tap,0.3203773185543964
|
13 |
-
PNC - tap,PR_Ova,-0.2932051856162034,tap,0.2932051856162034
|
14 |
-
aggrescan_90_score,SMAC,0.2852401926417188,Aggrescan3D,0.2852401926417188
|
15 |
-
aggrescan_max_score,SMAC,0.2720151775798609,Aggrescan3D,0.2720151775798609
|
16 |
-
aggrescan_max_score,HIC,0.2579163714894611,Aggrescan3D,0.2579163714894611
|
17 |
-
stability_score - saprot,HAC,0.2482190338151043,saprot,0.2482190338151043
|
18 |
-
SFvCSP - tap,HIC,-0.2450651623577951,tap,0.2450651623577951
|
19 |
-
aggrescan_max_score,PR_CHO,-0.24241781163854,Aggrescan3D,0.24241781163854
|
20 |
-
SFvCSP - tap,PR_CHO,0.2381972244142228,tap,0.2381972244142228
|
21 |
-
PNC - tap,AC-SINS_pH6.0,-0.2185768523842327,tap,0.2185768523842327
|
22 |
-
PPC - tap,PR_Ova,0.205520359496246,tap,0.205520359496246
|
23 |
-
aggrescan_max_score,PR_Ova,-0.1983067762197625,Aggrescan3D,0.1983067762197625
|
24 |
-
stability_score - saprot,Tm2,-0.1924791603648384,saprot,0.1924791603648384
|
25 |
-
CDR Length - tap,HIC,0.1923458958277369,tap,0.1923458958277369
|
26 |
-
solubility_probability - saprot,PR_Ova,0.1859602281879885,saprot,0.1859602281879885
|
27 |
-
PPC - tap,HIC,-0.1839687842860175,tap,0.1839687842860175
|
28 |
-
aggrescan_cdrh3_average_score,Titer,0.1814699248452822,Aggrescan3D,0.1814699248452822
|
29 |
-
Viscosity - deep-viscosity,HIC,0.18059398754127,DeepViscosity,0.18059398754127
|
30 |
-
PPC - tap,SEC %Monomer,0.179898358348615,tap,0.179898358348615
|
31 |
-
Viscosity - deep-viscosity,PR_Ova,-0.1792011299598071,DeepViscosity,0.1792011299598071
|
32 |
-
aggrescan_cdrh3_average_score,Purity,-0.1774879106041495,Aggrescan3D,0.1774879106041495
|
33 |
-
CDR Length - tap,SMAC,0.1753482083680697,tap,0.1753482083680697
|
34 |
-
PPC - tap,Purity,-0.1743385504957838,tap,0.1743385504957838
|
35 |
-
PPC - tap,Tm1,0.1717910377244919,tap,0.1717910377244919
|
36 |
-
PPC - tap,AC-SINS_pH7.4,0.1691412287169806,tap,0.1691412287169806
|
37 |
-
PNC - tap,SMAC,-0.1647616991330237,tap,0.1647616991330237
|
38 |
-
SFvCSP - tap,AC-SINS_pH6.0,0.1631061026200202,tap,0.1631061026200202
|
39 |
-
aggrescan_90_score,PR_Ova,-0.1630725493267146,Aggrescan3D,0.1630725493267146
|
40 |
-
aggrescan_cdrh3_average_score,HAC,-0.1621653601888134,Aggrescan3D,0.1621653601888134
|
41 |
-
aggrescan_90_score,PR_CHO,-0.1602601604994121,Aggrescan3D,0.1602601604994121
|
42 |
-
PNC - tap,PR_CHO,-0.151234196032203,tap,0.151234196032203
|
43 |
-
CDR Length - tap,AC-SINS_pH7.4,-0.1501689804134715,tap,0.1501689804134715
|
44 |
-
stability_score - saprot,PR_CHO,0.1482133956646727,saprot,0.1482133956646727
|
45 |
-
PPC - tap,AC-SINS_pH6.0,0.1448272149205899,tap,0.1448272149205899
|
46 |
-
SFvCSP - tap,Tm1,0.1426983792732488,tap,0.1426983792732488
|
47 |
-
PPC - tap,Titer,0.1423756688786398,tap,0.1423756688786398
|
48 |
-
PNC - tap,SEC %Monomer,-0.1345634135302046,tap,0.1345634135302046
|
49 |
-
aggrescan_average_score,HAC,-0.1311020701331903,Aggrescan3D,0.1311020701331903
|
50 |
-
aggrescan_cdrh3_average_score,Tm2,-0.1295581308418123,Aggrescan3D,0.1295581308418123
|
51 |
-
PSH - tap,HAC,0.1269358458430945,tap,0.1269358458430945
|
52 |
-
aggrescan_cdrh3_average_score,AC-SINS_pH6.0,0.1241248052844776,Aggrescan3D,0.1241248052844776
|
53 |
-
aggrescan_average_score,PR_Ova,-0.1225803596842919,Aggrescan3D,0.1225803596842919
|
54 |
-
solubility_probability - saprot,Purity,0.120581879119953,saprot,0.120581879119953
|
55 |
-
aggrescan_90_score,AC-SINS_pH6.0,-0.1156038989665139,Aggrescan3D,0.1156038989665139
|
56 |
-
Viscosity - deep-viscosity,PR_CHO,-0.1125214482263828,DeepViscosity,0.1125214482263828
|
57 |
-
aggrescan_cdrh3_average_score,HIC,0.1109333602778311,Aggrescan3D,0.1109333602778311
|
58 |
-
PNC - tap,Tm1,-0.1094376940826625,tap,0.1094376940826625
|
59 |
-
PNC - tap,Titer,-0.1043862069630446,tap,0.1043862069630446
|
60 |
-
aggrescan_90_score,HAC,-0.1029367717205433,Aggrescan3D,0.1029367717205433
|
61 |
-
PPC - tap,Tonset,0.1024480318260903,tap,0.1024480318260903
|
62 |
-
aggrescan_average_score,Tm1,0.0984625979382824,Aggrescan3D,0.0984625979382824
|
63 |
-
SFvCSP - tap,Purity,-0.0979379393217746,tap,0.0979379393217746
|
64 |
-
solubility_probability - saprot,Tm2,-0.0978456145482691,saprot,0.0978456145482691
|
65 |
-
SFvCSP - tap,SEC %Monomer,0.096650605592591,tap,0.096650605592591
|
66 |
-
Viscosity - deep-viscosity,Tm2,0.093745084007507,DeepViscosity,0.093745084007507
|
67 |
-
PNC - tap,Tonset,-0.0925140513893314,tap,0.0925140513893314
|
68 |
-
aggrescan_90_score,Titer,-0.0888890152050186,Aggrescan3D,0.0888890152050186
|
69 |
-
PPC - tap,PR_CHO,0.0885325199884014,tap,0.0885325199884014
|
70 |
-
Viscosity - deep-viscosity,SMAC,0.0883647279655625,DeepViscosity,0.0883647279655625
|
71 |
-
PPC - tap,SMAC,-0.0881450436285762,tap,0.0881450436285762
|
72 |
-
SFvCSP - tap,Tonset,0.0869080829604942,tap,0.0869080829604942
|
73 |
-
aggrescan_average_score,Purity,-0.0855300736249475,Aggrescan3D,0.0855300736249475
|
74 |
-
PSH - tap,PR_Ova,0.0851843571887952,tap,0.0851843571887952
|
75 |
-
solubility_probability - saprot,HAC,-0.0849192244020849,saprot,0.0849192244020849
|
76 |
-
stability_score - saprot,PR_Ova,0.0844385315275266,saprot,0.0844385315275266
|
77 |
-
aggrescan_average_score,PR_CHO,-0.082335263587056,Aggrescan3D,0.082335263587056
|
78 |
-
CDR Length - tap,HAC,-0.0807572482895502,tap,0.0807572482895502
|
79 |
-
Viscosity - deep-viscosity,AC-SINS_pH7.4,-0.0803879126171943,DeepViscosity,0.0803879126171943
|
80 |
-
SFvCSP - tap,Titer,0.0797623802296775,tap,0.0797623802296775
|
81 |
-
aggrescan_average_score,AC-SINS_pH7.4,0.078198839245547,Aggrescan3D,0.078198839245547
|
82 |
-
aggrescan_max_score,Tonset,-0.0758666681469678,Aggrescan3D,0.0758666681469678
|
83 |
-
stability_score - saprot,SMAC,-0.0752343621503858,saprot,0.0752343621503858
|
84 |
-
stability_score - saprot,Tonset,-0.0738992116600914,saprot,0.0738992116600914
|
85 |
-
stability_score - saprot,SEC %Monomer,-0.0733865038928551,saprot,0.0733865038928551
|
86 |
-
CDR Length - tap,Tm2,-0.0729274519946903,tap,0.0729274519946903
|
87 |
-
CDR Length - tap,SEC %Monomer,-0.0720782456119583,tap,0.0720782456119583
|
88 |
-
stability_score - saprot,AC-SINS_pH7.4,0.0718305679545067,saprot,0.0718305679545067
|
89 |
-
solubility_probability - saprot,Tonset,-0.0707794898935402,saprot,0.0707794898935402
|
90 |
-
CDR Length - tap,Tonset,-0.0697571003932752,tap,0.0697571003932752
|
91 |
-
solubility_probability - saprot,AC-SINS_pH6.0,0.0669921910968805,saprot,0.0669921910968805
|
92 |
-
PSH - tap,SMAC,-0.0668504875953866,tap,0.0668504875953866
|
93 |
-
CDR Length - tap,AC-SINS_pH6.0,-0.0662557372283483,tap,0.0662557372283483
|
94 |
-
aggrescan_90_score,Purity,-0.0642609945737365,Aggrescan3D,0.0642609945737365
|
95 |
-
CDR Length - tap,Purity,0.0640138427858363,tap,0.0640138427858363
|
96 |
-
aggrescan_cdrh3_average_score,PR_CHO,-0.0639580648777149,Aggrescan3D,0.0639580648777149
|
97 |
-
PSH - tap,Titer,-0.0638862853735791,tap,0.0638862853735791
|
98 |
-
Viscosity - deep-viscosity,Titer,-0.0636053342823435,DeepViscosity,0.0636053342823435
|
99 |
-
stability_score - saprot,HIC,-0.0625972585374469,saprot,0.0625972585374469
|
100 |
-
stability_score - saprot,Titer,0.0607177541361877,saprot,0.0607177541361877
|
101 |
-
aggrescan_average_score,Tonset,0.0532502341076833,Aggrescan3D,0.0532502341076833
|
102 |
-
CDR Length - tap,PR_CHO,-0.0524556823713343,tap,0.0524556823713343
|
103 |
-
aggrescan_90_score,AC-SINS_pH7.4,-0.0509589937861982,Aggrescan3D,0.0509589937861982
|
104 |
-
PSH - tap,SEC %Monomer,-0.0487785361924088,tap,0.0487785361924088
|
105 |
-
PNC - tap,Tm2,-0.0482259337861972,tap,0.0482259337861972
|
106 |
-
SFvCSP - tap,SMAC,-0.0479604170867368,tap,0.0479604170867368
|
107 |
-
CDR Length - tap,Tm1,0.0470910111346684,tap,0.0470910111346684
|
108 |
-
PSH - tap,HIC,-0.0464732086283245,tap,0.0464732086283245
|
109 |
-
aggrescan_cdrh3_average_score,SMAC,0.0462084030163925,Aggrescan3D,0.0462084030163925
|
110 |
-
stability_score - saprot,Tm1,-0.0461587451740238,saprot,0.0461587451740238
|
111 |
-
aggrescan_max_score,AC-SINS_pH6.0,-0.0422041355140005,Aggrescan3D,0.0422041355140005
|
112 |
-
Viscosity - deep-viscosity,Tm1,0.0418758583153736,DeepViscosity,0.0418758583153736
|
113 |
-
CDR Length - tap,Titer,-0.0415639454664855,tap,0.0415639454664855
|
114 |
-
Viscosity - deep-viscosity,AC-SINS_pH6.0,-0.0391995375434282,DeepViscosity,0.0391995375434282
|
115 |
-
aggrescan_max_score,SEC %Monomer,0.0384606168278266,Aggrescan3D,0.0384606168278266
|
116 |
-
aggrescan_max_score,Purity,0.0377965473734412,Aggrescan3D,0.0377965473734412
|
117 |
-
aggrescan_cdrh3_average_score,Tonset,-0.0371645511788307,Aggrescan3D,0.0371645511788307
|
118 |
-
stability_score - saprot,AC-SINS_pH6.0,0.0363459090170338,saprot,0.0363459090170338
|
119 |
-
PSH - tap,AC-SINS_pH7.4,-0.0360881689253704,tap,0.0360881689253704
|
120 |
-
solubility_probability - saprot,Tm1,-0.0359790946528558,saprot,0.0359790946528558
|
121 |
-
aggrescan_average_score,SEC %Monomer,0.0329005393127016,Aggrescan3D,0.0329005393127016
|
122 |
-
solubility_probability - saprot,AC-SINS_pH7.4,0.0320374764320225,saprot,0.0320374764320225
|
123 |
-
stability_score - saprot,Purity,0.0319067204658559,saprot,0.0319067204658559
|
124 |
-
solubility_probability - saprot,HIC,0.0318219345388521,saprot,0.0318219345388521
|
125 |
-
PSH - tap,Tm2,-0.0317350623491362,tap,0.0317350623491362
|
126 |
-
aggrescan_average_score,Tm2,-0.0312770789755912,Aggrescan3D,0.0312770789755912
|
127 |
-
aggrescan_cdrh3_average_score,AC-SINS_pH7.4,0.0305591682601827,Aggrescan3D,0.0305591682601827
|
128 |
-
aggrescan_max_score,Tm1,-0.0301284126829971,Aggrescan3D,0.0301284126829971
|
129 |
-
aggrescan_cdrh3_average_score,Tm1,-0.0293641493096082,Aggrescan3D,0.0293641493096082
|
130 |
-
aggrescan_90_score,Tm1,0.0279545108349369,Aggrescan3D,0.0279545108349369
|
131 |
-
aggrescan_average_score,AC-SINS_pH6.0,0.0271292409530908,Aggrescan3D,0.0271292409530908
|
132 |
-
PSH - tap,Tonset,0.0258012823141481,tap,0.0258012823141481
|
133 |
-
solubility_probability - saprot,SEC %Monomer,-0.0255220000167489,saprot,0.0255220000167489
|
134 |
-
aggrescan_cdrh3_average_score,SEC %Monomer,-0.0242523887163972,Aggrescan3D,0.0242523887163972
|
135 |
-
aggrescan_max_score,HAC,-0.0238463005336014,Aggrescan3D,0.0238463005336014
|
136 |
-
Viscosity - deep-viscosity,SEC %Monomer,-0.0226036392916792,DeepViscosity,0.0226036392916792
|
137 |
-
aggrescan_max_score,Titer,-0.0218947825112391,Aggrescan3D,0.0218947825112391
|
138 |
-
PSH - tap,PR_CHO,0.0209381900169799,tap,0.0209381900169799
|
139 |
-
aggrescan_max_score,Tm2,-0.0199308718790671,Aggrescan3D,0.0199308718790671
|
140 |
-
PSH - tap,Purity,-0.0198292183035963,tap,0.0198292183035963
|
141 |
-
CDR Length - tap,PR_Ova,-0.0191507855521124,tap,0.0191507855521124
|
142 |
-
SFvCSP - tap,Tm2,-0.0179541460075494,tap,0.0179541460075494
|
143 |
-
aggrescan_max_score,AC-SINS_pH7.4,0.0177424118352705,Aggrescan3D,0.0177424118352705
|
144 |
-
Viscosity - deep-viscosity,Purity,-0.0164122333153846,DeepViscosity,0.0164122333153846
|
145 |
-
PSH - tap,Tm1,0.0149070260126188,tap,0.0149070260126188
|
146 |
-
PNC - tap,HIC,0.0102627218889135,tap,0.0102627218889135
|
147 |
-
PPC - tap,Tm2,-0.0098872681569066,tap,0.0098872681569066
|
148 |
-
PNC - tap,Purity,0.0096311210026764,tap,0.0096311210026764
|
149 |
-
aggrescan_90_score,SEC %Monomer,-0.0069533060784548,Aggrescan3D,0.0069533060784548
|
150 |
-
solubility_probability - saprot,Titer,-0.0068735643986468,saprot,0.0068735643986468
|
151 |
-
aggrescan_cdrh3_average_score,PR_Ova,-0.0057045278689166,Aggrescan3D,0.0057045278689166
|
152 |
-
Viscosity - deep-viscosity,Tonset,-0.0052886682383666,DeepViscosity,0.0052886682383666
|
153 |
-
aggrescan_90_score,Tm2,0.0014898396535596,Aggrescan3D,0.0014898396535596
|
154 |
-
aggrescan_90_score,Tonset,-0.0012258917323618,Aggrescan3D,0.0012258917323618
|
155 |
-
solubility_probability - saprot,SMAC,-0.0008774163836285,saprot,0.0008774163836285
|
156 |
-
aggrescan_average_score,Titer,-0.0003490541872287,Aggrescan3D,0.0003490541872287
|
157 |
-
PSH - tap,AC-SINS_pH6.0,-6.566404038227427e-05,tap,6.566404038227427e-05
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
utils.py
CHANGED
@@ -1,4 +1,3 @@
|
|
1 |
-
from datetime import datetime, timezone, timedelta
|
2 |
import pandas as pd
|
3 |
from datasets import load_dataset
|
4 |
import gradio as gr
|
@@ -13,9 +12,10 @@ def show_output_box(message):
|
|
13 |
|
14 |
|
15 |
def fetch_hf_results():
|
16 |
-
#
|
17 |
-
|
18 |
-
|
|
|
19 |
# Should cache by default if not using force_redownload
|
20 |
df = load_dataset(
|
21 |
RESULTS_REPO, data_files="auto_submissions/metrics_all.csv",
|
|
|
|
|
1 |
import pandas as pd
|
2 |
from datasets import load_dataset
|
3 |
import gradio as gr
|
|
|
12 |
|
13 |
|
14 |
def fetch_hf_results():
|
15 |
+
# For debugging
|
16 |
+
# # Print current time in EST
|
17 |
+
# EST = timezone(timedelta(hours=-4))
|
18 |
+
# print(f"tmp: Fetching results from HF at {datetime.now(EST)}")
|
19 |
# Should cache by default if not using force_redownload
|
20 |
df = load_dataset(
|
21 |
RESULTS_REPO, data_files="auto_submissions/metrics_all.csv",
|