zhouxiangxin1998 commited on
Commit
0ea619a
β€’
1 Parent(s): cc5c681

add label and head

Browse files
.gitignore CHANGED
@@ -11,3 +11,4 @@ eval-results/
11
  eval-queue-bk/
12
  eval-results-bk/
13
  logs/
 
 
11
  eval-queue-bk/
12
  eval-results-bk/
13
  logs/
14
+ read_csv.py
app.py CHANGED
@@ -3,7 +3,7 @@ import base64
3
  import gradio as gr
4
  import pandas as pd
5
  from apscheduler.schedulers.background import BackgroundScheduler
6
-
7
  from src.about import (
8
  CITATION_BUTTON_LABEL,
9
  CITATION_BUTTON_TEXT,
@@ -42,6 +42,13 @@ in-depth evaluation framework for protein foundation models, driving their devel
42
  ## [Paper](https://www.arxiv.org/pdf/2409.06744) | [Website](https://proteinbench.github.io/)
43
  """
44
 
 
 
 
 
 
 
 
45
  # ### Space initialisation
46
 
47
  demo = gr.Blocks(css=custom_css)
@@ -59,10 +66,12 @@ with demo:
59
  with gr.TabItem("πŸ† Inverse Folding Leaderboard", elem_id='inverse-folding-table', id=0,):
60
  with gr.Row():
61
  inverse_folding_csv = pd.read_csv('data/inverse_folding.csv')
 
62
  inverse_folding_table = gr.components.DataFrame(
63
- inverse_folding_csv,
64
  height=99999,
65
  interactive=False,
 
66
  datatype=['markdown'] + (len(inverse_folding_csv.columns)-1) * ['number'],
67
 
68
  )
@@ -70,73 +79,81 @@ with demo:
70
  with gr.Row():
71
  structure_design_csv = pd.read_csv('data/structure_design.csv')
72
  structure_design_table = gr.components.DataFrame(
73
- structure_design_csv,
74
  height=99999,
75
  interactive=False,
 
76
  datatype=['markdown'] + (len(structure_design_csv.columns)-1) * ['number'],
77
  )
78
  with gr.TabItem("πŸ† Sequence Design Leaderboard", elem_id='sequence-design-table', id=2,):
79
  with gr.Row():
80
- sequence_design_csv = pd.read_csv('data/sequence_design.csv'),
81
  sequence_design_table = gr.components.DataFrame(
82
- sequence_design_csv,
83
  height=99999,
84
  interactive=False,
 
85
  datatype=['markdown'] + (len(sequence_design_csv.columns)-1) * ['number'],
86
  )
87
  with gr.TabItem("πŸ† Sequence-Structure Co-Design Leaderboard", elem_id='co-design-table', id=3,):
88
  with gr.Row():
89
  co_design_csv = pd.read_csv('data/co_design.csv')
90
  co_design_table = gr.components.DataFrame(
91
- co_design_csv,
92
  height=99999,
93
  interactive=False,
 
94
  datatype=['markdown'] + (len(co_design_csv.columns)-1) * ['number'],
95
  )
96
  with gr.TabItem("πŸ† Motif Scaffolding Leaderboard", elem_id='motif-scaffolding-table', id=4,):
97
  with gr.Row():
98
  motif_scaffolding_csv = pd.read_csv('data/motif_scaffolding.csv')
99
  motif_scaffolding_table = gr.components.DataFrame(
100
- motif_scaffolding_csv,
101
  height=99999,
102
  interactive=False,
 
103
  datatype=['markdown'] + (len(motif_scaffolding_csv.columns)-1) * ['number'],
104
  )
105
  with gr.TabItem("πŸ† Antibody Design Leaderboard", elem_id='antibody-design-table', id=5,):
106
  with gr.Row():
107
  antibody_design_csv = pd.read_csv('data/antibody_design.csv')
108
  antibody_design_table = gr.components.DataFrame(
109
- antibody_design_csv,
110
  height=99999,
111
  interactive=False,
 
112
  datatype=['markdown'] + (len(antibody_design_csv.columns)-1) * ['number'],
113
  )
114
  with gr.TabItem("πŸ… Protein Folding Leaderboard", elem_id='protein-folding-table', id=6,):
115
  with gr.Row():
116
  protein_folding_csv = pd.read_csv('data/protein_folding.csv')
117
  protein_folding_table = gr.components.DataFrame(
118
- protein_folding_csv,
119
  height=99999,
120
  interactive=False,
 
121
  datatype=['markdown'] + (len(protein_folding_csv.columns)-1) * ['number'],
122
  )
123
  with gr.TabItem("πŸ… Multi-State Prediction Leaderboard", elem_id='multi-state-prediction-table', id=7,):
124
  with gr.Row():
125
  multi_state_prediction_csv = pd.read_csv('data/multi_state_prediction.csv')
126
  multi_state_prediction_table = gr.components.DataFrame(
127
- multi_state_prediction_csv,
128
  height=99999,
129
  interactive=False,
 
130
  datatype=['markdown'] + (len(multi_state_prediction_csv.columns)-1) * ['number'],
131
  )
132
  with gr.TabItem("πŸ… Conformation Prediction Leaderboard", elem_id='conformation-prediction-table', id=8,):
133
  with gr.Row():
134
- conformation_prediction = pd.read_csv('data/conformation_prediction.csv')
135
  conformation_prediction_table = gr.components.DataFrame(
136
- conformation_prediction,
137
  height=99999,
138
  interactive=False,
139
- datatype=['markdown'] + (len(conformation_prediction.columns)-1) * ['number'],
 
140
  )
141
 
142
 
 
3
  import gradio as gr
4
  import pandas as pd
5
  from apscheduler.schedulers.background import BackgroundScheduler
6
+ import numpy as np
7
  from src.about import (
8
  CITATION_BUTTON_LABEL,
9
  CITATION_BUTTON_TEXT,
 
42
  ## [Paper](https://www.arxiv.org/pdf/2409.06744) | [Website](https://proteinbench.github.io/)
43
  """
44
 
45
+ def convert_to_float(df):
46
+ columns = df.columns
47
+ for col in columns[1:]:
48
+ df[col] = df[col].astype('float')
49
+ return df
50
+
51
+
52
  # ### Space initialisation
53
 
54
  demo = gr.Blocks(css=custom_css)
 
66
  with gr.TabItem("πŸ† Inverse Folding Leaderboard", elem_id='inverse-folding-table', id=0,):
67
  with gr.Row():
68
  inverse_folding_csv = pd.read_csv('data/inverse_folding.csv')
69
+ print(convert_to_float(inverse_folding_csv))
70
  inverse_folding_table = gr.components.DataFrame(
71
+ value=convert_to_float(inverse_folding_csv).values,
72
  height=99999,
73
  interactive=False,
74
+ headers=inverse_folding_csv.columns.to_list(),
75
  datatype=['markdown'] + (len(inverse_folding_csv.columns)-1) * ['number'],
76
 
77
  )
 
79
  with gr.Row():
80
  structure_design_csv = pd.read_csv('data/structure_design.csv')
81
  structure_design_table = gr.components.DataFrame(
82
+ value=convert_to_float(structure_design_csv).values,
83
  height=99999,
84
  interactive=False,
85
+ headers=structure_design_csv.columns.to_list(),
86
  datatype=['markdown'] + (len(structure_design_csv.columns)-1) * ['number'],
87
  )
88
  with gr.TabItem("πŸ† Sequence Design Leaderboard", elem_id='sequence-design-table', id=2,):
89
  with gr.Row():
90
+ sequence_design_csv = pd.read_csv('data/sequence_design.csv')
91
  sequence_design_table = gr.components.DataFrame(
92
+ value=convert_to_float(sequence_design_csv).values,
93
  height=99999,
94
  interactive=False,
95
+ headers=sequence_design_csv.columns.to_list(),
96
  datatype=['markdown'] + (len(sequence_design_csv.columns)-1) * ['number'],
97
  )
98
  with gr.TabItem("πŸ† Sequence-Structure Co-Design Leaderboard", elem_id='co-design-table', id=3,):
99
  with gr.Row():
100
  co_design_csv = pd.read_csv('data/co_design.csv')
101
  co_design_table = gr.components.DataFrame(
102
+ value=convert_to_float(co_design_csv).values,
103
  height=99999,
104
  interactive=False,
105
+ headers=co_design_csv.columns.to_list(),
106
  datatype=['markdown'] + (len(co_design_csv.columns)-1) * ['number'],
107
  )
108
  with gr.TabItem("πŸ† Motif Scaffolding Leaderboard", elem_id='motif-scaffolding-table', id=4,):
109
  with gr.Row():
110
  motif_scaffolding_csv = pd.read_csv('data/motif_scaffolding.csv')
111
  motif_scaffolding_table = gr.components.DataFrame(
112
+ value=convert_to_float(motif_scaffolding_csv).values,
113
  height=99999,
114
  interactive=False,
115
+ headers=motif_scaffolding_csv.columns.to_list(),
116
  datatype=['markdown'] + (len(motif_scaffolding_csv.columns)-1) * ['number'],
117
  )
118
  with gr.TabItem("πŸ† Antibody Design Leaderboard", elem_id='antibody-design-table', id=5,):
119
  with gr.Row():
120
  antibody_design_csv = pd.read_csv('data/antibody_design.csv')
121
  antibody_design_table = gr.components.DataFrame(
122
+ value=convert_to_float(antibody_design_csv).values,
123
  height=99999,
124
  interactive=False,
125
+ headers=antibody_design_csv.columns.to_list(),
126
  datatype=['markdown'] + (len(antibody_design_csv.columns)-1) * ['number'],
127
  )
128
  with gr.TabItem("πŸ… Protein Folding Leaderboard", elem_id='protein-folding-table', id=6,):
129
  with gr.Row():
130
  protein_folding_csv = pd.read_csv('data/protein_folding.csv')
131
  protein_folding_table = gr.components.DataFrame(
132
+ value=convert_to_float(protein_folding_csv).values,
133
  height=99999,
134
  interactive=False,
135
+ headers=protein_folding_csv.columns.to_list(),
136
  datatype=['markdown'] + (len(protein_folding_csv.columns)-1) * ['number'],
137
  )
138
  with gr.TabItem("πŸ… Multi-State Prediction Leaderboard", elem_id='multi-state-prediction-table', id=7,):
139
  with gr.Row():
140
  multi_state_prediction_csv = pd.read_csv('data/multi_state_prediction.csv')
141
  multi_state_prediction_table = gr.components.DataFrame(
142
+ value=convert_to_float(multi_state_prediction_csv).values,
143
  height=99999,
144
  interactive=False,
145
+ headers=multi_state_prediction_csv.columns.to_list(),
146
  datatype=['markdown'] + (len(multi_state_prediction_csv.columns)-1) * ['number'],
147
  )
148
  with gr.TabItem("πŸ… Conformation Prediction Leaderboard", elem_id='conformation-prediction-table', id=8,):
149
  with gr.Row():
150
+ conformation_prediction_csv = pd.read_csv('data/conformation_prediction.csv')
151
  conformation_prediction_table = gr.components.DataFrame(
152
+ value=convert_to_float(conformation_prediction_csv).values,
153
  height=99999,
154
  interactive=False,
155
+ headers=conformation_prediction_csv.columns.to_list(),
156
+ datatype=['markdown'] + (len(conformation_prediction_csv.columns)-1) * ['number'],
157
  )
158
 
159
 
data/antibody_design.csv CHANGED
@@ -1,9 +1,9 @@
1
- Model,AAR ↑,RMSD ↓,TM-score ↑,Binding Energy ↓,SeqSim-outer ↓,SeqSim-inner ↑,PHR ↓,CN-score ↑,Clashes-inner ↓,Clashes-outer ↓,SeqNat ↑,Total Energy ↓,scRMSD ↓
2
- RAbD (natural),100.00%,0.00,1.00,-15.33,0.26,-,45.78%,50.19,0.07,0.00,-1.74,-16.76,1.77
3
- HERN,33.17%,9.86,0.16,1242.77,0.41,-,39.83%,0.04,0.04,3.25,-1.47,5408.74,9.89
4
- MEAN,33.47%,1.82,0.25,263.90,0.65,-,40.74%,1.33,11.65,0.29,-1.83,1077.32,2.77
5
- dyMEAN,40.95%,2.36,0.36,889.28,0.58,-,42.04%,1.49,9.15,0.47,-1.79,1642.65,2.11
6
- *dyMEAN-FixFR,40.05%,2.37,0.35,612.75,0.60,0.96,43.75%,1.14,8.88,0.48,-1.82,1239.29,2.48
7
- *DiffAb,35.04%,2.53,0.37,489.42,0.37,0.45,40.68%,2.02,1.84,0.19,-1.88,495.69,2.57
8
- *AbDPO,31.29%,2.79,0.35,116.06,0.38,0.60,69.69%,1.33,4.14,0.10,-1.99,270.12,2.79
9
- *AbDPO++,36.25%,2.48,0.35,223.73,0.39,0.54,44.51%,2.34,1.66,0.08,-1.78,338.14,2.50
 
1
+ Model,AAR ↑,RMSD ↓,TM-score ↑,Binding Energy ↓,SeqSim-outer ↓,SeqSim-inner ↑,PHR (%) ↓,CN-score ↑,Clashes-inner ↓,Clashes-outer ↓,SeqNat ↑,Total Energy ↓,scRMSD ↓
2
+ RAbD (natural),100.00,0.00,1.00,-15.33,0.26,NaN,45.78,50.19,0.07,0.00,-1.74,-16.76,1.77
3
+ HERN,33.17,9.86,0.16,1242.77,0.41,NaN,39.83,0.04,0.04,3.25,-1.47,5408.74,9.89
4
+ MEAN,33.47,1.82,0.25,263.90,0.65,NaN,40.74,1.33,11.65,0.29,-1.83,1077.32,2.77
5
+ dyMEAN,40.95,2.36,0.36,889.28,0.58,NaN,42.04,1.49,9.15,0.47,-1.79,1642.65,2.11
6
+ *dyMEAN-FixFR,40.05,2.37,0.35,612.75,0.60,0.96,43.75,1.14,8.88,0.48,-1.82,1239.29,2.48
7
+ *DiffAb,35.04,2.53,0.37,489.42,0.37,0.45,40.68,2.02,1.84,0.19,-1.88,495.69,2.57
8
+ *AbDPO,31.29,2.79,0.35,116.06,0.38,0.60,69.69,1.33,4.14,0.10,-1.99,270.12,2.79
9
+ *AbDPO++,36.25,2.48,0.35,223.73,0.39,0.54,44.51,2.34,1.66,0.08,-1.78,338.14,2.50
data/co_design.csv CHANGED
@@ -1,5 +1,5 @@
1
  Model,scTM (L=100) ↑,scRMSD (L=100) ↓,Max Clust. (L=100) ↑,Max TM (L=100) ↓,scTM (L=200) ↑,scRMSD (L=200) ↓,Max Clust. (L=200) ↑,Max TM (L=200) ↓,scTM (L=300) ↑,scRMSD (L=300) ↓,Max Clust. (L=300) ↑,Max TM (L=300) ↓,scTM (L=500) ↑,scRMSD (L=500) ↓,Max Clust. (L=500) ↑,Max TM (L=500) ↓
2
- Native PDBs,0.91,2.98,0.75,-,0.88,3.24,0.77,-,0.92,3.94,0.75,-,0.90,9.64,0.80,-
3
  ProteinGenerator,0.91,3.75,0.24,0.73,0.88,6.24,0.25,0.72,0.81,9.26,0.22,0.71,0.69,17.00,0.18,0.73
4
  ProtPardelle*,0.56,12.90,0.57,0.66,0.64,13.67,0.10,0.69,0.69,14.91,0.04,0.72,0.44,43.15,0.60,0.69
5
  Multiflow,0.96,1.10,0.33,0.71,0.95,1.61,0.42,0.71,0.96,2.14,0.58,0.71,0.95,2.71,0.62,0.71
 
1
  Model,scTM (L=100) ↑,scRMSD (L=100) ↓,Max Clust. (L=100) ↑,Max TM (L=100) ↓,scTM (L=200) ↑,scRMSD (L=200) ↓,Max Clust. (L=200) ↑,Max TM (L=200) ↓,scTM (L=300) ↑,scRMSD (L=300) ↓,Max Clust. (L=300) ↑,Max TM (L=300) ↓,scTM (L=500) ↑,scRMSD (L=500) ↓,Max Clust. (L=500) ↑,Max TM (L=500) ↓
2
+ Native PDBs,0.91,2.98,0.75,NaN,0.88,3.24,0.77,NaN,0.92,3.94,0.75,NaN,0.90,9.64,0.80,NaN
3
  ProteinGenerator,0.91,3.75,0.24,0.73,0.88,6.24,0.25,0.72,0.81,9.26,0.22,0.71,0.69,17.00,0.18,0.73
4
  ProtPardelle*,0.56,12.90,0.57,0.66,0.64,13.67,0.10,0.69,0.69,14.91,0.04,0.72,0.44,43.15,0.60,0.69
5
  Multiflow,0.96,1.10,0.33,0.71,0.95,1.61,0.42,0.71,0.96,2.14,0.58,0.71,0.95,2.71,0.62,0.71
data/conformation_prediction.csv CHANGED
@@ -1,14 +1,14 @@
1
  Model,Pairwise RMSD,*RMSF,Pearson r on Pairwise RMSD ↑,Pearson r on *Global RMSF ↑,Pearson r on *Per target RMSF ↑,*RMWD ↓,MD PCA W2 ↓,Joint PCA W2 ↓,PC sim > 0.5% ↑,Weak contacts J ↑,Transient contacts J ↑,*Exposed residue J ↑,*Exposed MI matrix ρ ↑,CA break % ↓,CA clash % ↓,PepBond break % ↓
2
  MD iid,2.76,1.63,0.96,0.97,0.99,0.71,0.76,0.70,93.9,0.90,0.80,0.93,0.56,0.0,0.1,3.4
3
  MD 2.5 ns,1.54,0.98,0.89,0.85,0.85,2.21,1.57,1.93,36.6,0.62,0.45,0.64,0.24,0.0,0.1,3.4
4
- EigenFold,5.96,-,-0.04,-,-,-,2.35,7.96,12.2,0.36,0.18,-,-,0.7,9.6,-
5
  MSA-depth256,0.84,0.53,0.25,0.34,0.59,3.63,1.83,2.90,29.3,0.30,0.28,0.33,0.06,0.0,0.2,5.9
6
  MSA-depth64,2.03,1.51,0.24,0.30,0.57,4.00,1.87,3.32,18.3,0.38,0.27,0.38,0.12,0.0,0.2,8.4
7
  MSA-depth32,5.71,7.96,0.07,0.17,0.53,6.12,2.50,5.67,17.1,0.39,0.24,0.36,0.15,0.0,0.5,13.0
8
- Str2Str-ODE (t=0.1),1.66,-,0.13,-,-,-,2.12,4.42,6.1,0.42,0.17,-,-,0.0,0.1,13.7
9
- Str2Str-ODE (t=0.3),3.15,-,0.12,-,-,-,2.23,4.75,9.8,0.41,0.17,-,-,0.0,0.1,14.8
10
- Str2Str-SDE (t=0.1),4.74,-,0.10,-,-,-,2.54,8.84,9.8,0.40,0.13,-,-,1.6,0.2,23.0
11
- Str2Str-SDE (t=0.3),7.54,-,0.00,-,-,-,3.29,12.28,7.3,0.35,0.13,-,-,1.5,0.2,21.4
12
  AlphaFlow-PDB,2.58,1.20,0.27,0.46,0.81,2.96,1.66,2.60,37.8,0.44,0.33,0.42,0.18,0.0,0.2,6.6
13
  AlphaFlow-MD,2.88,1.63,0.53,0.66,0.85,2.68,1.53,2.28,39.0,0.57,0.38,0.50,0.24,0.0,0.2,21.7
14
  ESMFlow-PDB,3.00,1.68,0.14,0.27,0.71,4.20,1.77,3.54,28.0,0.42,0.29,0.41,0.16,0.0,0.6,5.4
 
1
  Model,Pairwise RMSD,*RMSF,Pearson r on Pairwise RMSD ↑,Pearson r on *Global RMSF ↑,Pearson r on *Per target RMSF ↑,*RMWD ↓,MD PCA W2 ↓,Joint PCA W2 ↓,PC sim > 0.5% ↑,Weak contacts J ↑,Transient contacts J ↑,*Exposed residue J ↑,*Exposed MI matrix ρ ↑,CA break % ↓,CA clash % ↓,PepBond break % ↓
2
  MD iid,2.76,1.63,0.96,0.97,0.99,0.71,0.76,0.70,93.9,0.90,0.80,0.93,0.56,0.0,0.1,3.4
3
  MD 2.5 ns,1.54,0.98,0.89,0.85,0.85,2.21,1.57,1.93,36.6,0.62,0.45,0.64,0.24,0.0,0.1,3.4
4
+ EigenFold,5.96,NaN,-0.04,NaN,NaN,NaN,2.35,7.96,12.2,0.36,0.18,NaN,NaN,0.7,9.6,NaN
5
  MSA-depth256,0.84,0.53,0.25,0.34,0.59,3.63,1.83,2.90,29.3,0.30,0.28,0.33,0.06,0.0,0.2,5.9
6
  MSA-depth64,2.03,1.51,0.24,0.30,0.57,4.00,1.87,3.32,18.3,0.38,0.27,0.38,0.12,0.0,0.2,8.4
7
  MSA-depth32,5.71,7.96,0.07,0.17,0.53,6.12,2.50,5.67,17.1,0.39,0.24,0.36,0.15,0.0,0.5,13.0
8
+ Str2Str-ODE (t=0.1),1.66,NaN,0.13,NaN,NaN,NaN,2.12,4.42,6.1,0.42,0.17,NaN,NaN,0.0,0.1,13.7
9
+ Str2Str-ODE (t=0.3),3.15,NaN,0.12,NaN,NaN,NaN,2.23,4.75,9.8,0.41,0.17,NaN,NaN,0.0,0.1,14.8
10
+ Str2Str-SDE (t=0.1),4.74,NaN,0.10,NaN,NaN,NaN,2.54,8.84,9.8,0.40,0.13,NaN,NaN,1.6,0.2,23.0
11
+ Str2Str-SDE (t=0.3),7.54,NaN,0.00,NaN,NaN,NaN,3.29,12.28,7.3,0.35,0.13,NaN,NaN,1.5,0.2,21.4
12
  AlphaFlow-PDB,2.58,1.20,0.27,0.46,0.81,2.96,1.66,2.60,37.8,0.44,0.33,0.42,0.18,0.0,0.2,6.6
13
  AlphaFlow-MD,2.88,1.63,0.53,0.66,0.85,2.68,1.53,2.28,39.0,0.57,0.38,0.50,0.24,0.0,0.2,21.7
14
  ESMFlow-PDB,3.00,1.68,0.14,0.27,0.71,4.20,1.77,3.54,28.0,0.42,0.29,0.41,0.16,0.0,0.6,5.4
data/inverse_folding.csv CHANGED
@@ -1,5 +1,5 @@
1
  Model,CASP AAR ↑,CAMEO AAR ↑,scTM (L=100) ↑,pLDDT (L=100) ↑,scTM (L=200) ↑,pLDDT (L=200) ↑,scTM (L=300) ↑,pLDDT (L=300) ↑,scTM (L=400) ↑,pLDDT (L=400) ↑,scTM (L=500) ↑,pLDDT (L=500) ↑
2
  ProteinMPNN,0.450,0.468,0.962,94.14,0.945,89.34,0.962,90.28,0.875,83.76,0.568,67.09
3
- ESM-IF1,-,-,0.810,88.83,0.635,69.67,0.336,74.36,0.449,64.59,0.462,58.97
4
  LM-Design,0.516,0.570,0.834,78.45,0.373,58.41,0.481,69.86,0.565,59.87,0.397,56.35
5
- ESM3,-,-,0.942,86.60,0.486,60.69,0.632,70.78,0.564,62.63,0.452,59.37
 
1
  Model,CASP AAR ↑,CAMEO AAR ↑,scTM (L=100) ↑,pLDDT (L=100) ↑,scTM (L=200) ↑,pLDDT (L=200) ↑,scTM (L=300) ↑,pLDDT (L=300) ↑,scTM (L=400) ↑,pLDDT (L=400) ↑,scTM (L=500) ↑,pLDDT (L=500) ↑
2
  ProteinMPNN,0.450,0.468,0.962,94.14,0.945,89.34,0.962,90.28,0.875,83.76,0.568,67.09
3
+ ESM-IF1,NaN,NaN,0.810,88.83,0.635,69.67,0.336,74.36,0.449,64.59,0.462,58.97
4
  LM-Design,0.516,0.570,0.834,78.45,0.373,58.41,0.481,69.86,0.565,59.87,0.397,56.35
5
+ ESM3,NaN,NaN,0.942,86.60,0.486,60.69,0.632,70.78,0.564,62.63,0.452,59.37
data/multi_state_prediction.csv CHANGED
@@ -1,5 +1,5 @@
1
  Model,RMSDens N=10,RMSDens N=100,RMSDens N=500,RMSDens N=1000,RMSD Cluster 3 N=10,RMSD Cluster 3 N=100,RMSD Cluster 3 N=500,RMSD Cluster 3 N=1000,Pairwise RMSD,CA clash (%),CA break (%),PepBond break (%)
2
- EigenFold,1.56,1.50,1.47,1.46,2.54,2.48,2.46,2.46,0.85,1.4,4.3,-
3
  MSA-depth256,1.57,1.54,1.52,1.52,2.51,2.47,2.45,2.45,0.20,0.0,0.0,9.2
4
  MSA-depth64,1.60,1.54,1.51,1.50,2.48,2.40,2.35,2.33,0.55,0.0,0.0,7.9
5
  MSA-depth32,1.67,1.53,1.45,1.41,2.39,2.21,1.93,1.87,2.14,0.6,0.0,10.6
 
1
  Model,RMSDens N=10,RMSDens N=100,RMSDens N=500,RMSDens N=1000,RMSD Cluster 3 N=10,RMSD Cluster 3 N=100,RMSD Cluster 3 N=500,RMSD Cluster 3 N=1000,Pairwise RMSD,CA clash (%),CA break (%),PepBond break (%)
2
+ EigenFold,1.56,1.50,1.47,1.46,2.54,2.48,2.46,2.46,0.85,1.4,4.3,NaN
3
  MSA-depth256,1.57,1.54,1.52,1.52,2.51,2.47,2.45,2.45,0.20,0.0,0.0,9.2
4
  MSA-depth64,1.60,1.54,1.51,1.50,2.48,2.40,2.35,2.33,0.55,0.0,0.0,7.9
5
  MSA-depth32,1.67,1.53,1.45,1.41,2.39,2.21,1.93,1.87,2.14,0.6,0.0,10.6
data/protein_folding.csv CHANGED
@@ -3,4 +3,4 @@ AlphaFold2,0.871,3.21,0.860,0.900,0.3,0.0,4.8
3
  OpenFold,0.870,3.21,0.856,0.895,0.4,0.0,2.0
4
  RoseTTAFold2,0.859,3.52,0.845,0.888,0.3,0.2,5.5
5
  ESMFold,0.847,3.98,0.826,0.870,0.3,0.0,4.7
6
- EigenFold*,0.743,7.65,0.703,0.737,8.0,0.5,-
 
3
  OpenFold,0.870,3.21,0.856,0.895,0.4,0.0,2.0
4
  RoseTTAFold2,0.859,3.52,0.845,0.888,0.3,0.2,5.5
5
  ESMFold,0.847,3.98,0.826,0.870,0.3,0.0,4.7
6
+ EigenFold*,0.743,7.65,0.703,0.737,8.0,0.5,NaN
data/sequence_design.csv CHANGED
@@ -1,5 +1,5 @@
1
  Model,ppl (L=100) ↓,pLDDT (L=100) ↑,pairwise TM (L=100) ↓,Max Clust. (L=100) ↑,Max TM (L=100) ↓,ppl (L=200) ↓,pLDDT (L=200) ↑,pairwise TM (L=200) ↓,Max Clust. (L=200) ↑,Max TM (L=200) ↓,ppl (L=300) ↓,pLDDT (L=300) ↑,pairwise TM (L=300) ↓,Max Clust. (L=300) ↑,Max TM (L=300) ↓,ppl (L=500) ↓,pLDDT (L=500) ↑,pairwise TM (L=500) ↓,Max Clust. (L=500) ↑,Max TM (L=500) ↓
2
- Native Seqs,-,68.46,0.55,0.75,-,-,61.91,0.49,0.78,-,-,61.49,0.51,0.85,-,-,62.95,0.51,0.78,-
3
  Progen 2 (700M),8.28,64.00,0.42,0.94,0.64,5.68,69.91,0.40,0.91,0.69,6.25,65.69,0.42,0.93,0.66,4.27,61.45,0.32,0.95,0.68
4
  EvoDiff,16.89,50.20,0.43,0.98,0.69,17.28,50.66,0.36,1.00,0.71,17.13,45.14,0.31,1.00,0.68,16.51,43.14,0.31,1.00,0.69
5
  DPLM (650M),6.21,85.38,0.50,0.80,0.74,4.61,93.54,0.54,0.70,0.91,3.47,93.07,0.57,0.63,0.91,3.33,87.73,0.43,0.85,0.85
 
1
  Model,ppl (L=100) ↓,pLDDT (L=100) ↑,pairwise TM (L=100) ↓,Max Clust. (L=100) ↑,Max TM (L=100) ↓,ppl (L=200) ↓,pLDDT (L=200) ↑,pairwise TM (L=200) ↓,Max Clust. (L=200) ↑,Max TM (L=200) ↓,ppl (L=300) ↓,pLDDT (L=300) ↑,pairwise TM (L=300) ↓,Max Clust. (L=300) ↑,Max TM (L=300) ↓,ppl (L=500) ↓,pLDDT (L=500) ↑,pairwise TM (L=500) ↓,Max Clust. (L=500) ↑,Max TM (L=500) ↓
2
+ Native Seqs,NaN,68.46,0.55,0.75,NaN,NaN,61.91,0.49,0.78,NaN,NaN,61.49,0.51,0.85,NaN,NaN,62.95,0.51,0.78,NaN
3
  Progen 2 (700M),8.28,64.00,0.42,0.94,0.64,5.68,69.91,0.40,0.91,0.69,6.25,65.69,0.42,0.93,0.66,4.27,61.45,0.32,0.95,0.68
4
  EvoDiff,16.89,50.20,0.43,0.98,0.69,17.28,50.66,0.36,1.00,0.71,17.13,45.14,0.31,1.00,0.68,16.51,43.14,0.31,1.00,0.69
5
  DPLM (650M),6.21,85.38,0.50,0.80,0.74,4.61,93.54,0.54,0.70,0.91,3.47,93.07,0.57,0.63,0.91,3.33,87.73,0.43,0.85,0.85
data/structure_design.csv CHANGED
@@ -1,5 +1,5 @@
1
  Model,scTM (L=50) ↑,scRMSD (L=50) ↓,Max TM (L=50) ↓,pairwise TM (L=50) ↓,Max Clust. (L=50) ↑,scTM (L=100) ↑,scRMSD (L=100) ↓,Max TM (L=100) ↓,pairwise TM (L=100) ↓,Max Clust. (L=100) ↑,scTM (L=300) ↑,scRMSD (L=300) ↓,Max TM (L=300) ↓,pairwise TM (L=300) ↓,Max Clust. (L=300) ↑,scTM (L=500) ↑,scRMSD (L=500) ↓,Max TM (L=500) ↓,pairwise TM (L=500) ↓,Max Clust. (L=500) ↑
2
- Native PDBs,0.91,0.74,-,0.29,0.66,0.96,0.67,-,0.30,0.77,0.97,0.82,-,0.28,0.77,0.97,1.07,-,0.29,0.80
3
  RFdiffusion,0.95,0.45,0.65,0.58,0.67,0.98,0.48,0.76,0.41,0.32,0.96,1.03,0.64,0.36,0.65,0.79,5.60,0.62,0.33,0.89
4
  FrameFlow,0.91,0.58,0.75,0.68,0.39,0.94,0.70,0.72,0.55,0.49,0.92,1.95,0.65,0.43,0.88,0.61,7.92,0.61,0.40,0.92
5
  Chroma,0.85,1.05,0.59,0.29,0.48,0.89,1.27,0.70,0.35,0.59,0.87,2.47,0.66,0.36,0.67,0.72,6.71,0.60,0.29,0.99
 
1
  Model,scTM (L=50) ↑,scRMSD (L=50) ↓,Max TM (L=50) ↓,pairwise TM (L=50) ↓,Max Clust. (L=50) ↑,scTM (L=100) ↑,scRMSD (L=100) ↓,Max TM (L=100) ↓,pairwise TM (L=100) ↓,Max Clust. (L=100) ↑,scTM (L=300) ↑,scRMSD (L=300) ↓,Max TM (L=300) ↓,pairwise TM (L=300) ↓,Max Clust. (L=300) ↑,scTM (L=500) ↑,scRMSD (L=500) ↓,Max TM (L=500) ↓,pairwise TM (L=500) ↓,Max Clust. (L=500) ↑
2
+ Native PDBs,0.91,0.74,NaN,0.29,0.66,0.96,0.67,NaN,0.30,0.77,0.97,0.82,NaN,0.28,0.77,0.97,1.07,NaN,0.29,0.80
3
  RFdiffusion,0.95,0.45,0.65,0.58,0.67,0.98,0.48,0.76,0.41,0.32,0.96,1.03,0.64,0.36,0.65,0.79,5.60,0.62,0.33,0.89
4
  FrameFlow,0.91,0.58,0.75,0.68,0.39,0.94,0.70,0.72,0.55,0.49,0.92,1.95,0.65,0.43,0.88,0.61,7.92,0.61,0.40,0.92
5
  Chroma,0.85,1.05,0.59,0.29,0.48,0.89,1.27,0.70,0.35,0.59,0.87,2.47,0.66,0.36,0.67,0.72,6.71,0.60,0.29,0.99