zhiyuw commited on
Commit
ae5f882
·
verified ·
1 Parent(s): 36710de

Initial release: trained PLASMA heads (21 task x backbone variants) + model card

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +1 -0
  2. README.md +184 -0
  3. assets/visual_abstract.png +3 -0
  4. weights/active_site/ProstT5/config.json +11 -0
  5. weights/active_site/ProstT5/metadata.json +33 -0
  6. weights/active_site/ProstT5/model.safetensors +3 -0
  7. weights/active_site/ProtSSN/config.json +11 -0
  8. weights/active_site/ProtSSN/metadata.json +33 -0
  9. weights/active_site/ProtSSN/model.safetensors +3 -0
  10. weights/active_site/TM-Vec/config.json +11 -0
  11. weights/active_site/TM-Vec/metadata.json +33 -0
  12. weights/active_site/TM-Vec/model.safetensors +3 -0
  13. weights/active_site/ankh-base/config.json +11 -0
  14. weights/active_site/ankh-base/metadata.json +33 -0
  15. weights/active_site/ankh-base/model.safetensors +3 -0
  16. weights/active_site/esm2_t33_650M_UR50D/config.json +11 -0
  17. weights/active_site/esm2_t33_650M_UR50D/metadata.json +33 -0
  18. weights/active_site/esm2_t33_650M_UR50D/model.safetensors +3 -0
  19. weights/active_site/prot_bert/config.json +11 -0
  20. weights/active_site/prot_bert/metadata.json +33 -0
  21. weights/active_site/prot_bert/model.safetensors +3 -0
  22. weights/active_site/prot_t5_xl_half_uniref50-enc/config.json +11 -0
  23. weights/active_site/prot_t5_xl_half_uniref50-enc/metadata.json +33 -0
  24. weights/active_site/prot_t5_xl_half_uniref50-enc/model.safetensors +3 -0
  25. weights/binding_site/ProstT5/config.json +11 -0
  26. weights/binding_site/ProstT5/metadata.json +33 -0
  27. weights/binding_site/ProstT5/model.safetensors +3 -0
  28. weights/binding_site/ProtSSN/config.json +11 -0
  29. weights/binding_site/ProtSSN/metadata.json +33 -0
  30. weights/binding_site/ProtSSN/model.safetensors +3 -0
  31. weights/binding_site/TM-Vec/config.json +11 -0
  32. weights/binding_site/TM-Vec/metadata.json +33 -0
  33. weights/binding_site/TM-Vec/model.safetensors +3 -0
  34. weights/binding_site/ankh-base/config.json +11 -0
  35. weights/binding_site/ankh-base/metadata.json +33 -0
  36. weights/binding_site/ankh-base/model.safetensors +3 -0
  37. weights/binding_site/esm2_t33_650M_UR50D/config.json +11 -0
  38. weights/binding_site/esm2_t33_650M_UR50D/metadata.json +33 -0
  39. weights/binding_site/esm2_t33_650M_UR50D/model.safetensors +3 -0
  40. weights/binding_site/prot_bert/config.json +11 -0
  41. weights/binding_site/prot_bert/metadata.json +33 -0
  42. weights/binding_site/prot_bert/model.safetensors +3 -0
  43. weights/binding_site/prot_t5_xl_half_uniref50-enc/config.json +11 -0
  44. weights/binding_site/prot_t5_xl_half_uniref50-enc/metadata.json +33 -0
  45. weights/binding_site/prot_t5_xl_half_uniref50-enc/model.safetensors +3 -0
  46. weights/motif/ProstT5/config.json +11 -0
  47. weights/motif/ProstT5/metadata.json +33 -0
  48. weights/motif/ProstT5/model.safetensors +3 -0
  49. weights/motif/ProtSSN/config.json +11 -0
  50. weights/motif/ProtSSN/metadata.json +33 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ assets/visual_abstract.png filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,184 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: mit
3
+ library_name: plasma-protein-local-alignment
4
+ pipeline_tag: feature-extraction
5
+ tags:
6
+ - protein
7
+ - protein-language-model
8
+ - alignment
9
+ - optimal-transport
10
+ - sinkhorn
11
+ - bioinformatics
12
+ - biology
13
+ ---
14
+
15
+ # PLASMA: Pluggable Local Alignment via Sinkhorn MAtrix
16
+
17
+ [![arXiv](https://img.shields.io/badge/arXiv-2510.11752-b31b1b.svg)](https://arxiv.org/abs/2510.11752)
18
+ [![ICLR 2026](https://img.shields.io/badge/ICLR-2026-blue.svg)](https://arxiv.org/abs/2510.11752)
19
+ [![GitHub stars](https://img.shields.io/github/stars/ZW471/PLASMA-Protein-Local-Alignment?style=social)](https://github.com/ZW471/PLASMA-Protein-Local-Alignment)
20
+
21
+ ![Visual abstract](assets/visual_abstract.png)
22
+
23
+ **PLASMA** is a tiny, pluggable head that turns any frozen protein-language-model
24
+ (PLM) into a residue-level *local* aligner. It reformulates protein substructure
25
+ alignment as a regularised optimal transport problem and runs ~50× faster than
26
+ structure-based aligners (TM-Align, Foldseek) by operating on pre-computed
27
+ embeddings.
28
+
29
+ This repository hosts the trained **PLASMA** heads for every (task, backbone)
30
+ combination from the paper, plus instructions for the parameter-free
31
+ **PLASMA-PF** baseline (which has no learned weights). PLASMA was published at
32
+ **ICLR 2026**.
33
+
34
+ - **Paper:** <https://arxiv.org/abs/2510.11752> (ICLR 2026)
35
+ - **Code:** <https://github.com/ZW471/PLASMA-Protein-Local-Alignment>
36
+ - **License:** MIT
37
+
38
+ ## What's in this repo
39
+
40
+ Each variant lives in its own subfolder and is loaded by the `load_plasma`
41
+ helper from the GitHub package:
42
+
43
+ ```
44
+ weights/
45
+ active_site/
46
+ prot_bert/ # config.json + model.safetensors + metadata.json
47
+ ankh-base/
48
+ TM-Vec/
49
+ ProstT5/
50
+ prot_t5_xl_half_uniref50-enc/
51
+ esm2_t33_650M_UR50D/
52
+ ProtSSN/
53
+ binding_site/
54
+ ...
55
+ motif/
56
+ ...
57
+ ```
58
+
59
+ All heads share the same architecture: a small `LRL` non-linearity
60
+ (`LazyLinear → ReLU → Linear → LayerNorm`, hidden dim 512) followed by a
61
+ parameter-free Sinkhorn iteration (`temperature=0.1`, `n_iters=20`). The
62
+ checkpoint files are ~3 MB each.
63
+
64
+ ## Quickstart
65
+
66
+ Install the PLASMA package from source (the model class is shipped with the
67
+ GitHub repo):
68
+
69
+ ```bash
70
+ git clone https://github.com/ZW471/PLASMA-Protein-Local-Alignment
71
+ cd PLASMA-Protein-Local-Alignment
72
+ uv sync
73
+ ```
74
+
75
+ Then load any trained head with the high-level helper:
76
+
77
+ ```python
78
+ import torch
79
+ from alignment import load_plasma
80
+
81
+ model = load_plasma(task="active_site", backbone="prot_bert")
82
+ model.eval()
83
+
84
+ # Feed pre-computed AA-level embeddings from the matching backbone.
85
+ # H_q / H_c are residue-level embeddings; batch_q / batch_c assign each
86
+ # residue to a sample (use zeros if you only have one pair).
87
+ H_q = torch.randn(120, 1024) # query: 120 residues, ProtBERT dim
88
+ H_c = torch.randn(180, 1024) # candidate: 180 residues
89
+ batch_q = torch.zeros(120, dtype=torch.long)
90
+ batch_c = torch.zeros(180, dtype=torch.long)
91
+
92
+ with torch.no_grad():
93
+ alignment_matrix = model(H_q, H_c, batch_q, batch_c) # (120, 180)
94
+ ```
95
+
96
+ The output is a doubly-stochastic transport plan describing the residue-level
97
+ correspondence between the two substructures. To reduce it to a similarity
98
+ score, reuse `utils.alignment_score` from the GitHub repo (it applies the
99
+ diagonal convolution + threshold described in the paper).
100
+
101
+ ## PLASMA-PF (parameter-free)
102
+
103
+ PLASMA-PF is a hinge / Sinkhorn baseline with **no learned weights**. There is
104
+ nothing to download — just instantiate it from the same `Alignment` class:
105
+
106
+ ```python
107
+ from alignment import load_plasma_pf
108
+
109
+ model = load_plasma_pf() # Alignment(eta='hinge', omega='sinkhorn', ...)
110
+ ```
111
+
112
+ It accepts the same forward signature as the trained heads above.
113
+
114
+ ## Available variants & evaluation results
115
+
116
+ Numbers below are 3-seed averages (mean ± std) reported in the paper. The seven
117
+ backbone columns correspond to the seven subfolders under each task.
118
+
119
+ ### Interpolation (in-distribution test split)
120
+
121
+ | Task | Metric | Ankh | ESM-2 | ProstT5 | ProtBERT | ProtSSN | ProtT5 | TM-Vec |
122
+ | --- | --- | ---: | ---: | ---: | ---: | ---: | ---: | ---: |
123
+ | **Motif** | ROC-AUC | .925 ± .002 | .933 ± .005 | .954 ± .002 | .854 ± .003 | .922 ± .002 | **.972 ± .001** | .910 ± .003 |
124
+ | | F1-Max | .885 ± .002 | .877 ± .005 | .885 ± .003 | .784 ± .002 | .866 ± .002 | **.918 ± .003** | .853 ± .003 |
125
+ | | PR-AUC | .921 ± .002 | .931 ± .004 | .953 ± .003 | .872 ± .003 | .920 ± .002 | **.971 ± .002** | .914 ± .003 |
126
+ | | Label Match Score | .921 ± .004 | .890 ± .008 | .929 ± .001 | .746 ± .007 | .767 ± .008 | **.937 ± .001** | .792 ± .008 |
127
+ | **Binding Site** | ROC-AUC | **.995 ± .000** | .992 ± .000 | .993 ± .001 | .981 ± .001 | .992 ± .001 | .993 ± .000 | .980 ± .001 |
128
+ | | F1-Max | .987 ± .001 | .986 ± .001 | .983 ± .001 | .948 ± .002 | .982 ± .001 | **.988 ± .001** | .970 ± .001 |
129
+ | | PR-AUC | **.996 ± .001** | .994 ± .001 | .995 ± .001 | .985 ± .001 | .993 ± .001 | .995 ± .000 | .984 ± .001 |
130
+ | | Label Match Score | **.951 ± .002** | .950 ± .002 | **.951 ± .002** | .880 ± .008 | .872 ± .005 | **.951 ± .001** | .900 ± .004 |
131
+ | **Active Site** | ROC-AUC | **.994 ± .001** | .991 ± .001 | .993 ± .001 | .986 ± .001 | .992 ± .001 | **.994 ± .001** | .991 ± .001 |
132
+ | | F1-Max | **.989 ± .001** | .985 ± .001 | .987 ± .001 | .967 ± .001 | .987 ± .001 | .987 ± .001 | .982 ± .001 |
133
+ | | PR-AUC | **.994 ± .001** | .992 ± .001 | **.994 ± .001** | .988 ± .001 | **.994 ± .001** | **.994 ± .001** | .992 ± .001 |
134
+ | | Label Match Score | **.975 ± .001** | .969 ± .002 | **.975 ± .001** | .904 ± .003 | .885 ± .013 | .972 ± .001 | .938 ± .001 |
135
+
136
+ ### Extrapolation (held-out hard test split)
137
+
138
+ | Task | Metric | Ankh | ESM-2 | ProstT5 | ProtBERT | ProtSSN | ProtT5 | TM-Vec |
139
+ | --- | --- | ---: | ---: | ---: | ---: | ---: | ---: | ---: |
140
+ | **Motif** | ROC-AUC | .960 ± .011 | .972 ± .010 | **.975 ± .009** | .870 ± .030 | .949 ± .013 | .968 ± .012 | .954 ± .013 |
141
+ | | F1-Max | .915 ± .021 | **.931 ± .016** | .926 ± .020 | .799 ± .039 | .896 ± .023 | .922 ± .023 | .903 ± .026 |
142
+ | | PR-AUC | .948 ± .020 | **.970 ± .010** | .969 ± .016 | .873 ± .036 | .940 ± .020 | .962 ± .018 | .944 ± .022 |
143
+ | | Label Match Score | **.842 ± .025** | .786 ± .032 | .801 ± .022 | .541 ± .060 | .537 ± .025 | .738 ± .028 | .704 ± .020 |
144
+ | **Binding Site** | ROC-AUC | .995 ± .005 | **.999 ± .001** | .993 ± .005 | .951 ± .014 | **.999 ± .001** | **.999 ± .001** | .990 ± .008 |
145
+ | | F1-Max | .992 ± .005 | .991 ± .005 | .985 ± .009 | .896 ± .019 | .988 ± .006 | **.996 ± .003** | .983 ± .011 |
146
+ | | PR-AUC | .997 ± .003 | **.999 ± .001** | .995 ± .003 | .958 ± .012 | .998 ± .001 | **.999 ± .000** | .992 ± .006 |
147
+ | | Label Match Score | .894 ± .026 | .851 ± .031 | .891 ± .029 | .603 ± .041 | .753 ± .041 | **.902 ± .019** | .824 ± .031 |
148
+ | **Active Site** | ROC-AUC | .995 ± .002 | .996 ± .003 | .996 ± .003 | .980 ± .004 | .997 ± .001 | **.999 ± .000** | .995 ± .002 |
149
+ | | F1-Max | **.992 ± .002** | .986 ± .004 | .991 ± .004 | .950 ± .005 | .991 ± .003 | .991 ± .002 | .985 ± .003 |
150
+ | | PR-AUC | .995 ± .003 | .997 ± .002 | .997 ± .002 | .984 ± .003 | .998 ± .001 | **.999 ± .000** | .996 ± .002 |
151
+ | | Label Match Score | **.938 ± .014** | .882 ± .027 | .931 ± .026 | .697 ± .019 | .737 ± .011 | .893 ± .017 | .880 ± .023 |
152
+
153
+ Each subfolder also contains a `metadata.json` with the full hyperparameter
154
+ config in machine-readable form.
155
+
156
+ ## Training details
157
+
158
+ - **Architecture:** `Alignment(eta='lrl', omega='sinkhorn',
159
+ eta_kwargs={'hidden_dim': 512},
160
+ omega_kwargs={'temperature': 0.1, 'n_iters': 20})`.
161
+ - **Score head:** `K=10`, `threshold=0.5` (used by
162
+ `utils.alignment_score` to reduce the transport plan to a scalar).
163
+ - **Optimiser / loss:** Adam (`lr=1e-4`), `BCEWithLogitsLoss` on the alignment
164
+ score plus a label-match auxiliary loss (`target_loss_weight=1.0`).
165
+ - **Data:** the InterPro-derived motif / binding-site / active-site datasets
166
+ shipped under `data/raw/` in the GitHub repo, split into train / validation /
167
+ test / test-hard with `dataset_fraction=0.1` (default sweep) and
168
+ `dataset_fraction=1.0` (full sweep — checkpoints here are from the full
169
+ sweep).
170
+ - **Selection metric:** validation loss (early stopping, `patience=3`).
171
+
172
+ ## Citation
173
+
174
+ If you use these weights, please cite the PLASMA paper:
175
+
176
+ ```bibtex
177
+ @inproceedings{wang2026plasma,
178
+ title = {Fast and Interpretable Protein Substructure Alignment via Optimal Transport},
179
+ author = {Wang, Zhiyu and Zhou, Bingxin and Wang, Jing and Tan, Yang and Zhao, Weishu and Li{\`o}, Pietro and Hong, Liang},
180
+ booktitle = {International Conference on Learning Representations (ICLR)},
181
+ year = {2026},
182
+ url = {https://arxiv.org/abs/2510.11752},
183
+ }
184
+ ```
assets/visual_abstract.png ADDED

Git LFS Details

  • SHA256: a7b646e74de96e8c7126554fa52a2dcabc1c0e0a54fd95723c71f5a548023139
  • Pointer size: 132 Bytes
  • Size of remote file: 1.06 MB
weights/active_site/ProstT5/config.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "eta": "lrl",
3
+ "eta_kwargs": {
4
+ "hidden_dim": 512
5
+ },
6
+ "omega": "sinkhorn",
7
+ "omega_kwargs": {
8
+ "n_iters": 20,
9
+ "temperature": 0.1
10
+ }
11
+ }
weights/active_site/ProstT5/metadata.json ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "task": "active_site",
3
+ "backbone": "ProstT5",
4
+ "split": 0,
5
+ "eta_config": {
6
+ "type": "lrl",
7
+ "hidden_dim": 512
8
+ },
9
+ "omega_config": {
10
+ "type": "sinkhorn",
11
+ "temperature": 0.1,
12
+ "n_iters": 20
13
+ },
14
+ "score_config": {
15
+ "K": 10,
16
+ "threshold": 0.5
17
+ },
18
+ "metrics": {
19
+ "test_frequent": {
20
+ "rocauc": 0.992344856262207,
21
+ "f1_max": 0.9862671660424469,
22
+ "pr_auc": 0.9944091439247131,
23
+ "label_match_score": 0.9720931127164464
24
+ },
25
+ "test_hard": {
26
+ "rocauc": 0.9999887347221375,
27
+ "f1_max": 0.9987496874218554,
28
+ "pr_auc": 0.9999887943267822,
29
+ "label_match_score": 0.9361866737141609
30
+ }
31
+ },
32
+ "source_checkpoint": "sweeps/train/all/active_site/ProstT5/27/active_site_split0_best.pt"
33
+ }
weights/active_site/ProstT5/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e65cdc9a5beb16a5f25be6f4dbb788481d16acece4a83056ed59827bb21a938c
3
+ size 3154416
weights/active_site/ProtSSN/config.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "eta": "lrl",
3
+ "eta_kwargs": {
4
+ "hidden_dim": 512
5
+ },
6
+ "omega": "sinkhorn",
7
+ "omega_kwargs": {
8
+ "n_iters": 20,
9
+ "temperature": 0.1
10
+ }
11
+ }
weights/active_site/ProtSSN/metadata.json ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "task": "active_site",
3
+ "backbone": "ProtSSN",
4
+ "split": 0,
5
+ "eta_config": {
6
+ "type": "lrl",
7
+ "hidden_dim": 512
8
+ },
9
+ "omega_config": {
10
+ "type": "sinkhorn",
11
+ "temperature": 0.1,
12
+ "n_iters": 20
13
+ },
14
+ "score_config": {
15
+ "K": 10,
16
+ "threshold": 0.5
17
+ },
18
+ "metrics": {
19
+ "test_frequent": {
20
+ "rocauc": 0.9907435178756714,
21
+ "f1_max": 0.9846695149535059,
22
+ "pr_auc": 0.9934981465339661,
23
+ "label_match_score": 0.8660282360271119
24
+ },
25
+ "test_hard": {
26
+ "rocauc": 0.9999032616615295,
27
+ "f1_max": 0.9965,
28
+ "pr_auc": 0.9999053478240967,
29
+ "label_match_score": 0.7096276976610534
30
+ }
31
+ },
32
+ "source_checkpoint": "sweeps/train/all/active_site/ProtSSN/54/active_site_split0_best.pt"
33
+ }
weights/active_site/ProtSSN/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21388d6626e4faa3bc260f1f6439cd66dbc03710052aff49b2111e62a1444bdb
3
+ size 3678704
weights/active_site/TM-Vec/config.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "eta": "lrl",
3
+ "eta_kwargs": {
4
+ "hidden_dim": 512
5
+ },
6
+ "omega": "sinkhorn",
7
+ "omega_kwargs": {
8
+ "n_iters": 20,
9
+ "temperature": 0.1
10
+ }
11
+ }
weights/active_site/TM-Vec/metadata.json ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "task": "active_site",
3
+ "backbone": "TM-Vec",
4
+ "split": 0,
5
+ "eta_config": {
6
+ "type": "lrl",
7
+ "hidden_dim": 512
8
+ },
9
+ "omega_config": {
10
+ "type": "sinkhorn",
11
+ "temperature": 0.1,
12
+ "n_iters": 20
13
+ },
14
+ "score_config": {
15
+ "K": 10,
16
+ "threshold": 0.5
17
+ },
18
+ "metrics": {
19
+ "test_frequent": {
20
+ "rocauc": 0.9918658137321472,
21
+ "f1_max": 0.9819729594391587,
22
+ "pr_auc": 0.9937556982040405,
23
+ "label_match_score": 0.9401966694747831
24
+ },
25
+ "test_hard": {
26
+ "rocauc": 0.9987612366676331,
27
+ "f1_max": 0.9860865165696939,
28
+ "pr_auc": 0.9988466501235962,
29
+ "label_match_score": 0.854244963310197
30
+ }
31
+ },
32
+ "source_checkpoint": "sweeps/train/all/active_site/TM-Vec/18/active_site_split0_best.pt"
33
+ }
weights/active_site/TM-Vec/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5dc025d05e15cd99328dfd341064756f01efa5ff8aa331e7622bf3657e9e4c6d
3
+ size 3154416
weights/active_site/ankh-base/config.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "eta": "lrl",
3
+ "eta_kwargs": {
4
+ "hidden_dim": 512
5
+ },
6
+ "omega": "sinkhorn",
7
+ "omega_kwargs": {
8
+ "n_iters": 20,
9
+ "temperature": 0.1
10
+ }
11
+ }
weights/active_site/ankh-base/metadata.json ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "task": "active_site",
3
+ "backbone": "ankh-base",
4
+ "split": 0,
5
+ "eta_config": {
6
+ "type": "lrl",
7
+ "hidden_dim": 512
8
+ },
9
+ "omega_config": {
10
+ "type": "sinkhorn",
11
+ "temperature": 0.1,
12
+ "n_iters": 20
13
+ },
14
+ "score_config": {
15
+ "K": 10,
16
+ "threshold": 0.5
17
+ },
18
+ "metrics": {
19
+ "test_frequent": {
20
+ "rocauc": 0.9938057661056519,
21
+ "f1_max": 0.9892041174993723,
22
+ "pr_auc": 0.9950824975967407,
23
+ "label_match_score": 0.9734372955750135
24
+ },
25
+ "test_hard": {
26
+ "rocauc": 0.9999867081642151,
27
+ "f1_max": 0.9987503124218945,
28
+ "pr_auc": 0.9999868869781494,
29
+ "label_match_score": 0.9452198707803406
30
+ }
31
+ },
32
+ "source_checkpoint": "sweeps/train/all/active_site/ankh-base/9/active_site_split0_best.pt"
33
+ }
weights/active_site/ankh-base/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:acf83dac2b7ed05b521bb659492aa192914222424f96107cd64a6f3a467cd182
3
+ size 2630128
weights/active_site/esm2_t33_650M_UR50D/config.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "eta": "lrl",
3
+ "eta_kwargs": {
4
+ "hidden_dim": 512
5
+ },
6
+ "omega": "sinkhorn",
7
+ "omega_kwargs": {
8
+ "n_iters": 20,
9
+ "temperature": 0.1
10
+ }
11
+ }
weights/active_site/esm2_t33_650M_UR50D/metadata.json ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "task": "active_site",
3
+ "backbone": "esm2_t33_650M_UR50D",
4
+ "split": 0,
5
+ "eta_config": {
6
+ "type": "lrl",
7
+ "hidden_dim": 512
8
+ },
9
+ "omega_config": {
10
+ "type": "sinkhorn",
11
+ "temperature": 0.1,
12
+ "n_iters": 20
13
+ },
14
+ "score_config": {
15
+ "K": 10,
16
+ "threshold": 0.5
17
+ },
18
+ "metrics": {
19
+ "test_frequent": {
20
+ "rocauc": 0.9898462891578674,
21
+ "f1_max": 0.985478217325989,
22
+ "pr_auc": 0.9927905797958374,
23
+ "label_match_score": 0.966968783440344
24
+ },
25
+ "test_hard": {
26
+ "rocauc": 0.9998506903648376,
27
+ "f1_max": 0.9959939909864797,
28
+ "pr_auc": 0.9998576045036316,
29
+ "label_match_score": 0.8552783124974398
30
+ }
31
+ },
32
+ "source_checkpoint": "sweeps/train/all/active_site/esm2_t33_650M_UR50D/45/active_site_split0_best.pt"
33
+ }
weights/active_site/esm2_t33_650M_UR50D/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:543c89f2bcd6b30fbadc7acdbfef207ef285f73aa90ef48bff4db6b4b871b5f0
3
+ size 3678704
weights/active_site/prot_bert/config.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "eta": "lrl",
3
+ "eta_kwargs": {
4
+ "hidden_dim": 512
5
+ },
6
+ "omega": "sinkhorn",
7
+ "omega_kwargs": {
8
+ "n_iters": 20,
9
+ "temperature": 0.1
10
+ }
11
+ }
weights/active_site/prot_bert/metadata.json ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "task": "active_site",
3
+ "backbone": "prot_bert",
4
+ "split": 0,
5
+ "eta_config": {
6
+ "type": "lrl",
7
+ "hidden_dim": 512
8
+ },
9
+ "omega_config": {
10
+ "type": "sinkhorn",
11
+ "temperature": 0.1,
12
+ "n_iters": 20
13
+ },
14
+ "score_config": {
15
+ "K": 10,
16
+ "threshold": 0.5
17
+ },
18
+ "metrics": {
19
+ "test_frequent": {
20
+ "rocauc": 0.9855157732963562,
21
+ "f1_max": 0.9628886659979939,
22
+ "pr_auc": 0.9884096384048462,
23
+ "label_match_score": 0.910069686397606
24
+ },
25
+ "test_hard": {
26
+ "rocauc": 0.9875518083572388,
27
+ "f1_max": 0.9543965734441925,
28
+ "pr_auc": 0.9901764988899231,
29
+ "label_match_score": 0.6242303718695857
30
+ }
31
+ },
32
+ "source_checkpoint": "sweeps/train/all/active_site/prot_bert/0/active_site_split0_best.pt"
33
+ }
weights/active_site/prot_bert/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6192f5a73807ff7721cfda218a7d8e88b56772cd4476868ed9781e73305c343
3
+ size 3154416
weights/active_site/prot_t5_xl_half_uniref50-enc/config.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "eta": "lrl",
3
+ "eta_kwargs": {
4
+ "hidden_dim": 512
5
+ },
6
+ "omega": "sinkhorn",
7
+ "omega_kwargs": {
8
+ "n_iters": 20,
9
+ "temperature": 0.1
10
+ }
11
+ }
weights/active_site/prot_t5_xl_half_uniref50-enc/metadata.json ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "task": "active_site",
3
+ "backbone": "prot_t5_xl_half_uniref50-enc",
4
+ "split": 0,
5
+ "eta_config": {
6
+ "type": "lrl",
7
+ "hidden_dim": 512
8
+ },
9
+ "omega_config": {
10
+ "type": "sinkhorn",
11
+ "temperature": 0.1,
12
+ "n_iters": 20
13
+ },
14
+ "score_config": {
15
+ "K": 10,
16
+ "threshold": 0.5
17
+ },
18
+ "metrics": {
19
+ "test_frequent": {
20
+ "rocauc": 0.9920676946640015,
21
+ "f1_max": 0.984769038701623,
22
+ "pr_auc": 0.9936845302581787,
23
+ "label_match_score": 0.9688430294838205
24
+ },
25
+ "test_hard": {
26
+ "rocauc": 0.9998884797096252,
27
+ "f1_max": 0.9960059910134798,
28
+ "pr_auc": 0.999886691570282,
29
+ "label_match_score": 0.8415421822864932
30
+ }
31
+ },
32
+ "source_checkpoint": "sweeps/train/all/active_site/prot_t5_xl_half_uniref50-enc/36/active_site_split0_best.pt"
33
+ }
weights/active_site/prot_t5_xl_half_uniref50-enc/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c4f629be09a89aee0e13bea4d420878e017e68415b386e70eb25114b2ed70d72
3
+ size 3154416
weights/binding_site/ProstT5/config.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "eta": "lrl",
3
+ "eta_kwargs": {
4
+ "hidden_dim": 512
5
+ },
6
+ "omega": "sinkhorn",
7
+ "omega_kwargs": {
8
+ "n_iters": 20,
9
+ "temperature": 0.1
10
+ }
11
+ }
weights/binding_site/ProstT5/metadata.json ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "task": "binding_site",
3
+ "backbone": "ProstT5",
4
+ "split": 0,
5
+ "eta_config": {
6
+ "type": "lrl",
7
+ "hidden_dim": 512
8
+ },
9
+ "omega_config": {
10
+ "type": "sinkhorn",
11
+ "temperature": 0.1,
12
+ "n_iters": 20
13
+ },
14
+ "score_config": {
15
+ "K": 10,
16
+ "threshold": 0.5
17
+ },
18
+ "metrics": {
19
+ "test_frequent": {
20
+ "rocauc": 0.9942386150360107,
21
+ "f1_max": 0.9826327712056381,
22
+ "pr_auc": 0.9957546591758728,
23
+ "label_match_score": 0.9467616829861532
24
+ },
25
+ "test_hard": {
26
+ "rocauc": 0.9979713559150696,
27
+ "f1_max": 0.9945945945945946,
28
+ "pr_auc": 0.9983985424041748,
29
+ "label_match_score": 0.9251244336550384
30
+ }
31
+ },
32
+ "source_checkpoint": "sweeps/train/all/binding_site/ProstT5/30/binding_site_split0_best.pt"
33
+ }
weights/binding_site/ProstT5/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0af354b1a2e012a204766eacbc66e708dc0978b23814d95e04dea87396f8724
3
+ size 3154416
weights/binding_site/ProtSSN/config.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "eta": "lrl",
3
+ "eta_kwargs": {
4
+ "hidden_dim": 512
5
+ },
6
+ "omega": "sinkhorn",
7
+ "omega_kwargs": {
8
+ "n_iters": 20,
9
+ "temperature": 0.1
10
+ }
11
+ }
weights/binding_site/ProtSSN/metadata.json ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "task": "binding_site",
3
+ "backbone": "ProtSSN",
4
+ "split": 0,
5
+ "eta_config": {
6
+ "type": "lrl",
7
+ "hidden_dim": 512
8
+ },
9
+ "omega_config": {
10
+ "type": "sinkhorn",
11
+ "temperature": 0.1,
12
+ "n_iters": 20
13
+ },
14
+ "score_config": {
15
+ "K": 10,
16
+ "threshold": 0.5
17
+ },
18
+ "metrics": {
19
+ "test_frequent": {
20
+ "rocauc": 0.9934399724006653,
21
+ "f1_max": 0.9803625377643505,
22
+ "pr_auc": 0.9950706362724304,
23
+ "label_match_score": 0.8582753864622367
24
+ },
25
+ "test_hard": {
26
+ "rocauc": 0.9999507665634155,
27
+ "f1_max": 0.9971223021582734,
28
+ "pr_auc": 0.9999310374259949,
29
+ "label_match_score": 0.785670741250131
30
+ }
31
+ },
32
+ "source_checkpoint": "sweeps/train/all/binding_site/ProtSSN/57/binding_site_split0_best.pt"
33
+ }
weights/binding_site/ProtSSN/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5600eb5599169bfbb0214c707e68a20e9377b1244f6e03d1a5b2a21f8879c9c1
3
+ size 3678704
weights/binding_site/TM-Vec/config.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "eta": "lrl",
3
+ "eta_kwargs": {
4
+ "hidden_dim": 512
5
+ },
6
+ "omega": "sinkhorn",
7
+ "omega_kwargs": {
8
+ "n_iters": 20,
9
+ "temperature": 0.1
10
+ }
11
+ }
weights/binding_site/TM-Vec/metadata.json ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "task": "binding_site",
3
+ "backbone": "TM-Vec",
4
+ "split": 0,
5
+ "eta_config": {
6
+ "type": "lrl",
7
+ "hidden_dim": 512
8
+ },
9
+ "omega_config": {
10
+ "type": "sinkhorn",
11
+ "temperature": 0.1,
12
+ "n_iters": 20
13
+ },
14
+ "score_config": {
15
+ "K": 10,
16
+ "threshold": 0.5
17
+ },
18
+ "metrics": {
19
+ "test_frequent": {
20
+ "rocauc": 0.9777182936668396,
21
+ "f1_max": 0.9658886894075404,
22
+ "pr_auc": 0.9825307726860046,
23
+ "label_match_score": 0.8937117450104289
24
+ },
25
+ "test_hard": {
26
+ "rocauc": 0.9969605207443237,
27
+ "f1_max": 0.9967567567567568,
28
+ "pr_auc": 0.997014045715332,
29
+ "label_match_score": 0.8630872951235824
30
+ }
31
+ },
32
+ "source_checkpoint": "sweeps/train/all/binding_site/TM-Vec/21/binding_site_split0_best.pt"
33
+ }
weights/binding_site/TM-Vec/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b7c955e1c5e2b290f849037b2557a55ebcfc425b864e98a077646788c0bf0505
3
+ size 3154416
weights/binding_site/ankh-base/config.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "eta": "lrl",
3
+ "eta_kwargs": {
4
+ "hidden_dim": 512
5
+ },
6
+ "omega": "sinkhorn",
7
+ "omega_kwargs": {
8
+ "n_iters": 20,
9
+ "temperature": 0.1
10
+ }
11
+ }
weights/binding_site/ankh-base/metadata.json ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "task": "binding_site",
3
+ "backbone": "ankh-base",
4
+ "split": 0,
5
+ "eta_config": {
6
+ "type": "lrl",
7
+ "hidden_dim": 512
8
+ },
9
+ "omega_config": {
10
+ "type": "sinkhorn",
11
+ "temperature": 0.1,
12
+ "n_iters": 20
13
+ },
14
+ "score_config": {
15
+ "K": 10,
16
+ "threshold": 0.5
17
+ },
18
+ "metrics": {
19
+ "test_frequent": {
20
+ "rocauc": 0.9952087998390198,
21
+ "f1_max": 0.9896803423105965,
22
+ "pr_auc": 0.9964244365692139,
23
+ "label_match_score": 0.9444196989256388
24
+ },
25
+ "test_hard": {
26
+ "rocauc": 0.9999386072158813,
27
+ "f1_max": 0.9978432782171099,
28
+ "pr_auc": 0.9999148845672607,
29
+ "label_match_score": 0.938885366370608
30
+ }
31
+ },
32
+ "source_checkpoint": "sweeps/train/all/binding_site/ankh-base/12/binding_site_split0_best.pt"
33
+ }
weights/binding_site/ankh-base/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9eb81c0ada0185276791992bc1e66a558970a009b64e78ca7dbd664532a51d93
3
+ size 2630128
weights/binding_site/esm2_t33_650M_UR50D/config.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "eta": "lrl",
3
+ "eta_kwargs": {
4
+ "hidden_dim": 512
5
+ },
6
+ "omega": "sinkhorn",
7
+ "omega_kwargs": {
8
+ "n_iters": 20,
9
+ "temperature": 0.1
10
+ }
11
+ }
weights/binding_site/esm2_t33_650M_UR50D/metadata.json ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "task": "binding_site",
3
+ "backbone": "esm2_t33_650M_UR50D",
4
+ "split": 0,
5
+ "eta_config": {
6
+ "type": "lrl",
7
+ "hidden_dim": 512
8
+ },
9
+ "omega_config": {
10
+ "type": "sinkhorn",
11
+ "temperature": 0.1,
12
+ "n_iters": 20
13
+ },
14
+ "score_config": {
15
+ "K": 10,
16
+ "threshold": 0.5
17
+ },
18
+ "metrics": {
19
+ "test_frequent": {
20
+ "rocauc": 0.9934264421463013,
21
+ "f1_max": 0.9860865165696939,
22
+ "pr_auc": 0.9950663447380066,
23
+ "label_match_score": 0.949677944527228
24
+ },
25
+ "test_hard": {
26
+ "rocauc": 0.999835193157196,
27
+ "f1_max": 0.9935344827586207,
28
+ "pr_auc": 0.9997715950012207,
29
+ "label_match_score": 0.8993046989344214
30
+ }
31
+ },
32
+ "source_checkpoint": "sweeps/train/all/binding_site/esm2_t33_650M_UR50D/48/binding_site_split0_best.pt"
33
+ }
weights/binding_site/esm2_t33_650M_UR50D/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56f464b1d41e8922f75ae8e7a727a32cb7bcc086f95dec46d7f13213d61c014d
3
+ size 3678704
weights/binding_site/prot_bert/config.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "eta": "lrl",
3
+ "eta_kwargs": {
4
+ "hidden_dim": 512
5
+ },
6
+ "omega": "sinkhorn",
7
+ "omega_kwargs": {
8
+ "n_iters": 20,
9
+ "temperature": 0.1
10
+ }
11
+ }
weights/binding_site/prot_bert/metadata.json ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "task": "binding_site",
3
+ "backbone": "prot_bert",
4
+ "split": 0,
5
+ "eta_config": {
6
+ "type": "lrl",
7
+ "hidden_dim": 512
8
+ },
9
+ "omega_config": {
10
+ "type": "sinkhorn",
11
+ "temperature": 0.1,
12
+ "n_iters": 20
13
+ },
14
+ "score_config": {
15
+ "K": 10,
16
+ "threshold": 0.5
17
+ },
18
+ "metrics": {
19
+ "test_frequent": {
20
+ "rocauc": 0.9826457500457764,
21
+ "f1_max": 0.9522342064714946,
22
+ "pr_auc": 0.9867449402809143,
23
+ "label_match_score": 0.887023501667951
24
+ },
25
+ "test_hard": {
26
+ "rocauc": 0.9887794256210327,
27
+ "f1_max": 0.9510791366906475,
28
+ "pr_auc": 0.9874331951141357,
29
+ "label_match_score": 0.7587943521090054
30
+ }
31
+ },
32
+ "source_checkpoint": "sweeps/train/all/binding_site/prot_bert/3/binding_site_split0_best.pt"
33
+ }
weights/binding_site/prot_bert/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69692d6e35fd438bdcf63c710b130636da2e495f015568e8d38820d7d86e6c06
3
+ size 3154416
weights/binding_site/prot_t5_xl_half_uniref50-enc/config.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "eta": "lrl",
3
+ "eta_kwargs": {
4
+ "hidden_dim": 512
5
+ },
6
+ "omega": "sinkhorn",
7
+ "omega_kwargs": {
8
+ "n_iters": 20,
9
+ "temperature": 0.1
10
+ }
11
+ }
weights/binding_site/prot_t5_xl_half_uniref50-enc/metadata.json ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "task": "binding_site",
3
+ "backbone": "prot_t5_xl_half_uniref50-enc",
4
+ "split": 0,
5
+ "eta_config": {
6
+ "type": "lrl",
7
+ "hidden_dim": 512
8
+ },
9
+ "omega_config": {
10
+ "type": "sinkhorn",
11
+ "temperature": 0.1,
12
+ "n_iters": 20
13
+ },
14
+ "score_config": {
15
+ "K": 10,
16
+ "threshold": 0.5
17
+ },
18
+ "metrics": {
19
+ "test_frequent": {
20
+ "rocauc": 0.9949175715446472,
21
+ "f1_max": 0.991672975018925,
22
+ "pr_auc": 0.9963440895080566,
23
+ "label_match_score": 0.9517851873361006
24
+ },
25
+ "test_hard": {
26
+ "rocauc": 0.9999374151229858,
27
+ "f1_max": 0.9967590925459129,
28
+ "pr_auc": 0.9999114274978638,
29
+ "label_match_score": 0.8924064511657084
30
+ }
31
+ },
32
+ "source_checkpoint": "sweeps/train/all/binding_site/prot_t5_xl_half_uniref50-enc/39/binding_site_split0_best.pt"
33
+ }
weights/binding_site/prot_t5_xl_half_uniref50-enc/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70c7184ded2cb29cbfba1521c4fb651514231630d5db2875c441ef64f9fa80ac
3
+ size 3154416
weights/motif/ProstT5/config.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "eta": "lrl",
3
+ "eta_kwargs": {
4
+ "hidden_dim": 512
5
+ },
6
+ "omega": "sinkhorn",
7
+ "omega_kwargs": {
8
+ "n_iters": 20,
9
+ "temperature": 0.1
10
+ }
11
+ }
weights/motif/ProstT5/metadata.json ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "task": "motif",
3
+ "backbone": "ProstT5",
4
+ "split": 0,
5
+ "eta_config": {
6
+ "type": "lrl",
7
+ "hidden_dim": 512
8
+ },
9
+ "omega_config": {
10
+ "type": "sinkhorn",
11
+ "temperature": 0.1,
12
+ "n_iters": 20
13
+ },
14
+ "score_config": {
15
+ "K": 10,
16
+ "threshold": 0.5
17
+ },
18
+ "metrics": {
19
+ "test_frequent": {
20
+ "rocauc": 0.9485077261924744,
21
+ "f1_max": 0.8776619845944721,
22
+ "pr_auc": 0.9461915493011475,
23
+ "label_match_score": 0.9349878941312089
24
+ },
25
+ "test_hard": {
26
+ "rocauc": 0.9987444877624512,
27
+ "f1_max": 0.9784646567012921,
28
+ "pr_auc": 0.9987750053405762,
29
+ "label_match_score": 0.7881006840105947
30
+ }
31
+ },
32
+ "source_checkpoint": "sweeps/train/all/motif/ProstT5/33/motif_split0_best.pt"
33
+ }
weights/motif/ProstT5/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ff0edb123312a3832f686a28a1dc00996af04918c7bf83c333842a1bff11407
3
+ size 3154416
weights/motif/ProtSSN/config.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "eta": "lrl",
3
+ "eta_kwargs": {
4
+ "hidden_dim": 512
5
+ },
6
+ "omega": "sinkhorn",
7
+ "omega_kwargs": {
8
+ "n_iters": 20,
9
+ "temperature": 0.1
10
+ }
11
+ }
weights/motif/ProtSSN/metadata.json ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "task": "motif",
3
+ "backbone": "ProtSSN",
4
+ "split": 0,
5
+ "eta_config": {
6
+ "type": "lrl",
7
+ "hidden_dim": 512
8
+ },
9
+ "omega_config": {
10
+ "type": "sinkhorn",
11
+ "temperature": 0.1,
12
+ "n_iters": 20
13
+ },
14
+ "score_config": {
15
+ "K": 10,
16
+ "threshold": 0.5
17
+ },
18
+ "metrics": {
19
+ "test_frequent": {
20
+ "rocauc": 0.9163562655448914,
21
+ "f1_max": 0.8624229979466119,
22
+ "pr_auc": 0.913853108882904,
23
+ "label_match_score": 0.7653402222577776
24
+ },
25
+ "test_hard": {
26
+ "rocauc": 0.9953680038452148,
27
+ "f1_max": 0.9669315560112791,
28
+ "pr_auc": 0.9959331750869751,
29
+ "label_match_score": 0.5649718196333852
30
+ }
31
+ },
32
+ "source_checkpoint": "sweeps/train/all/motif/ProtSSN/60/motif_split0_best.pt"
33
+ }