Irwiny123 commited on Nov 9, 2025

Commit

ef423c5

1 Parent(s): 4132f99

添加PepFlow模型初始代码

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

.gitignore +180 -0
LICENSE +21 -0
README.md +106 -3
configs/learn_angle.yaml +74 -0
environment.yml +261 -0
eval/align.py +17 -0
eval/energy.py +94 -0
eval/foldx.py +77 -0
eval/geometry.py +127 -0
eval/run_esmfold.py +73 -0
eval/run_esmif.py +33 -0
eval/run_mpnn.py +146 -0
eval/run_rfdiffusion.py +75 -0
eval/run_scwrl4.py +30 -0
eval/utils.py +106 -0
models_con/edge.py +112 -0
models_con/flow_model.py +472 -0
models_con/ga.py +127 -0
models_con/inference.py +101 -0
models_con/ipa_pytorch.py +687 -0
models_con/node.py +105 -0
models_con/pep_dataloader.py +212 -0
models_con/sample.py +145 -0
models_con/torsion.py +239 -0
models_con/torus.py +34 -0
models_con/utils.py +72 -0
openfold/config.py +4 -0
openfold/model/__init__.py +16 -0
openfold/model/dropout.py +78 -0
openfold/model/embedders.py +352 -0
openfold/model/evoformer.py +630 -0
openfold/model/heads.py +251 -0
openfold/model/model.py +446 -0
openfold/model/msa.py +392 -0
openfold/model/outer_product_mean.py +129 -0
openfold/model/pair_transition.py +99 -0
openfold/model/primitives.py +587 -0
openfold/model/structure_module.py +820 -0
openfold/model/template.py +333 -0
openfold/model/torchscript.py +215 -0
openfold/model/triangular_attention.py +139 -0
openfold/model/triangular_multiplicative_update.py +127 -0
openfold/np/__init__.py +16 -0
openfold/np/protein.py +438 -0
openfold/np/relax/__init__.py +16 -0
openfold/np/relax/amber_minimize.py +612 -0
openfold/np/relax/cleanup.py +131 -0
openfold/np/relax/relax.py +90 -0
openfold/np/relax/utils.py +88 -0
openfold/np/residue_constants.py +1310 -0

.gitignore ADDED Viewed

	@@ -0,0 +1,180 @@

+logs/
+lightning_logs/
+wandb/
+Data/
+wandb*.json
+**/*.ckpt
+**/*.pth
+**/*.json
+.vscode/
+**/*.pdb
+ckpt/
+*.code-workspace
+outputs/
+**/*.txt
+**/lightning_logs/
+**/inference_outputs/
+.hydra
+preprocessed/
+misc/
+# Byte-compiled / optimized / DLL files
+__pycache__/
+*.py[cod]
+*$py.class
+# C extensions
+*.so
+# Distribution / packaging
+.Python
+build/
+develop-eggs/
+dist/
+downloads/
+eggs/
+.eggs/
+lib/
+lib64/
+parts/
+sdist/
+var/
+wheels/
+share/python-wheels/
+*.egg-info/
+.installed.cfg
+*.egg
+MANIFEST
+# PyInstaller
+#  Usually these files are written by a python script from a template
+#  before PyInstaller builds the exe, so as to inject date/other infos into it.
+*.manifest
+*.spec
+# Installer logs
+pip-log.txt
+pip-delete-this-directory.txt
+# Unit test / coverage reports
+htmlcov/
+.tox/
+.nox/
+.coverage
+.coverage.*
+.cache
+nosetests.xml
+coverage.xml
+*.cover
+*.py,cover
+.hypothesis/
+.pytest_cache/
+cover/
+# Translations
+*.mo
+*.pot
+# Django stuff:
+*.log
+local_settings.py
+db.sqlite3
+db.sqlite3-journal
+# Flask stuff:
+instance/
+.webassets-cache
+# Scrapy stuff:
+.scrapy
+# Sphinx documentation
+docs/_build/
+# PyBuilder
+.pybuilder/
+target/
+# Jupyter Notebook
+.ipynb_checkpoints
+# IPython
+profile_default/
+ipython_config.py
+# pyenv
+#   For a library or package, you might want to ignore these files since the code is
+#   intended to run in multiple environments; otherwise, check them in:
+# .python-version
+# pipenv
+#   According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
+#   However, in case of collaboration, if having platform-specific dependencies or dependencies
+#   having no cross-platform support, pipenv may install dependencies that don't work, or not
+#   install all needed dependencies.
+#Pipfile.lock
+# poetry
+#   Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control.
+#   This is especially recommended for binary packages to ensure reproducibility, and is more
+#   commonly ignored for libraries.
+#   https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control
+#poetry.lock
+# pdm
+#   Similar to Pipfile.lock, it is generally recommended to include pdm.lock in version control.
+#pdm.lock
+#   pdm stores project-wide configurations in .pdm.toml, but it is recommended to not include it
+#   in version control.
+#   https://pdm.fming.dev/#use-with-ide
+.pdm.toml
+# PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm
+__pypackages__/
+# Celery stuff
+celerybeat-schedule
+celerybeat.pid
+# SageMath parsed files
+*.sage.py
+# Environments
+.env
+.venv
+env/
+venv/
+ENV/
+env.bak/
+venv.bak/
+# Spyder project settings
+.spyderproject
+.spyproject
+# Rope project settings
+.ropeproject
+# mkdocs documentation
+/site
+# mypy
+.mypy_cache/
+.dmypy.json
+dmypy.json
+# Pyre type checker
+.pyre/
+# pytype static type analyzer
+.pytype/
+# Cython debug symbols
+cython_debug/
+# PyCharm
+#  JetBrains specific template is maintained in a separate JetBrains.gitignore that can
+#  be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore
+#  and can be added to the global gitignore or merged into this file.  For a more nuclear
+#  option (not recommended) you can uncomment the following to ignore the entire idea folder.
+#.idea/

LICENSE ADDED Viewed

	@@ -0,0 +1,21 @@

+MIT License
+Copyright (c) 2024 Cedlijh
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.

README.md CHANGED Viewed

@@ -1,3 +1,106 @@
----
-license: mit
----

+# PepFlow: Full-Atom Peptide Design
+![alt text](teaser.png)
+This repository contains the official implementation of 💡 Full-Atom Peptide Design based on Multi-modal Flow Matching (ICML 2024).
+You can find our [paper](https://arxiv.org/abs/2406.00735) here. We also appreciate the inspiration from [diffab](https://github.com/luost26/diffab) and [frameflow](https://github.com/microsoft/protein-frame-flow).
+If you have any questions, please contact lijiahanypc@pku.edu.cn or ced3ljhypc@gmail.com. Thank you! :)
+## Install
+### Environment
+Please replace cuda and torch version to match your machine, here we test our code on CUDA >= 11.7, we also suggest using [micromamba](https://mamba.readthedocs.io/en/latest/installation/micromamba-installation.html) as a replace of conda.
+```bash
+conda env create -f environment.yml # or use micromamba instead of conda
+conda activate flow
+pip install torch-scatter -f https://data.pyg.org/whl/torch-2.0.0+cu117.html
+pip install joblib lmdb easydict
+```
+### Clone Repo### Train
+```bash
+git clone https://github.com/Ced3-han/PepFlowww.git
+```
+We suggest adding the code to the Python environment variable, or you can use setup tools.
+ ```bash
+export PYTHONPATH=$(pwd):$PYTHONPATH
+python setup.py develop
+ ```
+### Data and Weights Download
+We provide data and pretrained model weights [here](https://drive.google.com/drive/folders/1bHaKDF3uCDPtfsihjZs0zmjwF6UU1uVl?usp=sharing).
++ PepMerge_release.zip: 1.2GB
++ PepMerge_lmdb.zip: 180MB
++ model1.pt: 80MB
++ model2.pt: 80MB
+The ```PepMerge_release.zip``` contains filtered data of peptide-receptor pairs. For example, in the folder ```1a0n_A```, the ```P``` chain in the PDB file ```1a0n``` is the peptide. In this folder, we provide the FASTA and PDB files of the peptide and receptor. The postfix _merge means the peptide and receptor are in the same PDB file. We also extract the binding pocket of the receptor, where our model is trained to generate peptides based on the binding pocket. You can also download [PepBDB](http://huanglab.phys.hust.edu.cn/pepbdb/db/1cta_A/) and [QBioLip](https://yanglab.qd.sdu.edu.cn/Q-BioLiP/Download), and use ```playgrounds/gen_dataset```.ipynb to reproduce the dataset.
+The ```PepMerge_lmdb.zip``` contains several different splits of the dataset. We use ```mmseqs2``` to cluster complexes based on receptor sequence identity. See ```playgrounds/cluster.ipynb``` for details. The names.txt file contains the names of complexes in the test set. You can use ```models_con/pep_dataloader.py``` to load these datasets. We suggest putting these LMDBs in a single ```Data``` folder.
+Besides, ```model1.pt``` and ```model2.pt``` are two checkpoints that you can load using ```models_con/flow_model.py``` together with the config file configs/learn_angle.yaml. We suggest using model1 for benchmark evaluation and model2 for real-world peptide design tasks, the latter is trained on a larger dataset.
+## Usage
+We will add more user-friendly straightforward pipelines (generation and evaluation) later.
+### Inference and Generate
+By default, we support sampling of generated peptides from our processed dataset. You can use ```models_con/sample.py``` to sample, and ```models_con/inference.py``` to reconstruct PDB files.
+If you want to use your own data, you can organize your data (peptide and pocket) as we did in PepMerge_release and construct a dataset for sampling and reconstruction. You can also use ```models_con/pep_dataloader/preprocess_structure``` to parse a single data point.
+### Evaluation
+Our evaluation involves many third-party packages, and we include some useful evaluation scripts in ```eval```. Please refer to our paper for details and download the corresponding packages for evaluation. Please use different python environments for these tools.
+### Train
+You can also ```train.py``` on single GPU training and ```train_ddp.py``` for multiple GPT training.
+## Future Work
+Future improvements on peptide generation models may include chemical modifications, non-canonical amino acids, pretraining on larger datasets, language models, better sampling methods, etc. Stay tuned and feel free to contact us for collaboration and discussion!
+## Reference
+```bibtex
+@InProceedings{pmlr-v235-li24o,
+  title={Full-Atom Peptide Design based on Multi-modal Flow Matching},
+  author={Li, Jiahan and Cheng, Chaoran and Wu, Zuofan and Guo, Ruihan and Luo, Shitong and Ren, Zhizhou and Peng, Jian and Ma, Jianzhu},
+  booktitle={Proceedings of the 41st International Conference on Machine Learning},
+  pages={27615--27640},
+  year={2024},
+  editor={Salakhutdinov, Ruslan and Kolter, Zico and Heller, Katherine and Weller, Adrian and Oliver, Nuria and Scarlett, Jonathan and Berkenkamp, Felix},
+  volume={235},
+  series={Proceedings of Machine Learning Research},
+  month=21--27 Jul},
+  publisher={PMLR},
+}
+```

configs/learn_angle.yaml ADDED Viewed

	@@ -0,0 +1,74 @@

+model:
+  encoder:
+    node_embed_size: 128
+    edge_embed_size: 64
+    ipa:
+      c_s: 128 #${model.node_embed_size}
+      c_z: 64 #${model.edge_embed_size}
+      c_hidden: 128
+      no_heads: 8
+      no_qk_points: 8
+      no_v_points: 12
+      seq_tfmr_num_heads: 4
+      seq_tfmr_num_layers: 2
+      num_blocks: 6
+      stop_grad: False
+  interpolant:
+    min_t: 1.e-2
+    t_normalization_clip: 0.9
+    sample_sequence: True
+    sample_structure: True
+    rots:
+      train_schedule: linear
+      sample_schedule: exp
+      exp_rate: 10
+    trans:
+      train_schedule: linear
+      sample_schedule: linear
+      sigma: 1.0
+    seqs:
+      num_classes: 20
+      simplex_value: 5.0
+    sampling:
+      num_timesteps: 100
+    self_condition: False
+train:
+  loss_weights:
+    trans_loss: 0.5 # 1.0 for dreamfold, 0.05 for yim
+    rot_loss: 0.5 # 1.0 for dreamfold, 0.5 for yim
+    bb_atom_loss: 0.25
+    seqs_loss: 1.0
+    angle_loss: 1.0
+    torsion_loss: 0.5
+  max_iters: 400000000
+  val_freq: 20000
+  batch_size: 32
+  accum_grad: 1
+  seed: 114514
+  max_grad_norm: 100.0
+  optimizer:
+    type: adam
+    lr: 5.e-4 #1.e-4
+    weight_decay: 0.0
+    beta1: 0.9
+    beta2: 0.999
+  scheduler:
+    type: plateau
+    factor: 0.8
+    patience: 10
+    min_lr: 5.e-6
+dataset:
+  train:
+    type: peprec
+    structure_dir: /datapool/data2/home/jiahan/Data/PepMerge_new/
+    dataset_dir: /datapool/data2/home/jiahan/ResProj/PepDiff/frame-flow/Data/Fixed Data
+    name: pep_pocket_train
+    reset: False
+  val:
+    type: peprec
+    structure_dir: /datapool/data2/home/jiahan/Data/PepMerge_new/
+    dataset_dir: /datapool/data2/home/jiahan/ResProj/PepDiff/frame-flow/Data/Fixed Data
+    name: pep_pocket_test
+    reset: False

environment.yml ADDED Viewed

	@@ -0,0 +1,261 @@

+name: flow
+channels:
+- conda-forge
+- nvidia
+- pytorch
+dependencies:
+- _libgcc_mutex==0.1=conda_forge
+- _openmp_mutex==4.5=2_gnu
+- anyio==3.7.1=pyhd8ed1ab_0
+- argon2-cffi==21.3.0=pyhd8ed1ab_0
+- argon2-cffi-bindings==21.2.0=py310h5764c6d_3
+- arrow==1.2.3=pyhd8ed1ab_0
+- asttokens==2.2.1=pyhd8ed1ab_0
+- astunparse==1.6.3=pyhd8ed1ab_0
+- async-lru==2.0.4=pyhd8ed1ab_0
+- attrs==23.1.0=pyh71513ae_1
+- babel==2.12.1=pyhd8ed1ab_1
+- backcall==0.2.0=pyh9f0ad1d_0
+- backports==1.0=pyhd8ed1ab_3
+- backports.functools_lru_cache==1.6.5=pyhd8ed1ab_0
+- beautifulsoup4==4.12.2=pyha770c72_0
+- biopython==1.81=py310h1fa729e_0
+- biotite==0.38.0
+- bleach==6.0.0=pyhd8ed1ab_0
+- blosc==1.21.4=h0f2a231_0
+- brotli==1.0.9=h166bdaf_9
+- brotli-bin==1.0.9=h166bdaf_9
+- brotli-python==1.0.9=py310hd8f1fbe_9
+- bzip2==1.0.8=h7f98852_4
+- c-ares==1.19.1=hd590300_0
+- c-blosc2==2.10.2=hb4ffafa_0
+- ca-certificates==2023.7.22=hbcca054_0
+- cached-property==1.5.2=hd8ed1ab_1
+- cached_property==1.5.2=pyha770c72_1
+- certifi==2023.7.22=pyhd8ed1ab_0
+- cffi==1.15.1=py310h255011f_3
+- charset-normalizer==3.2.0=pyhd8ed1ab_0
+- comm==0.1.4=pyhd8ed1ab_0
+- contourpy==1.1.0=py310hd41b1e2_0
+- cuda==11.6.0=0
+- cuda-cccl==11.6.55=hf6102b2_0
+- cuda-command-line-tools==11.6.2=0
+- cuda-compiler==11.6.2=0
+- cuda-cudart==11.6.55=he381448_0
+- cuda-cudart-dev==11.6.55=h42ad0f4_0
+- cuda-cuobjdump==11.6.124=h2eeebcb_0
+- cuda-cupti==11.6.124=h86345e5_0
+- cuda-cuxxfilt==11.6.124=hecbf4f6_0
+- cuda-driver-dev==11.6.55=0
+- cuda-gdb==12.0.90=hd47b8d6_0
+- cuda-libraries==11.6.2=0
+- cuda-libraries-dev==11.6.0=0
+- cuda-memcheck==11.8.86=0
+- cuda-nsight==12.0.78=ha770c72_0
+- cuda-nsight-compute==12.2.1=0
+- cuda-nvcc==11.6.124=hbba6d2d_0
+- cuda-nvdisasm==12.0.76=h59595ed_0
+- cuda-nvml-dev==11.6.55=haa9ef22_0
+- cuda-nvprof==12.0.90=h59595ed_0
+- cuda-nvprune==11.6.124=he22ec0a_0
+- cuda-nvrtc==11.6.124=h020bade_0
+- cuda-nvrtc-dev==11.6.124=h249d397_0
+- cuda-nvtx==11.6.124=h0630a44_0
+- cuda-nvvp==12.0.90=h59595ed_0
+- cuda-runtime==11.6.2=0
+- cuda-samples==11.6.101=h8efea70_0
+- cuda-sanitizer-api==12.0.90=h59595ed_0
+- cuda-toolkit==11.6.0=0
+- cuda-tools==11.6.0=0
+- cuda-version==12.0=hffde075_2
+- cuda-visual-tools==11.6.0=0
+- cycler==0.11.0=pyhd8ed1ab_0
+- debugpy==1.6.8=py310hc6cd4ac_0
+- decorator==5.1.1=pyhd8ed1ab_0
+- defusedxml==0.7.1=pyhd8ed1ab_0
+- entrypoints==0.4=pyhd8ed1ab_0
+- exceptiongroup==1.1.3=pyhd8ed1ab_0
+- executing==1.2.0=pyhd8ed1ab_0
+- flit-core==3.9.0=pyhd8ed1ab_0
+- fonttools==4.42.0=py310h2372a71_0
+- fqdn==1.5.1=pyhd8ed1ab_0
+- freetype==2.12.1=hca18f0e_1
+- gds-tools==1.5.0.59=hcb278e6_0
+- gmp==6.2.1=h58526e2_0
+- hdf5==1.14.1=nompi_h4f84152_100
+- idna==3.4=pyhd8ed1ab_0
+- importlib-metadata==6.8.0=pyha770c72_0
+- importlib_metadata==6.8.0=hd8ed1ab_0
+- importlib_resources==6.0.1=pyhd8ed1ab_0
+- ipykernel==6.25.1=pyh71e2992_0
+- ipython==8.14.0=pyh41d4057_0
+- isoduration==20.11.0=pyhd8ed1ab_0
+- jedi==0.19.0=pyhd8ed1ab_0
+- jinja2==3.1.2=pyhd8ed1ab_1
+- json5==0.9.14=pyhd8ed1ab_0
+- jsonpointer==2.0=py_0
+- jsonschema==4.19.0=pyhd8ed1ab_1
+- jsonschema-specifications==2023.7.1=pyhd8ed1ab_0
+- jsonschema-with-format-nongpl==4.19.0=pyhd8ed1ab_1
+- jupyter-lsp==2.2.0=pyhd8ed1ab_0
+- jupyter_client==8.3.0=pyhd8ed1ab_0
+- jupyter_core==5.3.1=py310hff52083_0
+- jupyter_events==0.7.0=pyhd8ed1ab_2
+- jupyter_server==2.7.1=pyhd8ed1ab_0
+- jupyter_server_terminals==0.4.4=pyhd8ed1ab_1
+- jupyterlab==4.0.5=pyhd8ed1ab_0
+- jupyterlab_pygments==0.2.2=pyhd8ed1ab_0
+- jupyterlab_server==2.24.0=pyhd8ed1ab_0
+- keyutils==1.6.1=h166bdaf_0
+- kiwisolver==1.4.4=py310hbf28c38_1
+- krb5==1.21.2=h659d440_0
+- lcms2==2.15=haa2dc70_1
+- ld_impl_linux-64==2.40=h41732ed_0
+- lerc==4.0.0=h27087fc_0
+- libaec==1.0.6=hcb278e6_1
+- libblas==3.9.0=17_linux64_openblas
+- libbrotlicommon==1.0.9=h166bdaf_9
+- libbrotlidec==1.0.9=h166bdaf_9
+- libbrotlienc==1.0.9=h166bdaf_9
+- libcblas==3.9.0=17_linux64_openblas
+- libcublas==12.0.1.189=hcb278e6_2
+- libcublas-dev==12.0.1.189=hcb278e6_2
+- libcufft==11.0.0.21=hcb278e6_1
+- libcufft-dev==11.0.0.21=hcb278e6_1
+- libcufile==1.5.0.59=hcb278e6_0
+- libcufile-dev==1.5.0.59=hcb278e6_0
+- libcurand==10.3.1.50=hcb278e6_0
+- libcurand-dev==10.3.1.50=hcb278e6_0
+- libcurl==8.2.1=hca28451_0
+- libcusolver==11.4.2.57=hcb278e6_1
+- libcusparse==12.0.0.76=hcb278e6_1
+- libdeflate==1.18=h0b41bf4_0
+- libedit==3.1.20191231=he28a2e2_2
+- libev==4.33=h516909a_1
+- libffi==3.4.2=h7f98852_5
+- libgcc-ng==13.1.0=he5830b7_0
+- libgfortran-ng==13.1.0=h69a702a_0
+- libgfortran5==13.1.0=h15d22d2_0
+- libgomp==13.1.0=he5830b7_0
+- libjpeg-turbo==2.1.5.1=h0b41bf4_0
+- liblapack==3.9.0=17_linux64_openblas
+- libnghttp2==1.52.0=h61bc06f_0
+- libnpp==12.0.0.30=h59595ed_0
+- libnpp-dev==12.0.0.30=h59595ed_0
+- libnsl==2.0.0=h7f98852_0
+- libnuma==2.0.16=h0b41bf4_1
+- libnvjitlink==12.0.76=hcb278e6_1
+- libnvjpeg==12.0.0.28=hcb278e6_0
+- libnvjpeg-dev==12.0.0.28=ha770c72_0
+- libopenblas==0.3.23=pthreads_h80387f5_0
+- libpng==1.6.39=h753d276_0
+- libsodium==1.0.18=h36c2ea0_1
+- libsqlite==3.42.0=h2797004_0
+- libssh2==1.11.0=h0841786_0
+- libstdcxx-ng==13.1.0=hfd8a6a1_0
+- libtiff==4.5.1=h8b53f26_0
+- libuuid==2.38.1=h0b41bf4_0
+- libwebp-base==1.3.1=hd590300_0
+- libxcb==1.15=h0b41bf4_0
+- libzlib==1.2.13=hd590300_5
+- lz4-c==1.9.4=hcb278e6_0
+- lzo==2.10=h516909a_1000
+- markupsafe==2.1.3=py310h2372a71_0
+- matplotlib-base==3.7.2=py310hf38f957_0
+- matplotlib-inline==0.1.6=pyhd8ed1ab_0
+- mdtraj==1.9.9=py310h8e08b51_0
+- mistune==3.0.1=pyhd8ed1ab_0
+- munkres==1.1.4=pyh9f0ad1d_0
+- nbclient==0.8.0=pyhd8ed1ab_0
+- nbconvert-core==7.7.4=pyhd8ed1ab_0
+- nbformat==5.9.2=pyhd8ed1ab_0
+- ncurses==6.4=hcb278e6_0
+- nest-asyncio==1.5.6=pyhd8ed1ab_0
+- nomkl==1.0=h5ca1d4c_0
+- notebook-shim==0.2.3=pyhd8ed1ab_0
+- nsight-compute==2023.2.1.3=0
+- numexpr==2.8.4=py310hd91493a_101
+- numpy==1.25.2=py310ha4c1d20_0
+- openjpeg==2.5.0=hfec8fc6_2
+- openssl==3.1.2=hd590300_0
+- overrides==7.4.0=pyhd8ed1ab_0
+- packaging==23.1=pyhd8ed1ab_0
+- pandas==2.0.3=py310h7cbd5c2_1
+- pandocfilters==1.5.0=pyhd8ed1ab_0
+- parso==0.8.3=pyhd8ed1ab_0
+- patsy==0.5.3=pyhd8ed1ab_0
+- pexpect==4.8.0=pyh1a96a4e_2
+- pickleshare==0.7.5=py_1003
+- pillow==10.0.0=py310h582fbeb_0
+- pip
+- pkgutil-resolve-name==1.3.10=pyhd8ed1ab_0
+- platformdirs==3.10.0=pyhd8ed1ab_0
+- pooch==1.7.0=pyha770c72_3
+- prometheus_client==0.17.1=pyhd8ed1ab_0
+- prompt-toolkit==3.0.39=pyha770c72_0
+- prompt_toolkit==3.0.39=hd8ed1ab_0
+- psutil==5.9.5=py310h1fa729e_0
+- pthread-stubs==0.4=h36c2ea0_1001
+- ptyprocess==0.7.0=pyhd3deb0d_0
+- pure_eval==0.2.2=pyhd8ed1ab_0
+- py-cpuinfo==9.0.0=pyhd8ed1ab_0
+- pycparser==2.21=pyhd8ed1ab_0
+- pygments==2.16.1=pyhd8ed1ab_0
+- pyparsing==3.0.9=pyhd8ed1ab_0
+- pysocks==1.7.1=pyha2e5f31_6
+- pytables==3.8.0=py310ha028ce3_2
+- python==3.10.12=hd12c33a_0_cpython
+- python-dateutil==2.8.2=pyhd8ed1ab_0
+- python-fastjsonschema==2.18.0=pyhd8ed1ab_0
+- python-json-logger==2.0.7=pyhd8ed1ab_0
+- python-tzdata==2023.3=pyhd8ed1ab_0
+- python_abi==3.10=3_cp310
+- pytorch-cuda==11.6=h867d48c_0
+- pytz==2023.3=pyhd8ed1ab_0
+- pyyaml==6.0=py310h5764c6d_5
+- pyzmq==25.1.1=py310h5bbb5d0_0
+- readline==8.2=h8228510_1
+- referencing==0.30.2=pyhd8ed1ab_0
+- requests==2.31.0=pyhd8ed1ab_0
+- rfc3339-validator==0.1.4=pyhd8ed1ab_0
+- rfc3986-validator==0.1.1=pyh9f0ad1d_0
+- rpds-py==0.9.2=py310hcb5633a_0
+- scipy==1.11.1=py310ha4c1d20_0
+- seaborn==0.12.2=hd8ed1ab_0
+- seaborn-base==0.12.2=pyhd8ed1ab_0
+- send2trash==1.8.2=pyh41d4057_0
+- setuptools==68.1.2=pyhd8ed1ab_0
+- six==1.16.0=pyh6c4a22f_0
+- snappy==1.1.10=h9fff704_0
+- sniffio==1.3.0=pyhd8ed1ab_0
+- soupsieve==2.3.2.post1=pyhd8ed1ab_0
+- stack_data==0.6.2=pyhd8ed1ab_0
+- statsmodels==0.14.0=py310h278f3c1_1
+- terminado==0.17.1=pyh41d4057_0
+- tinycss2==1.2.1=pyhd8ed1ab_0
+- tk==8.6.12=h27826a3_0
+- tomli==2.0.1=pyhd8ed1ab_0
+- tornado==6.3.3=py310h2372a71_0
+- traitlets==5.9.0=pyhd8ed1ab_0
+- typing-extensions==4.7.1=hd8ed1ab_0
+- typing_extensions==4.7.1=pyha770c72_0
+- typing_utils==0.1.0=pyhd8ed1ab_0
+- tzdata==2023c=h71feb2d_0
+- unicodedata2==15.0.0=py310h5764c6d_0
+- uri-template==1.3.0=pyhd8ed1ab_0
+- urllib3==2.0.4=pyhd8ed1ab_0
+- wcwidth==0.2.6=pyhd8ed1ab_0
+- webcolors==1.13=pyhd8ed1ab_0
+- webencodings==0.5.1=py_1
+- websocket-client==1.6.1=pyhd8ed1ab_0
+- wheel==0.41.1=pyhd8ed1ab_0
+- xorg-libxau==1.0.11=hd590300_0
+- xorg-libxdmcp==1.1.3=h7f98852_0
+- xz==5.2.6=h166bdaf_0
+- yaml==0.2.5=h7f98852_2
+- zeromq==4.3.4=h9c3ff4c_1
+- zipp==3.16.2=pyhd8ed1ab_0
+- zlib==1.2.13=hd590300_5
+- zlib-ng==2.0.7=h0b41bf4_0
+- zstd==1.5.2=hfc55251_7

eval/align.py ADDED Viewed

	@@ -0,0 +1,17 @@

+import subprocess
+import re
+from tqdm import tqdm
+import os
+RUNNER = '/datapool/data2/home/jiahan/Tool/TMalign-20180426/MMalign'
+def align_pdb(pdb1,pdb2,pdb1_out):
+    subprocess.run([RUNNER,pdb1,pdb2,'-o',pdb1_out],stdout=subprocess.PIPE)
+def get_tm_score(pdb1,pdb2):
+    cmd = subprocess.run(['TMscore',pdb1,pdb2],stdout=subprocess.PIPE)
+    out = cmd.stdout.decode()
+    tm_score = re.search(r"TM-score\s+=\s+(\d+\.\d+)", out)
+    rmsd = re.search(r"RMSD of  the common residues=\s+(\d+\.\d+)", out)
+    return float(rmsd.group(1)),float(tm_score.group(1))

eval/energy.py ADDED Viewed

	@@ -0,0 +1,94 @@

+import pyrosetta
+from pyrosetta import init, pose_from_pdb, get_fa_scorefxn
+from pyrosetta.rosetta.protocols.relax import FastRelax
+from pyrosetta.rosetta.protocols.analysis import InterfaceAnalyzerMover
+from pyrosetta.rosetta.core.pack.task import TaskFactory
+from pyrosetta.rosetta.core.pack.task.operation import RestrictToRepacking
+from pyrosetta.rosetta.protocols.minimization_packing import PackRotamersMover
+import os
+import pandas as pd
+import subprocess
+import numpy as np
+import shutil
+from tqdm import tqdm
+import pickle
+from joblib import delayed, Parallel
+from utils import *
+input_dir=".Tests"
+output_dir="./Pack"
+def get_chain_dic(input_pdb):
+    parser = PDBParser()
+    structure = parser.get_structure("protein", input_pdb)
+    chain_dic = {}
+    for model in structure:
+        for chain in model:
+            chain_dic[chain.id] = len([res for res in chain if is_aa(res) and res.has_id('CA')])
+    return chain_dic
+def get_rosetta_score_base(pdb_path,chain_id='A'):
+    try:
+        init()
+        pose = pyrosetta.pose_from_pdb(pdb_path)
+        chains = list(get_chain_dic(pdb_path).keys())
+        chains.remove(chain_id)
+        interface = f'{chain_id}_{"".join(chains)}'
+        fast_relax = FastRelax() # cant be pickled
+        scorefxn = get_fa_scorefxn()
+        fast_relax.set_scorefxn(scorefxn)
+        mover = InterfaceAnalyzerMover(interface)
+        mover.set_pack_separated(True)
+        stabs,binds = [],[]
+        for i in range(5):
+            fast_relax.apply(pose)
+            stab = scorefxn(pose)
+            mover.apply(pose)
+            bind = pose.scores['dG_separated']
+            stabs.append(stab)
+            binds.append(bind)
+        return {'name':pdb_path,'stab':np.array(stabs).mean(),'bind':np.array(binds).mean()}
+    except:
+        return {'name':pdb_path,'stab':999.0,'bind':999.0}
+def get_rosetta_score(pdb_path,chain='A'):
+    try:
+        init()
+        pose = pyrosetta.pose_from_pdb(pdb_path)
+        # chains = list(get_chain_dic(os.path.join(input_dir,name,'pocket_merge_renum.pdb')).keys())
+        # chains.remove(chain)
+        # interface = f'{chain}_{"".join(chains)}'
+        interface='A_B'
+        fast_relax = FastRelax() # cant be pickled
+        scorefxn = get_fa_scorefxn()
+        fast_relax.set_scorefxn(scorefxn)
+        mover = InterfaceAnalyzerMover(interface)
+        mover.set_pack_separated(True)
+        fast_relax.apply(pose)
+        energy = scorefxn(pose)
+        mover.apply(pose)
+        dg = pose.scores['dG_separated']
+        return [pdb_path,energy,dg]
+    except:
+        return [pdb_path,999.0,999.0]
+def pack_sc(name='1a1m_C',num_samples=10):
+    try:
+        if os.path.exists(os.path.join(output_dir,name,'rosetta')):
+            shutil.rmtree(os.path.join(output_dir,name,'rosetta'))
+        os.makedirs(os.path.join(output_dir,name,'rosetta'),exist_ok=True)
+        init()
+        tf = TaskFactory()
+        tf.push_back(RestrictToRepacking())  # Only repack, don't change amino acid types
+        packer = PackRotamersMover()
+        packer.task_factory(tf)
+        for i in range(num_samples):
+            pose = pose_from_pdb(os.path.join(input_dir,name,f'pocket_merge_renum_bb.pdb'))
+            packer.apply(pose)
+            pose.dump_pdb(os.path.join(output_dir,name,'rosetta',f'packed_{i}.pdb'))
+    except:
+        return None

eval/foldx.py ADDED Viewed

	@@ -0,0 +1,77 @@

+import pandas as pd
+import numpy as np
+import pandas as pd
+import torch
+from joblib import Parallel, delayed
+from tqdm import tqdm
+import tempfile
+import os
+import shutil
+import subprocess
+from Bio.PDB import PDBParser
+def fetch_stability_score(path):
+    u = pd.read_csv(path, sep='\t', header=None)
+    return u.values[0][1]
+def fetch_binding_affinity(path):
+    with open(path, 'r') as f:
+        u = f.readlines()
+    return float(u[-1].split("\t")[-3])
+class FoldXSession(object):
+    def __init__(self):
+        super().__init__()
+        self.tmpdir = tempfile.TemporaryDirectory()
+        self.pdb_names = []
+    def cleanup(self):
+        self.tmpdir.cleanup()
+        self.tmpdir = None
+    def __enter__(self):
+        return self
+    def __exit__(self, exc_type, exc_val, exc_tb):
+        self.cleanup()
+    @property
+    def workdir(self):
+        return self.tmpdir.name
+    def path(self, filename):
+        return os.path.join(self.workdir, filename)
+    def preprocess_data(self, pdb_dir, pdb_name):
+        shutil.copy(os.path.join(pdb_dir, pdb_name), self.path(pdb_name))
+        return self.path(pdb_name)
+def get_chain_names(pdb_dir,pdb_name):
+    pep_chain = pdb_name.split("_")[-1][0]
+    parser = PDBParser()
+    structure = parser.get_structure("name", os.path.join(pdb_dir,pdb_name))
+    chain_names = [chain.get_id() for model in structure for chain in model]
+    chains = f"{pep_chain},"
+    for chain in chain_names:
+        if chain != pep_chain:
+            chains += f"{chain}"
+    return chains
+def process_one_file(pdb_dir,pdb_name):
+    chains = get_chain_names(pdb_dir,pdb_name)
+    with FoldXSession() as session:
+        try:
+            # print(session.workdir)
+            session.preprocess_data(pdb_dir, pdb_name)
+            assert(os.path.exists(session.path(pdb_name)))
+            # print(os.listdir(session.workdir))
+            ret = subprocess.run(['/datapool/data2/home/ruihan/bin/foldx', '--command='+'AnalyseComplex', '--pdb='+pdb_name, f'--analyseComplexChains={chains}'], cwd=session.workdir, stdout=None)
+            fxout_path = session.path(f'Summary_{pdb_name.split(".")[0]}_AC.fxout')
+            assert(os.path.exists(fxout_path))
+            return (pdb_name.split('.')[0],fetch_binding_affinity(fxout_path))
+        except:
+            print(f"Error in {pdb_name}")
+            print(os.path.exists(fxout_path))
+            return (pdb_name.split('.')[0],None)

eval/geometry.py ADDED Viewed

	@@ -0,0 +1,127 @@

+from Bio.PDB import PDBParser, Superimposer, is_aa, Select, NeighborSearch
+import tmtools
+import os
+import numpy as np
+import mdtraj as md
+from Bio.SeqUtils import seq1
+import warnings
+from Bio import BiopythonWarning, SeqIO
+import difflib
+import torch
+# 忽略PDBConstructionWarning
+warnings.filterwarnings('ignore', category=BiopythonWarning)
+def get_chain_from_pdb(pdb_path, chain_id='A'):
+    parser = PDBParser()
+    structure = parser.get_structure('X', pdb_path)[0]
+    for chain in structure:
+        if chain.id == chain_id:
+            # print(len(chain))
+            return chain
+    return None
+def diff_ratio(str1, str2):
+    # Create a SequenceMatcher object
+    seq_matcher = difflib.SequenceMatcher(None, str1, str2)
+    # Calculate the difference ratio
+    return seq_matcher.ratio()
+#######################################
+#RMSD and Tm
+#######################################
+def align_chains(chain1, chain2):
+    reslist1 = []
+    reslist2 = []
+    for residue1,residue2 in zip(chain1.get_residues(),chain2.get_residues()):
+        if is_aa(residue1) and residue1.has_id('CA'): # at least have CA
+            reslist1.append(residue1)
+            reslist2.append(residue2)
+    return reslist1,reslist2
+def get_rmsd(chain1, chain2):
+    # chain1 = get_chain_from_pdb(pdb1, chain_id1)
+    # chain2 = get_chain_from_pdb(pdb2, chain_id2)
+    if chain1 is None or chain2 is None:
+        return None
+    super_imposer = Superimposer()
+    pos1 = np.array([atom.get_coord() for atom in chain1.get_atoms() if atom.name == 'CA'])
+    pos2 = np.array([atom.get_coord() for atom in chain2.get_atoms() if atom.name == 'CA'])
+    rmsd1 = np.sqrt(np.sum((pos1 - pos2)**2) / len(pos1))
+    super_imposer.set_atoms([atom for atom in chain1.get_atoms() if atom.name == 'CA'],
+                            [atom for atom in chain2.get_atoms() if atom.name == 'CA'])
+    rmsd2 = super_imposer.rms
+    return rmsd1,rmsd2
+def get_tm(chain1,chain2):
+    # chain1 = get_chain_from_pdb(pdb1, chain_id1)
+    # chain2 = get_chain_from_pdb(pdb2, chain_id2)
+    pos1 = np.array([atom.get_coord() for atom in chain1.get_atoms() if atom.name == 'CA'])
+    pos2 = np.array([atom.get_coord() for atom in chain2.get_atoms() if atom.name == 'CA'])
+    tm_results = tmtools.tm_align(pos1, pos2, 'A'*len(pos1), 'A'*len(pos2))
+    # print(dir(tm_results))
+    return tm_results.tm_norm_chain2
+def get_traj_chain(pdb, chain):
+    parser = PDBParser()
+    structure = parser.get_structure('X', pdb)[0]
+    chain2id = {chain.id:i for i,chain in enumerate(structure)}
+    traj = md.load(pdb)
+    chain_indices = traj.topology.select(f"chainid {chain2id[chain]}")
+    traj = traj.atom_slice(chain_indices)
+    return traj
+def get_second_stru(pdb,chain):
+    parser = PDBParser()
+    structure = parser.get_structure('X', pdb)[0]
+    chain2id = {chain.id:i for i,chain in enumerate(structure)}
+    traj = md.load(pdb)
+    chain_indices = traj.topology.select(f"chainid {chain2id[chain]}")
+    traj = traj.atom_slice(chain_indices)
+    return md.compute_dssp(traj,simplified=True)
+def get_ss(traj1,traj2):
+    # traj1,traj2 = get_traj_chain(pdb1,chain_id1),get_traj_chain(pdb2,chain_id2)
+    ss1,ss2 = md.compute_dssp(traj1,simplified=True),md.compute_dssp(traj2,simplified=True)
+    return (ss1==ss2).mean()
+def get_bind_site(pdb,chain_id):
+    parser = PDBParser()
+    structure = parser.get_structure('X', pdb)[0]
+    peps = [atom for res in structure[chain_id] for atom in res if atom.get_name() == 'CA']
+    recs = [atom for chain in structure if chain.get_id()!=chain_id for res in chain for atom in res if atom.get_name() == 'CA']
+    # print(recs)
+    search = NeighborSearch(recs)
+    near_res = []
+    for atom in peps:
+        near_res += search.search(atom.get_coord(), 10.0, level='R')
+    near_res = set([res.get_id()[1] for res in near_res])
+    return near_res
+def get_bind_ratio(pdb1, pdb2, chain_id1, chain_id2):
+    near_res1,near_res2 = get_bind_site(pdb1,chain_id1),get_bind_site(pdb2,chain_id2)
+    # print(near_res1)
+    # print(near_res2)
+    return len(near_res1.intersection(near_res2))/(len(near_res2)+1e-10) # last one is gt
+def get_dihedral(pdb,chain):
+    traj = get_traj_chain(pdb,chain)
+    #TODO: dihedral
+def get_seq(pdb,chain_id):
+    parser = PDBParser()
+    chain = parser.get_structure('X', pdb)[0][chain_id]
+    return seq1("".join([residue.get_resname() for residue in chain])) # ignore is_aa,used for extract seq from genrated pdb
+def get_mpnn_seqs(path):
+    fastas = []
+    for record in SeqIO.parse(path, "fasta"):
+        tmp = [c for c in str(record.seq)]
+        fastas.append(tmp)
+    return fastas

eval/run_esmfold.py ADDED Viewed

	@@ -0,0 +1,73 @@

+import os
+import pandas as pd
+import subprocess
+import torch
+import esm
+import numpy as np
+import shutil
+from tqdm import tqdm
+from joblib import delayed, Parallel
+import warnings
+from Bio import BiopythonWarning, SeqIO
+from geometry import *
+# 忽略PDBConstructionWarning
+warnings.filterwarnings('ignore', category=BiopythonWarning)
+input_dir="./Data/Baselines_new/Tests"
+output_dir="/datapool/data2/home/jiahan/ResProj/PepDiff/frame-flow/Data/Baselines_new/Codesign"
+model = esm.pretrained.esmfold_v1()
+model = model.eval().to('cuda:2')
+def process_rf(name='1aze_B'):
+    input_dir=".Data/Baselines_new/Tests"
+    output_dir=".Data/Baselines_new/Codesign"
+    struct_dir = os.path.join(output_dir,name,'rfs_refold')
+    seq_dir = os.path.join(output_dir,name,'mpnns','seqs')
+    os.makedirs(struct_dir,exist_ok=True)
+    seqs = {}
+    for seq_path in os.listdir(seq_dir):
+        tmp_seqs = []
+        if seq_path.endswith('.fasta'):
+            for record in SeqIO.parse(os.path.join(seq_dir,seq_path), "fasta"):
+                tmp_seqs.append(str(record.seq))
+        seqs[seq_path.split('.')[0]] = tmp_seqs[-1]
+    for seq_name,seq in seqs.items():
+        with torch.no_grad():
+            output = model.infer_pdb(seq)
+        with open(os.path.join(struct_dir,seq_name+'.pdb'),'w') as f:
+            f.write(output)
+def process_pg(name='1aze_B',chain_id='A'):
+    input_dir=".Data/Baselines_new/Tests"
+    output_dir=".Data/Baselines_new/Codesign"
+    struct_dir = os.path.join(output_dir,name,'pgs_refold')
+    seq_dir = os.path.join(output_dir,name,'pgs')
+    os.makedirs(struct_dir,exist_ok=True)
+    seqs = {}
+    for seq_path in os.listdir(seq_dir):
+        if seq_path.endswith('.pdb'):
+            seqs[seq_path.split('.')[0]] = get_seq(os.path.join(seq_dir,seq_path),chain_id)
+    for seq_name,seq in seqs.items():
+        with torch.no_grad():
+            output = model.infer_pdb(seq)
+        with open(os.path.join(struct_dir,seq_name+'.pdb'),'w') as f:
+            f.write(output)
+def refold(name,chain_id,sub_dir):
+    raw_dir = os.path.join('/datapool/data2/home/jiahan/ResProj/PepDiff/frame-flow/Data/Models_new/Codesign',sub_dir,'pdbs')
+    refold_dir = os.path.join('/datapool/data2/home/jiahan/ResProj/PepDiff/frame-flow/Data/Models_new/Codesign',sub_dir,'pdbs_refold')
+    os.makedirs(os.path.join(refold_dir,name),exist_ok=True)
+    seqs = {}
+    for seq_path in os.listdir(os.path.join(raw_dir,name)):
+        if seq_path.endswith('.pdb'):
+            seqs[seq_path.split('.')[0]] = get_seq(os.path.join(raw_dir,name,seq_path),chain_id)
+    for seq_name,seq in seqs.items():
+        with torch.no_grad():
+            output = model.infer_pdb(seq)
+        with open(os.path.join(refold_dir,name,seq_name+'.pdb'),'w') as f:
+            f.write(output)

eval/run_esmif.py ADDED Viewed

	@@ -0,0 +1,33 @@

+from utils import *
+import os
+import pandas as pd
+import subprocess
+import torch
+import numpy as np
+import shutil
+from tqdm import tqdm
+from joblib import delayed, Parallel
+input_dir="./Baselines_new/Tests"
+# output_dir="/datapool/data2/home/jiahan/Res Proj/PepDiff/frame-flow/Data/RF_samples"
+output_dir="./Data/Baselines_new/Fixbb"
+RUNNER = "/datapool/data2/home/jiahan/Tool/esm/examples/inverse_folding/sample_sequences.py"
+def process_one_item_esmif(name='1a1m_C',chains_to_design="A",num_samples=10,temperature=0.1):
+    if not os.path.exists(os.path.join(output_dir,name,'esms')):
+        os.makedirs(os.path.join(output_dir,name,'esms'))
+    assert os.path.exists(os.path.join(output_dir,name,'esms'))
+    # if not os.path.exists(os.path.join(output_dir,name,'pocket_merge_renum.pdb')):
+    #     chain_dic = renumber_pdb(os.path.join(input_dir,name,'pocket_merge.pdb'),os.path.join(output_dir,name,'pocket_merge_renum.pdb'))
+    dirname = os.path.join(output_dir,name,'esms')
+    cmd = [
+    "python", RUNNER, os.path.join(input_dir,name,'pocket_merge_renum.pdb'),
+    "--chain", chains_to_design, "--temperature", f"{temperature}", "--num-samples", f"{num_samples}",
+    "--outpath", os.path.join(dirname,'pocket_merge_renum.fasta'),
+    "--multichain-backbone", "--nogpu"
+]
+    subprocess.run(cmd)

eval/run_mpnn.py ADDED Viewed

	@@ -0,0 +1,146 @@

+from utils import *
+from geometry import *
+import os
+import pandas as pd
+import subprocess
+import torch
+import numpy as np
+import shutil
+from tqdm import tqdm
+from joblib import delayed, Parallel
+from Bio.PDB import PDBParser, PDBIO, Select
+HELPERS = "/datapool/data2/home/jiahan/Tool/ProteinMPNN/helper_scripts"
+RUNNER = "/datapool/data2/home/jiahan/Tool/ProteinMPNN/protein_mpnn_run.py"
+def get_chain_nums(pdb_path,chain_id):
+    parser = PDBParser()
+    chain = parser.get_structure('X',pdb_path)[0][chain_id]
+    residue_nums = [residue.get_id()[1] for residue in chain]
+    return residue_nums
+def process_mpnn_bb(name='1aze_B',chains_to_design="A",num_samples=1):
+    input_dir = './Data/Models_new/Codesign/bb/pdbs'
+    output_dir = './Data/Models_new/Codesign/bb/seqs'
+    if not os.path.exists(os.path.join(output_dir,name)):
+        os.makedirs(os.path.join(output_dir,name))
+    dirname = os.path.join(output_dir,name)
+    # defined dirs
+    path_for_parsed_chains=os.path.join(dirname,'parsed_pdbs.jsonl')
+    path_for_assigned_chains=os.path.join(dirname,'assigned_pdbs.jsonl')
+    path_for_fixed_positions=os.path.join(dirname,'fixed_pdbs.jsonl')
+    residue_nums = get_chain_nums(os.path.join(input_dir,name,'gt.pdb'),chains_to_design)
+    design_only_positions = " ".join(map(str,residue_nums)) #design only these residues; use flag --specify_non_fixed
+    # print(path_for_assigned_chains)
+    # print(design_only_positions)
+    subprocess.run([
+        "python", os.path.join(HELPERS,"parse_multiple_chains.py"),
+        "--input_path", os.path.join(input_dir,name),
+        "--output_path", path_for_parsed_chains,
+    ])
+    subprocess.run([
+        "python", os.path.join(HELPERS,"assign_fixed_chains.py"),
+        "--input_path", path_for_parsed_chains,
+        "--output_path", path_for_assigned_chains,
+        '--chain_list', chains_to_design,
+    ])
+    subprocess.run([
+        "python", os.path.join(HELPERS,"make_fixed_positions_dict.py"),
+        "--input_path", path_for_parsed_chains,
+        "--output_path", path_for_fixed_positions,
+        '--chain_list', chains_to_design,
+        '--position_list', design_only_positions,
+        '--specify_non_fixed'
+    ])
+    # run mpnn
+    # print('run mpnns')
+    subprocess.run([
+        "python", RUNNER,
+        "--jsonl_path", path_for_parsed_chains,
+        "--chain_id_jsonl", path_for_assigned_chains,
+        "--fixed_positions_jsonl", path_for_fixed_positions,
+        "--out_folder", dirname,
+        "--num_seq_per_target", f"{num_samples}",
+        "--sampling_temp", "0.1",
+        "--seed", "37",
+        "--batch_size","1",
+        '--device','cuda:1'
+    ])
+def process_one_item_mpnn(name='1a1m_C',chains_to_design="A",num_samples=1):
+    input_dir="./Data/Baselines_new/Tests"
+    output_dir="./Data/Baselines_new/Codesign"
+    if not os.path.exists(os.path.join(output_dir,name,'mpnns')):
+        os.makedirs(os.path.join(output_dir,name,'mpnns'))
+    # if not os.path.exists(os.path.join(output_dir,name,'pocket_merge_renum.pdb')):
+    #     chain_dic = renumber_pdb(os.path.join(input_dir,name,'pocket_merge.pdb'),os.path.join(output_dir,name,'pocket_merge_renum.pdb'))
+    dirname = os.path.join(output_dir,name,'mpnns')
+    # defined dirs
+    path_for_parsed_chains=os.path.join(dirname,'parsed_pdbs.jsonl')
+    path_for_assigned_chains=os.path.join(dirname,'assigned_pdbs.jsonl')
+    path_for_fixed_positions=os.path.join(dirname,'fixed_pdbs.jsonl')
+    with open(os.path.join(input_dir,name,'seq.fasta'),'r') as f:
+        pep_len = len(f.readlines()[1].strip())
+    design_only_positions=" ".join(map(str,list(range(1,pep_len+1)))) #design only these residues; use flag --specify_non_fixed
+    # print(design_only_positions)
+    # parsed chains
+    # print("parsing chains")
+    subprocess.run([
+        "python", os.path.join(HELPERS,"parse_multiple_chains.py"),
+        "--input_path", os.path.join('./Data/Baselines_new/Codesign',name,'rfs'),#os.path.join('/datapool/data2/home/jiahan/ResProj/PepDiff/frame-flow/Data/Baselines/Fixbb/',name),
+        "--output_path", path_for_parsed_chains,
+    ])
+    subprocess.run([
+        "python", os.path.join(HELPERS,"assign_fixed_chains.py"),
+        "--input_path", path_for_parsed_chains,
+        "--output_path", path_for_assigned_chains,
+        '--chain_list', chains_to_design,
+    ])
+    subprocess.run([
+        "python", os.path.join(HELPERS,"make_fixed_positions_dict.py"),
+        "--input_path", path_for_parsed_chains,
+        "--output_path", path_for_fixed_positions,
+        '--chain_list', chains_to_design,
+        '--position_list', design_only_positions,
+        '--specify_non_fixed'
+    ])
+    # run mpnn
+    # print('run mpnns')
+    subprocess.run([
+        "python", RUNNER,
+        "--jsonl_path", path_for_parsed_chains,
+        "--chain_id_jsonl", path_for_assigned_chains,
+        "--fixed_positions_jsonl", path_for_fixed_positions,
+        "--out_folder", dirname,
+        "--num_seq_per_target", f"{num_samples}",
+        "--sampling_temp", "0.1",
+        "--seed", "37",
+        "--batch_size","1",
+        '--device','cuda:1'
+    ])
+def write_seq_to_pdb(seq_path,pdb_path,out_path,chain_id):
+    # first we should fix GGGGG in rfs with mpnn generated seq
+    aa_mapping = {"A": "ALA","C": "CYS","D": "ASP","E": "GLU","F": "PHE","G": "GLY","H": "HIS","I": "ILE","K": "LYS","L": "LEU","M": "MET","N": "ASN","P": "PRO","Q": "GLN","R": "ARG","S": "SER","T": "THR","V": "VAL","W": "TRP","Y": "TYR",
+                  'X':'UNK'}
+    tmps = []
+    for record in SeqIO.parse(seq_path, "fasta"):
+        tmps.append(str(record.seq))
+    seq = tmps[-1]
+    parser = PDBParser()
+    structure = parser.get_structure("X", pdb_path)
+    model = structure[0]
+    for chain in model:
+        if chain.id == chain_id:  # 假设你要更改的是链A
+            for i,res in enumerate(chain):
+                if i<len(seq):
+                    res.resname = aa_mapping[seq[i]]
+    io = PDBIO()
+    io.set_structure(structure)
+    io.save(out_path)

eval/run_rfdiffusion.py ADDED Viewed

	@@ -0,0 +1,75 @@

+from utils import *
+from geometry import *
+import os
+import pandas as pd
+import subprocess
+import torch
+import numpy as np
+import shutil
+from tqdm import tqdm
+from joblib import delayed, Parallel
+input_dir="./Data/Baselines_new/Tests"
+output_dir=".Data/Baselines_new/Codesign"
+PROGEN="/datapool/data2/home/jiahan/Tool/protein_generator/inference.py"
+def process_one_item_rf(name='1a1m_C',num_samples=10):
+    if not os.path.exists(os.path.join(output_dir,name,'rfs')):
+        os.makedirs(os.path.join(output_dir,name,'rfs'))
+    chain_dic = get_chain_dic(os.path.join(input_dir,name,'pocket_renum.pdb'))
+    with open(os.path.join(input_dir,name,'seq.fasta'),'r') as f:
+        pep_len = len(f.readlines()[1].strip())
+    # rfdiffusion
+    contigs = []
+    for chain,chain_len in chain_dic.items():
+        contigs.append(f'{chain}1-{chain_len}/0')
+    contigs.append(f'{pep_len}-{pep_len}')
+    contigs = " ".join(contigs)
+    command = [
+    "run_inference.py",
+    f"inference.output_prefix='{os.path.join(output_dir,name,'rfs','sample')}'",
+    f"inference.input_pdb='{os.path.join(input_dir,name,'pocket_renum.pdb')}'",
+    f"contigmap.contigs=[{contigs}]",
+    f"inference.num_designs={num_samples}",
+]
+    # print(command)
+    try:
+        result = subprocess.run(command, check=True, capture_output=True, text=True)
+        return name
+    except:
+        return None
+def process_one_item_pg(name='1a1m_C',num_samples=10):
+    if not os.path.exists(os.path.join(output_dir,name,'pgs')):
+        os.makedirs(os.path.join(output_dir,name,'pgs'))
+    os.makedirs(os.path.join(output_dir,name,'pgs'),exist_ok=True)
+    chain_dic = get_chain_dic(os.path.join(input_dir,name,'pocket_renum.pdb'))
+    with open(os.path.join(input_dir,name,'seq.fasta'),'r') as f:
+        pep_len = len(f.readlines()[1].strip())
+    # protein_generator settings
+    contigs = []
+    for chain,chain_len in chain_dic.items():
+        contigs.append(f'{chain}1-{chain_len},0')
+    contigs.append(f'{pep_len}-{pep_len}')
+    command = [
+        "python", PROGEN,
+        "--num_designs", f"{num_samples}",
+        "--out", os.path.join(output_dir,name,'pgs','sample'),
+        "--pdb", os.path.join(input_dir,name,'pocket_renum.pdb'),
+        "--T", "25", # default setting
+        "--save_best_plddt", # default setting
+        "--contigs", *contigs,
+    ]
+    # print(command)
+    try:
+        result = subprocess.run(command, check=True, capture_output=True, text=True)
+        return name
+    except:
+        return None
+def process_one_item(name='1a1m_C',num_samples=10):
+    process_one_item_pg(name,num_samples)
+    process_one_item_rf(name,num_samples)

eval/run_scwrl4.py ADDED Viewed

	@@ -0,0 +1,30 @@

+from utils import *
+import os
+import pandas as pd
+import subprocess
+import numpy as np
+import shutil
+from tqdm import tqdm
+from joblib import delayed, Parallel
+input_dir="./Data/Baselines_new/Tests"
+output_dir="./Data/Baselines_new/Pack"
+RUNNER = "/datapool/data2/home/jiahan/Tool/bin/Scwrl4"
+def process_one_item_scwrl4(name='1a1m_C',num_samples=10):
+    if not os.path.exists(os.path.join(output_dir,name,'scwrls')):
+        os.makedirs(os.path.join(output_dir,name,'scwrls'))
+    # if not os.path.exists(os.path.join(output_dir,name,'pocket_merge_renum.pdb')):
+    #     chain_dic = renumber_pdb(os.path.join(input_dir,name,'pocket_merge.pdb'),os.path.join(output_dir,name,'pocket_merge_renum.pdb'))
+    #     keep_backbone_atoms(os.path.join(output_dir,name,'pocket_merge_renum.pdb'),os.path.join(output_dir,name,'pocket_merge_renum_backbone.pdb'))
+    dirname = os.path.join(output_dir,name,'scwrls')
+    for i in range(num_samples):
+        cmd = [
+            RUNNER,
+            '-i',os.path.join(input_dir,name,'pocket_merge_renum_bb.pdb'),
+            '-o',os.path.join(dirname,f'packed_{i}.pdb'),
+        ]
+        subprocess.run(cmd)

eval/utils.py ADDED Viewed

	@@ -0,0 +1,106 @@

+import os
+import glob
+import pandas as pd
+import subprocess
+from difflib import SequenceMatcher
+from Bio import SeqIO
+from Bio.PDB import PDBParser, PDBIO, Chain, Select, is_aa
+from Bio.PDB.Polypeptide import PPBuilder
+from Bio.PDB import PDBParser
+from Bio.SeqUtils import seq1
+# def parse_pdb_chains(pdb_file):
+#     parser = PDBParser()
+#     structure = parser.get_structure("protein", pdb_file)
+#     pp_builder = PPBuilder()
+#     sequences = {}
+#     for model in structure:
+#         for chain in model:
+#             chain_id = chain.get_id()
+#             sequence = "".join([str(pp.get_sequence()) for pp in pp_builder.build_peptides(chain)])
+#             print(len(sequence))
+#             sequences[chain_id] = sequence
+#     return sequences
+def get_fasta_from_pdb(pdb_file):
+    parser = PDBParser()
+    structure = parser.get_structure("pdb", pdb_file)
+    fasta_sequence = {}
+    for chain in structure.get_chains():
+        seq = ""
+        for residue in chain.get_residues():
+                seq += seq1(residue.get_resname())
+        fasta_sequence[chain.id] = seq
+    return fasta_sequence
+def parse_fasta(file):
+    sequences = {}
+    with open(file, "r") as fasta_file:
+        for i, record in enumerate(SeqIO.parse(fasta_file, "fasta")):
+            sequences[i] = str(record.seq).split("/")
+    return sequences
+def renumber_pdb(input_pdb, output_pdb):
+    parser = PDBParser()
+    structure = parser.get_structure("protein", input_pdb)
+    chain_dic = {}
+    for model in structure:
+        old_chains = []
+        new_chains = []
+        for chain in model: # this may include HEAATM atoms
+            new_chain_id = chain.id + "_renum"
+            new_chain = Chain.Chain(new_chain_id)
+            for i, residue in enumerate(chain):
+                new_residue = residue.copy()
+                new_residue_id = (residue.id[0], i + 1, residue.id[2])
+                new_residue.id = new_residue_id
+                new_chain.add(new_residue)
+            old_chains.append(chain)
+            new_chains.append(new_chain)
+            chain_dic[chain.id] = len(list(chain))
+        for chain, new_chain in zip(old_chains, new_chains):
+            model.detach_child(chain.id)
+            new_chain.id = chain.id
+            model.add(new_chain)
+    io = PDBIO()
+    io.set_structure(structure)
+    io.save(output_pdb)
+    return chain_dic
+def get_chain_dic(input_pdb):
+    parser = PDBParser()
+    structure = parser.get_structure("protein", input_pdb)
+    chain_dic = {}
+    for model in structure:
+        for chain in model:
+            chain_dic[chain.id] = len([res for res in chain if is_aa(res) and res.has_id('CA')])
+    return chain_dic
+def keep_backbone_atoms(input_file, output_file):
+    class BackboneSelect(Select):
+        def accept_atom(self, atom):
+            return atom.get_name() in ["N", "CA", "C", "O"]
+    parser = PDBParser()
+    io = PDBIO()
+    structure = parser.get_structure("protein", input_file)
+    io.set_structure(structure)
+    io.save(output_file, BackboneSelect())

models_con/edge.py ADDED Viewed

	@@ -0,0 +1,112 @@

+import torch
+import torch.nn as nn
+import torch.nn.functional as F
+from pepflow.modules.common.geometry import angstrom_to_nm, pairwise_dihedrals
+from pepflow.modules.common.layers import AngularEncoding
+from pepflow.modules.protein.constants import BBHeavyAtom, AA
+class EdgeEmbedder(nn.Module):
+    def __init__(self, feat_dim, max_num_atoms, max_aa_types=22, max_relpos=32, num_bins=16):
+        super().__init__()
+        self.max_num_atoms = max_num_atoms
+        self.max_aa_types = max_aa_types
+        self.max_relpos = max_relpos
+        self.num_bins = num_bins
+        self.aa_pair_embed = nn.Embedding(self.max_aa_types*self.max_aa_types, feat_dim)
+        self.relpos_embed = nn.Embedding(2*max_relpos+1, feat_dim)
+        self.aapair_to_distcoef = nn.Embedding(self.max_aa_types*self.max_aa_types, max_num_atoms*max_num_atoms)
+        nn.init.zeros_(self.aapair_to_distcoef.weight)
+        self.distance_embed = nn.Sequential(
+            nn.Linear(max_num_atoms*max_num_atoms, feat_dim), nn.ReLU(),
+            nn.Linear(feat_dim, feat_dim), nn.ReLU(),
+        )
+        self.dihedral_embed = AngularEncoding()
+        feat_dihed_dim = self.dihedral_embed.get_out_dim(2) # Phi and Psi
+        infeat_dim = feat_dim + feat_dim + feat_dim + feat_dihed_dim
+        self.out_mlp = nn.Sequential(
+            nn.Linear(infeat_dim, feat_dim), nn.ReLU(),
+            nn.Linear(feat_dim, feat_dim), nn.ReLU(),
+            nn.Linear(feat_dim, feat_dim),
+        )
+    def forward(self, aa, res_nb, chain_nb, pos_atoms, mask_atoms, structure_mask=None, sequence_mask=None):
+        """
+        Args:
+            aa: (N, L).
+            res_nb: (N, L).
+            chain_nb: (N, L).
+            pos_atoms:  (N, L, A, 3)
+            mask_atoms: (N, L, A)
+            trans, sc_trans: (N,L,3)
+            structure_mask: (N, L)
+            sequence_mask:  (N, L), mask out unknown amino acids to generate.
+        Returns:
+            (N, L, L, feat_dim)
+        """
+        N, L = aa.size()
+        # Remove other atoms
+        pos_atoms = pos_atoms[:, :, :self.max_num_atoms]
+        mask_atoms = mask_atoms[:, :, :self.max_num_atoms]
+        mask_residue = mask_atoms[:, :, BBHeavyAtom.CA] # (N, L)
+        mask_pair = mask_residue[:, :, None] * mask_residue[:, None, :]
+        pair_structure_mask = structure_mask[:, :, None] * structure_mask[:, None, :] if structure_mask is not None else None
+        # Pair identities
+        if sequence_mask is not None:
+            # Avoid data leakage at training time
+            aa = torch.where(sequence_mask, aa, torch.full_like(aa, fill_value=AA.UNK))
+        aa_pair = aa[:,:,None]*self.max_aa_types + aa[:,None,:]    # (N, L, L)
+        feat_aapair = self.aa_pair_embed(aa_pair)
+        # Relative sequential positions
+        same_chain = (chain_nb[:, :, None] == chain_nb[:, None, :])
+        relpos = torch.clamp(
+            res_nb[:,:,None] - res_nb[:,None,:],
+            min=-self.max_relpos, max=self.max_relpos,
+        )   # (N, L, L)
+        feat_relpos = self.relpos_embed(relpos + self.max_relpos) * same_chain[:,:,:,None]
+        # Distances
+        d = angstrom_to_nm(torch.linalg.norm(
+            pos_atoms[:,:,None,:,None] - pos_atoms[:,None,:,None,:],
+            dim = -1, ord = 2,
+        )).reshape(N, L, L, -1) # (N, L, L, A*A)
+        c = F.softplus(self.aapair_to_distcoef(aa_pair))    # (N, L, L, A*A)
+        d_gauss = torch.exp(-1 * c * d**2)
+        mask_atom_pair = (mask_atoms[:,:,None,:,None] * mask_atoms[:,None,:,None,:]).reshape(N, L, L, -1)
+        feat_dist = self.distance_embed(d_gauss * mask_atom_pair)
+        if pair_structure_mask is not None:
+            # Avoid data leakage at training time
+            feat_dist = feat_dist * pair_structure_mask[:, :, :, None]
+        # Orientations
+        dihed = pairwise_dihedrals(pos_atoms)   # (N, L, L, 2)
+        feat_dihed = self.dihedral_embed(dihed)
+        if pair_structure_mask is not None:
+            # Avoid data leakage at training time
+            feat_dihed = feat_dihed * pair_structure_mask[:, :, :, None]
+        # # trans embed
+        # dist_feats = calc_distogram(
+        #     trans, min_bin=1e-3, max_bin=20.0, num_bins=self.num_bins)
+        # if sc_trans == None:
+        #     sc_trans = torch.zeros_like(trans)
+        # sc_feats = calc_distogram(
+        #     sc_trans, min_bin=1e-3, max_bin=20.0, num_bins=self.num_bins)
+        # All
+        feat_all = torch.cat([feat_aapair, feat_relpos, feat_dist, feat_dihed], dim=-1)
+        feat_all = self.out_mlp(feat_all)   # (N, L, L, F)
+        feat_all = feat_all * mask_pair[:, :, :, None]
+        return feat_all

models_con/flow_model.py ADDED Viewed

	@@ -0,0 +1,472 @@

+import numpy as np
+import torch
+import torch.nn as nn
+import torch.nn.functional as F
+import copy
+import math
+from tqdm.auto import tqdm
+import functools
+from torch.utils.data import DataLoader
+import os
+import argparse
+import pandas as pd
+from models_con.edge import EdgeEmbedder
+from models_con.node import NodeEmbedder
+from pepflow.modules.common.layers import sample_from, clampped_one_hot
+from models_con.ga import GAEncoder
+from pepflow.modules.protein.constants import AA, BBHeavyAtom, max_num_heavyatoms
+from pepflow.modules.common.geometry import construct_3d_basis
+from pepflow.utils.data import mask_select_data, find_longest_true_segment, PaddingCollate
+from pepflow.utils.misc import seed_all
+from pepflow.utils.train import sum_weighted_losses
+from torch.nn.utils import clip_grad_norm_
+from pepflow.modules.so3.dist import centered_gaussian,uniform_so3
+from pepflow.modules.common.geometry import batch_align, align
+from tqdm import tqdm
+import wandb
+from data import so3_utils
+from data import all_atom
+from models_con.pep_dataloader import PepDataset
+from pepflow.utils.misc import load_config
+from pepflow.utils.train import recursive_to
+from easydict import EasyDict
+from models_con.utils import process_dic
+from models_con.torsion import get_torsion_angle, torsions_mask
+import models_con.torus as torus
+import gc
+from copy import deepcopy
+from pepflow.utils.data import PaddingCollate
+collate_fn = PaddingCollate(eight=False)
+from pepflow.utils.train import recursive_to
+resolution_to_num_atoms = {
+    'backbone+CB': 5,
+    'full': max_num_heavyatoms
+}
+class FlowModel(nn.Module):
+    def __init__(self,cfg):
+        super().__init__()
+        self._model_cfg = cfg.encoder
+        self._interpolant_cfg = cfg.interpolant
+        self.node_embedder = NodeEmbedder(cfg.encoder.node_embed_size,max_num_heavyatoms)
+        self.edge_embedder = EdgeEmbedder(cfg.encoder.edge_embed_size,max_num_heavyatoms)
+        self.ga_encoder = GAEncoder(cfg.encoder.ipa)
+        self.sample_structure = self._interpolant_cfg.sample_structure
+        self.sample_sequence = self._interpolant_cfg.sample_sequence
+        self.K = self._interpolant_cfg.seqs.num_classes
+        self.k = self._interpolant_cfg.seqs.simplex_value
+    def encode(self, batch):
+        rotmats_1 =  construct_3d_basis(batch['pos_heavyatom'][:, :, BBHeavyAtom.CA],batch['pos_heavyatom'][:, :, BBHeavyAtom.C],batch['pos_heavyatom'][:, :, BBHeavyAtom.N] )
+        trans_1 = batch['pos_heavyatom'][:, :, BBHeavyAtom.CA]
+        seqs_1 = batch['aa']
+        # ignore psi
+        # batch['torsion_angle'] = batch['torsion_angle'][:,:,1:]
+        # batch['torsion_angle_mask'] = batch['torsion_angle_mask'][:,:,1:]
+        angles_1 = batch['torsion_angle']
+        context_mask = torch.logical_and(batch['mask_heavyatom'][:, :, BBHeavyAtom.CA], ~batch['generate_mask'])
+        structure_mask = context_mask if self.sample_structure else None
+        sequence_mask = context_mask if self.sample_sequence else None
+        node_embed = self.node_embedder(batch['aa'], batch['res_nb'], batch['chain_nb'], batch['pos_heavyatom'],
+                                        batch['mask_heavyatom'], structure_mask=structure_mask, sequence_mask=sequence_mask)
+        edge_embed = self.edge_embedder(batch['aa'], batch['res_nb'], batch['chain_nb'], batch['pos_heavyatom'],
+                                        batch['mask_heavyatom'], structure_mask=structure_mask, sequence_mask=sequence_mask)
+        return rotmats_1, trans_1, angles_1, seqs_1, node_embed, edge_embed
+    def zero_center_part(self,pos,gen_mask,res_mask):
+        """
+        move pos by center of gen_mask
+        pos: (B,N,3)
+        gen_mask, res_mask: (B,N)
+        """
+        center = torch.sum(pos * gen_mask[...,None], dim=1) / (torch.sum(gen_mask,dim=-1,keepdim=True) + 1e-8) # (B,N,3)*(B,N,1)->(B,3)/(B,1)->(B,3)
+        center = center.unsqueeze(1) # (B,1,3)
+        # center = 0. it seems not center didnt influence the result, but its good for training stabilty
+        pos = pos - center
+        pos = pos * res_mask[...,None]
+        return pos,center
+    def seq_to_simplex(self,seqs):
+        return clampped_one_hot(seqs, self.K).float() * self.k * 2 - self.k # (B,L,K)
+    def forward(self, batch):
+        num_batch, num_res = batch['aa'].shape
+        gen_mask,res_mask,angle_mask = batch['generate_mask'].long(),batch['res_mask'].long(),batch['torsion_angle_mask'].long()
+        #encode
+        rotmats_1, trans_1, angles_1, seqs_1, node_embed, edge_embed = self.encode(batch) # no generate mask
+        # prepare for denoise
+        trans_1_c,_ = self.zero_center_part(trans_1,gen_mask,res_mask)
+        trans_1_c = trans_1 # already centered when constructing dataset
+        seqs_1_simplex = self.seq_to_simplex(seqs_1)
+        seqs_1_prob = F.softmax(seqs_1_simplex,dim=-1)
+        with torch.no_grad():
+            t = torch.rand((num_batch,1), device=batch['aa'].device)
+            t = t*(1-2 * self._interpolant_cfg.t_normalization_clip) + self._interpolant_cfg.t_normalization_clip # avoid 0
+            if self.sample_structure:
+                # corrupt trans
+                trans_0 = torch.randn((num_batch,num_res,3), device=batch['aa'].device) * self._interpolant_cfg.trans.sigma # scale with sigma?
+                trans_0_c,_ = self.zero_center_part(trans_0,gen_mask,res_mask)
+                trans_t = (1-t[...,None])*trans_0_c + t[...,None]*trans_1_c
+                trans_t_c = torch.where(batch['generate_mask'][...,None],trans_t,trans_1_c)
+                # corrupt rotmats
+                rotmats_0 = uniform_so3(num_batch,num_res,device=batch['aa'].device)
+                rotmats_t = so3_utils.geodesic_t(t[..., None], rotmats_1, rotmats_0)
+                rotmats_t = torch.where(batch['generate_mask'][...,None,None],rotmats_t,rotmats_1)
+                # corrup angles
+                angles_0 = torus.tor_random_uniform(angles_1.shape, device=batch['aa'].device, dtype=angles_1.dtype) # (B,L,5)
+                angles_t = torus.tor_geodesic_t(t[..., None], angles_1, angles_0)
+                angles_t = torch.where(batch['generate_mask'][...,None],angles_t,angles_1)
+            else:
+                trans_t_c = trans_1_c.detach().clone()
+                rotmats_t = rotmats_1.detach().clone()
+                angles_t = angles_1.detach().clone()
+            if self.sample_sequence:
+                # corrupt seqs
+                seqs_0_simplex = self.k * torch.randn_like(seqs_1_simplex) # (B,L,K)
+                seqs_0_prob = F.softmax(seqs_0_simplex,dim=-1) # (B,L,K)
+                seqs_t_simplex = ((1 - t[..., None]) * seqs_0_simplex) + (t[..., None] * seqs_1_simplex) # (B,L,K)
+                seqs_t_simplex = torch.where(batch['generate_mask'][...,None],seqs_t_simplex,seqs_1_simplex)
+                seqs_t_prob = F.softmax(seqs_t_simplex,dim=-1) # (B,L,K)
+                seqs_t = sample_from(seqs_t_prob) # (B,L)
+                seqs_t = torch.where(batch['generate_mask'],seqs_t,seqs_1)
+            else:
+                seqs_t = seqs_1.detach().clone()
+                seqs_t_simplex = seqs_1_simplex.detach().clone()
+                seqs_t_prob = seqs_1_prob.detach().clone()
+        # denoise
+        pred_rotmats_1, pred_trans_1, pred_angles_1, pred_seqs_1_prob  = self.ga_encoder(t, rotmats_t, trans_t_c, angles_t, seqs_t, node_embed, edge_embed, gen_mask, res_mask)
+        pred_seqs_1 = sample_from(F.softmax(pred_seqs_1_prob,dim=-1))
+        pred_seqs_1 = torch.where(batch['generate_mask'],pred_seqs_1,torch.clamp(seqs_1,0,19))
+        pred_trans_1_c,_ = self.zero_center_part(pred_trans_1,gen_mask,res_mask)
+        pred_trans_1_c = pred_trans_1 # implicitly enforce zero center in gen_mask, in this way, we dont need to move receptor when sampling
+        norm_scale = 1 / (1 - torch.min(t[...,None], torch.tensor(self._interpolant_cfg.t_normalization_clip))) # yim etal.trick, 1/1-t
+        # trans vf loss
+        trans_loss = torch.sum((pred_trans_1_c - trans_1_c)**2*gen_mask[...,None],dim=(-1,-2)) / (torch.sum(gen_mask,dim=-1) + 1e-8) # (B,)
+        trans_loss = torch.mean(trans_loss)
+        # rots vf loss
+        gt_rot_vf = so3_utils.calc_rot_vf(rotmats_t, rotmats_1)
+        pred_rot_vf = so3_utils.calc_rot_vf(rotmats_t, pred_rotmats_1)
+        rot_loss = torch.sum(((gt_rot_vf - pred_rot_vf) * norm_scale)**2*gen_mask[...,None],dim=(-1,-2)) / (torch.sum(gen_mask,dim=-1) + 1e-8) # (B,)
+        rot_loss = torch.mean(rot_loss)
+        # bb aux loss
+        gt_bb_atoms = all_atom.to_atom37(trans_1_c, rotmats_1)[:, :, :3]
+        pred_bb_atoms = all_atom.to_atom37(pred_trans_1_c, pred_rotmats_1)[:, :, :3]
+        # gt_bb_atoms = all_atom.to_bb_atoms(trans_1_c, rotmats_1, angles_1[:,:,0]) # N,CA,C,O,CB
+        # pred_bb_atoms = all_atom.to_bb_atoms(pred_trans_1_c, pred_rotmats_1, pred_angles_1[:,:,0])
+        # print(gt_bb_atoms.shape)
+        bb_atom_loss = torch.sum(
+            (gt_bb_atoms - pred_bb_atoms) ** 2 * gen_mask[..., None, None],
+            dim=(-1, -2, -3)
+        ) / (torch.sum(gen_mask,dim=-1) + 1e-8) # (B,)
+        bb_atom_loss = torch.mean(bb_atom_loss)
+        # bb_atom_loss = torch.mean(torch.where(t[:,0]>=0.75,bb_atom_loss,torch.zeros_like(bb_atom_loss))) # penalty for near gt point
+        # seqs vf loss
+        seqs_loss = F.cross_entropy(pred_seqs_1_prob.view(-1,pred_seqs_1_prob.shape[-1]),torch.clamp(seqs_1,0,19).view(-1), reduction='none').view(pred_seqs_1_prob.shape[:-1]) # (N,L), not softmax
+        seqs_loss = torch.sum(seqs_loss * gen_mask, dim=-1) / (torch.sum(gen_mask,dim=-1) + 1e-8)
+        seqs_loss = torch.mean(seqs_loss)
+        # we should not use angle mask, as you dont know aa type when generating
+        # angle_mask_loss = torch.cat([angle_mask,angle_mask],dim=-1) # (B,L,10)
+        # angle vf loss
+        angle_mask_loss = torsions_mask.to(batch['aa'].device)
+        angle_mask_loss = angle_mask_loss[pred_seqs_1.reshape(-1)].reshape(num_batch,num_res,-1) # (B,L,5)
+        angle_mask_loss = torch.cat([angle_mask_loss,angle_mask_loss],dim=-1) # (B,L,10)
+        angle_mask_loss = torch.logical_and(batch['generate_mask'][...,None].bool(),angle_mask_loss)
+        gt_angle_vf = torus.tor_logmap(angles_t, angles_1)
+        gt_angle_vf_vec = torch.cat([torch.sin(gt_angle_vf),torch.cos(gt_angle_vf)],dim=-1)
+        pred_angle_vf = torus.tor_logmap(angles_t, pred_angles_1)
+        pred_angle_vf_vec = torch.cat([torch.sin(pred_angle_vf),torch.cos(pred_angle_vf)],dim=-1)
+        # angle_loss = torch.sum(((gt_angle_vf_vec - pred_angle_vf_vec) * norm_scale)**2*gen_mask[...,None],dim=(-1,-2)) / ((torch.sum(gen_mask,dim=-1)) + 1e-8) # (B,)
+        angle_loss = torch.sum(((gt_angle_vf_vec - pred_angle_vf_vec) * norm_scale)**2*angle_mask_loss,dim=(-1,-2)) / (torch.sum(angle_mask_loss,dim=(-1,-2)) + 1e-8) # (B,)
+        angle_loss = torch.mean(angle_loss)
+        # angle aux loss
+        angles_1_vec = torch.cat([torch.sin(angles_1),torch.cos(angles_1)],dim=-1)
+        pred_angles_1_vec = torch.cat([torch.sin(pred_angles_1),torch.cos(pred_angles_1)],dim=-1)
+        # torsion_loss = torch.sum((pred_angles_1_vec - angles_1_vec)**2*gen_mask[...,None],dim=(-1,-2)) / (torch.sum(gen_mask,dim=-1) + 1e-8) # (B,)
+        torsion_loss = torch.sum((pred_angles_1_vec - angles_1_vec)**2*angle_mask_loss,dim=(-1,-2)) / (torch.sum(angle_mask_loss,dim=(-1,-2)) + 1e-8) # (B,)
+        torsion_loss = torch.mean(torsion_loss)
+        return {
+            "trans_loss": trans_loss,
+            'rot_loss': rot_loss,
+            'bb_atom_loss': bb_atom_loss,
+            'seqs_loss': seqs_loss,
+            'angle_loss': angle_loss,
+            'torsion_loss': torsion_loss,
+        }
+    @torch.no_grad()
+    def sample(self, batch, num_steps = 100, sample_bb=True, sample_ang=True, sample_seq=True):
+        num_batch, num_res = batch['aa'].shape
+        gen_mask,res_mask = batch['generate_mask'],batch['res_mask']
+        K = self._interpolant_cfg.seqs.num_classes
+        k = self._interpolant_cfg.seqs.simplex_value
+        angle_mask_loss = torsions_mask.to(batch['aa'].device)
+        #encode
+        rotmats_1, trans_1, angles_1, seqs_1, node_embed, edge_embed = self.encode(batch)
+        # trans_1_c,center = self.zero_center_part(trans_1,gen_mask,res_mask)
+        trans_1_c = trans_1
+        seqs_1_simplex = self.seq_to_simplex(seqs_1)
+        seqs_1_prob = F.softmax(seqs_1_simplex,dim=-1)
+        # # # only sample bb, angle and seq with noise
+        # angles_1 = torch.where(batch['generate_mask'][...,None],angles_1,torus.tor_random_uniform(angles_1.shape, device=batch['aa'].device, dtype=angles_1.dtype))
+        # seqs_1 = torch.where(batch['generate_mask'],seqs_1,torch.randint_like(seqs_1,0,20))
+        # seqs_1_simplex = self.seq_to_simplex(seqs_1)
+        # seqs_1_prob = F.softmax(seqs_1_simplex,dim=-1)
+        #initial noise
+        if sample_bb:
+            rotmats_0 = uniform_so3(num_batch,num_res,device=batch['aa'].device)
+            rotmats_0 = torch.where(batch['generate_mask'][...,None,None],rotmats_0,rotmats_1)
+            trans_0 = torch.randn((num_batch,num_res,3), device=batch['aa'].device) # scale with sigma?
+            # move center and receptor
+            trans_0_c,center = self.zero_center_part(trans_0,gen_mask,res_mask)
+            trans_0_c = torch.where(batch['generate_mask'][...,None],trans_0_c,trans_1_c)
+        else:
+            rotmats_0 = rotmats_1.detach().clone()
+            trans_0_c = trans_1_c.detach().clone()
+        if sample_ang:
+            # angle noise
+            angles_0 = torus.tor_random_uniform(angles_1.shape, device=batch['aa'].device, dtype=angles_1.dtype) # (B,L,5)
+            angles_0 = torch.where(batch['generate_mask'][...,None],angles_0,angles_1)
+        else:
+            angles_0 = angles_1.detach().clone()
+        if sample_seq:
+            seqs_0_simplex = k * torch.randn((num_batch,num_res,K), device=batch['aa'].device)
+            seqs_0_prob = F.softmax(seqs_0_simplex,dim=-1)
+            seqs_0 = sample_from(seqs_0_prob)
+            seqs_0 = torch.where(batch['generate_mask'],seqs_0,seqs_1)
+            seqs_0_simplex = torch.where(batch['generate_mask'][...,None],seqs_0_simplex,seqs_1_simplex)
+        else:
+            seqs_0 = seqs_1.detach().clone()
+            seqs_0_prob = seqs_1_prob.detach().clone()
+            seqs_0_simplex = seqs_1_simplex.detach().clone()
+        # Set-up time
+        ts = torch.linspace(1.e-2, 1.0, num_steps)
+        t_1 = ts[0]
+        # prot_traj = [{'rotmats':rotmats_0,'trans':trans_0_c,'seqs':seqs_0,'seqs_simplex':seqs_0_simplex,'rotmats_1':rotmats_1,'trans_1':trans_1-center,'seqs_1':seqs_1}]
+        clean_traj = []
+        rotmats_t_1, trans_t_1_c, angles_t_1, seqs_t_1, seqs_t_1_simplex = rotmats_0, trans_0_c, angles_0, seqs_0, seqs_0_simplex
+        # denoise loop
+        for t_2 in ts[1:]:
+            t = torch.ones((num_batch, 1), device=batch['aa'].device) * t_1
+            # rots
+            pred_rotmats_1, pred_trans_1, pred_angles_1, pred_seqs_1_prob = self.ga_encoder(t, rotmats_t_1, trans_t_1_c, angles_t_1, seqs_t_1, node_embed, edge_embed, batch['generate_mask'].long(), batch['res_mask'].long())
+            pred_rotmats_1 = torch.where(batch['generate_mask'][...,None,None],pred_rotmats_1,rotmats_1)
+            # trans, move center
+            # pred_trans_1_c,center = self.zero_center_part(pred_trans_1,gen_mask,res_mask)
+            pred_trans_1_c = torch.where(batch['generate_mask'][...,None],pred_trans_1,trans_1_c) # move receptor also
+            # angles
+            pred_angles_1 = torch.where(batch['generate_mask'][...,None],pred_angles_1,angles_1)
+            # seqs
+            pred_seqs_1 = sample_from(F.softmax(pred_seqs_1_prob,dim=-1))
+            pred_seqs_1 = torch.where(batch['generate_mask'],pred_seqs_1,seqs_1)
+            pred_seqs_1_simplex = self.seq_to_simplex(pred_seqs_1)
+            # seq-angle
+            torsion_mask = angle_mask_loss[pred_seqs_1.reshape(-1)].reshape(num_batch,num_res,-1) # (B,L,5)
+            pred_angles_1 = torch.where(torsion_mask.bool(),pred_angles_1,torch.zeros_like(pred_angles_1))
+            if not sample_bb:
+                pred_trans_1_c = trans_1_c.detach().clone()
+                # _,center = self.zero_center_part(trans_1,gen_mask,res_mask)
+                pred_rotmats_1 = rotmats_1.detach().clone()
+            if not sample_ang:
+                pred_angles_1 = angles_1.detach().clone()
+            if not sample_seq:
+                pred_seqs_1 = seqs_1.detach().clone()
+                pred_seqs_1_simplex = seqs_1_simplex.detach().clone()
+            clean_traj.append({'rotmats':pred_rotmats_1.cpu(),'trans':pred_trans_1_c.cpu(),'angles':pred_angles_1.cpu(),'seqs':pred_seqs_1.cpu(),'seqs_simplex':pred_seqs_1_simplex.cpu(),
+                                    'rotmats_1':rotmats_1.cpu(),'trans_1':trans_1_c.cpu(),'angles_1':angles_1.cpu(),'seqs_1':seqs_1.cpu()})
+            # reverse step, also only for gen mask region
+            d_t = (t_2-t_1) * torch.ones((num_batch, 1), device=batch['aa'].device)
+            # Euler step
+            trans_t_2 = trans_t_1_c + (pred_trans_1_c-trans_0_c)*d_t[...,None]
+            # trans_t_2_c,center = self.zero_center_part(trans_t_2,gen_mask,res_mask)
+            trans_t_2_c = torch.where(batch['generate_mask'][...,None],trans_t_2,trans_1_c) # move receptor also
+            # rotmats_t_2 = so3_utils.geodesic_t(d_t[...,None] / (1-t[...,None]), pred_rotmats_1, rotmats_t_1)
+            rotmats_t_2 = so3_utils.geodesic_t(d_t[...,None] * 10, pred_rotmats_1, rotmats_t_1)
+            rotmats_t_2 = torch.where(batch['generate_mask'][...,None,None],rotmats_t_2,rotmats_1)
+            # angles
+            angles_t_2 = torus.tor_geodesic_t(d_t[...,None],pred_angles_1, angles_t_1)
+            angles_t_2 = torch.where(batch['generate_mask'][...,None],angles_t_2,angles_1)
+            # seqs
+            seqs_t_2_simplex = seqs_t_1_simplex + (pred_seqs_1_simplex - seqs_0_simplex) * d_t[...,None]
+            seqs_t_2 = sample_from(F.softmax(seqs_t_2_simplex,dim=-1))
+            seqs_t_2 = torch.where(batch['generate_mask'],seqs_t_2,seqs_1)
+            # seq-angle
+            torsion_mask = angle_mask_loss[seqs_t_2.reshape(-1)].reshape(num_batch,num_res,-1) # (B,L,5)
+            angles_t_2 = torch.where(torsion_mask.bool(),angles_t_2,torch.zeros_like(angles_t_2))
+            if not sample_bb:
+                trans_t_2_c = trans_1_c.detach().clone()
+                rotmats_t_2 = rotmats_1.detach().clone()
+            if not sample_ang:
+                angles_t_2 = angles_1.detach().clone()
+            if not sample_seq:
+                seqs_t_2 = seqs_1.detach().clone()
+            rotmats_t_1, trans_t_1_c, angles_t_1, seqs_t_1, seqs_t_1_simplex = rotmats_t_2, trans_t_2_c, angles_t_2, seqs_t_2, seqs_t_2_simplex
+            t_1 = t_2
+        # final step
+        t_1 = ts[-1]
+        t = torch.ones((num_batch, 1), device=batch['aa'].device) * t_1
+        pred_rotmats_1, pred_trans_1, pred_angles_1, pred_seqs_1_prob = self.ga_encoder(t, rotmats_t_1, trans_t_1_c, angles_t_1, seqs_t_1, node_embed, edge_embed, batch['generate_mask'].long(), batch['res_mask'].long())
+        pred_rotmats_1 = torch.where(batch['generate_mask'][...,None,None],pred_rotmats_1,rotmats_1)
+        # move center
+        # pred_trans_1_c,center = self.zero_center_part(pred_trans_1,gen_mask,res_mask)
+        pred_trans_1_c = torch.where(batch['generate_mask'][...,None],pred_trans_1,trans_1_c) # move receptor also
+        # angles
+        pred_angles_1 = torch.where(batch['generate_mask'][...,None],pred_angles_1,angles_1)
+        # seqs
+        pred_seqs_1 = sample_from(F.softmax(pred_seqs_1_prob,dim=-1))
+        pred_seqs_1 = torch.where(batch['generate_mask'],pred_seqs_1,seqs_1)
+        pred_seqs_1_simplex = self.seq_to_simplex(pred_seqs_1)
+        # seq-angle
+        torsion_mask = angle_mask_loss[pred_seqs_1.reshape(-1)].reshape(num_batch,num_res,-1) # (B,L,5)
+        pred_angles_1 = torch.where(torsion_mask.bool(),pred_angles_1,torch.zeros_like(pred_angles_1))
+        if not sample_bb:
+            pred_trans_1_c = trans_1_c.detach().clone()
+            # _,center = self.zero_center_part(trans_1,gen_mask,res_mask)
+            pred_rotmats_1 = rotmats_1.detach().clone()
+        if not sample_ang:
+            pred_angles_1 = angles_1.detach().clone()
+        if not sample_seq:
+            pred_seqs_1 = seqs_1.detach().clone()
+            pred_seqs_1_simplex = seqs_1_simplex.detach().clone()
+        clean_traj.append({'rotmats':pred_rotmats_1.cpu(),'trans':pred_trans_1_c.cpu(),'angles':pred_angles_1.cpu(),'seqs':pred_seqs_1.cpu(),'seqs_simplex':pred_seqs_1_simplex.cpu(),
+                                'rotmats_1':rotmats_1.cpu(),'trans_1':trans_1_c.cpu(),'angles_1':angles_1.cpu(),'seqs_1':seqs_1.cpu()})
+        return clean_traj
+# if __name__ == '__main__':
+#     prefix_dir = './pepflowww'
+#     # config,cfg_name = load_config("../configs/angle/learn_sc.yaml")
+#     config,cfg_name = load_config(os.path.join(prefix_dir,"configs/angle/learn_sc.yaml"))
+#     # print(config)
+#     device = 'cuda:0'
+#     dataset = PepDataset(structure_dir = config.dataset.val.structure_dir, dataset_dir = config.dataset.val.dataset_dir,
+#                                             name = config.dataset.val.name, transform=None, reset=config.dataset.val.reset)
+#     dataloader = DataLoader(dataset, batch_size=1, shuffle=False, collate_fn=PaddingCollate(eight=False), num_workers=4, pin_memory=True)
+#     ckpt = torch.load("./checkpoints/600000.pt", map_location=device)
+#     seed_all(114514)
+#     model = FlowModel(config.model).to(device)
+#     model.load_state_dict(process_dic(ckpt['model']))
+#     model.eval()
+#     # print(model)
+#     # print(dataset[0]['chain_id'])
+#     # print(dataset[0]['id'])
+#     # print(dataset[0]['resseq'])
+#     # print(dataset[0]['res_nb'])
+#     # print(dataset[0]['icode'])
+#     dic = {'id':[],'len':[],'tran':[],'aar':[],'rot':[],'trans_loss':[],'rot_loss':[]}
+#     # for batch in tqdm(dataloader):
+#     #     batch = recursive_to(batch,device)
+#     for i in tqdm(range(len(dataset))):
+#         item = dataset[i]
+#         data_list = [deepcopy(item) for _ in range(16)]
+#         batch = recursive_to(collate_fn(data_list),device)
+#         loss_dic = model(batch)
+#         # traj_1 = model.sample(batch,num_steps=50,sample_bb=False,sample_ang=True,sample_seq=False)
+#         traj_1 = model.sample(batch,num_steps=50,sample_bb=True,sample_ang=True,sample_seq=True)
+#         ca_dist = torch.sqrt(torch.sum((traj_1[-1]['trans']-traj_1[-1]['trans_1'])**2*batch['generate_mask'][...,None].cpu().long()) / (torch.sum(batch['generate_mask']) + 1e-8).cpu()) # rmsd
+#         rot_dist = torch.sqrt(torch.sum((traj_1[-1]['rotmats']-traj_1[-1]['rotmats_1'])**2*batch['generate_mask'][...,None,None].long().cpu()) / (torch.sum(batch['generate_mask']) + 1e-8).cpu()) # rmsd
+#         aar = torch.sum((traj_1[-1]['seqs']==traj_1[-1]['seqs_1']) * batch['generate_mask'].long().cpu()) / (torch.sum(batch['generate_mask']).cpu() + 1e-8)
+#         print(loss_dic)
+#         print(f'tran:{ca_dist},rot:{rot_dist},aar:{aar},len:{batch["generate_mask"].sum().item()}')
+#         # free
+#         torch.cuda.empty_cache()
+#         gc.collect()
+#     #     dic['tran'].append(ca_dist.item())
+#     #     dic['rot'].append(rot_dist.item())
+#         dic['aar'].append(aar.item())
+#         dic['trans_loss'].append(loss_dic['trans_loss'].item())
+#         dic['rot_loss'].append(loss_dic['rot_loss'].item())
+#         dic['id'].append(batch['id'][0])
+#         dic['len'].append(batch['generate_mask'].sum().item())
+#     #     # break
+#     #     traj_1[-1]['batch'] = batch
+#     #     torch.save(traj_1[-1],f'/datapool/data2/home/jiahan/ResProj/PepDiff/frame-flow/Data/Models_new/Pack_new/outputs/{batch["id"][0]}.pt')
+#         # print(dic)
+#     # dic = pd.DataFrame(dic)
+#     # dic.to_csv(f'/datapool/data2/home/jiahan/ResProj/PepDiff/frame-flow/Data/Models_new/Pack/outputs.csv',index=None)
+#     print(np.mean(dic['aar']))
+#     print(np.mean(dic['trans_loss']))
+# if __name__ == '__main__':
+#     config,cfg_name = load_config("./configs/angle/learn_angle.yaml")
+#     seed_all(114514)
+#     device = 'cpu'
+#     dataset = PepDataset(structure_dir = config.dataset.train.structure_dir, dataset_dir = config.dataset.train.dataset_dir,
+#                                             name = config.dataset.train.name, transform=None, reset=config.dataset.train.reset)
+#     dataloader = DataLoader(dataset, batch_size=2, shuffle=False, collate_fn=PaddingCollate(), num_workers=4, pin_memory=True)
+#     model = FlowModel(config.model).to(device)
+#     optimizer = torch.optim.Adam(model.parameters(),lr=1.e-4)
+#     # ckpt = torch.load('./checkpoints/90000.pt',map_location=device)
+#     # model.load_state_dict(process_dic(ckpt['model']))
+#     # optimizer.load_state_dict(ckpt['optimizer'])
+#     # torch.autograd.set_detect_anomaly(True)
+#     for i,batch in tqdm(enumerate(dataloader)):
+#         batch = recursive_to(batch,device)
+#         loss_dict = model(batch)
+#         loss = sum_weighted_losses(loss_dict, config.train.loss_weights)
+#         # if torch.isnan(loss):
+#         #     print(i)
+#         #     print(batch['id'])
+#         loss.backward()
+#         orig_grad_norm = clip_grad_norm_(model.parameters(), config.train.max_grad_norm)
+#         print(f'{loss_dict},{loss},{orig_grad_norm}')
+#         optimizer.step()
+#         optimizer.zero_grad()

models_con/ga.py ADDED Viewed

	@@ -0,0 +1,127 @@

+import torch
+from torch import nn
+from models_con import ipa_pytorch as ipa_pytorch
+from data import utils as du
+from models_con.utils import get_index_embedding, get_time_embedding
+from pepflow.modules.protein.constants import ANG_TO_NM_SCALE, NM_TO_ANG_SCALE
+from pepflow.modules.common.layers import AngularEncoding
+import math
+class GAEncoder(nn.Module):
+    def __init__(self, ipa_conf):
+        super().__init__()
+        self._ipa_conf = ipa_conf
+        # angles
+        self.angles_embedder = AngularEncoding(num_funcs=12) # 25*5=120, for competitive embedding size
+        self.angle_net = nn.Sequential(
+            nn.Linear(self._ipa_conf.c_s, self._ipa_conf.c_s),nn.ReLU(),
+            nn.Linear(self._ipa_conf.c_s, self._ipa_conf.c_s),nn.ReLU(),
+            nn.Linear(self._ipa_conf.c_s, 5)
+            # nn.Linear(self._ipa_conf.c_s, 22)
+        )
+        # for condition on current seq
+        self.current_seq_embedder = nn.Embedding(22, self._ipa_conf.c_s)
+        self.seq_net = nn.Sequential(
+            nn.Linear(self._ipa_conf.c_s, self._ipa_conf.c_s),nn.ReLU(),
+            nn.Linear(self._ipa_conf.c_s, self._ipa_conf.c_s),nn.ReLU(),
+            nn.Linear(self._ipa_conf.c_s, 20)
+            # nn.Linear(self._ipa_conf.c_s, 22)
+        )
+        # mixer
+        self.res_feat_mixer = nn.Sequential(
+            nn.Linear(3 * self._ipa_conf.c_s + self.angles_embedder.get_out_dim(in_dim=5), self._ipa_conf.c_s),
+            nn.ReLU(),
+            nn.Linear(self._ipa_conf.c_s, self._ipa_conf.c_s),
+        )
+        self.feat_dim = self._ipa_conf.c_s
+        # Attention trunk
+        self.trunk = nn.ModuleDict()
+        for b in range(self._ipa_conf.num_blocks):
+            self.trunk[f'ipa_{b}'] = ipa_pytorch.InvariantPointAttention(self._ipa_conf)
+            self.trunk[f'ipa_ln_{b}'] = nn.LayerNorm(self._ipa_conf.c_s)
+            tfmr_in = self._ipa_conf.c_s
+            tfmr_layer = torch.nn.TransformerEncoderLayer(
+                d_model=tfmr_in,
+                nhead=self._ipa_conf.seq_tfmr_num_heads,
+                dim_feedforward=tfmr_in,
+                batch_first=True,
+                dropout=0.0,
+                norm_first=False
+            )
+            self.trunk[f'seq_tfmr_{b}'] = torch.nn.TransformerEncoder(
+                tfmr_layer, self._ipa_conf.seq_tfmr_num_layers, enable_nested_tensor=False)
+            self.trunk[f'post_tfmr_{b}'] = ipa_pytorch.Linear(
+                tfmr_in, self._ipa_conf.c_s, init="final")
+            self.trunk[f'node_transition_{b}'] = ipa_pytorch.StructureModuleTransition(
+                c=self._ipa_conf.c_s)
+            self.trunk[f'bb_update_{b}'] = ipa_pytorch.BackboneUpdate(
+                self._ipa_conf.c_s, use_rot_updates=True)
+            if b < self._ipa_conf.num_blocks-1:
+                # No edge update on the last block.
+                edge_in = self._ipa_conf.c_z
+                self.trunk[f'edge_transition_{b}'] = ipa_pytorch.EdgeTransition(
+                    node_embed_size=self._ipa_conf.c_s,
+                    edge_embed_in=edge_in,
+                    edge_embed_out=self._ipa_conf.c_z,
+                )
+    def embed_t(self, timesteps, mask):
+        timestep_emb = get_time_embedding(
+            timesteps[:, 0],
+            self.feat_dim,
+            max_positions=2056
+        )[:, None, :].repeat(1, mask.shape[1], 1)
+        return timestep_emb
+    def forward(self, t, rotmats_t, trans_t, angles_t, seqs_t, node_embed, edge_embed, generate_mask, res_mask):
+        num_batch, num_res = seqs_t.shape
+        # incorperate current seq and timesteps
+        node_mask = res_mask
+        edge_mask = node_mask[:, None] * node_mask[:, :, None]
+        node_embed = self.res_feat_mixer(torch.cat([node_embed, self.current_seq_embedder(seqs_t), self.embed_t(t,node_mask), self.angles_embedder(angles_t).reshape(num_batch,num_res,-1)],dim=-1))
+        node_embed = node_embed * node_mask[..., None]
+        curr_rigids = du.create_rigid(rotmats_t, trans_t)
+        for b in range(self._ipa_conf.num_blocks):
+            ipa_embed = self.trunk[f'ipa_{b}'](
+                node_embed,
+                edge_embed,
+                curr_rigids,
+                node_mask)
+            ipa_embed *= node_mask[..., None]
+            node_embed = self.trunk[f'ipa_ln_{b}'](node_embed + ipa_embed)
+            seq_tfmr_out = self.trunk[f'seq_tfmr_{b}'](
+                node_embed, src_key_padding_mask=(1 - node_mask).bool())
+            node_embed = node_embed + self.trunk[f'post_tfmr_{b}'](seq_tfmr_out)
+            node_embed = self.trunk[f'node_transition_{b}'](node_embed)
+            node_embed = node_embed * node_mask[..., None]
+            rigid_update = self.trunk[f'bb_update_{b}'](
+                node_embed * node_mask[..., None])
+            curr_rigids = curr_rigids.compose_q_update_vec(
+                rigid_update, node_mask[..., None])
+            if b < self._ipa_conf.num_blocks-1:
+                edge_embed = self.trunk[f'edge_transition_{b}'](
+                    node_embed, edge_embed)
+                edge_embed *= edge_mask[..., None]
+        # curr_rigids = self.rigids_nm_to_ang(curr_rigids)
+        pred_trans1 = curr_rigids.get_trans()
+        pred_rotmats1 = curr_rigids.get_rots().get_rot_mats()
+        pred_seqs1_prob = self.seq_net(node_embed)
+        pred_angles1 = self.angle_net(node_embed)
+        pred_angles1 = pred_angles1 % (2*math.pi) # inductive bias to bound between (0,2pi)
+        return pred_rotmats1, pred_trans1, pred_angles1, pred_seqs1_prob

models_con/inference.py ADDED Viewed

	@@ -0,0 +1,101 @@

+import numpy as np
+import torch
+import torch.nn as nn
+import torch.nn.functional as F
+from torch.utils.data import DataLoader
+import copy
+import math
+from tqdm.auto import tqdm
+import functools
+import os
+import argparse
+import pandas as pd
+from copy import deepcopy
+from models_con.pep_dataloader import PepDataset
+from pepflow.utils.misc import load_config
+from pepflow.utils.train import recursive_to
+from pepflow.modules.common.geometry import reconstruct_backbone, reconstruct_backbone_partially, align, batch_align
+from pepflow.modules.protein.writers import save_pdb
+from pepflow.utils.data import PaddingCollate
+from models_con.utils import process_dic
+import gc
+from models_con.flow_model import FlowModel
+from pepflow.utils.misc import seed_all
+from models_con.torsion import full_atom_reconstruction, get_heavyatom_mask
+collate_fn = PaddingCollate(eight=False)
+import argparse
+if __name__ == '__main__':
+    args = argparse.ArgumentParser()
+    args.add_argument('--config', type=str)
+    args.add_argument('--device', type=str)
+    args.add_argument('--ckpt', type=str)
+    args.add_argument('--output', type=str)
+    args.add_argument('--num_steps', type=int, default=200)
+    args.add_argument('--num_samples', type=int, default=64)
+    args.add_argument('--sample_bb', type=bool, default=True)
+    args.add_argument('--sample_ang', type=bool, default=True)
+    args.add_argument('--sample_seq', type=bool, default=True)
+    args.add_argument('--num_samples', type=int, default=64)
+    args.add_argument('--num_samples', type=int, default=64)
+    parser = args.parse_args()
+    config,cfg_name = load_config(parser.config)
+    device = parser.device
+    dataset = PepDataset(structure_dir = config.dataset.val.structure_dir, dataset_dir = config.dataset.val.dataset_dir,
+                                            name = config.dataset.val.name, transform=None, reset=config.dataset.val.reset)
+    dataloader = DataLoader(dataset, batch_size=1, shuffle=False, collate_fn=PaddingCollate(eight=False), num_workers=4, pin_memory=True)
+    ckpt = torch.load(parser.ckpt, map_location=device)
+    seed_all(114514)
+    model = FlowModel(config.model).to(device)
+    model.load_state_dict(process_dic(ckpt['model']))
+    model.eval()
+    dic = {'id':[],'len':[],'tran':[],'aar':[],'rot':[],'trans_loss':[],'rot_loss':[]}
+    for i in tqdm(range(len(dataset))):
+        item = dataset[i]
+        data_list = [deepcopy(item) for _ in range(parser.num_samples)]
+        batch = recursive_to(collate_fn(data_list),device)
+        loss_dic = model(batch)
+        traj_1 = model.sample(batch,num_steps=parser.num_steps,sample_bb=parser.sample_bb,sample_ang=parser.sample_ang,sample_seq=parser.sample_seq)
+        ca_dist = torch.sqrt(torch.sum((traj_1[-1]['trans']-traj_1[-1]['trans_1'])**2*batch['generate_mask'][...,None].cpu().long()) / (torch.sum(batch['generate_mask']) + 1e-8).cpu()) # rmsd
+        rot_dist = torch.sqrt(torch.sum((traj_1[-1]['rotmats']-traj_1[-1]['rotmats_1'])**2*batch['generate_mask'][...,None,None].long().cpu()) / (torch.sum(batch['generate_mask']) + 1e-8).cpu()) # rmsd
+        aar = torch.sum((traj_1[-1]['seqs']==traj_1[-1]['seqs_1']) * batch['generate_mask'].long().cpu()) / (torch.sum(batch['generate_mask']).cpu() + 1e-8)
+        print(loss_dic)
+        print(f'tran:{ca_dist},rot:{rot_dist},aar:{aar},len:{batch["generate_mask"].sum().item()}')
+        # free
+        torch.cuda.empty_cache()
+        gc.collect()
+        dic['tran'].append(ca_dist.item())
+        dic['rot'].append(rot_dist.item())
+        dic['aar'].append(aar.item())
+        dic['trans_loss'].append(loss_dic['trans_loss'].item())
+        dic['rot_loss'].append(loss_dic['rot_loss'].item())
+        dic['id'].append(batch['id'][0])
+        dic['len'].append(batch['generate_mask'].sum().item())
+        # break
+        traj_1[-1]['batch'] = batch
+        torch.save(traj_1[-1],f'{parser.output}/outputs/{batch["id"][0]}.pt')
+    dic = pd.DataFrame(dic)
+    dic.to_csv(f'{parser.output}/outputs.csv',index=None)

models_con/ipa_pytorch.py ADDED Viewed

	@@ -0,0 +1,687 @@

+# Copyright 2021 AlQuraishi Laboratory
+# Copyright 2021 DeepMind Technologies Limited
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""Modified code of Openfold's IPA."""
+import numpy as np
+import torch
+import math
+from scipy.stats import truncnorm
+import torch.nn as nn
+from typing import Optional, Callable, List, Sequence
+from openfold.utils.rigid_utils import Rigid
+from data import all_atom
+def permute_final_dims(tensor: torch.Tensor, inds: List[int]):
+    zero_index = -1 * len(inds)
+    first_inds = list(range(len(tensor.shape[:zero_index])))
+    return tensor.permute(first_inds + [zero_index + i for i in inds])
+def flatten_final_dims(t: torch.Tensor, no_dims: int):
+    return t.reshape(t.shape[:-no_dims] + (-1,))
+def ipa_point_weights_init_(weights):
+    with torch.no_grad():
+        softplus_inverse_1 = 0.541324854612918
+        weights.fill_(softplus_inverse_1)
+def _prod(nums):
+    out = 1
+    for n in nums:
+        out = out * n
+    return out
+def _calculate_fan(linear_weight_shape, fan="fan_in"):
+    fan_out, fan_in = linear_weight_shape
+    if fan == "fan_in":
+        f = fan_in
+    elif fan == "fan_out":
+        f = fan_out
+    elif fan == "fan_avg":
+        f = (fan_in + fan_out) / 2
+    else:
+        raise ValueError("Invalid fan option")
+    return f
+def trunc_normal_init_(weights, scale=1.0, fan="fan_in"):
+    shape = weights.shape
+    f = _calculate_fan(shape, fan)
+    scale = scale / max(1, f)
+    a = -2
+    b = 2
+    std = math.sqrt(scale) / truncnorm.std(a=a, b=b, loc=0, scale=1)
+    size = _prod(shape)
+    samples = truncnorm.rvs(a=a, b=b, loc=0, scale=std, size=size)
+    samples = np.reshape(samples, shape)
+    with torch.no_grad():
+        weights.copy_(torch.tensor(samples, device=weights.device))
+def lecun_normal_init_(weights):
+    trunc_normal_init_(weights, scale=1.0)
+def he_normal_init_(weights):
+    trunc_normal_init_(weights, scale=2.0)
+def glorot_uniform_init_(weights):
+    nn.init.xavier_uniform_(weights, gain=1)
+def final_init_(weights):
+    with torch.no_grad():
+        weights.fill_(0.0)
+def gating_init_(weights):
+    with torch.no_grad():
+        weights.fill_(0.0)
+def normal_init_(weights):
+    torch.nn.init.kaiming_normal_(weights, nonlinearity="linear")
+def compute_angles(ca_pos, pts):
+    batch_size, num_res, num_heads, num_pts, _ = pts.shape
+    calpha_vecs = (ca_pos[:, :, None, :] - ca_pos[:, None, :, :]) + 1e-10
+    calpha_vecs = torch.tile(calpha_vecs[:, :, :, None, None, :], (1, 1, 1, num_heads, num_pts, 1))
+    ipa_pts = pts[:, :, None, :, :, :] - torch.tile(ca_pos[:, :, None, None, None, :], (1, 1, num_res, num_heads, num_pts, 1))
+    phi_angles = all_atom.calculate_neighbor_angles(
+        calpha_vecs.reshape(-1, 3),
+        ipa_pts.reshape(-1, 3)
+    ).reshape(batch_size, num_res, num_res, num_heads, num_pts)
+    return  phi_angles
+class Linear(nn.Linear):
+    """
+    A Linear layer with built-in nonstandard initializations. Called just
+    like torch.nn.Linear.
+    Implements the initializers in 1.11.4, plus some additional ones found
+    in the code.
+    """
+    def __init__(
+        self,
+        in_dim: int,
+        out_dim: int,
+        bias: bool = True,
+        init: str = "default",
+        init_fn: Optional[Callable[[torch.Tensor, torch.Tensor], None]] = None,
+    ):
+        """
+        Args:
+            in_dim:
+                The final dimension of inputs to the layer
+            out_dim:
+                The final dimension of layer outputs
+            bias:
+                Whether to learn an additive bias. True by default
+            init:
+                The initializer to use. Choose from:
+                "default": LeCun fan-in truncated normal initialization
+                "relu": He initialization w/ truncated normal distribution
+                "glorot": Fan-average Glorot uniform initialization
+                "gating": Weights=0, Bias=1
+                "normal": Normal initialization with std=1/sqrt(fan_in)
+                "final": Weights=0, Bias=0
+                Overridden by init_fn if the latter is not None.
+            init_fn:
+                A custom initializer taking weight and bias as inputs.
+                Overrides init if not None.
+        """
+        super(Linear, self).__init__(in_dim, out_dim, bias=bias)
+        if bias:
+            with torch.no_grad():
+                self.bias.fill_(0)
+        if init_fn is not None:
+            init_fn(self.weight, self.bias)
+        else:
+            if init == "default":
+                lecun_normal_init_(self.weight)
+            elif init == "relu":
+                he_normal_init_(self.weight)
+            elif init == "glorot":
+                glorot_uniform_init_(self.weight)
+            elif init == "gating":
+                gating_init_(self.weight)
+                if bias:
+                    with torch.no_grad():
+                        self.bias.fill_(1.0)
+            elif init == "normal":
+                normal_init_(self.weight)
+            elif init == "final":
+                final_init_(self.weight)
+            else:
+                raise ValueError("Invalid init string.")
+class StructureModuleTransition(nn.Module):
+    def __init__(self, c):
+        super(StructureModuleTransition, self).__init__()
+        self.c = c
+        self.linear_1 = Linear(self.c, self.c, init="relu")
+        self.linear_2 = Linear(self.c, self.c, init="relu")
+        self.linear_3 = Linear(self.c, self.c, init="final")
+        self.relu = nn.ReLU()
+        self.ln = nn.LayerNorm(self.c)
+    def forward(self, s):
+        s_initial = s
+        s = self.linear_1(s)
+        s = self.relu(s)
+        s = self.linear_2(s)
+        s = self.relu(s)
+        s = self.linear_3(s)
+        s = s + s_initial
+        s = self.ln(s)
+        return s
+class EdgeTransition(nn.Module):
+    def __init__(
+            self,
+            *,
+            node_embed_size,
+            edge_embed_in,
+            edge_embed_out,
+            num_layers=2,
+            node_dilation=2
+        ):
+        super(EdgeTransition, self).__init__()
+        bias_embed_size = node_embed_size // node_dilation
+        self.initial_embed = Linear(
+            node_embed_size, bias_embed_size, init="relu")
+        hidden_size = bias_embed_size * 2 + edge_embed_in
+        trunk_layers = []
+        for _ in range(num_layers):
+            trunk_layers.append(Linear(hidden_size, hidden_size, init="relu"))
+            trunk_layers.append(nn.ReLU())
+        self.trunk = nn.Sequential(*trunk_layers)
+        self.final_layer = Linear(hidden_size, edge_embed_out, init="final")
+        self.layer_norm = nn.LayerNorm(edge_embed_out)
+    def forward(self, node_embed, edge_embed):
+        node_embed = self.initial_embed(node_embed)
+        batch_size, num_res, _ = node_embed.shape
+        edge_bias = torch.cat([
+            torch.tile(node_embed[:, :, None, :], (1, 1, num_res, 1)),
+            torch.tile(node_embed[:, None, :, :], (1, num_res, 1, 1)),
+        ], axis=-1)
+        edge_embed = torch.cat(
+            [edge_embed, edge_bias], axis=-1).reshape(
+                batch_size * num_res**2, -1)
+        edge_embed = self.final_layer(self.trunk(edge_embed) + edge_embed)
+        edge_embed = self.layer_norm(edge_embed)
+        edge_embed = edge_embed.reshape(
+            batch_size, num_res, num_res, -1
+        )
+        return edge_embed
+class InvariantPointAttention(nn.Module):
+    """
+    Implements Algorithm 22.
+    """
+    def __init__(
+        self,
+        ipa_conf,
+        inf: float = 1e5,
+        eps: float = 1e-8,
+    ):
+        """
+        Args:
+            c_s:
+                Single representation channel dimension
+            c_z:
+                Pair representation channel dimension
+            c_hidden:
+                Hidden channel dimension
+            no_heads:
+                Number of attention heads
+            no_qk_points:
+                Number of query/key points to generate
+            no_v_points:
+                Number of value points to generate
+        """
+        super(InvariantPointAttention, self).__init__()
+        self._ipa_conf = ipa_conf
+        self.c_s = ipa_conf.c_s
+        self.c_z = ipa_conf.c_z
+        self.c_hidden = ipa_conf.c_hidden
+        self.no_heads = ipa_conf.no_heads
+        self.no_qk_points = ipa_conf.no_qk_points
+        self.no_v_points = ipa_conf.no_v_points
+        self.inf = inf
+        self.eps = eps
+        # These linear layers differ from their specifications in the
+        # supplement. There, they lack bias and use Glorot initialization.
+        # Here as in the official source, they have bias and use the default
+        # Lecun initialization.
+        hc = self.c_hidden * self.no_heads
+        self.linear_q = Linear(self.c_s, hc)
+        self.linear_kv = Linear(self.c_s, 2 * hc)
+        hpq = self.no_heads * self.no_qk_points * 3
+        self.linear_q_points = Linear(self.c_s, hpq)
+        hpkv = self.no_heads * (self.no_qk_points + self.no_v_points) * 3
+        self.linear_kv_points = Linear(self.c_s, hpkv)
+        self.linear_b = Linear(self.c_z, self.no_heads)
+        self.down_z = Linear(self.c_z, self.c_z // 4)
+        self.head_weights = nn.Parameter(torch.zeros((ipa_conf.no_heads)))
+        ipa_point_weights_init_(self.head_weights)
+        concat_out_dim =  (
+            self.c_z // 4 + self.c_hidden + self.no_v_points * 4
+        )
+        self.linear_out = Linear(self.no_heads * concat_out_dim, self.c_s, init="final")
+        self.softmax = nn.Softmax(dim=-1)
+        self.softplus = nn.Softplus()
+    def forward(
+        self,
+        s: torch.Tensor,
+        z: Optional[torch.Tensor],
+        r: Rigid,
+        mask: torch.Tensor,
+        _offload_inference: bool = False,
+        _z_reference_list: Optional[Sequence[torch.Tensor]] = None,
+    ) -> torch.Tensor:
+        """
+        Args:
+            s:
+                [*, N_res, C_s] single representation
+            z:
+                [*, N_res, N_res, C_z] pair representation
+            r:
+                [*, N_res] transformation object
+            mask:
+                [*, N_res] mask
+        Returns:
+            [*, N_res, C_s] single representation update
+        """
+        if _offload_inference:
+            z = _z_reference_list
+        else:
+            z = [z]
+        #######################################
+        # Generate scalar and point activations
+        #######################################
+        # [*, N_res, H * C_hidden]
+        q = self.linear_q(s)
+        kv = self.linear_kv(s)
+        # [*, N_res, H, C_hidden]
+        q = q.view(q.shape[:-1] + (self.no_heads, -1))
+        # [*, N_res, H, 2 * C_hidden]
+        kv = kv.view(kv.shape[:-1] + (self.no_heads, -1))
+        # [*, N_res, H, C_hidden]
+        k, v = torch.split(kv, self.c_hidden, dim=-1)
+        # [*, N_res, H * P_q * 3]
+        q_pts = self.linear_q_points(s)
+        # This is kind of clunky, but it's how the original does it
+        # [*, N_res, H * P_q, 3]
+        q_pts = torch.split(q_pts, q_pts.shape[-1] // 3, dim=-1)
+        q_pts = torch.stack(q_pts, dim=-1)
+        q_pts = r[..., None].apply(q_pts)
+        # [*, N_res, H, P_q, 3]
+        q_pts = q_pts.view(
+            q_pts.shape[:-2] + (self.no_heads, self.no_qk_points, 3)
+        )
+        # [*, N_res, H * (P_q + P_v) * 3]
+        kv_pts = self.linear_kv_points(s)
+        # [*, N_res, H * (P_q + P_v), 3]
+        kv_pts = torch.split(kv_pts, kv_pts.shape[-1] // 3, dim=-1)
+        kv_pts = torch.stack(kv_pts, dim=-1)
+        kv_pts = r[..., None].apply(kv_pts)
+        # [*, N_res, H, (P_q + P_v), 3]
+        kv_pts = kv_pts.view(kv_pts.shape[:-2] + (self.no_heads, -1, 3))
+        # [*, N_res, H, P_q/P_v, 3]
+        k_pts, v_pts = torch.split(
+            kv_pts, [self.no_qk_points, self.no_v_points], dim=-2
+        )
+        ##########################
+        # Compute attention scores
+        ##########################
+        # [*, N_res, N_res, H]
+        b = self.linear_b(z[0])
+        if(_offload_inference):
+            z[0] = z[0].cpu()
+        # [*, H, N_res, N_res]
+        a = torch.matmul(
+            permute_final_dims(q, (1, 0, 2)),  # [*, H, N_res, C_hidden]
+            permute_final_dims(k, (1, 2, 0)),  # [*, H, C_hidden, N_res]
+        )
+        a *= math.sqrt(1.0 / (3 * self.c_hidden))
+        a += (math.sqrt(1.0 / 3) * permute_final_dims(b, (2, 0, 1)))
+        # [*, N_res, N_res, H, P_q, 3]
+        pt_displacement = q_pts.unsqueeze(-4) - k_pts.unsqueeze(-5)
+        pt_att = pt_displacement ** 2
+        # [*, N_res, N_res, H, P_q]
+        pt_att = sum(torch.unbind(pt_att, dim=-1))
+        head_weights = self.softplus(self.head_weights).view(
+            *((1,) * len(pt_att.shape[:-2]) + (-1, 1))
+        )
+        head_weights = head_weights * math.sqrt(
+            1.0 / (3 * (self.no_qk_points * 9.0 / 2))
+        )
+        pt_att = pt_att * head_weights
+        # [*, N_res, N_res, H]
+        pt_att = torch.sum(pt_att, dim=-1) * (-0.5)
+        # [*, N_res, N_res]
+        square_mask = mask.unsqueeze(-1) * mask.unsqueeze(-2)
+        square_mask = self.inf * (square_mask - 1)
+        # [*, H, N_res, N_res]
+        pt_att = permute_final_dims(pt_att, (2, 0, 1))
+        a = a + pt_att
+        a = a + square_mask.unsqueeze(-3)
+        a = self.softmax(a)
+        ################
+        # Compute output
+        ################
+        # [*, N_res, H, C_hidden]
+        o = torch.matmul(
+            a, v.transpose(-2, -3)
+        ).transpose(-2, -3)
+        # [*, N_res, H * C_hidden]
+        o = flatten_final_dims(o, 2)
+        # [*, H, 3, N_res, P_v]
+        o_pt = torch.sum(
+            (
+                a[..., None, :, :, None]
+                * permute_final_dims(v_pts, (1, 3, 0, 2))[..., None, :, :]
+            ),
+            dim=-2,
+        )
+        # [*, N_res, H, P_v, 3]
+        o_pt = permute_final_dims(o_pt, (2, 0, 3, 1))
+        o_pt = r[..., None, None].invert_apply(o_pt)
+        # [*, N_res, H * P_v]
+        o_pt_dists = torch.sqrt(torch.sum(o_pt ** 2, dim=-1) + self.eps)
+        o_pt_norm_feats = flatten_final_dims(
+            o_pt_dists, 2)
+        # [*, N_res, H * P_v, 3]
+        o_pt = o_pt.reshape(*o_pt.shape[:-3], -1, 3)
+        if(_offload_inference):
+            z[0] = z[0].to(o_pt.device)
+        # [*, N_res, H, C_z // 4]
+        pair_z = self.down_z(z[0])
+        o_pair = torch.matmul(a.transpose(-2, -3), pair_z)
+        # [*, N_res, H * C_z // 4]
+        o_pair = flatten_final_dims(o_pair, 2)
+        o_feats = [o, *torch.unbind(o_pt, dim=-1), o_pt_norm_feats, o_pair]
+        # [*, N_res, C_s]
+        s = self.linear_out(
+            torch.cat(
+                o_feats, dim=-1
+            )
+        )
+        return s
+class TorsionAngles(nn.Module):
+    def __init__(self, c, num_torsions, eps=1e-8):
+        super(TorsionAngles, self).__init__()
+        self.c = c
+        self.eps = eps
+        self.num_torsions = num_torsions
+        self.linear_1 = Linear(self.c, self.c, init="relu")
+        self.linear_2 = Linear(self.c, self.c, init="relu")
+        # TODO: Remove after published checkpoint is updated without these weights.
+        self.linear_3 = Linear(self.c, self.c, init="final")
+        self.linear_final = Linear(
+            self.c, self.num_torsions * 2, init="final")
+        self.relu = nn.ReLU()
+    def forward(self, s):
+        s_initial = s
+        s = self.linear_1(s)
+        s = self.relu(s)
+        s = self.linear_2(s)
+        s = s + s_initial
+        unnormalized_s = self.linear_final(s)
+        norm_denom = torch.sqrt(
+            torch.clamp(
+                torch.sum(unnormalized_s ** 2, dim=-1, keepdim=True),
+                min=self.eps,
+            )
+        )
+        normalized_s = unnormalized_s / norm_denom
+        return unnormalized_s, normalized_s
+class RotationVFLayer(nn.Module):
+    def __init__(self, dim):
+        super(RotationVFLayer, self).__init__()
+        self.linear_1 = Linear(dim, dim, init="relu")
+        self.linear_2 = Linear(dim, dim, init="relu")
+        self.linear_3 = Linear(dim, dim)
+        self.final_linear = Linear(dim, 6, init="final")
+        self.relu = nn.ReLU()
+    def forward(self, s):
+        s_initial = s
+        s = self.linear_1(s)
+        s = self.relu(s)
+        s = self.linear_2(s)
+        s = self.relu(s)
+        s = self.linear_3(s)
+        s = s + s_initial
+        return self.final_linear(s)
+class BackboneUpdate(nn.Module):
+    """
+    Implements part of Algorithm 23.
+    """
+    def __init__(self, c_s, use_rot_updates):
+        """
+        Args:
+            c_s:
+                Single representation channel dimension
+        """
+        super(BackboneUpdate, self).__init__()
+        self.c_s = c_s
+        self._use_rot_updates = use_rot_updates
+        update_dim = 6 if use_rot_updates else 3
+        self.linear = Linear(self.c_s, update_dim, init="final")
+    def forward(self, s: torch.Tensor):
+        """
+        Args:
+            [*, N_res, C_s] single representation
+        Returns:
+            [*, N_res, 6] update vector
+        """
+        # [*, 6]
+        update = self.linear(s)
+        return update
+class IpaScore(nn.Module):
+    def __init__(self, model_conf, diffuser):
+        super(IpaScore, self).__init__()
+        self._model_conf = model_conf
+        ipa_conf = model_conf.ipa
+        self._ipa_conf = ipa_conf
+        self.diffuser = diffuser
+        self.scale_pos = lambda x: x * ipa_conf.coordinate_scaling
+        self.scale_rigids = lambda x: x.apply_trans_fn(self.scale_pos)
+        self.unscale_pos = lambda x: x / ipa_conf.coordinate_scaling
+        self.unscale_rigids = lambda x: x.apply_trans_fn(self.unscale_pos)
+        self.trunk = nn.ModuleDict()
+        for b in range(ipa_conf.num_blocks):
+            self.trunk[f'ipa_{b}'] = InvariantPointAttention(ipa_conf)
+            self.trunk[f'ipa_ln_{b}'] = nn.LayerNorm(ipa_conf.c_s)
+            self.trunk[f'skip_embed_{b}'] = Linear(
+                self._model_conf.node_embed_size,
+                self._ipa_conf.c_skip,
+                init="final"
+            )
+            tfmr_in = ipa_conf.c_s + self._ipa_conf.c_skip
+            tfmr_layer = torch.nn.TransformerEncoderLayer(
+                d_model=tfmr_in,
+                nhead=ipa_conf.seq_tfmr_num_heads,
+                dim_feedforward=tfmr_in,
+                batch_first=True,
+                dropout=0.0,
+                norm_first=False
+            )
+            self.trunk[f'seq_tfmr_{b}'] = torch.nn.TransformerEncoder(
+                tfmr_layer, ipa_conf.seq_tfmr_num_layers)
+            self.trunk[f'post_tfmr_{b}'] = Linear(
+                tfmr_in, ipa_conf.c_s, init="final")
+            self.trunk[f'node_transition_{b}'] = StructureModuleTransition(
+                c=ipa_conf.c_s)
+            self.trunk[f'bb_update_{b}'] = BackboneUpdate(ipa_conf.c_s)
+            if b < ipa_conf.num_blocks-1:
+                # No edge update on the last block.
+                edge_in = self._model_conf.edge_embed_size
+                self.trunk[f'edge_transition_{b}'] = EdgeTransition(
+                    node_embed_size=ipa_conf.c_s,
+                    edge_embed_in=edge_in,
+                    edge_embed_out=self._model_conf.edge_embed_size,
+                )
+        self.torsion_pred = TorsionAngles(ipa_conf.c_s, 1)
+    def forward(self, init_node_embed, edge_embed, input_feats):
+        node_mask = input_feats['res_mask'].type(torch.float32)
+        diffuse_mask = (1 - input_feats['fixed_mask'].type(torch.float32)) * node_mask
+        edge_mask = node_mask[..., None] * node_mask[..., None, :]
+        init_frames = input_feats['rigids_t'].type(torch.float32)
+        curr_rigids = Rigid.from_tensor_7(torch.clone(init_frames))
+        init_rigids = Rigid.from_tensor_7(init_frames)
+        init_rots = init_rigids.get_rots()
+        # Main trunk
+        curr_rigids = self.scale_rigids(curr_rigids)
+        init_node_embed = init_node_embed * node_mask[..., None]
+        node_embed = init_node_embed * node_mask[..., None]
+        for b in range(self._ipa_conf.num_blocks):
+            ipa_embed = self.trunk[f'ipa_{b}'](
+                node_embed,
+                edge_embed,
+                curr_rigids,
+                node_mask)
+            ipa_embed *= node_mask[..., None]
+            node_embed = self.trunk[f'ipa_ln_{b}'](node_embed + ipa_embed)
+            seq_tfmr_in = torch.cat([
+                node_embed, self.trunk[f'skip_embed_{b}'](init_node_embed)
+            ], dim=-1)
+            seq_tfmr_out = self.trunk[f'seq_tfmr_{b}'](
+                seq_tfmr_in, src_key_padding_mask=1 - node_mask)
+            node_embed = node_embed + self.trunk[f'post_tfmr_{b}'](seq_tfmr_out)
+            node_embed = self.trunk[f'node_transition_{b}'](node_embed)
+            node_embed = node_embed * node_mask[..., None]
+            rigid_update = self.trunk[f'bb_update_{b}'](
+                node_embed * diffuse_mask[..., None])
+            curr_rigids = curr_rigids.compose_q_update_vec(
+                rigid_update, diffuse_mask[..., None])
+            if b < self._ipa_conf.num_blocks-1:
+                edge_embed = self.trunk[f'edge_transition_{b}'](
+                    node_embed, edge_embed)
+                edge_embed *= edge_mask[..., None]
+        rot_score = self.diffuser.calc_rot_score(
+            init_rigids.get_rots(),
+            curr_rigids.get_rots(),
+            input_feats['t']
+        )
+        rot_score = rot_score * node_mask[..., None]
+        curr_rigids = self.unscale_rigids(curr_rigids)
+        trans_score = self.diffuser.calc_trans_score(
+            init_rigids.get_trans(),
+            curr_rigids.get_trans(),
+            input_feats['t'][:, None, None],
+            use_torch=True,
+        )
+        trans_score = trans_score * node_mask[..., None]
+        _, psi_pred = self.torsion_pred(node_embed)
+        model_out = {
+            'psi': psi_pred,
+            'rot_score': rot_score,
+            'trans_score': trans_score,
+            'final_rigids': curr_rigids,
+        }
+        return model_out

models_con/node.py ADDED Viewed

	@@ -0,0 +1,105 @@

+import torch
+from torch import nn
+from pepflow.modules.common.geometry import construct_3d_basis, global_to_local, get_backbone_dihedral_angles
+from pepflow.modules.common.layers import AngularEncoding
+from pepflow.modules.protein.constants import BBHeavyAtom, AA
+class NodeEmbedder(nn.Module):
+    def __init__(self, feat_dim, max_num_atoms, max_aa_types=22):
+        super().__init__()
+        self.max_num_atoms = max_num_atoms
+        self.max_aa_types = max_aa_types
+        self.feat_dim = feat_dim
+        self.aatype_embed = nn.Embedding(self.max_aa_types, feat_dim)
+        self.dihed_embed = AngularEncoding()
+        infeat_dim = feat_dim + (self.max_aa_types*max_num_atoms*3) + self.dihed_embed.get_out_dim(3)
+        self.mlp = nn.Sequential(
+            nn.Linear(infeat_dim, feat_dim * 2), nn.ReLU(),
+            nn.Linear(feat_dim * 2, feat_dim), nn.ReLU(),
+            nn.Linear(feat_dim, feat_dim), nn.ReLU(),
+            nn.Linear(feat_dim, feat_dim)
+        )
+    # def embed_t(self, timesteps, mask):
+    #     timestep_emb = get_time_embedding(
+    #         timesteps[:, 0],
+    #         self.feat_dim,
+    #         max_positions=2056
+    #     )[:, None, :].repeat(1, mask.shape[1], 1)
+    #     return timestep_emb
+    def forward(self, aa, res_nb, chain_nb, pos_atoms, mask_atoms, structure_mask=None, sequence_mask=None):
+        """
+        Args:
+            aa:         (N, L).
+            res_nb:     (N, L).
+            chain_nb:   (N, L).
+            pos_atoms:  (N, L, A, 3).
+            mask_atoms: (N, L, A).
+            structure_mask: (N, L), mask out unknown structures to generate.
+            sequence_mask:  (N, L), mask out unknown amino acids to generate.
+        """
+        N, L = aa.size()
+        mask_residue = mask_atoms[:, :, BBHeavyAtom.CA] # (N, L)
+        # Remove other atoms
+        pos_atoms = pos_atoms[:, :, :self.max_num_atoms]
+        mask_atoms = mask_atoms[:, :, :self.max_num_atoms]
+        # Amino acid identity features
+        if sequence_mask is not None:
+            # Avoid data leakage at training time
+            aa = torch.where(sequence_mask, aa, torch.full_like(aa, fill_value=AA.UNK))
+        aa_feat = self.aatype_embed(aa) # (N, L, feat)
+        # Coordinate features
+        R = construct_3d_basis(
+            pos_atoms[:, :, BBHeavyAtom.CA],
+            pos_atoms[:, :, BBHeavyAtom.C],
+            pos_atoms[:, :, BBHeavyAtom.N]
+        )
+        t = pos_atoms[:, :, BBHeavyAtom.CA]
+        crd = global_to_local(R, t, pos_atoms)    # (N, L, A, 3)
+        crd_mask = mask_atoms[:, :, :, None].expand_as(crd)
+        crd = torch.where(crd_mask, crd, torch.zeros_like(crd))
+        aa_expand  = aa[:, :, None, None, None].expand(N, L, self.max_aa_types, self.max_num_atoms, 3)
+        rng_expand = torch.arange(0, self.max_aa_types)[None, None, :, None, None].expand(N, L, self.max_aa_types, self.max_num_atoms, 3).to(aa_expand)
+        place_mask = (aa_expand == rng_expand)
+        crd_expand = crd[:, :, None, :, :].expand(N, L, self.max_aa_types, self.max_num_atoms, 3)
+        crd_expand = torch.where(place_mask, crd_expand, torch.zeros_like(crd_expand))
+        crd_feat = crd_expand.reshape(N, L, self.max_aa_types*self.max_num_atoms*3)
+        if structure_mask is not None:
+            # Avoid data leakage at training time
+            crd_feat = crd_feat * structure_mask[:, :, None]
+        # Backbone dihedral features
+        bb_dihedral, mask_bb_dihed = get_backbone_dihedral_angles(pos_atoms, chain_nb=chain_nb, res_nb=res_nb, mask=mask_residue)
+        dihed_feat = self.dihed_embed(bb_dihedral[:, :, :, None]) * mask_bb_dihed[:, :, :, None]  # (N, L, 3, dihed/3)
+        dihed_feat = dihed_feat.reshape(N, L, -1)
+        if structure_mask is not None:
+            # Avoid data leakage at training time
+            dihed_mask = torch.logical_and(
+                structure_mask,
+                torch.logical_and(
+                    torch.roll(structure_mask, shifts=+1, dims=1),
+                    torch.roll(structure_mask, shifts=-1, dims=1)
+                ),
+            )   # Avoid slight data leakage via dihedral angles of anchor residues
+            dihed_feat = dihed_feat * dihed_mask[:, :, None]
+        # # timestep
+        # timestep_emb = self.embed_t(timesteps, mask_residue)
+        out_feat = self.mlp(torch.cat([aa_feat, crd_feat, dihed_feat], dim=-1)) # (N, L, F)
+        out_feat = out_feat * mask_residue[:, :, None]
+        # print(f'aa_seq:{aa},aa:{aa_feat},crd:{crd_feat},dihed:{dihed_feat},time:{timestep_emb}')
+        # print(f'weight:{self.aatype_embed.weight}') # nan, why?
+        return out_feat

models_con/pep_dataloader.py ADDED Viewed

	@@ -0,0 +1,212 @@

+"""pep-rec dataset"""
+import os
+import logging
+import joblib
+import pickle
+import lmdb
+from Bio import PDB
+from Bio.PDB import PDBExceptions
+from torch.utils.data import Dataset
+from tqdm.auto import tqdm
+from pepflow.modules.protein.parsers import parse_pdb
+from pepflow.modules.common.geometry import *
+from pepflow.modules.protein.constants import *
+from pepflow.utils.data import mask_select_data, find_longest_true_segment, PaddingCollate
+from torch.utils.data import DataLoader
+from omegaconf import OmegaConf
+from easydict import EasyDict
+from torch.utils.data import DataLoader, Dataset
+from torch.utils.data.distributed import DistributedSampler, dist
+from pepflow.utils.misc import load_config
+from pepflow.utils.train import recursive_to
+from models_con.torsion import get_torsion_angle
+import torch
+from pepflow.modules.protein.writers import save_pdb
+# bind_dic = torch.load("/datapool/data2/home/jiahan/ResProj/PepDiff/frame-flow/misc/affinity_dict.pt")
+# testset
+names = []
+with open('/datapool/data2/home/ruihan/data/jiahan/ResProj/PepDiff/pepflowww/Data/names.txt','r') as f:
+    for line in f:
+        names.append(line.strip())
+def preprocess_structure(task):
+    try:
+        if task['id'] in names:
+            raise ValueError(f'{task["id"]} not in names')
+        pdb_path = task['pdb_path']
+        # pep
+        # process peptide and find center of mass
+        pep = parse_pdb(os.path.join(pdb_path,'peptide.pdb'))[0]
+        center = torch.sum(pep['pos_heavyatom'][pep['mask_heavyatom'][:, BBHeavyAtom.CA], BBHeavyAtom.CA], dim=0) / (torch.sum(pep['mask_heavyatom'][:, BBHeavyAtom.CA]) + 1e-8)
+        pep['pos_heavyatom'] = pep['pos_heavyatom'] - center[None, None, :]
+        pep['torsion_angle'],pep['torsion_angle_mask'] = get_torsion_angle(pep['pos_heavyatom'],pep['aa']) # calc angles after translation
+        if len(pep['aa'])<3 or len(pep['aa'])>25:
+            raise ValueError('peptide length not in [3,25]')
+        # rec
+        rec = parse_pdb(os.path.join(pdb_path,'pocket.pdb'))[0]
+        rec['pos_heavyatom'] = rec['pos_heavyatom'] - center[None, None, :]
+        rec['torsion_angle'],rec['torsion_angle_mask'] = get_torsion_angle(rec['pos_heavyatom'],rec['aa']) # calc angles after translation
+        rec['chain_nb'] += 1
+        # meta data
+        data = {}
+        data['id'] = task['id']
+        data['generate_mask'] = torch.cat([torch.zeros_like(rec['aa']), torch.ones_like(pep['aa'])], dim=0).bool()
+        for k in rec.keys():
+            if isinstance(rec[k], torch.Tensor):
+                data[k] = torch.cat([rec[k], pep[k]], dim=0)
+            elif isinstance(rec[k], list):
+                data[k] = rec[k] + pep[k]
+            else:
+                raise ValueError(f'Unknown type of {rec[k]}')
+        return data
+    except (
+        PDBExceptions.PDBConstructionException,
+        KeyError,
+        ValueError,
+        TypeError
+    ) as e:
+        logging.warning('[{}] {}: {}'.format(
+            task['id'],
+            e.__class__.__name__,
+            str(e)
+        ))
+        return None
+class PepDataset(Dataset):
+    MAP_SIZE = 32*(1024*1024*1024)  # 32GB
+    def __init__(self, structure_dir = "./Data/PepMerge_new/", dataset_dir = "./Data/",
+                                            name = 'pep', transform=None, reset=False):
+        super().__init__()
+        self.structure_dir = structure_dir
+        self.dataset_dir = dataset_dir
+        self.transform = transform
+        self.name = name
+        self.db_conn = None
+        self.db_ids = None
+        self._load_structures(reset)
+    @property
+    def _cache_db_path(self):
+        return os.path.join(self.dataset_dir, f'{self.name}_structure_cache.lmdb')
+    def _connect_db(self):
+        self._close_db()
+        self.db_conn = lmdb.open(
+            self._cache_db_path,
+            map_size=self.MAP_SIZE,
+            create=False,
+            subdir=False,
+            readonly=True,
+            lock=False,
+            readahead=False,
+            meminit=False,
+        )
+        with self.db_conn.begin() as txn:
+            keys = [k.decode() for k in txn.cursor().iternext(values=False)]
+            self.db_ids = keys
+    def _close_db(self):
+        if self.db_conn is not None:
+            self.db_conn.close()
+        self.db_conn = None
+        self.db_ids = None
+    def _load_structures(self, reset):
+        all_pdbs = os.listdir(self.structure_dir)
+        if reset:
+            if os.path.exists(self._cache_db_path):
+                os.remove(self._cache_db_path)
+                lock_file = self._cache_db_path + "-lock"
+                if os.path.exists(lock_file):
+                    os.remove(lock_file)
+            self._close_db()
+            todo_pdbs = all_pdbs
+        else:
+            if not os.path.exists(self._cache_db_path):
+                todo_pdbs = all_pdbs
+            else:
+                todo_pdbs = []
+                # self._connect_db()
+                # processed_pdbs = self.db_ids
+                # self._close_db()
+                # todo_pdbs = list(set(all_pdbs) - set(processed_pdbs))
+        if len(todo_pdbs) > 0:
+            self._preprocess_structures(todo_pdbs)
+    def _preprocess_structures(self, pdb_list):
+        tasks = []
+        for pdb_fname in pdb_list:
+            pdb_path = os.path.join(self.structure_dir, pdb_fname)
+            tasks.append({
+                'id': pdb_fname,
+                'pdb_path': pdb_path,
+            })
+        data_list = joblib.Parallel(
+            n_jobs = max(joblib.cpu_count() // 2, 1),
+        )(
+            joblib.delayed(preprocess_structure)(task)
+            for task in tqdm(tasks, dynamic_ncols=True, desc='Preprocess')
+        )
+        db_conn = lmdb.open(
+            self._cache_db_path,
+            map_size = self.MAP_SIZE,
+            create=True,
+            subdir=False,
+            readonly=False,
+        )
+        ids = []
+        with db_conn.begin(write=True, buffers=True) as txn:
+            for data in tqdm(data_list, dynamic_ncols=True, desc='Write to LMDB'):
+                if data is None:
+                    continue
+                ids.append(data['id'])
+                txn.put(data['id'].encode('utf-8'), pickle.dumps(data))
+    def __len__(self):
+        self._connect_db() # make sure db_ids is not None
+        return len(self.db_ids)
+    def __getitem__(self, index):
+        self._connect_db()
+        id = self.db_ids[index]
+        with self.db_conn.begin() as txn:
+            data = pickle.loads(txn.get(id.encode()))
+        if self.transform is not None:
+            data = self.transform(data)
+        return data
+if __name__ == '__main__':
+    device = 'cuda:1'
+    config,cfg_name = load_config("./configs/learn/learn_all.yaml")
+    dataset = PepDataset(structure_dir = "./Data/PepMerge_new/", dataset_dir = "/Data/Fixed Data",
+                                            name = 'pep_pocket_test', transform=None, reset=True)
+    print(len(dataset))
+    print(dataset[0])
+    dataloader = DataLoader(dataset, batch_size=4, shuffle=True, num_workers=4, collate_fn=PaddingCollate(eight=False))
+    batch = next(iter(dataloader))
+    print(batch['torsion_angle'].shape)
+    print(batch['torsion_angle_mask'].shape)

models_con/sample.py ADDED Viewed

	@@ -0,0 +1,145 @@

+import numpy as np
+import torch
+import torch.nn as nn
+import torch.nn.functional as F
+from torch.utils.data import DataLoader
+import copy
+import math
+from tqdm.auto import tqdm
+import functools
+import os
+import argparse
+import pandas as pd
+from copy import deepcopy
+from models_con.pep_dataloader import PepDataset
+from pepflow.utils.train import recursive_to
+from pepflow.modules.common.geometry import reconstruct_backbone, reconstruct_backbone_partially, align, batch_align
+from pepflow.modules.protein.writers import save_pdb
+from pepflow.utils.data import PaddingCollate
+from models_con.utils import process_dic
+from models_con.flow_model import FlowModel
+from models_con.torsion import full_atom_reconstruction, get_heavyatom_mask
+collate_fn = PaddingCollate(eight=False)
+import argparse
+def item_to_batch(item, nums=32):
+    data_list = [deepcopy(item) for i in range(nums)]
+    return collate_fn(data_list)
+def sample_for_data_bb(data, model, device, save_root, num_steps=200, sample_structure=True, sample_sequence=True, nums=8):
+    if not os.path.exists(os.path.join(save_root,data["id"])):
+        os.makedirs(os.path.join(save_root,data["id"]))
+    batch = recursive_to(item_to_batch(data, nums=nums),device=device)
+    traj = model.sample(batch, num_steps=num_steps, sample_structure=sample_structure, sample_sequence=sample_sequence)
+    final = recursive_to(traj[-1], device=device)
+    pos_bb = reconstruct_backbone(R=final['rotmats'],t=final['trans'],aa=final['seqs'],chain_nb=batch['chain_nb'],res_nb=batch['res_nb'],mask=batch['res_mask']) # (32,L,4,3)
+    pos_ha = F.pad(pos_bb, pad=(0,0,0,15-4), value=0.) # (32,L,A,3) pos14 A=14
+    pos_new = torch.where(batch['generate_mask'][:,:,None,None],pos_ha,batch['pos_heavyatom'])
+    mask_bb_atoms = torch.zeros_like(batch['mask_heavyatom'])
+    mask_bb_atoms[:,:,:4] = True
+    mask_new = torch.where(batch['generate_mask'][:,:,None],mask_bb_atoms,batch['mask_heavyatom'])
+    aa_new = final['seqs']
+    chain_nb = torch.LongTensor([0 if gen_mask else 1 for gen_mask in data['generate_mask']])
+    chain_id = ['A' if gen_mask else 'B' for gen_mask in data['generate_mask']]
+    icode = [' ' for _ in range(len(data['icode']))]
+    for i in range(nums):
+        ref_bb_pos = data['pos_heavyatom'][i][:,:4].cpu()
+        pred_bb_pos = pos_new[i][:,:4].cpu()
+        data_saved = {
+                      'chain_nb':data['chain_nb'],'chain_id':data['chain_id'],'resseq':data['resseq'],'icode':data['icode'],
+                      'aa':aa_new[i].cpu(), 'mask_heavyatom':mask_new[i].cpu(), 'pos_heavyatom':pos_new[i].cpu(),
+                    }
+        save_pdb(data_saved,path=os.path.join(save_root,data["id"],f'{data["id"]}_{i}.pdb'))
+    save_pdb(data,path=os.path.join(save_root,data["id"],f'{data["id"]}_gt.pdb'))
+def save_samples_bb(samples,save_dir):
+    # meta data
+    batch = recursive_to(samples['batch'],'cpu')
+    chain_id = [list(item) for item in zip(*batch['chain_id'])][0] # fix chain id in collate func
+    icode = [' ' for _ in range(len(chain_id))] # batch icode have same problem
+    nums = len(batch['id'])
+    id = batch['id'][0]
+    # batch convert
+    # aa=batch['aa] if only bb level
+    pos_bb = reconstruct_backbone(R=samples['rotmats'],t=samples['trans'],aa=samples['seqs'],chain_nb=batch['chain_nb'],res_nb=batch['res_nb'],mask=batch['res_mask']) # (32,L,4,3)
+    pos_ha = F.pad(pos_bb, pad=(0,0,0,15-4), value=0.) # (32,L,A,3) pos14 A=14
+    pos_new = torch.where(batch['generate_mask'][:,:,None,None],pos_ha,batch['pos_heavyatom'])
+    mask_bb_atoms = torch.zeros_like(batch['mask_heavyatom'])
+    mask_bb_atoms[:,:,:4] = True
+    mask_new = torch.where(batch['generate_mask'][:,:,None],mask_bb_atoms,batch['mask_heavyatom'])
+    aa_new = samples['seqs']
+    for i in range(nums):
+        data_saved = {
+                      'chain_nb':batch['chain_nb'][0],'chain_id':chain_id,'resseq':batch['resseq'][0],'icode':icode,
+                      'aa':aa_new[i], 'mask_heavyatom':mask_new[i], 'pos_heavyatom':pos_new[i],
+                    }
+        save_pdb(data_saved,path=os.path.join(save_dir,f'sample_{i}.pdb'))
+    data_saved = {
+                    'chain_nb':batch['chain_nb'][0],'chain_id':chain_id,'resseq':batch['resseq'][0],'icode':icode,
+                    'aa':batch['aa'][0], 'mask_heavyatom':batch['mask_heavyatom'][0], 'pos_heavyatom':batch['pos_heavyatom'][0],
+                }
+    save_pdb(data_saved,path=os.path.join(save_dir,f'gt.pdb'))
+def save_samples_sc(samples,save_dir):
+    # meta data
+    batch = recursive_to(samples['batch'],'cpu')
+    chain_id = [list(item) for item in zip(*batch['chain_id'])][0] # fix chain id in collate func
+    icode = [' ' for _ in range(len(chain_id))] # batch icode have same problem
+    nums = len(batch['id'])
+    id = batch['id'][0]
+    # batch convert
+    # aa=batch['aa] if only bb level
+    pos_ha,_,_ = full_atom_reconstruction(R_bb=samples['rotmats'],t_bb=samples['trans'],angles=samples['angles'],aa=samples['seqs']) # (32,L,14,3), instead of 15, ignore OXT masked
+    pos_ha = F.pad(pos_ha, pad=(0,0,0,15-14), value=0.) # (32,L,A,3) pos14 A=14
+    pos_new = torch.where(batch['generate_mask'][:,:,None,None],pos_ha,batch['pos_heavyatom'])
+    mask_new = get_heavyatom_mask(samples['seqs'])
+    aa_new = samples['seqs']
+    for i in range(nums):
+        data_saved = {
+                      'chain_nb':batch['chain_nb'][0],'chain_id':chain_id,'resseq':batch['resseq'][0],'icode':icode,
+                      'aa':aa_new[i], 'mask_heavyatom':mask_new[i], 'pos_heavyatom':pos_new[i],
+                    }
+        save_pdb(data_saved,path=os.path.join(save_dir,f'sample_{i}.pdb'))
+    data_saved = {
+                    'chain_nb':batch['chain_nb'][0],'chain_id':chain_id,'resseq':batch['resseq'][0],'icode':icode,
+                    'aa':batch['aa'][0], 'mask_heavyatom':batch['mask_heavyatom'][0], 'pos_heavyatom':batch['pos_heavyatom'][0],
+                }
+    save_pdb(data_saved,path=os.path.join(save_dir,f'gt.pdb'))
+if __name__ == '__main__':
+    # sample = torch.load('./Codesign/outputs/1aze_B.pt')
+    # save_samples_sc(sample,'./misc/test')
+    # save_samples_bb(sample,'./misc/test')
+    # for k,v in sample.items():
+    #     if isinstance(v,torch.Tensor):
+    #         print(f'{k},{v.shape}')
+    # # subdir = 'bb_seq_angle' # bb,bb_seq,bb_seq_angle
+    # names = [n.split('.')[0] for n in os.listdir(os.path.join(SAMPLE_DIR,subdir,'outputs'))]
+    # for name in tqdm(names):
+    #     sample = torch.load(os.path.join(SAMPLE_DIR,subdir,'outputs',f'{name}.pt'))
+    #     os.makedirs(os.path.join(SAMPLE_DIR,subdir,'pdbs',name),exist_ok=True)
+    #     save_samples_sc(sample,os.path.join(SAMPLE_DIR,subdir,'pdbs',name))
+    args = argparse.ArgumentParser()
+    args.add_argument('--SAMPLEDIR', type=str)
+    parser = args.parse_args()
+    SAMPLE_DIR = parser.SAMPLEDIR
+    names = [n.split('.')[0] for n in os.listdir(os.path.join(SAMPLE_DIR,'outputs'))]
+    for name in tqdm(names):
+        sample = torch.load(os.path.join(SAMPLE_DIR,'outputs',f'{name}.pt'))
+        os.makedirs(os.path.join(SAMPLE_DIR,'pdbs',name),exist_ok=True)
+        save_samples_sc(sample,os.path.join(SAMPLE_DIR,'pdbs',name))

models_con/torsion.py ADDED Viewed

	@@ -0,0 +1,239 @@

+import torch
+import math
+from typing import Any, Optional, Union, cast
+from pepflow.modules.common.geometry import *
+import pepflow.modules.protein.constants as constants
+"""
+calc torsion angles between (0,2pi)
+"""
+def _get_torsion(p0, p1, p2, p3):
+    """
+    Args:
+        p0-3:   (*, 3).
+    Returns:
+        Dihedral angles in radian, (*, ).
+    """
+    v0 = p2 - p1
+    v1 = p0 - p1
+    v2 = p3 - p2
+    u1 = torch.cross(v0, v1, dim=-1)
+    n1 = u1 / torch.linalg.norm(u1, dim=-1, keepdim=True)
+    u2 = torch.cross(v0, v2, dim=-1)
+    n2 = u2 / torch.linalg.norm(u2, dim=-1, keepdim=True)
+    sgn = torch.sign( (torch.cross(v1, v2, dim=-1) * v0).sum(-1) )
+    dihed = sgn*torch.acos( (n1 * n2).sum(-1).clamp(min=-0.999999, max=0.999999))
+    return dihed
+def get_chi_angles(restype, pos14):
+    chi_angles = torch.full([4], fill_value=float("inf")).to(pos14)
+    base_atom_names = constants.chi_angles_atoms[restype]
+    for i, four_atom_names in enumerate(base_atom_names):
+        atom_indices = [constants.restype_atom14_name_to_index[restype][a] for a in four_atom_names]
+        p = torch.stack([pos14[i] for i in atom_indices])
+        # if torch.eq(p, 99999).any():
+        #     continue
+        torsion = _get_torsion(*torch.unbind(p, dim=0))
+        chi_angles[i] = torsion
+    return chi_angles
+def get_psi_angle(pos14: torch.Tensor) -> torch.Tensor:
+    return _get_torsion(pos14[0], pos14[1], pos14[2], pos14[3]).reshape([1]) # af style psi, N,CA,C,O
+def get_torsion_angle(pos14: torch.Tensor, aa: torch.LongTensor):
+    torsion, torsion_mask = [], []
+    for i in range(pos14.shape[0]):
+        if aa[i] < constants.AA.UNK: # 0-19
+            chi = get_chi_angles(aa[i].item(), pos14[i])
+            psi = get_psi_angle(pos14[i])
+            torsion_this = torch.cat([psi, chi], dim=0)
+            torsion_mask_this = torsion_this.isfinite()
+        else:
+            torsion_this = torch.full([5], 0.)
+            torsion_mask_this = torch.full([5], False)
+        torsion.append(torsion_this.nan_to_num(posinf=0.))
+        torsion_mask.append(torsion_mask_this)
+    torsion = torch.stack(torsion) % (2*math.pi)
+    torsion_mask = torch.stack(torsion_mask).bool()
+    return torsion, torsion_mask
+def _make_psi_chi_rotation_matrices(angles: torch.Tensor) -> torch.Tensor:
+    """Compute psi and chi rotation matrices from torsional angles.
+    Here we provide angles instead of alpha in af2 between (0,2pi)
+    See alphafold supplementary Algorithm 25 for details.
+    Args:
+        angles: (B, N, 5), angles between (0,2pi)
+    Returns:
+        Torsional angle rotation matrices, (B, N, 5, 3, 3).
+    """
+    batch_size, n_res = angles.shape[:2]
+    sine,cosine = torch.sin(angles), torch.cos(angles)
+    sine = sine.reshape(batch_size, n_res, -1, 1, 1)
+    cosine = cosine.reshape(batch_size, n_res, -1, 1, 1)
+    zero = torch.zeros_like(sine)
+    one = torch.ones_like(sine)
+    row1 = torch.cat([one, zero, zero], dim=-1)  # (B, N, 5, 1, 3)
+    row2 = torch.cat([zero, cosine, -sine], dim=-1)  # (B, N, 5, 1, 3)
+    row3 = torch.cat([zero, sine, cosine], dim=-1)  # (B, N, 5, 1, 3)
+    R = torch.cat([row1, row2, row3], dim=-2)  # (B, N, 5, 3, 3)
+    return R
+def _get_rigid_group(aa: torch.Tensor) -> tuple[torch.Tensor, torch.Tensor, torch.Tensor, torch.Tensor]:
+    """Extract rigid group constants.
+    Args:
+        aa: Amino acid types, (B, N).
+    Returns:
+        A tuple of rigid group rotation, translation, atom14 group and atom14 position.
+    """
+    batch_size, n_res = aa.size()
+    aa = aa.flatten()
+    rotation = constants.restype_rigid_group_rotation.to(aa.device)[aa].reshape(batch_size, n_res, 8, 3, 3)
+    translation = constants.restype_rigid_group_translation.to(aa.device)[aa].reshape(batch_size, n_res, 8, 3)
+    atom14_group = constants.restype_heavyatom_to_rigid_group.to(aa.device)[aa].reshape(batch_size, n_res, 14)
+    atom14_position = constants.restype_heavyatom_rigid_group_positions.to(aa.device)[aa].reshape(
+        batch_size, n_res, 14, 3
+    )
+    return rotation, translation, atom14_group, atom14_position
+# construct heavy atom masks for genrating
+# restype_to_heavyatom_masks = {
+#     restype: [name != "" and name !='OXT' for name in names]
+#     for restype, names in constants.restype_to_heavyatom_names.items()
+# }
+# print(restype_to_heavyatom_masks[0])
+restype_to_heavyatom_masks = torch.zeros([22,15]).bool()
+for i in range(21):
+    restype_to_heavyatom_masks[i] = torch.tensor([name != "" and name !='OXT' for name in constants.restype_to_heavyatom_names[i]]).bool()
+def get_heavyatom_mask(aa: torch.Tensor) -> torch.Tensor:
+    """Compute heavy atom masks from amino acid types.
+    Args:
+        aa: Amino acid types, (B, N).
+    Returns:
+        Heavy atom masks, (B, N, 15).
+    """
+    batch_size, n_res = aa.size()
+    aa = aa.flatten()
+    mask = restype_to_heavyatom_masks.to(aa.device)[aa].reshape(batch_size, n_res, 15)
+    return mask
+def full_atom_reconstruction(
+    R_bb: torch.Tensor,
+    t_bb: torch.Tensor,
+    angles: torch.Tensor,
+    aa: torch.Tensor,
+) -> tuple[torch.Tensor, torch.Tensor, torch.Tensor]:
+    """Compute full atom positions from backbone frames and torsional angles.
+    See alphafold supplementary Algorithm 24 for details.
+    Args:
+        R_bb: Rotation of backbone frames, (B, N, 3, 3).
+        t_bb: Translation of backbone frames, (B, N, 3).
+        angles: (B, N, 5), angles between (0,2pi)
+        aa: Amino acid types, (B, N).
+    Returns:
+        A tuple of atom positions and full frames, (pos14, R, t).
+        pos14: Full atom positions in pos14 representations, (B, N, 14, 3).
+        R: Rotation of backbone, psi, chi1-4 frames, (B, N, 5, 3, 3).
+        t: Rotation of backbone, psi, chi1-4 frames, (B, N, 5, 3).
+    """
+    N, L = aa.size()
+    rot_psi, rot_chi1, rot_chi2, rot_chi3, rot_chi4 = _make_psi_chi_rotation_matrices(angles).unbind(dim=2)
+    # (B, N, 3, 3)
+    zeros = torch.zeros_like(t_bb)
+    rigid_rotation, rigid_translation, atom14_group, atom14_position = _get_rigid_group(aa)
+    R_psi, t_psi = compose_chain(
+        [
+            (R_bb, t_bb),
+            (rigid_rotation[:, :, constants.PSI_FRAME], rigid_translation[:, :, constants.PSI_FRAME]),
+            (rot_psi, zeros),
+        ]
+    )
+    R_chi1, t_chi1 = compose_chain(
+        [
+            (R_bb, t_bb),
+            (rigid_rotation[:, :, constants.CHI1_FRAME], rigid_translation[:, :, constants.CHI1_FRAME]),
+            (rot_chi1, zeros),
+        ]
+    )
+    R_chi2, t_chi2 = compose_chain(
+        [
+            (R_chi1, t_chi1),
+            (rigid_rotation[:, :, constants.CHI2_FRAME], rigid_translation[:, :, constants.CHI2_FRAME]),
+            (rot_chi2, zeros),
+        ]
+    )
+    R_chi3, t_chi3 = compose_chain(
+        [
+            (R_chi2, t_chi2),
+            (rigid_rotation[:, :, constants.CHI3_FRAME], rigid_translation[:, :, constants.CHI3_FRAME]),
+            (rot_chi3, zeros),
+        ]
+    )
+    R_chi4, t_chi4 = compose_chain(
+        [
+            (R_chi3, t_chi3),
+            (rigid_rotation[:, :, constants.CHI4_FRAME], rigid_translation[:, :, constants.CHI4_FRAME]),
+            (rot_chi4, zeros),
+        ]
+    )
+    # Return Frame
+    R_ret = torch.stack([R_bb, R_psi, R_chi1, R_chi2, R_chi3, R_chi4], dim=2)
+    t_ret = torch.stack([t_bb, t_psi, t_chi1, t_chi2, t_chi3, t_chi4], dim=2)
+    # Backbone, Omega, Phi, Psi, Chi1,2,3,4
+    R_all = torch.stack([R_bb, R_bb, R_bb, R_psi, R_chi1, R_chi2, R_chi3, R_chi4], dim=2)  # (B, N, 8, 3, 3)
+    t_all = torch.stack([t_bb, t_bb, t_bb, t_psi, t_chi1, t_chi2, t_chi3, t_chi4], dim=2)  # (B, N, 8, 3)
+    index_R = atom14_group.reshape(N, L, 14, 1, 1).repeat(1, 1, 1, 3, 3)  # (B, N, 14, 3, 3)
+    index_t = atom14_group.reshape(N, L, 14, 1).repeat(1, 1, 1, 3)  # (B, N, 14, 3)
+    R_atom = torch.gather(R_all, dim=2, index=index_R)  # (N, L, 14, 3, 3)
+    t_atom = torch.gather(t_all, dim=2, index=index_t)  # (N, L, 14, 3)
+    p_atom = atom14_position  # (N, L, 14, 3)
+    pos14 = torch.matmul(R_atom, p_atom.unsqueeze(-1)).squeeze(-1) + t_atom
+    return pos14, R_ret, t_ret
+torsions_mask = torch.zeros([22,5]).float() # 0-19, X, PAD
+for i in range(21):
+    torsions_mask[i] = torch.tensor([True] + constants.chi_angles_mask[i]).float()
+# print(angles_mask)
+if __name__ =='__main__':
+    aa = torch.full([3,8],fill_value=constants.AA.THR).long()
+    mask = get_heavyatom_mask(aa)
+    print(mask)
+    print(mask.shape)

models_con/torus.py ADDED Viewed

	@@ -0,0 +1,34 @@

+import math
+import torch
+def tor_expmap(x: torch.Tensor, u: torch.Tensor) -> torch.Tensor:
+    return (x + u) % (2 * math.pi)
+def tor_logmap(x: torch.Tensor, y: torch.Tensor) -> torch.Tensor:
+    return torch.atan2(torch.sin(y - x), torch.cos(y - x))
+def tor_projx(x: torch.Tensor) -> torch.Tensor:
+    return x % (2 * math.pi)
+def tor_random_uniform(*size, dtype=None, device=None) -> torch.Tensor:
+    z = torch.rand(*size, dtype=dtype, device=device)
+    return z * 2 * math.pi
+def tor_uniform_logprob(x):
+    dim = x.shape[-1]
+    return torch.full_like(x[..., 0], -dim * math.log(2 * math.pi))
+def tor_geodesic_t(t, angles_1, angles_0):
+    # target, base
+    tangent_vec = t * tor_logmap(angles_0, angles_1)
+    points_at_time_t = tor_expmap(angles_0, tangent_vec)
+    return points_at_time_t
+if __name__ =='__main__':
+    a = tor_random_uniform((2,3,5))
+    b = tor_random_uniform((2,3,5))
+    t = torch.ones((2,1)) * 0.2
+    c = tor_geodesic_t(t[...,None],a,b)
+    print(c)
+    print(c.shape)

models_con/utils.py ADDED Viewed

	@@ -0,0 +1,72 @@

+import numpy as np
+import torch
+import torch.nn as nn
+import torch.nn.functional as F
+import copy
+import math
+from tqdm.auto import tqdm
+import functools
+from torch.utils.data import DataLoader
+import os
+import argparse
+import pandas as pd
+def process_dic(state_dict):
+    new_state_dict = {}
+    for k,v in state_dict.items():
+        if 'module' in k:
+            new_state_dict[k[7:]] = v
+        else:
+            new_state_dict[k] = v
+    return new_state_dict
+def calc_distogram(pos, min_bin, max_bin, num_bins):
+    dists_2d = torch.linalg.norm(
+        pos[:, :, None, :] - pos[:, None, :, :], axis=-1)[..., None]
+    lower = torch.linspace(
+        min_bin,
+        max_bin,
+        num_bins,
+        device=pos.device)
+    upper = torch.cat([lower[1:], lower.new_tensor([1e8])], dim=-1)
+    dgram = ((dists_2d > lower) * (dists_2d < upper)).type(pos.dtype)
+    return dgram
+def get_index_embedding(indices, embed_size, max_len=2056):
+    """Creates sine / cosine positional embeddings from a prespecified indices.
+    Args:
+        indices: offsets of size [..., N_edges] of type integer
+        max_len: maximum length.
+        embed_size: dimension of the embeddings to create
+    Returns:
+        positional embedding of shape [N, embed_size]
+    """
+    K = torch.arange(embed_size//2, device=indices.device)
+    pos_embedding_sin = torch.sin(
+        indices[..., None] * math.pi / (max_len**(2*K[None]/embed_size))).to(indices.device)
+    pos_embedding_cos = torch.cos(
+        indices[..., None] * math.pi / (max_len**(2*K[None]/embed_size))).to(indices.device)
+    pos_embedding = torch.cat([
+        pos_embedding_sin, pos_embedding_cos], axis=-1)
+    return pos_embedding
+def get_time_embedding(timesteps, embedding_dim, max_positions=2000):
+    # Code from https://github.com/hojonathanho/diffusion/blob/master/diffusion_tf/nn.py
+    assert len(timesteps.shape) == 1
+    timesteps = timesteps * max_positions
+    half_dim = embedding_dim // 2
+    emb = math.log(max_positions) / (half_dim - 1)
+    emb = torch.exp(torch.arange(half_dim, dtype=torch.float32, device=timesteps.device) * -emb)
+    emb = timesteps.float()[:, None] * emb[None, :]
+    emb = torch.cat([torch.sin(emb), torch.cos(emb)], dim=1)
+    if embedding_dim % 2 == 1:  # zero pad
+        emb = F.pad(emb, (0, 1), mode='constant')
+    assert emb.shape == (timesteps.shape[0], embedding_dim)
+    return emb

openfold/config.py ADDED Viewed

	@@ -0,0 +1,4 @@

+NUM_RES = "num residues placeholder"
+NUM_MSA_SEQ = "msa placeholder"
+NUM_EXTRA_SEQ = "extra msa placeholder"
+NUM_TEMPLATES = "num templates placeholder"

openfold/model/__init__.py ADDED Viewed

	@@ -0,0 +1,16 @@

+import os
+import glob
+import importlib as importlib
+_files = glob.glob(os.path.join(os.path.dirname(__file__), "*.py"))
+__all__ = [
+    os.path.basename(f)[:-3]
+    for f in _files
+    if os.path.isfile(f) and not f.endswith("__init__.py")
+]
+_modules = [(m, importlib.import_module("." + m, __name__)) for m in __all__]
+for _m in _modules:
+    globals()[_m[0]] = _m[1]
+# Avoid needlessly cluttering the global namespace
+del _files, _m, _modules

openfold/model/dropout.py ADDED Viewed

	@@ -0,0 +1,78 @@

+# Copyright 2021 AlQuraishi Laboratory
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import torch
+import torch.nn as nn
+from functools import partialmethod
+from typing import Union, List
+class Dropout(nn.Module):
+    """
+    Implementation of dropout with the ability to share the dropout mask
+    along a particular dimension.
+    If not in training mode, this module computes the identity function.
+    """
+    def __init__(self, r: float, batch_dim: Union[int, List[int]]):
+        """
+        Args:
+            r:
+                Dropout rate
+            batch_dim:
+                Dimension(s) along which the dropout mask is shared
+        """
+        super(Dropout, self).__init__()
+        self.r = r
+        if type(batch_dim) == int:
+            batch_dim = [batch_dim]
+        self.batch_dim = batch_dim
+        self.dropout = nn.Dropout(self.r)
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        """
+        Args:
+            x:
+                Tensor to which dropout is applied. Can have any shape
+                compatible with self.batch_dim
+        """
+        shape = list(x.shape)
+        if self.batch_dim is not None:
+            for bd in self.batch_dim:
+                shape[bd] = 1
+        mask = x.new_ones(shape)
+        mask = self.dropout(mask)
+        x *= mask
+        return x
+class DropoutRowwise(Dropout):
+    """
+    Convenience class for rowwise dropout as described in subsection
+    1.11.6.
+    """
+    __init__ = partialmethod(Dropout.__init__, batch_dim=-3)
+class DropoutColumnwise(Dropout):
+    """
+    Convenience class for columnwise dropout as described in subsection
+    1.11.6.
+    """
+    __init__ = partialmethod(Dropout.__init__, batch_dim=-2)

openfold/model/embedders.py ADDED Viewed

	@@ -0,0 +1,352 @@

+# Copyright 2021 AlQuraishi Laboratory
+# Copyright 2021 DeepMind Technologies Limited
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import torch
+import torch.nn as nn
+from typing import Tuple
+from openfold.model.primitives import Linear, LayerNorm
+from openfold.utils.tensor_utils import one_hot
+class InputEmbedder(nn.Module):
+    """
+    Embeds a subset of the input features.
+    Implements Algorithms 3 (InputEmbedder) and 4 (relpos).
+    """
+    def __init__(
+        self,
+        tf_dim: int,
+        msa_dim: int,
+        c_z: int,
+        c_m: int,
+        relpos_k: int,
+        **kwargs,
+    ):
+        """
+        Args:
+            tf_dim:
+                Final dimension of the target features
+            msa_dim:
+                Final dimension of the MSA features
+            c_z:
+                Pair embedding dimension
+            c_m:
+                MSA embedding dimension
+            relpos_k:
+                Window size used in relative positional encoding
+        """
+        super(InputEmbedder, self).__init__()
+        self.tf_dim = tf_dim
+        self.msa_dim = msa_dim
+        self.c_z = c_z
+        self.c_m = c_m
+        self.linear_tf_z_i = Linear(tf_dim, c_z)
+        self.linear_tf_z_j = Linear(tf_dim, c_z)
+        self.linear_tf_m = Linear(tf_dim, c_m)
+        self.linear_msa_m = Linear(msa_dim, c_m)
+        # RPE stuff
+        self.relpos_k = relpos_k
+        self.no_bins = 2 * relpos_k + 1
+        self.linear_relpos = Linear(self.no_bins, c_z)
+    def relpos(self, ri: torch.Tensor):
+        """
+        Computes relative positional encodings
+        Implements Algorithm 4.
+        Args:
+            ri:
+                "residue_index" features of shape [*, N]
+        """
+        d = ri[..., None] - ri[..., None, :]
+        boundaries = torch.arange(
+            start=-self.relpos_k, end=self.relpos_k + 1, device=d.device
+        )
+        oh = one_hot(d, boundaries).type(ri.dtype)
+        return self.linear_relpos(oh)
+    def forward(
+        self,
+        tf: torch.Tensor,
+        ri: torch.Tensor,
+        msa: torch.Tensor,
+    ) -> Tuple[torch.Tensor, torch.Tensor]:
+        """
+        Args:
+            tf:
+                "target_feat" features of shape [*, N_res, tf_dim]
+            ri:
+                "residue_index" features of shape [*, N_res]
+            msa:
+                "msa_feat" features of shape [*, N_clust, N_res, msa_dim]
+        Returns:
+            msa_emb:
+                [*, N_clust, N_res, C_m] MSA embedding
+            pair_emb:
+                [*, N_res, N_res, C_z] pair embedding
+        """
+        # [*, N_res, c_z]
+        tf_emb_i = self.linear_tf_z_i(tf)
+        tf_emb_j = self.linear_tf_z_j(tf)
+        # [*, N_res, N_res, c_z]
+        pair_emb = tf_emb_i[..., None, :] + tf_emb_j[..., None, :, :]
+        pair_emb = pair_emb + self.relpos(ri.type(pair_emb.dtype))
+        # [*, N_clust, N_res, c_m]
+        n_clust = msa.shape[-3]
+        tf_m = (
+            self.linear_tf_m(tf)
+            .unsqueeze(-3)
+            .expand(((-1,) * len(tf.shape[:-2]) + (n_clust, -1, -1)))
+        )
+        msa_emb = self.linear_msa_m(msa) + tf_m
+        return msa_emb, pair_emb
+class RecyclingEmbedder(nn.Module):
+    """
+    Embeds the output of an iteration of the model for recycling.
+    Implements Algorithm 32.
+    """
+    def __init__(
+        self,
+        c_m: int,
+        c_z: int,
+        min_bin: float,
+        max_bin: float,
+        no_bins: int,
+        inf: float = 1e8,
+        **kwargs,
+    ):
+        """
+        Args:
+            c_m:
+                MSA channel dimension
+            c_z:
+                Pair embedding channel dimension
+            min_bin:
+                Smallest distogram bin (Angstroms)
+            max_bin:
+                Largest distogram bin (Angstroms)
+            no_bins:
+                Number of distogram bins
+        """
+        super(RecyclingEmbedder, self).__init__()
+        self.c_m = c_m
+        self.c_z = c_z
+        self.min_bin = min_bin
+        self.max_bin = max_bin
+        self.no_bins = no_bins
+        self.inf = inf
+        self.bins = None
+        self.linear = Linear(self.no_bins, self.c_z)
+        self.layer_norm_m = LayerNorm(self.c_m)
+        self.layer_norm_z = LayerNorm(self.c_z)
+    def forward(
+        self,
+        m: torch.Tensor,
+        z: torch.Tensor,
+        x: torch.Tensor,
+    ) -> Tuple[torch.Tensor, torch.Tensor]:
+        """
+        Args:
+            m:
+                First row of the MSA embedding. [*, N_res, C_m]
+            z:
+                [*, N_res, N_res, C_z] pair embedding
+            x:
+                [*, N_res, 3] predicted C_beta coordinates
+        Returns:
+            m:
+                [*, N_res, C_m] MSA embedding update
+            z:
+                [*, N_res, N_res, C_z] pair embedding update
+        """
+        if self.bins is None:
+            self.bins = torch.linspace(
+                self.min_bin,
+                self.max_bin,
+                self.no_bins,
+                dtype=x.dtype,
+                device=x.device,
+                requires_grad=False,
+            )
+        # [*, N, C_m]
+        m_update = self.layer_norm_m(m)
+        # This squared method might become problematic in FP16 mode.
+        # I'm using it because my homegrown method had a stubborn discrepancy I
+        # couldn't find in time.
+        squared_bins = self.bins ** 2
+        upper = torch.cat(
+            [squared_bins[1:], squared_bins.new_tensor([self.inf])], dim=-1
+        )
+        d = torch.sum(
+            (x[..., None, :] - x[..., None, :, :]) ** 2, dim=-1, keepdims=True
+        )
+        # [*, N, N, no_bins]
+        d = ((d > squared_bins) * (d < upper)).type(x.dtype)
+        # [*, N, N, C_z]
+        d = self.linear(d)
+        z_update = d + self.layer_norm_z(z)
+        return m_update, z_update
+class TemplateAngleEmbedder(nn.Module):
+    """
+    Embeds the "template_angle_feat" feature.
+    Implements Algorithm 2, line 7.
+    """
+    def __init__(
+        self,
+        c_in: int,
+        c_out: int,
+        **kwargs,
+    ):
+        """
+        Args:
+            c_in:
+                Final dimension of "template_angle_feat"
+            c_out:
+                Output channel dimension
+        """
+        super(TemplateAngleEmbedder, self).__init__()
+        self.c_out = c_out
+        self.c_in = c_in
+        self.linear_1 = Linear(self.c_in, self.c_out, init="relu")
+        self.relu = nn.ReLU()
+        self.linear_2 = Linear(self.c_out, self.c_out, init="relu")
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        """
+        Args:
+            x: [*, N_templ, N_res, c_in] "template_angle_feat" features
+        Returns:
+            x: [*, N_templ, N_res, C_out] embedding
+        """
+        x = self.linear_1(x)
+        x = self.relu(x)
+        x = self.linear_2(x)
+        return x
+class TemplatePairEmbedder(nn.Module):
+    """
+    Embeds "template_pair_feat" features.
+    Implements Algorithm 2, line 9.
+    """
+    def __init__(
+        self,
+        c_in: int,
+        c_out: int,
+        **kwargs,
+    ):
+        """
+        Args:
+            c_in:
+            c_out:
+                Output channel dimension
+        """
+        super(TemplatePairEmbedder, self).__init__()
+        self.c_in = c_in
+        self.c_out = c_out
+        # Despite there being no relu nearby, the source uses that initializer
+        self.linear = Linear(self.c_in, self.c_out, init="relu")
+    def forward(
+        self,
+        x: torch.Tensor,
+    ) -> torch.Tensor:
+        """
+        Args:
+            x:
+                [*, C_in] input tensor
+        Returns:
+            [*, C_out] output tensor
+        """
+        x = self.linear(x)
+        return x
+class ExtraMSAEmbedder(nn.Module):
+    """
+    Embeds unclustered MSA sequences.
+    Implements Algorithm 2, line 15
+    """
+    def __init__(
+        self,
+        c_in: int,
+        c_out: int,
+        **kwargs,
+    ):
+        """
+        Args:
+            c_in:
+                Input channel dimension
+            c_out:
+                Output channel dimension
+        """
+        super(ExtraMSAEmbedder, self).__init__()
+        self.c_in = c_in
+        self.c_out = c_out
+        self.linear = Linear(self.c_in, self.c_out)
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        """
+        Args:
+            x:
+                [*, N_extra_seq, N_res, C_in] "extra_msa_feat" features
+        Returns:
+            [*, N_extra_seq, N_res, C_out] embedding
+        """
+        x = self.linear(x)
+        return x

openfold/model/evoformer.py ADDED Viewed

	@@ -0,0 +1,630 @@

+# Copyright 2021 AlQuraishi Laboratory
+# Copyright 2021 DeepMind Technologies Limited
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import math
+import torch
+import torch.nn as nn
+from typing import Tuple, Optional
+from functools import partial
+from openfold.model.primitives import Linear, LayerNorm
+from openfold.model.dropout import DropoutRowwise, DropoutColumnwise
+from openfold.model.msa import (
+    MSARowAttentionWithPairBias,
+    MSAColumnAttention,
+    MSAColumnGlobalAttention,
+)
+from openfold.model.outer_product_mean import OuterProductMean
+from openfold.model.pair_transition import PairTransition
+from openfold.model.triangular_attention import (
+    TriangleAttentionStartingNode,
+    TriangleAttentionEndingNode,
+)
+from openfold.model.triangular_multiplicative_update import (
+    TriangleMultiplicationOutgoing,
+    TriangleMultiplicationIncoming,
+)
+from openfold.utils.checkpointing import checkpoint_blocks, get_checkpoint_fn
+from openfold.utils.tensor_utils import chunk_layer
+class MSATransition(nn.Module):
+    """
+    Feed-forward network applied to MSA activations after attention.
+    Implements Algorithm 9
+    """
+    def __init__(self, c_m, n):
+        """
+        Args:
+            c_m:
+                MSA channel dimension
+            n:
+                Factor multiplied to c_m to obtain the hidden channel
+                dimension
+        """
+        super(MSATransition, self).__init__()
+        self.c_m = c_m
+        self.n = n
+        self.layer_norm = LayerNorm(self.c_m)
+        self.linear_1 = Linear(self.c_m, self.n * self.c_m, init="relu")
+        self.relu = nn.ReLU()
+        self.linear_2 = Linear(self.n * self.c_m, self.c_m, init="final")
+    def _transition(self, m, mask):
+        m = self.linear_1(m)
+        m = self.relu(m)
+        m = self.linear_2(m) * mask
+        return m
+    @torch.jit.ignore
+    def _chunk(self,
+        m: torch.Tensor,
+        mask: torch.Tensor,
+        chunk_size: int,
+    ) -> torch.Tensor:
+         return chunk_layer(
+             self._transition,
+             {"m": m, "mask": mask},
+             chunk_size=chunk_size,
+             no_batch_dims=len(m.shape[:-2]),
+         )
+    def forward(
+        self,
+        m: torch.Tensor,
+        mask: Optional[torch.Tensor] = None,
+        chunk_size: Optional[int] = None,
+    ) -> torch.Tensor:
+        """
+        Args:
+            m:
+                [*, N_seq, N_res, C_m] MSA activation
+            mask:
+                [*, N_seq, N_res, C_m] MSA mask
+        Returns:
+            m:
+                [*, N_seq, N_res, C_m] MSA activation update
+        """
+        # DISCREPANCY: DeepMind forgets to apply the MSA mask here.
+        if mask is None:
+            mask = m.new_ones(m.shape[:-1])
+        mask = mask.unsqueeze(-1)
+        m = self.layer_norm(m)
+        if chunk_size is not None:
+            m = self._chunk(m, mask, chunk_size)
+        else:
+            m = self._transition(m, mask)
+        return m
+class EvoformerBlockCore(nn.Module):
+    def __init__(
+        self,
+        c_m: int,
+        c_z: int,
+        c_hidden_opm: int,
+        c_hidden_mul: int,
+        c_hidden_pair_att: int,
+        no_heads_msa: int,
+        no_heads_pair: int,
+        transition_n: int,
+        pair_dropout: float,
+        inf: float,
+        eps: float,
+        _is_extra_msa_stack: bool = False,
+    ):
+        super(EvoformerBlockCore, self).__init__()
+        self.msa_transition = MSATransition(
+            c_m=c_m,
+            n=transition_n,
+        )
+        self.outer_product_mean = OuterProductMean(
+            c_m,
+            c_z,
+            c_hidden_opm,
+        )
+        self.tri_mul_out = TriangleMultiplicationOutgoing(
+            c_z,
+            c_hidden_mul,
+        )
+        self.tri_mul_in = TriangleMultiplicationIncoming(
+            c_z,
+            c_hidden_mul,
+        )
+        self.tri_att_start = TriangleAttentionStartingNode(
+            c_z,
+            c_hidden_pair_att,
+            no_heads_pair,
+            inf=inf,
+        )
+        self.tri_att_end = TriangleAttentionEndingNode(
+            c_z,
+            c_hidden_pair_att,
+            no_heads_pair,
+            inf=inf,
+        )
+        self.pair_transition = PairTransition(
+            c_z,
+            transition_n,
+        )
+        self.ps_dropout_row_layer = DropoutRowwise(pair_dropout)
+        self.ps_dropout_col_layer = DropoutColumnwise(pair_dropout)
+    def forward(
+        self,
+        m: torch.Tensor,
+        z: torch.Tensor,
+        msa_mask: torch.Tensor,
+        pair_mask: torch.Tensor,
+        chunk_size: Optional[int] = None,
+        _mask_trans: bool = True,
+    ) -> Tuple[torch.Tensor, torch.Tensor]:
+        # DeepMind doesn't mask these transitions in the source, so _mask_trans
+        # should be disabled to better approximate the exact activations of
+        # the original.
+        msa_trans_mask = msa_mask if _mask_trans else None
+        pair_trans_mask = pair_mask if _mask_trans else None
+        m = m + self.msa_transition(
+            m, mask=msa_trans_mask, chunk_size=chunk_size
+        )
+        z = z + self.outer_product_mean(
+            m, mask=msa_mask, chunk_size=chunk_size
+        )
+        z = z + self.ps_dropout_row_layer(self.tri_mul_out(z, mask=pair_mask))
+        z = z + self.ps_dropout_row_layer(self.tri_mul_in(z, mask=pair_mask))
+        z = z + self.ps_dropout_row_layer(
+            self.tri_att_start(z, mask=pair_mask, chunk_size=chunk_size)
+        )
+        z = z + self.ps_dropout_col_layer(
+            self.tri_att_end(z, mask=pair_mask, chunk_size=chunk_size)
+        )
+        z = z + self.pair_transition(
+            z, mask=pair_trans_mask, chunk_size=chunk_size
+        )
+        return m, z
+class EvoformerBlock(nn.Module):
+    def __init__(self,
+        c_m: int,
+        c_z: int,
+        c_hidden_msa_att: int,
+        c_hidden_opm: int,
+        c_hidden_mul: int,
+        c_hidden_pair_att: int,
+        no_heads_msa: int,
+        no_heads_pair: int,
+        transition_n: int,
+        msa_dropout: float,
+        pair_dropout: float,
+        inf: float,
+        eps: float,
+    ):
+        super(EvoformerBlock, self).__init__()
+        self.msa_att_row = MSARowAttentionWithPairBias(
+            c_m=c_m,
+            c_z=c_z,
+            c_hidden=c_hidden_msa_att,
+            no_heads=no_heads_msa,
+            inf=inf,
+        )
+        self.msa_att_col = MSAColumnAttention(
+            c_m,
+            c_hidden_msa_att,
+            no_heads_msa,
+            inf=inf,
+        )
+        self.msa_dropout_layer = DropoutRowwise(msa_dropout)
+        self.core = EvoformerBlockCore(
+            c_m=c_m,
+            c_z=c_z,
+            c_hidden_opm=c_hidden_opm,
+            c_hidden_mul=c_hidden_mul,
+            c_hidden_pair_att=c_hidden_pair_att,
+            no_heads_msa=no_heads_msa,
+            no_heads_pair=no_heads_pair,
+            transition_n=transition_n,
+            pair_dropout=pair_dropout,
+            inf=inf,
+            eps=eps,
+        )
+    def forward(self,
+        m: torch.Tensor,
+        z: torch.Tensor,
+        msa_mask: torch.Tensor,
+        pair_mask: torch.Tensor,
+        chunk_size: Optional[int] = None,
+        _mask_trans: bool = True,
+    ) -> Tuple[torch.Tensor, torch.Tensor]:
+        m = m + self.msa_dropout_layer(
+            self.msa_att_row(m, z=z, mask=msa_mask, chunk_size=chunk_size)
+        )
+        m = m + self.msa_att_col(m, mask=msa_mask, chunk_size=chunk_size)
+        m, z = self.core(
+            m,
+            z,
+            msa_mask=msa_mask,
+            pair_mask=pair_mask,
+            chunk_size=chunk_size,
+            _mask_trans=_mask_trans,
+        )
+        return m, z
+class ExtraMSABlock(nn.Module):
+    """
+        Almost identical to the standard EvoformerBlock, except in that the
+        ExtraMSABlock uses GlobalAttention for MSA column attention and
+        requires more fine-grained control over checkpointing. Separated from
+        its twin to preserve the TorchScript-ability of the latter.
+    """
+    def __init__(self,
+        c_m: int,
+        c_z: int,
+        c_hidden_msa_att: int,
+        c_hidden_opm: int,
+        c_hidden_mul: int,
+        c_hidden_pair_att: int,
+        no_heads_msa: int,
+        no_heads_pair: int,
+        transition_n: int,
+        msa_dropout: float,
+        pair_dropout: float,
+        inf: float,
+        eps: float,
+        ckpt: bool,
+    ):
+        super(ExtraMSABlock, self).__init__()
+        self.ckpt = ckpt
+        self.msa_att_row = MSARowAttentionWithPairBias(
+            c_m=c_m,
+            c_z=c_z,
+            c_hidden=c_hidden_msa_att,
+            no_heads=no_heads_msa,
+            inf=inf,
+        )
+        self.msa_att_col = MSAColumnGlobalAttention(
+            c_in=c_m,
+            c_hidden=c_hidden_msa_att,
+            no_heads=no_heads_msa,
+            inf=inf,
+            eps=eps,
+        )
+        self.msa_dropout_layer = DropoutRowwise(msa_dropout)
+        self.core = EvoformerBlockCore(
+            c_m=c_m,
+            c_z=c_z,
+            c_hidden_opm=c_hidden_opm,
+            c_hidden_mul=c_hidden_mul,
+            c_hidden_pair_att=c_hidden_pair_att,
+            no_heads_msa=no_heads_msa,
+            no_heads_pair=no_heads_pair,
+            transition_n=transition_n,
+            pair_dropout=pair_dropout,
+            inf=inf,
+            eps=eps,
+        )
+    def forward(self,
+        m: torch.Tensor,
+        z: torch.Tensor,
+        msa_mask: torch.Tensor,
+        pair_mask: torch.Tensor,
+        chunk_size: Optional[int] = None,
+        _chunk_logits: Optional[int] = 1024,
+    ) -> Tuple[torch.Tensor, torch.Tensor]:
+        def add(m1, m2):
+            # The first operation in a checkpoint can't be in-place, but it's
+            # nice to have in-place addition during inference. Thus...
+            if(torch.is_grad_enabled()):
+                m1 = m1 + m2
+            else:
+                m1 += m2
+            return m1
+        m = add(m, self.msa_dropout_layer(
+            self.msa_att_row(
+                m.clone() if torch.is_grad_enabled() else m,
+                z=z.clone() if torch.is_grad_enabled() else z,
+                mask=msa_mask,
+                chunk_size=chunk_size,
+                _chunk_logits=_chunk_logits if torch.is_grad_enabled() else None,
+                _checkpoint_chunks=
+                    self.ckpt if torch.is_grad_enabled() else False,
+            )
+        ))
+        def fn(m, z):
+            m = add(m, self.msa_att_col(m, mask=msa_mask, chunk_size=chunk_size))
+            m, z = self.core(
+                m, z, msa_mask=msa_mask, pair_mask=pair_mask, chunk_size=chunk_size
+            )
+            return m, z
+        if(torch.is_grad_enabled() and self.ckpt):
+            checkpoint_fn = get_checkpoint_fn()
+            m, z = checkpoint_fn(fn, m, z)
+        else:
+            m, z = fn(m, z)
+        return m, z
+class EvoformerStack(nn.Module):
+    """
+    Main Evoformer trunk.
+    Implements Algorithm 6.
+    """
+    def __init__(
+        self,
+        c_m: int,
+        c_z: int,
+        c_hidden_msa_att: int,
+        c_hidden_opm: int,
+        c_hidden_mul: int,
+        c_hidden_pair_att: int,
+        c_s: int,
+        no_heads_msa: int,
+        no_heads_pair: int,
+        no_blocks: int,
+        transition_n: int,
+        msa_dropout: float,
+        pair_dropout: float,
+        blocks_per_ckpt: int,
+        inf: float,
+        eps: float,
+        clear_cache_between_blocks: bool = False,
+        **kwargs,
+    ):
+        """
+        Args:
+            c_m:
+                MSA channel dimension
+            c_z:
+                Pair channel dimension
+            c_hidden_msa_att:
+                Hidden dimension in MSA attention
+            c_hidden_opm:
+                Hidden dimension in outer product mean module
+            c_hidden_mul:
+                Hidden dimension in multiplicative updates
+            c_hidden_pair_att:
+                Hidden dimension in triangular attention
+            c_s:
+                Channel dimension of the output "single" embedding
+            no_heads_msa:
+                Number of heads used for MSA attention
+            no_heads_pair:
+                Number of heads used for pair attention
+            no_blocks:
+                Number of Evoformer blocks in the stack
+            transition_n:
+                Factor by which to multiply c_m to obtain the MSATransition
+                hidden dimension
+            msa_dropout:
+                Dropout rate for MSA activations
+            pair_dropout:
+                Dropout used for pair activations
+            blocks_per_ckpt:
+                Number of Evoformer blocks in each activation checkpoint
+            clear_cache_between_blocks:
+                Whether to clear CUDA's GPU memory cache between blocks of the
+                stack. Slows down each block but can reduce fragmentation
+        """
+        super(EvoformerStack, self).__init__()
+        self.blocks_per_ckpt = blocks_per_ckpt
+        self.clear_cache_between_blocks = clear_cache_between_blocks
+        self.blocks = nn.ModuleList()
+        for _ in range(no_blocks):
+            block = EvoformerBlock(
+                c_m=c_m,
+                c_z=c_z,
+                c_hidden_msa_att=c_hidden_msa_att,
+                c_hidden_opm=c_hidden_opm,
+                c_hidden_mul=c_hidden_mul,
+                c_hidden_pair_att=c_hidden_pair_att,
+                no_heads_msa=no_heads_msa,
+                no_heads_pair=no_heads_pair,
+                transition_n=transition_n,
+                msa_dropout=msa_dropout,
+                pair_dropout=pair_dropout,
+                inf=inf,
+                eps=eps,
+            )
+            self.blocks.append(block)
+        self.linear = Linear(c_m, c_s)
+    def forward(self,
+        m: torch.Tensor,
+        z: torch.Tensor,
+        msa_mask: torch.Tensor,
+        pair_mask: torch.Tensor,
+        chunk_size: int,
+        _mask_trans: bool = True,
+    ) -> Tuple[torch.Tensor, torch.Tensor, Optional[torch.Tensor]]:
+        """
+        Args:
+            m:
+                [*, N_seq, N_res, C_m] MSA embedding
+            z:
+                [*, N_res, N_res, C_z] pair embedding
+            msa_mask:
+                [*, N_seq, N_res] MSA mask
+            pair_mask:
+                [*, N_res, N_res] pair mask
+        Returns:
+            m:
+                [*, N_seq, N_res, C_m] MSA embedding
+            z:
+                [*, N_res, N_res, C_z] pair embedding
+            s:
+                [*, N_res, C_s] single embedding (or None if extra MSA stack)
+        """
+        blocks = [
+            partial(
+                b,
+                msa_mask=msa_mask,
+                pair_mask=pair_mask,
+                chunk_size=chunk_size,
+                _mask_trans=_mask_trans,
+            )
+            for b in self.blocks
+        ]
+        if(self.clear_cache_between_blocks):
+            def block_with_cache_clear(block, *args):
+                torch.cuda.empty_cache()
+                return block(*args)
+            blocks = [partial(block_with_cache_clear, b) for b in blocks]
+        m, z = checkpoint_blocks(
+            blocks,
+            args=(m, z),
+            blocks_per_ckpt=self.blocks_per_ckpt if self.training else None,
+        )
+        s = self.linear(m[..., 0, :, :])
+        return m, z, s
+class ExtraMSAStack(nn.Module):
+    """
+    Implements Algorithm 18.
+    """
+    def __init__(self,
+        c_m: int,
+        c_z: int,
+        c_hidden_msa_att: int,
+        c_hidden_opm: int,
+        c_hidden_mul: int,
+        c_hidden_pair_att: int,
+        no_heads_msa: int,
+        no_heads_pair: int,
+        no_blocks: int,
+        transition_n: int,
+        msa_dropout: float,
+        pair_dropout: float,
+        inf: float,
+        eps: float,
+        ckpt: bool,
+        clear_cache_between_blocks: bool = False,
+        **kwargs,
+    ):
+        super(ExtraMSAStack, self).__init__()
+        self.clear_cache_between_blocks = clear_cache_between_blocks
+        self.blocks = nn.ModuleList()
+        for _ in range(no_blocks):
+            block = ExtraMSABlock(
+                c_m=c_m,
+                c_z=c_z,
+                c_hidden_msa_att=c_hidden_msa_att,
+                c_hidden_opm=c_hidden_opm,
+                c_hidden_mul=c_hidden_mul,
+                c_hidden_pair_att=c_hidden_pair_att,
+                no_heads_msa=no_heads_msa,
+                no_heads_pair=no_heads_pair,
+                transition_n=transition_n,
+                msa_dropout=msa_dropout,
+                pair_dropout=pair_dropout,
+                inf=inf,
+                eps=eps,
+                ckpt=ckpt,
+            )
+            self.blocks.append(block)
+    def forward(self,
+        m: torch.Tensor,
+        z: torch.Tensor,
+        chunk_size: int,
+        msa_mask: Optional[torch.Tensor] = None,
+        pair_mask: Optional[torch.Tensor] = None,
+        _mask_trans: bool = True,
+    ) -> torch.Tensor:
+        """
+        Args:
+            m:
+                [*, N_extra, N_res, C_m] extra MSA embedding
+            z:
+                [*, N_res, N_res, C_z] pair embedding
+            msa_mask:
+                Optional [*, N_extra, N_res] MSA mask
+            pair_mask:
+                Optional [*, N_res, N_res] pair mask
+        Returns:
+            [*, N_res, N_res, C_z] pair update
+        """
+        #checkpoint_fn = get_checkpoint_fn()
+        #blocks = [
+        #    partial(b, msa_mask=msa_mask, pair_mask=pair_mask, chunk_size=chunk_size, _chunk_logits=None) for b in self.blocks
+        #]
+        #def dodo(b, *args):
+        #    torch.cuda.empty_cache()
+        #    return b(*args)
+        #blocks = [partial(dodo, b) for b in blocks]
+        #for b in blocks:
+        #    if(torch.is_grad_enabled()):
+        #        m, z = checkpoint_fn(b, *(m, z))
+        #    else:
+        #        m, z = b(m, z)
+        for b in self.blocks:
+            m, z = b(m, z, msa_mask, pair_mask, chunk_size=chunk_size)
+            if(self.clear_cache_between_blocks):
+                torch.cuda.empty_cache()
+        return z

openfold/model/heads.py ADDED Viewed

	@@ -0,0 +1,251 @@

+# Copyright 2021 AlQuraishi Laboratory
+# Copyright 2021 DeepMind Technologies Limited
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import torch
+import torch.nn as nn
+from openfold.model.primitives import Linear, LayerNorm
+from openfold.utils.loss import (
+    compute_plddt,
+    compute_tm,
+    compute_predicted_aligned_error,
+)
+class AuxiliaryHeads(nn.Module):
+    def __init__(self, config):
+        super(AuxiliaryHeads, self).__init__()
+        self.plddt = PerResidueLDDTCaPredictor(
+            **config["lddt"],
+        )
+        self.distogram = DistogramHead(
+            **config["distogram"],
+        )
+        self.masked_msa = MaskedMSAHead(
+            **config["masked_msa"],
+        )
+        self.experimentally_resolved = ExperimentallyResolvedHead(
+            **config["experimentally_resolved"],
+        )
+        if config.tm.enabled:
+            self.tm = TMScoreHead(
+                **config.tm,
+            )
+        self.config = config
+    def forward(self, outputs):
+        aux_out = {}
+        lddt_logits = self.plddt(outputs["sm"]["single"])
+        aux_out["lddt_logits"] = lddt_logits
+        # Required for relaxation later on
+        aux_out["plddt"] = compute_plddt(lddt_logits)
+        distogram_logits = self.distogram(outputs["pair"])
+        aux_out["distogram_logits"] = distogram_logits
+        masked_msa_logits = self.masked_msa(outputs["msa"])
+        aux_out["masked_msa_logits"] = masked_msa_logits
+        experimentally_resolved_logits = self.experimentally_resolved(
+            outputs["single"]
+        )
+        aux_out[
+            "experimentally_resolved_logits"
+        ] = experimentally_resolved_logits
+        if self.config.tm.enabled:
+            tm_logits = self.tm(outputs["pair"])
+            aux_out["tm_logits"] = tm_logits
+            aux_out["predicted_tm_score"] = compute_tm(
+                tm_logits, **self.config.tm
+            )
+            aux_out.update(
+                compute_predicted_aligned_error(
+                    tm_logits,
+                    **self.config.tm,
+                )
+            )
+        return aux_out
+class PerResidueLDDTCaPredictor(nn.Module):
+    def __init__(self, no_bins, c_in, c_hidden):
+        super(PerResidueLDDTCaPredictor, self).__init__()
+        self.no_bins = no_bins
+        self.c_in = c_in
+        self.c_hidden = c_hidden
+        self.layer_norm = LayerNorm(self.c_in)
+        self.linear_1 = Linear(self.c_in, self.c_hidden, init="relu")
+        self.linear_2 = Linear(self.c_hidden, self.c_hidden, init="relu")
+        self.linear_3 = Linear(self.c_hidden, self.no_bins, init="final")
+        self.relu = nn.ReLU()
+    def forward(self, s):
+        s = self.layer_norm(s)
+        s = self.linear_1(s)
+        s = self.relu(s)
+        s = self.linear_2(s)
+        s = self.relu(s)
+        s = self.linear_3(s)
+        return s
+class DistogramHead(nn.Module):
+    """
+    Computes a distogram probability distribution.
+    For use in computation of distogram loss, subsection 1.9.8
+    """
+    def __init__(self, c_z, no_bins, **kwargs):
+        """
+        Args:
+            c_z:
+                Input channel dimension
+            no_bins:
+                Number of distogram bins
+        """
+        super(DistogramHead, self).__init__()
+        self.c_z = c_z
+        self.no_bins = no_bins
+        self.linear = Linear(self.c_z, self.no_bins, init="final")
+    def forward(self, z):  # [*, N, N, C_z]
+        """
+        Args:
+            z:
+                [*, N_res, N_res, C_z] pair embedding
+        Returns:
+            [*, N, N, no_bins] distogram probability distribution
+        """
+        # [*, N, N, no_bins]
+        logits = self.linear(z)
+        logits = logits + logits.transpose(-2, -3)
+        return logits
+class TMScoreHead(nn.Module):
+    """
+    For use in computation of TM-score, subsection 1.9.7
+    """
+    def __init__(self, c_z, no_bins, **kwargs):
+        """
+        Args:
+            c_z:
+                Input channel dimension
+            no_bins:
+                Number of bins
+        """
+        super(TMScoreHead, self).__init__()
+        self.c_z = c_z
+        self.no_bins = no_bins
+        self.linear = Linear(self.c_z, self.no_bins, init="final")
+    def forward(self, z):
+        """
+        Args:
+            z:
+                [*, N_res, N_res, C_z] pairwise embedding
+        Returns:
+            [*, N_res, N_res, no_bins] prediction
+        """
+        # [*, N, N, no_bins]
+        logits = self.linear(z)
+        return logits
+class MaskedMSAHead(nn.Module):
+    """
+    For use in computation of masked MSA loss, subsection 1.9.9
+    """
+    def __init__(self, c_m, c_out, **kwargs):
+        """
+        Args:
+            c_m:
+                MSA channel dimension
+            c_out:
+                Output channel dimension
+        """
+        super(MaskedMSAHead, self).__init__()
+        self.c_m = c_m
+        self.c_out = c_out
+        self.linear = Linear(self.c_m, self.c_out, init="final")
+    def forward(self, m):
+        """
+        Args:
+            m:
+                [*, N_seq, N_res, C_m] MSA embedding
+        Returns:
+            [*, N_seq, N_res, C_out] reconstruction
+        """
+        # [*, N_seq, N_res, C_out]
+        logits = self.linear(m)
+        return logits
+class ExperimentallyResolvedHead(nn.Module):
+    """
+    For use in computation of "experimentally resolved" loss, subsection
+    1.9.10
+    """
+    def __init__(self, c_s, c_out, **kwargs):
+        """
+        Args:
+            c_s:
+                Input channel dimension
+            c_out:
+                Number of distogram bins
+        """
+        super(ExperimentallyResolvedHead, self).__init__()
+        self.c_s = c_s
+        self.c_out = c_out
+        self.linear = Linear(self.c_s, self.c_out, init="final")
+    def forward(self, s):
+        """
+        Args:
+            s:
+                [*, N_res, C_s] single embedding
+        Returns:
+            [*, N, C_out] logits
+        """
+        # [*, N, C_out]
+        logits = self.linear(s)
+        return logits

openfold/model/model.py ADDED Viewed

	@@ -0,0 +1,446 @@

+# Copyright 2021 AlQuraishi Laboratory
+# Copyright 2021 DeepMind Technologies Limited
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from functools import partial
+import torch
+import torch.nn as nn
+from openfold.utils.feats import (
+    pseudo_beta_fn,
+    build_extra_msa_feat,
+    build_template_angle_feat,
+    build_template_pair_feat,
+    atom14_to_atom37,
+)
+from openfold.model.embedders import (
+    InputEmbedder,
+    RecyclingEmbedder,
+    TemplateAngleEmbedder,
+    TemplatePairEmbedder,
+    ExtraMSAEmbedder,
+)
+from openfold.model.evoformer import EvoformerStack, ExtraMSAStack
+from openfold.model.heads import AuxiliaryHeads
+import openfold.np.residue_constants as residue_constants
+from openfold.model.structure_module import StructureModule
+from openfold.model.template import (
+    TemplatePairStack,
+    TemplatePointwiseAttention,
+)
+from openfold.utils.loss import (
+    compute_plddt,
+)
+from openfold.utils.tensor_utils import (
+    dict_multimap,
+    tensor_tree_map,
+)
+class AlphaFold(nn.Module):
+    """
+    Alphafold 2.
+    Implements Algorithm 2 (but with training).
+    """
+    def __init__(self, config):
+        """
+        Args:
+            config:
+                A dict-like config object (like the one in config.py)
+        """
+        super(AlphaFold, self).__init__()
+        self.globals = config.globals
+        config = config.model
+        template_config = config.template
+        extra_msa_config = config.extra_msa
+        # Main trunk + structure module
+        self.input_embedder = InputEmbedder(
+            **config["input_embedder"],
+        )
+        self.recycling_embedder = RecyclingEmbedder(
+            **config["recycling_embedder"],
+        )
+        self.template_angle_embedder = TemplateAngleEmbedder(
+            **template_config["template_angle_embedder"],
+        )
+        self.template_pair_embedder = TemplatePairEmbedder(
+            **template_config["template_pair_embedder"],
+        )
+        self.template_pair_stack = TemplatePairStack(
+            **template_config["template_pair_stack"],
+        )
+        self.template_pointwise_att = TemplatePointwiseAttention(
+            **template_config["template_pointwise_attention"],
+        )
+        self.extra_msa_embedder = ExtraMSAEmbedder(
+            **extra_msa_config["extra_msa_embedder"],
+        )
+        self.extra_msa_stack = ExtraMSAStack(
+            **extra_msa_config["extra_msa_stack"],
+        )
+        self.evoformer = EvoformerStack(
+            **config["evoformer_stack"],
+        )
+        self.structure_module = StructureModule(
+            **config["structure_module"],
+        )
+        self.aux_heads = AuxiliaryHeads(
+            config["heads"],
+        )
+        self.config = config
+    def embed_templates(self, batch, z, pair_mask, templ_dim):
+        # Embed the templates one at a time (with a poor man's vmap)
+        template_embeds = []
+        n_templ = batch["template_aatype"].shape[templ_dim]
+        for i in range(n_templ):
+            idx = batch["template_aatype"].new_tensor(i)
+            single_template_feats = tensor_tree_map(
+                lambda t: torch.index_select(t, templ_dim, idx),
+                batch,
+            )
+            single_template_embeds = {}
+            if self.config.template.embed_angles:
+                template_angle_feat = build_template_angle_feat(
+                    single_template_feats,
+                )
+                # [*, S_t, N, C_m]
+                a = self.template_angle_embedder(template_angle_feat)
+                single_template_embeds["angle"] = a
+            # [*, S_t, N, N, C_t]
+            t = build_template_pair_feat(
+                single_template_feats,
+                inf=self.config.template.inf,
+                eps=self.config.template.eps,
+                **self.config.template.distogram,
+            ).to(z.dtype)
+            t = self.template_pair_embedder(t)
+            single_template_embeds.update({"pair": t})
+            template_embeds.append(single_template_embeds)
+        template_embeds = dict_multimap(
+            partial(torch.cat, dim=templ_dim),
+            template_embeds,
+        )
+        # [*, S_t, N, N, C_z]
+        t = self.template_pair_stack(
+            template_embeds["pair"],
+            pair_mask.unsqueeze(-3).to(dtype=z.dtype),
+            chunk_size=self.globals.chunk_size,
+            _mask_trans=self.config._mask_trans,
+        )
+        # [*, N, N, C_z]
+        t = self.template_pointwise_att(
+            t,
+            z,
+            template_mask=batch["template_mask"].to(dtype=z.dtype),
+            chunk_size=self.globals.chunk_size,
+        )
+        t = t * (torch.sum(batch["template_mask"]) > 0)
+        ret = {}
+        if self.config.template.embed_angles:
+            ret["template_angle_embedding"] = template_embeds["angle"]
+        ret.update({"template_pair_embedding": t})
+        return ret
+    def iteration(self, feats, m_1_prev, z_prev, x_prev, _recycle=True):
+        # Primary output dictionary
+        outputs = {}
+        # This needs to be done manually for DeepSpeed's sake
+        dtype = next(self.parameters()).dtype
+        for k in feats:
+            if(feats[k].dtype == torch.float32):
+                feats[k] = feats[k].to(dtype=dtype)
+        # Grab some data about the input
+        batch_dims = feats["target_feat"].shape[:-2]
+        no_batch_dims = len(batch_dims)
+        n = feats["target_feat"].shape[-2]
+        n_seq = feats["msa_feat"].shape[-3]
+        device = feats["target_feat"].device
+        # Prep some features
+        seq_mask = feats["seq_mask"]
+        pair_mask = seq_mask[..., None] * seq_mask[..., None, :]
+        msa_mask = feats["msa_mask"]
+        # Initialize the MSA and pair representations
+        # m: [*, S_c, N, C_m]
+        # z: [*, N, N, C_z]
+        m, z = self.input_embedder(
+            feats["target_feat"],
+            feats["residue_index"],
+            feats["msa_feat"],
+        )
+        # Initialize the recycling embeddings, if needs be
+        if None in [m_1_prev, z_prev, x_prev]:
+            # [*, N, C_m]
+            m_1_prev = m.new_zeros(
+                (*batch_dims, n, self.config.input_embedder.c_m),
+                requires_grad=False,
+            )
+            # [*, N, N, C_z]
+            z_prev = z.new_zeros(
+                (*batch_dims, n, n, self.config.input_embedder.c_z),
+                requires_grad=False,
+            )
+            # [*, N, 3]
+            x_prev = z.new_zeros(
+                (*batch_dims, n, residue_constants.atom_type_num, 3),
+                requires_grad=False,
+            )
+        x_prev = pseudo_beta_fn(
+            feats["aatype"], x_prev, None
+        ).to(dtype=z.dtype)
+        # m_1_prev_emb: [*, N, C_m]
+        # z_prev_emb: [*, N, N, C_z]
+        m_1_prev_emb, z_prev_emb = self.recycling_embedder(
+            m_1_prev,
+            z_prev,
+            x_prev,
+        )
+        # If the number of recycling iterations is 0, skip recycling
+        # altogether. We zero them this way instead of computing them
+        # conditionally to avoid leaving parameters unused, which has annoying
+        # implications for DDP training.
+        if(not _recycle):
+            m_1_prev_emb *= 0
+            z_prev_emb *= 0
+        # [*, S_c, N, C_m]
+        m[..., 0, :, :] += m_1_prev_emb
+        # [*, N, N, C_z]
+        z += z_prev_emb
+        # Possibly prevents memory fragmentation
+        del m_1_prev, z_prev, x_prev, m_1_prev_emb, z_prev_emb
+        # Embed the templates + merge with MSA/pair embeddings
+        if self.config.template.enabled:
+            template_feats = {
+                k: v for k, v in feats.items() if k.startswith("template_")
+            }
+            template_embeds = self.embed_templates(
+                template_feats,
+                z,
+                pair_mask.to(dtype=z.dtype),
+                no_batch_dims,
+            )
+            # [*, N, N, C_z]
+            z = z + template_embeds["template_pair_embedding"]
+            if self.config.template.embed_angles:
+                # [*, S = S_c + S_t, N, C_m]
+                m = torch.cat(
+                    [m, template_embeds["template_angle_embedding"]],
+                    dim=-3
+                )
+                # [*, S, N]
+                torsion_angles_mask = feats["template_torsion_angles_mask"]
+                msa_mask = torch.cat(
+                    [feats["msa_mask"], torsion_angles_mask[..., 2]],
+                    dim=-2
+                )
+        # Embed extra MSA features + merge with pairwise embeddings
+        if self.config.extra_msa.enabled:
+            # [*, S_e, N, C_e]
+            a = self.extra_msa_embedder(build_extra_msa_feat(feats))
+            # [*, N, N, C_z]
+            z = self.extra_msa_stack(
+                a,
+                z,
+                msa_mask=feats["extra_msa_mask"].to(dtype=a.dtype),
+                chunk_size=self.globals.chunk_size,
+                pair_mask=pair_mask.to(dtype=z.dtype),
+                _mask_trans=self.config._mask_trans,
+            )
+        # Run MSA + pair embeddings through the trunk of the network
+        # m: [*, S, N, C_m]
+        # z: [*, N, N, C_z]
+        # s: [*, N, C_s]
+        m, z, s = self.evoformer(
+            m,
+            z,
+            msa_mask=msa_mask.to(dtype=m.dtype),
+            pair_mask=pair_mask.to(dtype=z.dtype),
+            chunk_size=self.globals.chunk_size,
+            _mask_trans=self.config._mask_trans,
+        )
+        outputs["msa"] = m[..., :n_seq, :, :]
+        outputs["pair"] = z
+        outputs["single"] = s
+        # Predict 3D structure
+        outputs["sm"] = self.structure_module(
+            s,
+            z,
+            feats["aatype"],
+            mask=feats["seq_mask"].to(dtype=s.dtype),
+        )
+        outputs["final_atom_positions"] = atom14_to_atom37(
+            outputs["sm"]["positions"][-1], feats
+        )
+        outputs["final_atom_mask"] = feats["atom37_atom_exists"]
+        outputs["final_affine_tensor"] = outputs["sm"]["frames"][-1]
+        # Save embeddings for use during the next recycling iteration
+        # [*, N, C_m]
+        m_1_prev = m[..., 0, :, :]
+        # [*, N, N, C_z]
+        z_prev = z
+        # [*, N, 3]
+        x_prev = outputs["final_atom_positions"]
+        return outputs, m_1_prev, z_prev, x_prev
+    def _disable_activation_checkpointing(self):
+        self.template_pair_stack.blocks_per_ckpt = None
+        self.evoformer.blocks_per_ckpt = None
+        for b in self.extra_msa_stack.blocks:
+            b.ckpt = False
+    def _enable_activation_checkpointing(self):
+        self.template_pair_stack.blocks_per_ckpt = (
+            self.config.template.template_pair_stack.blocks_per_ckpt
+        )
+        self.evoformer.blocks_per_ckpt = (
+            self.config.evoformer_stack.blocks_per_ckpt
+        )
+        for b in self.extra_msa_stack.blocks:
+            b.ckpt = self.config.extra_msa.extra_msa_stack.ckpt
+    def forward(self, batch):
+        """
+        Args:
+            batch:
+                Dictionary of arguments outlined in Algorithm 2. Keys must
+                include the official names of the features in the
+                supplement subsection 1.2.9.
+                The final dimension of each input must have length equal to
+                the number of recycling iterations.
+                Features (without the recycling dimension):
+                    "aatype" ([*, N_res]):
+                        Contrary to the supplement, this tensor of residue
+                        indices is not one-hot.
+                    "target_feat" ([*, N_res, C_tf])
+                        One-hot encoding of the target sequence. C_tf is
+                        config.model.input_embedder.tf_dim.
+                    "residue_index" ([*, N_res])
+                        Tensor whose final dimension consists of
+                        consecutive indices from 0 to N_res.
+                    "msa_feat" ([*, N_seq, N_res, C_msa])
+                        MSA features, constructed as in the supplement.
+                        C_msa is config.model.input_embedder.msa_dim.
+                    "seq_mask" ([*, N_res])
+                        1-D sequence mask
+                    "msa_mask" ([*, N_seq, N_res])
+                        MSA mask
+                    "pair_mask" ([*, N_res, N_res])
+                        2-D pair mask
+                    "extra_msa_mask" ([*, N_extra, N_res])
+                        Extra MSA mask
+                    "template_mask" ([*, N_templ])
+                        Template mask (on the level of templates, not
+                        residues)
+                    "template_aatype" ([*, N_templ, N_res])
+                        Tensor of template residue indices (indices greater
+                        than 19 are clamped to 20 (Unknown))
+                    "template_all_atom_positions"
+                        ([*, N_templ, N_res, 37, 3])
+                        Template atom coordinates in atom37 format
+                    "template_all_atom_mask" ([*, N_templ, N_res, 37])
+                        Template atom coordinate mask
+                    "template_pseudo_beta" ([*, N_templ, N_res, 3])
+                        Positions of template carbon "pseudo-beta" atoms
+                        (i.e. C_beta for all residues but glycine, for
+                        for which C_alpha is used instead)
+                    "template_pseudo_beta_mask" ([*, N_templ, N_res])
+                        Pseudo-beta mask
+        """
+        # Initialize recycling embeddings
+        m_1_prev, z_prev, x_prev = None, None, None
+        # Disable activation checkpointing for the first few recycling iters
+        is_grad_enabled = torch.is_grad_enabled()
+        self._disable_activation_checkpointing()
+        # Main recycling loop
+        num_iters = batch["aatype"].shape[-1]
+        for cycle_no in range(num_iters):
+            # Select the features for the current recycling cycle
+            fetch_cur_batch = lambda t: t[..., cycle_no]
+            feats = tensor_tree_map(fetch_cur_batch, batch)
+            # Enable grad iff we're training and it's the final recycling layer
+            is_final_iter = cycle_no == (num_iters - 1)
+            with torch.set_grad_enabled(is_grad_enabled and is_final_iter):
+                if is_final_iter:
+                    self._enable_activation_checkpointing()
+                    # Sidestep AMP bug (PyTorch issue #65766)
+                    if torch.is_autocast_enabled():
+                        torch.clear_autocast_cache()
+                # Run the next iteration of the model
+                outputs, m_1_prev, z_prev, x_prev = self.iteration(
+                    feats,
+                    m_1_prev,
+                    z_prev,
+                    x_prev,
+                    _recycle=(num_iters > 1)
+                )
+        # Run auxiliary heads
+        outputs.update(self.aux_heads(outputs))
+        return outputs

openfold/model/msa.py ADDED Viewed

	@@ -0,0 +1,392 @@

+# Copyright 2021 AlQuraishi Laboratory
+# Copyright 2021 DeepMind Technologies Limited
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import math
+import torch
+import torch.nn as nn
+from typing import Optional, List, Tuple
+from openfold.model.primitives import (
+    Linear,
+    LayerNorm,
+    Attention,
+    GlobalAttention,
+    _attention_chunked_trainable,
+)
+from openfold.utils.checkpointing import get_checkpoint_fn
+from openfold.utils.tensor_utils import (
+    chunk_layer,
+    permute_final_dims,
+    flatten_final_dims,
+)
+class MSAAttention(nn.Module):
+    def __init__(
+        self,
+        c_in,
+        c_hidden,
+        no_heads,
+        pair_bias=False,
+        c_z=None,
+        inf=1e9,
+    ):
+        """
+        Args:
+            c_in:
+                Input channel dimension
+            c_hidden:
+                Per-head hidden channel dimension
+            no_heads:
+                Number of attention heads
+            pair_bias:
+                Whether to use pair embedding bias
+            c_z:
+                Pair embedding channel dimension. Ignored unless pair_bias
+                is true
+            inf:
+                A large number to be used in computing the attention mask
+        """
+        super(MSAAttention, self).__init__()
+        self.c_in = c_in
+        self.c_hidden = c_hidden
+        self.no_heads = no_heads
+        self.pair_bias = pair_bias
+        self.c_z = c_z
+        self.inf = inf
+        self.layer_norm_m = LayerNorm(self.c_in)
+        self.layer_norm_z = None
+        self.linear_z = None
+        if self.pair_bias:
+            self.layer_norm_z = LayerNorm(self.c_z)
+            self.linear_z = Linear(
+                self.c_z, self.no_heads, bias=False, init="normal"
+            )
+        self.mha = Attention(
+            self.c_in, self.c_in, self.c_in, self.c_hidden, self.no_heads
+        )
+    @torch.jit.ignore
+    def _chunk(self,
+        m: torch.Tensor,
+        biases: List[torch.Tensor],
+        chunk_size: int,
+    ) -> torch.Tensor:
+        return chunk_layer(
+            self.mha,
+            {"q_x": m, "kv_x": m, "biases": biases},
+            chunk_size=chunk_size,
+            no_batch_dims=len(m.shape[:-2]),
+        )
+    def _prep_inputs(self,
+        m: torch.Tensor,
+        z: Optional[torch.Tensor],
+        mask: Optional[torch.Tensor]
+    ) -> Tuple[torch.Tensor, torch.Tensor, torch.Tensor]:
+        # [*, N_seq, N_res, C_m]
+        m = self.layer_norm_m(m)
+        n_seq, n_res = m.shape[-3:-1]
+        if mask is None:
+            # [*, N_seq, N_res]
+            mask = m.new_ones(
+                m.shape[:-3] + (n_seq, n_res),
+            )
+        # [*, N_seq, 1, 1, N_res]
+        mask_bias = (self.inf * (mask - 1))[..., :, None, None, :]
+        # This step simply returns a larger view of the bias, and does not
+        # consume additional memory.
+        # [*, N_seq, no_heads, N_res, N_res]
+        #bias = bias.expand(
+        #    ((-1,) * len(bias.shape[:-4])) + (-1, self.no_heads, n_res, -1)
+        #)
+        if (self.pair_bias and
+            z is not None and                       # For the
+            self.layer_norm_z is not None and       # benefit of
+            self.linear_z is not None               # TorchScript
+        ):
+            # [*, N_res, N_res, C_z]
+            z = self.layer_norm_z(z)
+            # [*, N_res, N_res, no_heads]
+            z = self.linear_z(z)
+            # [*, 1, no_heads, N_res, N_res]
+            z = permute_final_dims(z, (2, 0, 1)).unsqueeze(-4)
+        return m, mask_bias, z
+    @torch.jit.ignore
+    def _chunked_msa_attn(self,
+        m: torch.Tensor,
+        z: Optional[torch.Tensor],
+        mask: Optional[torch.Tensor],
+        chunk_logits: int,
+        checkpoint: bool,
+    ) -> torch.Tensor:
+        MSA_DIM = -4
+        def _get_qkv(m, z):
+            m, mask_bias, z = self._prep_inputs(m, z, mask)
+            q, k, v = self.mha._prep_qkv(m, m)
+            return m, q, k, v, mask_bias, z
+        checkpoint_fn = get_checkpoint_fn()
+        if(torch.is_grad_enabled() and checkpoint):
+            m, q, k, v, mask_bias, z = checkpoint_fn(_get_qkv, m, z)
+        else:
+            m, q, k, v, mask_bias, z = _get_qkv(m, z)
+        o = _attention_chunked_trainable(
+            query=q,
+            key=k,
+            value=v,
+            biases=[mask_bias, z],
+            chunk_size=chunk_logits,
+            chunk_dim=MSA_DIM,
+            checkpoint=checkpoint,
+        )
+        if(torch.is_grad_enabled() and checkpoint):
+            # Storing an additional m here is far from ideal
+            m = checkpoint_fn(self.mha._wrap_up, o, m)
+        else:
+            m = self.mha._wrap_up(o, m)
+        return m
+    def forward(self,
+        m: torch.Tensor,
+        z: Optional[torch.Tensor] = None,
+        mask: Optional[torch.Tensor] = None,
+        chunk_size: Optional[int] = None,
+        _chunk_logits: Optional[int] = None,
+        _checkpoint_chunks: Optional[bool] = None,
+    ) -> torch.Tensor:
+        """
+        Args:
+            m:
+                [*, N_seq, N_res, C_m] MSA embedding
+            z:
+                [*, N_res, N_res, C_z] pair embedding. Required only if
+                pair_bias is True
+            mask:
+                [*, N_seq, N_res] MSA mask
+            chunk_size:
+                Size of chunks into which the inputs are split along their
+                batch dimensions. A low value decreases memory overhead at the
+                cost of slower execution. Chunking is not performed by default.
+        """
+        if(_chunk_logits is not None):
+            return self._chunked_msa_attn(
+                m=m, z=z, mask=mask,
+                chunk_logits=_chunk_logits, checkpoint=_checkpoint_chunks
+            )
+        m, mask_bias, z = self._prep_inputs(m, z, mask)
+        biases = [mask_bias]
+        if(z is not None):
+            biases.append(z)
+        if chunk_size is not None:
+            m = self._chunk(m, biases, chunk_size)
+        else:
+            m = self.mha(
+                q_x=m,
+                kv_x=m,
+                biases=biases
+            )
+        return m
+class MSARowAttentionWithPairBias(MSAAttention):
+    """
+    Implements Algorithm 7.
+    """
+    def __init__(self, c_m, c_z, c_hidden, no_heads, inf=1e9):
+        """
+        Args:
+            c_m:
+                Input channel dimension
+            c_z:
+                Pair embedding channel dimension
+            c_hidden:
+                Per-head hidden channel dimension
+            no_heads:
+                Number of attention heads
+            inf:
+                Large number used to construct attention masks
+        """
+        super(MSARowAttentionWithPairBias, self).__init__(
+            c_m,
+            c_hidden,
+            no_heads,
+            pair_bias=True,
+            c_z=c_z,
+            inf=inf,
+        )
+class MSAColumnAttention(nn.Module):
+    """
+    Implements Algorithm 8.
+    By rights, this should also be a subclass of MSAAttention. Alas,
+    most inheritance isn't supported by TorchScript.
+    """
+    def __init__(self, c_m, c_hidden, no_heads, inf=1e9):
+        """
+        Args:
+            c_m:
+                MSA channel dimension
+            c_hidden:
+                Per-head hidden channel dimension
+            no_heads:
+                Number of attention heads
+            inf:
+                Large number used to construct attention masks
+        """
+        super(MSAColumnAttention, self).__init__()
+        self.c_m = c_m
+        self.c_hidden = c_hidden
+        self.no_heads = no_heads
+        self.inf = inf
+        self._msa_att = MSAAttention(
+            c_in=c_m,
+            c_hidden=c_hidden,
+            no_heads=no_heads,
+            pair_bias=False,
+            c_z=None,
+            inf=inf,
+        )
+    def forward(self,
+        m: torch.Tensor,
+        mask: Optional[torch.Tensor] = None,
+        chunk_size: Optional[int] = None
+    ) -> torch.Tensor:
+        """
+        Args:
+            m:
+                [*, N_seq, N_res, C_m] MSA embedding
+            mask:
+                [*, N_seq, N_res] MSA mask
+            chunk_size:
+                Size of chunks into which the inputs are split along their
+                batch dimensions. A low value decreases memory overhead at the
+                cost of slower execution. Chunking is not performed by default.
+        """
+        # [*, N_res, N_seq, C_in]
+        m = m.transpose(-2, -3)
+        if mask is not None:
+            mask = mask.transpose(-1, -2)
+        m = self._msa_att(m, mask=mask, chunk_size=chunk_size)
+        # [*, N_seq, N_res, C_in]
+        m = m.transpose(-2, -3)
+        if mask is not None:
+            mask = mask.transpose(-1, -2)
+        return m
+class MSAColumnGlobalAttention(nn.Module):
+    def __init__(
+        self, c_in, c_hidden, no_heads, inf=1e9, eps=1e-10,
+    ):
+        super(MSAColumnGlobalAttention, self).__init__()
+        self.c_in = c_in
+        self.c_hidden = c_hidden
+        self.no_heads = no_heads
+        self.inf = inf
+        self.eps = eps
+        self.layer_norm_m = nn.LayerNorm(c_in)
+        self.global_attention = GlobalAttention(
+            c_in=c_in,
+            c_hidden=c_hidden,
+            no_heads=no_heads,
+            inf=inf,
+            eps=eps,
+        )
+    @torch.jit.ignore
+    def _chunk(self,
+        m: torch.Tensor,
+        mask: torch.Tensor,
+        chunk_size: int,
+    ) -> torch.Tensor:
+        mha_input = {
+            "m": m,
+            "mask": mask,
+        }
+        return chunk_layer(
+            self.global_attention,
+            mha_input,
+            chunk_size=chunk_size,
+            no_batch_dims=len(m.shape[:-2]),
+        )
+    def forward(
+        self,
+        m: torch.Tensor,
+        mask: Optional[torch.Tensor] = None,
+        chunk_size: Optional[int] = None,
+    ) -> torch.Tensor:
+        n_seq, n_res, c_in = m.shape[-3:]
+        if mask is None:
+            # [*, N_seq, N_res]
+            mask = torch.ones(
+                m.shape[:-1],
+                dtype=m.dtype,
+                device=m.device,
+            ).detach()
+        # [*, N_res, N_seq, C_in]
+        m = m.transpose(-2, -3)
+        mask = mask.transpose(-1, -2)
+        # [*, N_res, N_seq, C_in]
+        m = self.layer_norm_m(m)
+        if chunk_size is not None:
+            m = self._chunk(m, mask, chunk_size)
+        else:
+            m = self.global_attention(m=m, mask=mask)
+        # [*, N_seq, N_res, C_in]
+        m = m.transpose(-2, -3)
+        return m

openfold/model/outer_product_mean.py ADDED Viewed

	@@ -0,0 +1,129 @@

+# Copyright 2021 AlQuraishi Laboratory
+# Copyright 2021 DeepMind Technologies Limited
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from functools import partial
+from typing import Optional
+import torch
+import torch.nn as nn
+from openfold.model.primitives import Linear
+from openfold.utils.tensor_utils import chunk_layer
+class OuterProductMean(nn.Module):
+    """
+    Implements Algorithm 10.
+    """
+    def __init__(self, c_m, c_z, c_hidden, eps=1e-3):
+        """
+        Args:
+            c_m:
+                MSA embedding channel dimension
+            c_z:
+                Pair embedding channel dimension
+            c_hidden:
+                Hidden channel dimension
+        """
+        super(OuterProductMean, self).__init__()
+        self.c_m = c_m
+        self.c_z = c_z
+        self.c_hidden = c_hidden
+        self.eps = eps
+        self.layer_norm = nn.LayerNorm(c_m)
+        self.linear_1 = Linear(c_m, c_hidden)
+        self.linear_2 = Linear(c_m, c_hidden)
+        self.linear_out = Linear(c_hidden ** 2, c_z, init="final")
+    def _opm(self, a, b):
+        # [*, N_res, N_res, C, C]
+        outer = torch.einsum("...bac,...dae->...bdce", a, b)
+        # [*, N_res, N_res, C * C]
+        outer = outer.reshape(outer.shape[:-2] + (-1,))
+        # [*, N_res, N_res, C_z]
+        outer = self.linear_out(outer)
+        return outer
+    @torch.jit.ignore
+    def _chunk(self,
+        a: torch.Tensor,
+        b: torch.Tensor,
+        chunk_size: int
+    ) -> torch.Tensor:
+        # Since the "batch dim" in this case is not a true batch dimension
+        # (in that the shape of the output depends on it), we need to
+        # iterate over it ourselves
+        a_reshape = a.reshape((-1,) + a.shape[-3:])
+        b_reshape = b.reshape((-1,) + b.shape[-3:])
+        out = []
+        for a_prime, b_prime in zip(a_reshape, b_reshape):
+            outer = chunk_layer(
+                partial(self._opm, b=b_prime),
+                {"a": a_prime},
+                chunk_size=chunk_size,
+                no_batch_dims=1,
+            )
+            out.append(outer)
+        outer = torch.stack(out, dim=0)
+        outer = outer.reshape(a.shape[:-3] + outer.shape[1:])
+        return outer
+    def forward(self,
+        m: torch.Tensor,
+        mask: Optional[torch.Tensor] = None,
+        chunk_size: Optional[int] = None
+    ) -> torch.Tensor:
+        """
+        Args:
+            m:
+                [*, N_seq, N_res, C_m] MSA embedding
+            mask:
+                [*, N_seq, N_res] MSA mask
+        Returns:
+            [*, N_res, N_res, C_z] pair embedding update
+        """
+        if mask is None:
+            mask = m.new_ones(m.shape[:-1])
+        # [*, N_seq, N_res, C_m]
+        m = self.layer_norm(m)
+        # [*, N_seq, N_res, C]
+        mask = mask.unsqueeze(-1)
+        a = self.linear_1(m) * mask
+        b = self.linear_2(m) * mask
+        a = a.transpose(-2, -3)
+        b = b.transpose(-2, -3)
+        if chunk_size is not None:
+            outer = self._chunk(a, b, chunk_size)
+        else:
+            outer = self._opm(a, b)
+        # [*, N_res, N_res, 1]
+        norm = torch.einsum("...abc,...adc->...bdc", mask, mask)
+        # [*, N_res, N_res, C_z]
+        outer = outer / (self.eps + norm)
+        return outer

openfold/model/pair_transition.py ADDED Viewed

	@@ -0,0 +1,99 @@

+# Copyright 2021 AlQuraishi Laboratory
+# Copyright 2021 DeepMind Technologies Limited
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from typing import Optional
+import torch
+import torch.nn as nn
+from openfold.model.primitives import Linear, LayerNorm
+from openfold.utils.tensor_utils import chunk_layer
+class PairTransition(nn.Module):
+    """
+    Implements Algorithm 15.
+    """
+    def __init__(self, c_z, n):
+        """
+        Args:
+            c_z:
+                Pair transition channel dimension
+            n:
+                Factor by which c_z is multiplied to obtain hidden channel
+                dimension
+        """
+        super(PairTransition, self).__init__()
+        self.c_z = c_z
+        self.n = n
+        self.layer_norm = LayerNorm(self.c_z)
+        self.linear_1 = Linear(self.c_z, self.n * self.c_z, init="relu")
+        self.relu = nn.ReLU()
+        self.linear_2 = Linear(self.n * self.c_z, c_z, init="final")
+    def _transition(self, z, mask):
+        # [*, N_res, N_res, C_hidden]
+        z = self.linear_1(z)
+        z = self.relu(z)
+        # [*, N_res, N_res, C_z]
+        z = self.linear_2(z) * mask
+        return z
+    @torch.jit.ignore
+    def _chunk(self,
+        z: torch.Tensor,
+        mask: torch.Tensor,
+        chunk_size: int,
+    ) -> torch.Tensor:
+        return chunk_layer(
+            self._transition,
+            {"z": z, "mask": mask},
+            chunk_size=chunk_size,
+            no_batch_dims=len(z.shape[:-2]),
+        )
+    def forward(self,
+        z: torch.Tensor,
+        mask: Optional[torch.Tensor] = None,
+        chunk_size: Optional[int] = None,
+    ) -> torch.Tensor:
+        """
+        Args:
+            z:
+                [*, N_res, N_res, C_z] pair embedding
+        Returns:
+            [*, N_res, N_res, C_z] pair embedding update
+        """
+        # DISCREPANCY: DeepMind forgets to apply the mask in this module.
+        if mask is None:
+            mask = z.new_ones(z.shape[:-1])
+        # [*, N_res, N_res, 1]
+        mask = mask.unsqueeze(-1)
+        # [*, N_res, N_res, C_z]
+        z = self.layer_norm(z)
+        if chunk_size is not None:
+            z = self._chunk(z, mask, chunk_size)
+        else:
+            z = self._transition(z=z, mask=mask)
+        return z

openfold/model/primitives.py ADDED Viewed

	@@ -0,0 +1,587 @@

+# Copyright 2021 AlQuraishi Laboratory
+# Copyright 2021 DeepMind Technologies Limited
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from functools import partial
+import math
+from typing import Optional, Callable, List, Tuple, Sequence
+import numpy as np
+import deepspeed
+import torch
+import torch.nn as nn
+from scipy.stats import truncnorm
+from openfold.utils.checkpointing import get_checkpoint_fn
+from openfold.utils.tensor_utils import (
+    permute_final_dims,
+    flatten_final_dims,
+    _chunk_slice,
+)
+def _prod(nums):
+    out = 1
+    for n in nums:
+        out = out * n
+    return out
+def _calculate_fan(linear_weight_shape, fan="fan_in"):
+    fan_out, fan_in = linear_weight_shape
+    if fan == "fan_in":
+        f = fan_in
+    elif fan == "fan_out":
+        f = fan_out
+    elif fan == "fan_avg":
+        f = (fan_in + fan_out) / 2
+    else:
+        raise ValueError("Invalid fan option")
+    return f
+def trunc_normal_init_(weights, scale=1.0, fan="fan_in"):
+    shape = weights.shape
+    f = _calculate_fan(shape, fan)
+    scale = scale / max(1, f)
+    a = -2
+    b = 2
+    std = math.sqrt(scale) / truncnorm.std(a=a, b=b, loc=0, scale=1)
+    size = _prod(shape)
+    samples = truncnorm.rvs(a=a, b=b, loc=0, scale=std, size=size)
+    samples = np.reshape(samples, shape)
+    with torch.no_grad():
+        weights.copy_(torch.tensor(samples, device=weights.device))
+def lecun_normal_init_(weights):
+    trunc_normal_init_(weights, scale=1.0)
+def he_normal_init_(weights):
+    trunc_normal_init_(weights, scale=2.0)
+def glorot_uniform_init_(weights):
+    nn.init.xavier_uniform_(weights, gain=1)
+def final_init_(weights):
+    with torch.no_grad():
+        weights.fill_(0.0)
+def gating_init_(weights):
+    with torch.no_grad():
+        weights.fill_(0.0)
+def normal_init_(weights):
+    torch.nn.init.kaiming_normal_(weights, nonlinearity="linear")
+def ipa_point_weights_init_(weights):
+    with torch.no_grad():
+        softplus_inverse_1 = 0.541324854612918
+        weights.fill_(softplus_inverse_1)
+class Linear(nn.Linear):
+    """
+    A Linear layer with built-in nonstandard initializations. Called just
+    like torch.nn.Linear.
+    Implements the initializers in 1.11.4, plus some additional ones found
+    in the code.
+    """
+    def __init__(
+        self,
+        in_dim: int,
+        out_dim: int,
+        bias: bool = True,
+        init: str = "default",
+        init_fn: Optional[Callable[[torch.Tensor, torch.Tensor], None]] = None,
+    ):
+        """
+        Args:
+            in_dim:
+                The final dimension of inputs to the layer
+            out_dim:
+                The final dimension of layer outputs
+            bias:
+                Whether to learn an additive bias. True by default
+            init:
+                The initializer to use. Choose from:
+                "default": LeCun fan-in truncated normal initialization
+                "relu": He initialization w/ truncated normal distribution
+                "glorot": Fan-average Glorot uniform initialization
+                "gating": Weights=0, Bias=1
+                "normal": Normal initialization with std=1/sqrt(fan_in)
+                "final": Weights=0, Bias=0
+                Overridden by init_fn if the latter is not None.
+            init_fn:
+                A custom initializer taking weight and bias as inputs.
+                Overrides init if not None.
+        """
+        super(Linear, self).__init__(in_dim, out_dim, bias=bias)
+        if bias:
+            with torch.no_grad():
+                self.bias.fill_(0)
+        if init_fn is not None:
+            init_fn(self.weight, self.bias)
+        else:
+            if init == "default":
+                lecun_normal_init_(self.weight)
+            elif init == "relu":
+                he_normal_init_(self.weight)
+            elif init == "glorot":
+                glorot_uniform_init_(self.weight)
+            elif init == "gating":
+                gating_init_(self.weight)
+                if bias:
+                    with torch.no_grad():
+                        self.bias.fill_(1.0)
+            elif init == "normal":
+                normal_init_(self.weight)
+            elif init == "final":
+                final_init_(self.weight)
+            else:
+                raise ValueError("Invalid init string.")
+class LayerNorm(nn.Module):
+    def __init__(self, c_in, eps=1e-5):
+        super(LayerNorm, self).__init__()
+        self.c_in = (c_in,)
+        self.eps = eps
+        self.weight = nn.Parameter(torch.ones(c_in))
+        self.bias = nn.Parameter(torch.zeros(c_in))
+    def forward(self, x):
+        d = x.dtype
+        if(d is torch.bfloat16 and not deepspeed.utils.is_initialized()):
+            with torch.cuda.amp.autocast(enabled=False):
+                out = nn.functional.layer_norm(
+                    x,
+                    self.c_in,
+                    self.weight.to(dtype=d),
+                    self.bias.to(dtype=d),
+                    self.eps
+                )
+        else:
+            out = nn.functional.layer_norm(
+                x,
+                self.c_in,
+                self.weight,
+                self.bias,
+                self.eps,
+            )
+        return out
+@torch.jit.ignore
+def softmax(t: torch.Tensor, dim: int = -1) -> torch.Tensor:
+    """
+        Softmax, but without automatic casting to fp32 when the input is of
+        type bfloat16
+    """
+    d = t.dtype
+    if(d is torch.bfloat16 and not deepspeed.utils.is_initialized()):
+        with torch.cuda.amp.autocast(enabled=False):
+            s = torch.nn.functional.softmax(t, dim=dim)
+    else:
+        s = torch.nn.functional.softmax(t, dim=dim)
+    return s
+#@torch.jit.script
+def _attention(query: torch.Tensor, key: torch.Tensor, value: torch.Tensor, biases: List[torch.Tensor]) -> torch.Tensor:
+    # [*, H, Q, C_hidden]
+    query = permute_final_dims(query, (1, 0, 2))
+    # [*, H, C_hidden, K]
+    key = permute_final_dims(key, (1, 2, 0))
+    # [*, H, V, C_hidden]
+    value = permute_final_dims(value, (1, 0, 2))
+    # [*, H, Q, K]
+    a = torch.matmul(query, key)
+    for b in biases:
+        a += b
+    a = softmax(a, -1)
+    # [*, H, Q, C_hidden]
+    a = torch.matmul(a, value)
+    # [*, Q, H, C_hidden]
+    a = a.transpose(-2, -3)
+    return a
+@torch.jit.ignore
+def _attention_chunked_trainable(
+    query, key, value, biases, chunk_size, chunk_dim, checkpoint,
+):
+    if(checkpoint and len(biases) > 2):
+        raise ValueError(
+            "Checkpointed version permits only permits two bias terms"
+        )
+    def _checkpointable_attention(q, k, v, b1, b2):
+        bs = [b for b in [b1, b2] if b is not None]
+        return _attention(q, k, v, bs)
+    o_chunks = []
+    checkpoint_fn = get_checkpoint_fn()
+    count = query.shape[chunk_dim]
+    for start in range(0, count, chunk_size):
+        end = start + chunk_size
+        idx = [slice(None)] * len(query.shape)
+        idx[chunk_dim] = slice(start, end)
+        idx_tup = tuple(idx)
+        q_chunk = query[idx_tup]
+        k_chunk = key[idx_tup]
+        v_chunk = value[idx_tup]
+        def _slice_bias(b):
+            idx[chunk_dim] = (
+                slice(start, end) if b.shape[chunk_dim] != 1 else slice(None)
+            )
+            return b[tuple(idx)]
+        if(checkpoint):
+            bias_1_chunk, bias_2_chunk = [
+                _slice_bias(b) if b is not None else None
+                for b in (biases + [None, None])[:2]
+            ]
+            o_chunk = checkpoint_fn(_checkpointable_attention,
+                q_chunk, k_chunk, v_chunk, bias_1_chunk, bias_2_chunk
+            )
+        else:
+            bias_chunks = [
+                _slice_bias(b) for b in biases
+            ]
+            o_chunk = _attention(q_chunk, k_chunk, v_chunk, bias_chunks)
+        o_chunks.append(o_chunk)
+    o = torch.cat(o_chunks, dim=chunk_dim)
+    return o
+class Attention(nn.Module):
+    """
+    Standard multi-head attention using AlphaFold's default layer
+    initialization. Allows multiple bias vectors.
+    """
+    def __init__(
+        self,
+        c_q: int,
+        c_k: int,
+        c_v: int,
+        c_hidden: int,
+        no_heads: int,
+        gating: bool = True,
+    ):
+        """
+        Args:
+            c_q:
+                Input dimension of query data
+            c_k:
+                Input dimension of key data
+            c_v:
+                Input dimension of value data
+            c_hidden:
+                Per-head hidden dimension
+            no_heads:
+                Number of attention heads
+            gating:
+                Whether the output should be gated using query data
+        """
+        super(Attention, self).__init__()
+        self.c_q = c_q
+        self.c_k = c_k
+        self.c_v = c_v
+        self.c_hidden = c_hidden
+        self.no_heads = no_heads
+        self.gating = gating
+        # DISCREPANCY: c_hidden is not the per-head channel dimension, as
+        # stated in the supplement, but the overall channel dimension.
+        self.linear_q = Linear(
+            self.c_q, self.c_hidden * self.no_heads, bias=False, init="glorot"
+        )
+        self.linear_k = Linear(
+            self.c_k, self.c_hidden * self.no_heads, bias=False, init="glorot"
+        )
+        self.linear_v = Linear(
+            self.c_v, self.c_hidden * self.no_heads, bias=False, init="glorot"
+        )
+        self.linear_o = Linear(
+            self.c_hidden * self.no_heads, self.c_q, init="final"
+        )
+        self.linear_g = None
+        if self.gating:
+            self.linear_g = Linear(
+                self.c_q, self.c_hidden * self.no_heads, init="gating"
+            )
+        self.sigmoid = nn.Sigmoid()
+    def _prep_qkv(self,
+        q_x: torch.Tensor,
+        kv_x: torch.Tensor
+    ) -> Tuple[
+        torch.Tensor, torch.Tensor, torch.Tensor
+    ]:
+        # [*, Q/K/V, H * C_hidden]
+        q = self.linear_q(q_x)
+        k = self.linear_k(kv_x)
+        v = self.linear_v(kv_x)
+        # [*, Q/K, H, C_hidden]
+        q = q.view(q.shape[:-1] + (self.no_heads, -1))
+        k = k.view(k.shape[:-1] + (self.no_heads, -1))
+        v = v.view(v.shape[:-1] + (self.no_heads, -1))
+        q /= math.sqrt(self.c_hidden)
+        return q, k, v
+    def _wrap_up(self,
+        o: torch.Tensor,
+        q_x: torch.Tensor
+    ) -> torch.Tensor:
+        if(self.linear_g is not None):
+            g = self.sigmoid(self.linear_g(q_x))
+            # [*, Q, H, C_hidden]
+            g = g.view(g.shape[:-1] + (self.no_heads, -1))
+            o = o * g
+        # [*, Q, H * C_hidden]
+        o = flatten_final_dims(o, 2)
+        # [*, Q, C_q]
+        o = self.linear_o(o)
+        return o
+    def forward(
+        self,
+        q_x: torch.Tensor,
+        kv_x: torch.Tensor,
+        biases: Optional[List[torch.Tensor]] = None,
+        use_lma: bool = False,
+        q_chunk_size: Optional[int] = None,
+        kv_chunk_size: Optional[int] = None,
+    ) -> torch.Tensor:
+        """
+        Args:
+            q_x:
+                [*, Q, C_q] query data
+            kv_x:
+                [*, K, C_k] key data
+            biases:
+                List of biases that broadcast to [*, H, Q, K]
+            use_lma:
+                Whether to use low-memory attention
+            q_chunk_size:
+                Query chunk size (for LMA)
+            kv_chunk_size:
+                Key/Value chunk size (for LMA)
+        Returns
+            [*, Q, C_q] attention update
+        """
+        if(biases is None):
+            biases = []
+        if(use_lma and (q_chunk_size is None or kv_chunk_size is None)):
+            raise ValueError(
+                "If use_lma is specified, q_chunk_size and kv_chunk_size must "
+                "be provided"
+            )
+        q, k, v = self._prep_qkv(q_x, kv_x)
+        if(use_lma):
+            biases = [
+                b.expand(b.shape[:-2] + (q_x.shape[-2],) + (kv_x.shape[-2],))
+                for b in biases
+            ]
+            o = _lma(q, k, v, biases, q_chunk_size, kv_chunk_size)
+        else:
+            o = _attention(q, k, v, biases)
+        o = self._wrap_up(o, q_x)
+        return o
+class GlobalAttention(nn.Module):
+    def __init__(self, c_in, c_hidden, no_heads, inf, eps):
+        super(GlobalAttention, self).__init__()
+        self.c_in = c_in
+        self.c_hidden = c_hidden
+        self.no_heads = no_heads
+        self.inf = inf
+        self.eps = eps
+        self.linear_q = Linear(
+            c_in, c_hidden * no_heads, bias=False, init="glorot"
+        )
+        self.linear_k = Linear(
+            c_in, c_hidden, bias=False, init="glorot",
+        )
+        self.linear_v = Linear(
+            c_in, c_hidden, bias=False, init="glorot",
+        )
+        self.linear_g = Linear(c_in, c_hidden * no_heads, init="gating")
+        self.linear_o = Linear(c_hidden * no_heads, c_in, init="final")
+        self.sigmoid = nn.Sigmoid()
+    def forward(self, m: torch.Tensor, mask: torch.Tensor) -> torch.Tensor:
+        # [*, N_res, C_in]
+        q = torch.sum(m * mask.unsqueeze(-1), dim=-2) / (
+            torch.sum(mask, dim=-1)[..., None] + self.eps
+        )
+        # [*, N_res, H * C_hidden]
+        q = self.linear_q(q)
+        q *= (self.c_hidden ** (-0.5))
+        # [*, N_res, H, C_hidden]
+        q = q.view(q.shape[:-1] + (self.no_heads, -1))
+        # [*, N_res, N_seq, C_hidden]
+        k = self.linear_k(m)
+        v = self.linear_v(m)
+        # [*, N_res, H, N_seq]
+        a = torch.matmul(
+            q,
+            k.transpose(-1, -2),  # [*, N_res, C_hidden, N_seq]
+        )
+        bias = (self.inf * (mask - 1))[..., :, None, :]
+        a += bias
+        a = softmax(a)
+        # [*, N_res, H, C_hidden]
+        o = torch.matmul(
+            a,
+            v,
+        )
+        # [*, N_res, N_seq, C_hidden]
+        g = self.sigmoid(self.linear_g(m))
+        # [*, N_res, N_seq, H, C_hidden]
+        g = g.view(g.shape[:-1] + (self.no_heads, -1))
+        # [*, N_res, N_seq, H, C_hidden]
+        o = o.unsqueeze(-3) * g
+        # [*, N_res, N_seq, H * C_hidden]
+        o = o.reshape(o.shape[:-2] + (-1,))
+        # [*, N_res, N_seq, C_in]
+        m = self.linear_o(o)
+        return m
+def _lma(
+    q: torch.Tensor,
+    k: torch.Tensor,
+    v: torch.Tensor,
+    biases: List[torch.Tensor],
+    q_chunk_size: int,
+    kv_chunk_size: int,
+):
+    no_q, no_kv = q.shape[-3], k.shape[-3]
+    # [*, Q, H, C_hidden]
+    o = q.new_zeros(q.shape)
+    for q_s in range(0, no_q, q_chunk_size):
+        q_chunk = q[..., q_s: q_s + q_chunk_size, :, :]
+        large_bias_chunks = [
+            b[..., q_s: q_s + q_chunk_size, :] for b in biases
+        ]
+        maxes = []
+        weights = []
+        values = []
+        for kv_s in range(0, no_kv, kv_chunk_size):
+            k_chunk = k[..., kv_s: kv_s + kv_chunk_size, :, :]
+            v_chunk = v[..., kv_s: kv_s + kv_chunk_size, :, :]
+            small_bias_chunks = [
+                b[..., kv_s: kv_s + kv_chunk_size] for b in large_bias_chunks
+            ]
+            a = torch.einsum(
+                "...qhd,...khd->...hqk", q_chunk, k_chunk,
+            )
+            for b in small_bias_chunks:
+                a += b
+            a = a.transpose(-2, -3)
+            max_a = torch.max(a, dim=-1, keepdim=True)[0]
+            exp_a = torch.exp(a - max_a)
+            exp_v = torch.einsum("...vhf,...qhv->...qhf", v_chunk, exp_a)
+            maxes.append(max_a.detach().squeeze(-1))
+            weights.append(torch.sum(exp_a, dim=-1))
+            values.append(exp_v)
+        chunk_max = torch.stack(maxes, dim=-3)
+        chunk_weights = torch.stack(weights, dim=-3)
+        chunk_values = torch.stack(values, dim=-4)
+        global_max = torch.max(chunk_max, dim=-3, keepdim=True)[0]
+        max_diffs = torch.exp(chunk_max - global_max)
+        chunk_values *= max_diffs.unsqueeze(-1)
+        chunk_weights *= max_diffs
+        all_values = torch.sum(chunk_values, dim=-4)
+        all_weights = torch.sum(chunk_weights.unsqueeze(-1), dim=-4)
+        q_chunk_out = all_values / all_weights
+        o[..., q_s: q_s + q_chunk_size, :, :] = q_chunk_out
+    return o

openfold/model/structure_module.py ADDED Viewed

	@@ -0,0 +1,820 @@

+# Copyright 2021 AlQuraishi Laboratory
+# Copyright 2021 DeepMind Technologies Limited
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from functools import reduce
+import importlib
+import math
+import sys
+from operator import mul
+import torch
+import torch.nn as nn
+from typing import Optional, Tuple, Sequence
+from openfold.model.primitives import Linear, LayerNorm, ipa_point_weights_init_
+from openfold.np.residue_constants import (
+    restype_rigid_group_default_frame,
+    restype_atom14_to_rigid_group,
+    restype_atom14_mask,
+    restype_atom14_rigid_group_positions,
+)
+from openfold.utils.feats import (
+    frames_and_literature_positions_to_atom14_pos,
+    torsion_angles_to_frames,
+)
+from openfold.utils.precision_utils import is_fp16_enabled
+from openfold.utils.rigid_utils import Rotation, Rigid
+from openfold.utils.tensor_utils import (
+    dict_multimap,
+    permute_final_dims,
+    flatten_final_dims,
+)
+# attn_core_inplace_cuda = importlib.import_module("attn_core_inplace_cuda")
+class AngleResnetBlock(nn.Module):
+    def __init__(self, c_hidden):
+        """
+        Args:
+            c_hidden:
+                Hidden channel dimension
+        """
+        super(AngleResnetBlock, self).__init__()
+        self.c_hidden = c_hidden
+        self.linear_1 = Linear(self.c_hidden, self.c_hidden, init="relu")
+        self.linear_2 = Linear(self.c_hidden, self.c_hidden, init="final")
+        self.relu = nn.ReLU()
+    def forward(self, a: torch.Tensor) -> torch.Tensor:
+        s_initial = a
+        a = self.relu(a)
+        a = self.linear_1(a)
+        a = self.relu(a)
+        a = self.linear_2(a)
+        return a + s_initial
+class AngleResnet(nn.Module):
+    """
+    Implements Algorithm 20, lines 11-14
+    """
+    def __init__(self, c_in, c_hidden, no_blocks, no_angles, epsilon):
+        """
+        Args:
+            c_in:
+                Input channel dimension
+            c_hidden:
+                Hidden channel dimension
+            no_blocks:
+                Number of resnet blocks
+            no_angles:
+                Number of torsion angles to generate
+            epsilon:
+                Small constant for normalization
+        """
+        super(AngleResnet, self).__init__()
+        self.c_in = c_in
+        self.c_hidden = c_hidden
+        self.no_blocks = no_blocks
+        self.no_angles = no_angles
+        self.eps = epsilon
+        self.linear_in = Linear(self.c_in, self.c_hidden)
+        self.linear_initial = Linear(self.c_in, self.c_hidden)
+        self.layers = nn.ModuleList()
+        for _ in range(self.no_blocks):
+            layer = AngleResnetBlock(c_hidden=self.c_hidden)
+            self.layers.append(layer)
+        self.linear_out = Linear(self.c_hidden, self.no_angles * 2)
+        self.relu = nn.ReLU()
+    def forward(
+        self, s: torch.Tensor, s_initial: torch.Tensor
+    ) -> Tuple[torch.Tensor, torch.Tensor]:
+        """
+        Args:
+            s:
+                [*, C_hidden] single embedding
+            s_initial:
+                [*, C_hidden] single embedding as of the start of the
+                StructureModule
+        Returns:
+            [*, no_angles, 2] predicted angles
+        """
+        # NOTE: The ReLU's applied to the inputs are absent from the supplement
+        # pseudocode but present in the source. For maximal compatibility with
+        # the pretrained weights, I'm going with the source.
+        # [*, C_hidden]
+        s_initial = self.relu(s_initial)
+        s_initial = self.linear_initial(s_initial)
+        s = self.relu(s)
+        s = self.linear_in(s)
+        s = s + s_initial
+        for l in self.layers:
+            s = l(s)
+        s = self.relu(s)
+        # [*, no_angles * 2]
+        s = self.linear_out(s)
+        # [*, no_angles, 2]
+        s = s.view(s.shape[:-1] + (-1, 2))
+        unnormalized_s = s
+        norm_denom = torch.sqrt(
+            torch.clamp(
+                torch.sum(s ** 2, dim=-1, keepdim=True),
+                min=self.eps,
+            )
+        )
+        s = s / norm_denom
+        return unnormalized_s, s
+class InvariantPointAttention(nn.Module):
+    """
+    Implements Algorithm 22.
+    """
+    def __init__(
+        self,
+        c_s: int,
+        c_z: int,
+        c_hidden: int,
+        no_heads: int,
+        no_qk_points: int,
+        no_v_points: int,
+        inf: float = 1e5,
+        eps: float = 1e-8,
+    ):
+        """
+        Args:
+            c_s:
+                Single representation channel dimension
+            c_z:
+                Pair representation channel dimension
+            c_hidden:
+                Hidden channel dimension
+            no_heads:
+                Number of attention heads
+            no_qk_points:
+                Number of query/key points to generate
+            no_v_points:
+                Number of value points to generate
+        """
+        super(InvariantPointAttention, self).__init__()
+        self.c_s = c_s
+        self.c_z = c_z
+        self.c_hidden = c_hidden
+        self.no_heads = no_heads
+        self.no_qk_points = no_qk_points
+        self.no_v_points = no_v_points
+        self.inf = inf
+        self.eps = eps
+        # These linear layers differ from their specifications in the
+        # supplement. There, they lack bias and use Glorot initialization.
+        # Here as in the official source, they have bias and use the default
+        # Lecun initialization.
+        hc = self.c_hidden * self.no_heads
+        self.linear_q = Linear(self.c_s, hc)
+        self.linear_kv = Linear(self.c_s, 2 * hc)
+        hpq = self.no_heads * self.no_qk_points * 3
+        self.linear_q_points = Linear(self.c_s, hpq)
+        hpkv = self.no_heads * (self.no_qk_points + self.no_v_points) * 3
+        self.linear_kv_points = Linear(self.c_s, hpkv)
+        hpv = self.no_heads * self.no_v_points * 3
+        self.linear_b = Linear(self.c_z, self.no_heads)
+        self.head_weights = nn.Parameter(torch.zeros((no_heads)))
+        ipa_point_weights_init_(self.head_weights)
+        concat_out_dim = self.no_heads * (
+            self.c_z + self.c_hidden + self.no_v_points * 4
+        )
+        self.linear_out = Linear(concat_out_dim, self.c_s, init="final")
+        self.softmax = nn.Softmax(dim=-1)
+        self.softplus = nn.Softplus()
+    def forward(
+        self,
+        s: torch.Tensor,
+        z: Optional[torch.Tensor],
+        r: Rigid,
+        mask: torch.Tensor,
+        inplace_safe: bool = False,
+        _offload_inference: bool = False,
+        _z_reference_list: Optional[Sequence[torch.Tensor]] = None,
+    ) -> torch.Tensor:
+        """
+        Args:
+            s:
+                [*, N_res, C_s] single representation
+            z:
+                [*, N_res, N_res, C_z] pair representation
+            r:
+                [*, N_res] transformation object
+            mask:
+                [*, N_res] mask
+        Returns:
+            [*, N_res, C_s] single representation update
+        """
+        if(_offload_inference and inplace_safe):
+            z = _z_reference_list
+        else:
+            z = [z]
+        #######################################
+        # Generate scalar and point activations
+        #######################################
+        # [*, N_res, H * C_hidden]
+        q = self.linear_q(s)
+        kv = self.linear_kv(s)
+        # [*, N_res, H, C_hidden]
+        q = q.view(q.shape[:-1] + (self.no_heads, -1))
+        # [*, N_res, H, 2 * C_hidden]
+        kv = kv.view(kv.shape[:-1] + (self.no_heads, -1))
+        # [*, N_res, H, C_hidden]
+        k, v = torch.split(kv, self.c_hidden, dim=-1)
+        # [*, N_res, H * P_q * 3]
+        q_pts = self.linear_q_points(s)
+        # This is kind of clunky, but it's how the original does it
+        # [*, N_res, H * P_q, 3]
+        q_pts = torch.split(q_pts, q_pts.shape[-1] // 3, dim=-1)
+        q_pts = torch.stack(q_pts, dim=-1)
+        q_pts = r[..., None].apply(q_pts)
+        # [*, N_res, H, P_q, 3]
+        q_pts = q_pts.view(
+            q_pts.shape[:-2] + (self.no_heads, self.no_qk_points, 3)
+        )
+        # [*, N_res, H * (P_q + P_v) * 3]
+        kv_pts = self.linear_kv_points(s)
+        # [*, N_res, H * (P_q + P_v), 3]
+        kv_pts = torch.split(kv_pts, kv_pts.shape[-1] // 3, dim=-1)
+        kv_pts = torch.stack(kv_pts, dim=-1)
+        kv_pts = r[..., None].apply(kv_pts)
+        # [*, N_res, H, (P_q + P_v), 3]
+        kv_pts = kv_pts.view(kv_pts.shape[:-2] + (self.no_heads, -1, 3))
+        # [*, N_res, H, P_q/P_v, 3]
+        k_pts, v_pts = torch.split(
+            kv_pts, [self.no_qk_points, self.no_v_points], dim=-2
+        )
+        ##########################
+        # Compute attention scores
+        ##########################
+        # [*, N_res, N_res, H]
+        b = self.linear_b(z[0])
+        if(_offload_inference):
+            assert(sys.getrefcount(z[0]) == 2)
+            z[0] = z[0].cpu()
+        # [*, H, N_res, N_res]
+        if(is_fp16_enabled()):
+            with torch.cuda.amp.autocast(enabled=False):
+                a = torch.matmul(
+                    permute_final_dims(q.float(), (1, 0, 2)),  # [*, H, N_res, C_hidden]
+                    permute_final_dims(k.float(), (1, 2, 0)),  # [*, H, C_hidden, N_res]
+                )
+        else:
+            a = torch.matmul(
+                permute_final_dims(q, (1, 0, 2)),  # [*, H, N_res, C_hidden]
+                permute_final_dims(k, (1, 2, 0)),  # [*, H, C_hidden, N_res]
+            )
+        a *= math.sqrt(1.0 / (3 * self.c_hidden))
+        a += (math.sqrt(1.0 / 3) * permute_final_dims(b, (2, 0, 1)))
+        # [*, N_res, N_res, H, P_q, 3]
+        pt_att = q_pts.unsqueeze(-4) - k_pts.unsqueeze(-5)
+        if(inplace_safe):
+            pt_att *= pt_att
+        else:
+            pt_att = pt_att ** 2
+        # [*, N_res, N_res, H, P_q]
+        pt_att = sum(torch.unbind(pt_att, dim=-1))
+        head_weights = self.softplus(self.head_weights).view(
+            *((1,) * len(pt_att.shape[:-2]) + (-1, 1))
+        )
+        head_weights = head_weights * math.sqrt(
+            1.0 / (3 * (self.no_qk_points * 9.0 / 2))
+        )
+        if(inplace_safe):
+            pt_att *= head_weights
+        else:
+            pt_att = pt_att * head_weights
+        # [*, N_res, N_res, H]
+        pt_att = torch.sum(pt_att, dim=-1) * (-0.5)
+        # [*, N_res, N_res]
+        square_mask = mask.unsqueeze(-1) * mask.unsqueeze(-2)
+        square_mask = self.inf * (square_mask - 1)
+        # [*, H, N_res, N_res]
+        pt_att = permute_final_dims(pt_att, (2, 0, 1))
+        if(inplace_safe):
+            a += pt_att
+            del pt_att
+            a += square_mask.unsqueeze(-3)
+            # in-place softmax
+            attn_core_inplace_cuda.forward_(
+                a,
+                reduce(mul, a.shape[:-1]),
+                a.shape[-1],
+            )
+        else:
+            a = a + pt_att
+            a = a + square_mask.unsqueeze(-3)
+            a = self.softmax(a)
+        ################
+        # Compute output
+        ################
+        # [*, N_res, H, C_hidden]
+        o = torch.matmul(
+            a, v.transpose(-2, -3).to(dtype=a.dtype)
+        ).transpose(-2, -3)
+        # [*, N_res, H * C_hidden]
+        o = flatten_final_dims(o, 2)
+        # [*, H, 3, N_res, P_v]
+        if(inplace_safe):
+            v_pts = permute_final_dims(v_pts, (1, 3, 0, 2))
+            o_pt = [
+                torch.matmul(a, v.to(a.dtype))
+                for v in torch.unbind(v_pts, dim=-3)
+            ]
+            o_pt = torch.stack(o_pt, dim=-3)
+        else:
+            o_pt = torch.sum(
+                (
+                    a[..., None, :, :, None]
+                    * permute_final_dims(v_pts, (1, 3, 0, 2))[..., None, :, :]
+                ),
+                dim=-2,
+            )
+        # [*, N_res, H, P_v, 3]
+        o_pt = permute_final_dims(o_pt, (2, 0, 3, 1))
+        o_pt = r[..., None, None].invert_apply(o_pt)
+        # [*, N_res, H * P_v]
+        o_pt_norm = flatten_final_dims(
+            torch.sqrt(torch.sum(o_pt ** 2, dim=-1) + self.eps), 2
+        )
+        # [*, N_res, H * P_v, 3]
+        o_pt = o_pt.reshape(*o_pt.shape[:-3], -1, 3)
+        if(_offload_inference):
+            z[0] = z[0].to(o_pt.device)
+        # [*, N_res, H, C_z]
+        o_pair = torch.matmul(a.transpose(-2, -3), z[0].to(dtype=a.dtype))
+        # [*, N_res, H * C_z]
+        o_pair = flatten_final_dims(o_pair, 2)
+        # [*, N_res, C_s]
+        s = self.linear_out(
+            torch.cat(
+                (o, *torch.unbind(o_pt, dim=-1), o_pt_norm, o_pair), dim=-1
+            ).to(dtype=z[0].dtype)
+        )
+        return s
+class BackboneUpdate(nn.Module):
+    """
+    Implements part of Algorithm 23.
+    """
+    def __init__(self, c_s):
+        """
+        Args:
+            c_s:
+                Single representation channel dimension
+        """
+        super(BackboneUpdate, self).__init__()
+        self.c_s = c_s
+        self.linear = Linear(self.c_s, 6, init="final")
+    def forward(self, s: torch.Tensor) -> Tuple[torch.Tensor, torch.Tensor]:
+        """
+        Args:
+            [*, N_res, C_s] single representation
+        Returns:
+            [*, N_res, 6] update vector
+        """
+        # [*, 6]
+        update = self.linear(s)
+        return update
+class StructureModuleTransitionLayer(nn.Module):
+    def __init__(self, c):
+        super(StructureModuleTransitionLayer, self).__init__()
+        self.c = c
+        self.linear_1 = Linear(self.c, self.c, init="relu")
+        self.linear_2 = Linear(self.c, self.c, init="relu")
+        self.linear_3 = Linear(self.c, self.c, init="final")
+        self.relu = nn.ReLU()
+    def forward(self, s):
+        s_initial = s
+        s = self.linear_1(s)
+        s = self.relu(s)
+        s = self.linear_2(s)
+        s = self.relu(s)
+        s = self.linear_3(s)
+        s = s + s_initial
+        return s
+class StructureModuleTransition(nn.Module):
+    def __init__(self, c, num_layers, dropout_rate):
+        super(StructureModuleTransition, self).__init__()
+        self.c = c
+        self.num_layers = num_layers
+        self.dropout_rate = dropout_rate
+        self.layers = nn.ModuleList()
+        for _ in range(self.num_layers):
+            l = StructureModuleTransitionLayer(self.c)
+            self.layers.append(l)
+        self.dropout = nn.Dropout(self.dropout_rate)
+        self.layer_norm = LayerNorm(self.c)
+    def forward(self, s):
+        for l in self.layers:
+            s = l(s)
+        s = self.dropout(s)
+        s = self.layer_norm(s)
+        return s
+class StructureModule(nn.Module):
+    def __init__(
+        self,
+        c_s,
+        c_z,
+        c_ipa,
+        c_resnet,
+        no_heads_ipa,
+        no_qk_points,
+        no_v_points,
+        dropout_rate,
+        no_blocks,
+        no_transition_layers,
+        no_resnet_blocks,
+        no_angles,
+        trans_scale_factor,
+        epsilon,
+        inf,
+        **kwargs,
+    ):
+        """
+        Args:
+            c_s:
+                Single representation channel dimension
+            c_z:
+                Pair representation channel dimension
+            c_ipa:
+                IPA hidden channel dimension
+            c_resnet:
+                Angle resnet (Alg. 23 lines 11-14) hidden channel dimension
+            no_heads_ipa:
+                Number of IPA heads
+            no_qk_points:
+                Number of query/key points to generate during IPA
+            no_v_points:
+                Number of value points to generate during IPA
+            dropout_rate:
+                Dropout rate used throughout the layer
+            no_blocks:
+                Number of structure module blocks
+            no_transition_layers:
+                Number of layers in the single representation transition
+                (Alg. 23 lines 8-9)
+            no_resnet_blocks:
+                Number of blocks in the angle resnet
+            no_angles:
+                Number of angles to generate in the angle resnet
+            trans_scale_factor:
+                Scale of single representation transition hidden dimension
+            epsilon:
+                Small number used in angle resnet normalization
+            inf:
+                Large number used for attention masking
+        """
+        super(StructureModule, self).__init__()
+        self.c_s = c_s
+        self.c_z = c_z
+        self.c_ipa = c_ipa
+        self.c_resnet = c_resnet
+        self.no_heads_ipa = no_heads_ipa
+        self.no_qk_points = no_qk_points
+        self.no_v_points = no_v_points
+        self.dropout_rate = dropout_rate
+        self.no_blocks = no_blocks
+        self.no_transition_layers = no_transition_layers
+        self.no_resnet_blocks = no_resnet_blocks
+        self.no_angles = no_angles
+        self.trans_scale_factor = trans_scale_factor
+        self.epsilon = epsilon
+        self.inf = inf
+        # Buffers to be lazily initialized later
+        # self.default_frames
+        # self.group_idx
+        # self.atom_mask
+        # self.lit_positions
+        self.layer_norm_s = LayerNorm(self.c_s)
+        self.layer_norm_z = LayerNorm(self.c_z)
+        self.linear_in = Linear(self.c_s, self.c_s)
+        self.ipa = InvariantPointAttention(
+            self.c_s,
+            self.c_z,
+            self.c_ipa,
+            self.no_heads_ipa,
+            self.no_qk_points,
+            self.no_v_points,
+            inf=self.inf,
+            eps=self.epsilon,
+        )
+        self.ipa_dropout = nn.Dropout(self.dropout_rate)
+        self.layer_norm_ipa = LayerNorm(self.c_s)
+        self.transition = StructureModuleTransition(
+            self.c_s,
+            self.no_transition_layers,
+            self.dropout_rate,
+        )
+        self.bb_update = BackboneUpdate(self.c_s)
+        self.angle_resnet = AngleResnet(
+            self.c_s,
+            self.c_resnet,
+            self.no_resnet_blocks,
+            self.no_angles,
+            self.epsilon,
+        )
+    def forward(
+        self,
+        evoformer_output_dict,
+        aatype,
+        mask=None,
+        inplace_safe=False,
+        _offload_inference=False,
+    ):
+        """
+        Args:
+            evoformer_output_dict:
+                Dictionary containing:
+                    "single":
+                        [*, N_res, C_s] single representation
+                    "pair":
+                        [*, N_res, N_res, C_z] pair representation
+            aatype:
+                [*, N_res] amino acid indices
+            mask:
+                Optional [*, N_res] sequence mask
+        Returns:
+            A dictionary of outputs
+        """
+        s = evoformer_output_dict["single"]
+        if mask is None:
+            # [*, N]
+            mask = s.new_ones(s.shape[:-1])
+        # [*, N, C_s]
+        s = self.layer_norm_s(s)
+        # [*, N, N, C_z]
+        z = self.layer_norm_z(evoformer_output_dict["pair"])
+        z_reference_list = None
+        if(_offload_inference):
+            assert(sys.getrefcount(evoformer_output_dict["pair"]) == 2)
+            evoformer_output_dict["pair"] = evoformer_output_dict["pair"].cpu()
+            z_reference_list = [z]
+            z = None
+        # [*, N, C_s]
+        s_initial = s
+        s = self.linear_in(s)
+        # [*, N]
+        rigids = Rigid.identity(
+            s.shape[:-1],
+            s.dtype,
+            s.device,
+            self.training,
+            fmt="quat",
+        )
+        outputs = []
+        for i in range(self.no_blocks):
+            # [*, N, C_s]
+            s = s + self.ipa(
+                s,
+                z,
+                rigids,
+                mask,
+                inplace_safe=inplace_safe,
+                _offload_inference=_offload_inference,
+                _z_reference_list=z_reference_list
+            )
+            s = self.ipa_dropout(s)
+            s = self.layer_norm_ipa(s)
+            s = self.transition(s)
+            # [*, N]
+            rigids = rigids.compose_q_update_vec(self.bb_update(s))
+            # To hew as closely as possible to AlphaFold, we convert our
+            # quaternion-based transformations to rotation-matrix ones
+            # here
+            backb_to_global = Rigid(
+                Rotation(
+                    rot_mats=rigids.get_rots().get_rot_mats(),
+                    quats=None
+                ),
+                rigids.get_trans(),
+            )
+            backb_to_global = backb_to_global.scale_translation(
+                self.trans_scale_factor
+            )
+            # [*, N, 7, 2]
+            unnormalized_angles, angles = self.angle_resnet(s, s_initial)
+            all_frames_to_global = self.torsion_angles_to_frames(
+                backb_to_global,
+                angles,
+                aatype,
+            )
+            pred_xyz = self.frames_and_literature_positions_to_atom14_pos(
+                all_frames_to_global,
+                aatype,
+            )
+            scaled_rigids = rigids.scale_translation(self.trans_scale_factor)
+            preds = {
+                "frames": scaled_rigids.to_tensor_7(),
+                "sidechain_frames": all_frames_to_global.to_tensor_4x4(),
+                "unnormalized_angles": unnormalized_angles,
+                "angles": angles,
+                "positions": pred_xyz,
+                "states": s,
+            }
+            outputs.append(preds)
+            rigids = rigids.stop_rot_gradient()
+        del z, z_reference_list
+        if(_offload_inference):
+            evoformer_output_dict["pair"] = (
+                evoformer_output_dict["pair"].to(s.device)
+            )
+        outputs = dict_multimap(torch.stack, outputs)
+        outputs["single"] = s
+        return outputs
+    def _init_residue_constants(self, float_dtype, device):
+        if not hasattr(self, "default_frames"):
+            self.register_buffer(
+                "default_frames",
+                torch.tensor(
+                    restype_rigid_group_default_frame,
+                    dtype=float_dtype,
+                    device=device,
+                    requires_grad=False,
+                ),
+                persistent=False,
+            )
+        if not hasattr(self, "group_idx"):
+            self.register_buffer(
+                "group_idx",
+                torch.tensor(
+                    restype_atom14_to_rigid_group,
+                    device=device,
+                    requires_grad=False,
+                ),
+                persistent=False,
+            )
+        if not hasattr(self, "atom_mask"):
+            self.register_buffer(
+                "atom_mask",
+                torch.tensor(
+                    restype_atom14_mask,
+                    dtype=float_dtype,
+                    device=device,
+                    requires_grad=False,
+                ),
+                persistent=False,
+            )
+        if not hasattr(self, "lit_positions"):
+            self.register_buffer(
+                "lit_positions",
+                torch.tensor(
+                    restype_atom14_rigid_group_positions,
+                    dtype=float_dtype,
+                    device=device,
+                    requires_grad=False,
+                ),
+                persistent=False,
+            )
+    def torsion_angles_to_frames(self, r, alpha, f):
+        # Lazily initialize the residue constants on the correct device
+        self._init_residue_constants(alpha.dtype, alpha.device)
+        # Separated purely to make testing less annoying
+        return torsion_angles_to_frames(r, alpha, f, self.default_frames)
+    def frames_and_literature_positions_to_atom14_pos(
+        self, r, f  # [*, N, 8]  # [*, N]
+    ):
+        # Lazily initialize the residue constants on the correct device
+        self._init_residue_constants(r.get_rots().dtype, r.get_rots().device)
+        return frames_and_literature_positions_to_atom14_pos(
+            r,
+            f,
+            self.default_frames,
+            self.group_idx,
+            self.atom_mask,
+            self.lit_positions,
+        )

openfold/model/template.py ADDED Viewed

	@@ -0,0 +1,333 @@

+# Copyright 2021 AlQuraishi Laboratory
+# Copyright 2021 DeepMind Technologies Limited
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from functools import partial
+import math
+from typing import Optional, List
+import torch
+import torch.nn as nn
+from openfold.model.primitives import Linear, LayerNorm, Attention
+from openfold.model.dropout import (
+    DropoutRowwise,
+    DropoutColumnwise,
+)
+from openfold.model.pair_transition import PairTransition
+from openfold.model.triangular_attention import (
+    TriangleAttentionStartingNode,
+    TriangleAttentionEndingNode,
+)
+from openfold.model.triangular_multiplicative_update import (
+    TriangleMultiplicationOutgoing,
+    TriangleMultiplicationIncoming,
+)
+from openfold.utils.checkpointing import checkpoint_blocks
+from openfold.utils.tensor_utils import (
+    chunk_layer,
+    permute_final_dims,
+    flatten_final_dims,
+)
+class TemplatePointwiseAttention(nn.Module):
+    """
+    Implements Algorithm 17.
+    """
+    def __init__(self, c_t, c_z, c_hidden, no_heads, inf, **kwargs):
+        """
+        Args:
+            c_t:
+                Template embedding channel dimension
+            c_z:
+                Pair embedding channel dimension
+            c_hidden:
+                Hidden channel dimension
+        """
+        super(TemplatePointwiseAttention, self).__init__()
+        self.c_t = c_t
+        self.c_z = c_z
+        self.c_hidden = c_hidden
+        self.no_heads = no_heads
+        self.inf = inf
+        self.mha = Attention(
+            self.c_z,
+            self.c_t,
+            self.c_t,
+            self.c_hidden,
+            self.no_heads,
+            gating=False,
+        )
+    def _chunk(self,
+        z: torch.Tensor,
+        t: torch.Tensor,
+        biases: List[torch.Tensor],
+        chunk_size: int,
+    ) -> torch.Tensor:
+        mha_inputs = {
+            "q_x": z,
+            "kv_x": t,
+            "biases": biases,
+        }
+        return chunk_layer(
+            self.mha,
+            mha_inputs,
+            chunk_size=chunk_size,
+            no_batch_dims=len(z.shape[:-2]),
+        )
+    def forward(self,
+        t: torch.Tensor,
+        z: torch.Tensor,
+        template_mask: Optional[torch.Tensor] = None,
+        chunk_size: Optional[int] = None
+    ) -> torch.Tensor:
+        """
+        Args:
+            t:
+                [*, N_templ, N_res, N_res, C_t] template embedding
+            z:
+                [*, N_res, N_res, C_t] pair embedding
+            template_mask:
+                [*, N_templ] template mask
+        Returns:
+            [*, N_res, N_res, C_z] pair embedding update
+        """
+        if template_mask is None:
+            template_mask = t.new_ones(t.shape[:-3])
+        bias = self.inf * (template_mask[..., None, None, None, None, :] - 1)
+        # [*, N_res, N_res, 1, C_z]
+        z = z.unsqueeze(-2)
+        # [*, N_res, N_res, N_temp, C_t]
+        t = permute_final_dims(t, (1, 2, 0, 3))
+        # [*, N_res, N_res, 1, C_z]
+        biases = [bias]
+        if chunk_size is not None:
+            z = self._chunk(z, t, biases, chunk_size)
+        else:
+            z = self.mha(q_x=z, kv_x=t, biases=biases)
+        # [*, N_res, N_res, C_z]
+        z = z.squeeze(-2)
+        return z
+class TemplatePairStackBlock(nn.Module):
+    def __init__(
+        self,
+        c_t: int,
+        c_hidden_tri_att: int,
+        c_hidden_tri_mul: int,
+        no_heads: int,
+        pair_transition_n: int,
+        dropout_rate: float,
+        inf: float,
+        **kwargs,
+    ):
+        super(TemplatePairStackBlock, self).__init__()
+        self.c_t = c_t
+        self.c_hidden_tri_att = c_hidden_tri_att
+        self.c_hidden_tri_mul = c_hidden_tri_mul
+        self.no_heads = no_heads
+        self.pair_transition_n = pair_transition_n
+        self.dropout_rate = dropout_rate
+        self.inf = inf
+        self.dropout_row = DropoutRowwise(self.dropout_rate)
+        self.dropout_col = DropoutColumnwise(self.dropout_rate)
+        self.tri_att_start = TriangleAttentionStartingNode(
+            self.c_t,
+            self.c_hidden_tri_att,
+            self.no_heads,
+            inf=inf,
+        )
+        self.tri_att_end = TriangleAttentionEndingNode(
+            self.c_t,
+            self.c_hidden_tri_att,
+            self.no_heads,
+            inf=inf,
+        )
+        self.tri_mul_out = TriangleMultiplicationOutgoing(
+            self.c_t,
+            self.c_hidden_tri_mul,
+        )
+        self.tri_mul_in = TriangleMultiplicationIncoming(
+            self.c_t,
+            self.c_hidden_tri_mul,
+        )
+        self.pair_transition = PairTransition(
+            self.c_t,
+            self.pair_transition_n,
+        )
+    def forward(self,
+        z: torch.Tensor,
+        mask: torch.Tensor,
+        chunk_size: Optional[int] = None,
+        _mask_trans: bool = True
+    ):
+        single_templates = [
+            t.unsqueeze(-4) for t in torch.unbind(z, dim=-4)
+        ]
+        single_templates_masks = [
+            m.unsqueeze(-3) for m in torch.unbind(mask, dim=-3)
+        ]
+        for i in range(len(single_templates)):
+            single = single_templates[i]
+            single_mask = single_templates_masks[i]
+            single = single + self.dropout_row(
+                self.tri_att_start(
+                    single,
+                    chunk_size=chunk_size,
+                    mask=single_mask
+                )
+            )
+            single = single + self.dropout_col(
+                self.tri_att_end(
+                    single,
+                    chunk_size=chunk_size,
+                    mask=single_mask
+                )
+            )
+            single = single + self.dropout_row(
+                self.tri_mul_out(
+                    single,
+                    mask=single_mask
+                )
+            )
+            single = single + self.dropout_row(
+                self.tri_mul_in(
+                    single,
+                    mask=single_mask
+                )
+            )
+            single = single + self.pair_transition(
+                single,
+                mask=single_mask if _mask_trans else None,
+                chunk_size=chunk_size,
+            )
+            single_templates[i] = single
+        z = torch.cat(single_templates, dim=-4)
+        return z
+class TemplatePairStack(nn.Module):
+    """
+    Implements Algorithm 16.
+    """
+    def __init__(
+        self,
+        c_t,
+        c_hidden_tri_att,
+        c_hidden_tri_mul,
+        no_blocks,
+        no_heads,
+        pair_transition_n,
+        dropout_rate,
+        blocks_per_ckpt,
+        inf=1e9,
+        **kwargs,
+    ):
+        """
+        Args:
+            c_t:
+                Template embedding channel dimension
+            c_hidden_tri_att:
+                Per-head hidden dimension for triangular attention
+            c_hidden_tri_att:
+                Hidden dimension for triangular multiplication
+            no_blocks:
+                Number of blocks in the stack
+            pair_transition_n:
+                Scale of pair transition (Alg. 15) hidden dimension
+            dropout_rate:
+                Dropout rate used throughout the stack
+            blocks_per_ckpt:
+                Number of blocks per activation checkpoint. None disables
+                activation checkpointing
+        """
+        super(TemplatePairStack, self).__init__()
+        self.blocks_per_ckpt = blocks_per_ckpt
+        self.blocks = nn.ModuleList()
+        for _ in range(no_blocks):
+            block = TemplatePairStackBlock(
+                c_t=c_t,
+                c_hidden_tri_att=c_hidden_tri_att,
+                c_hidden_tri_mul=c_hidden_tri_mul,
+                no_heads=no_heads,
+                pair_transition_n=pair_transition_n,
+                dropout_rate=dropout_rate,
+                inf=inf,
+            )
+            self.blocks.append(block)
+        self.layer_norm = LayerNorm(c_t)
+    def forward(
+        self,
+        t: torch.tensor,
+        mask: torch.tensor,
+        chunk_size: int,
+        _mask_trans: bool = True,
+    ):
+        """
+        Args:
+            t:
+                [*, N_templ, N_res, N_res, C_t] template embedding
+            mask:
+                [*, N_templ, N_res, N_res] mask
+        Returns:
+            [*, N_templ, N_res, N_res, C_t] template embedding update
+        """
+        if(mask.shape[-3] == 1):
+            expand_idx = list(mask.shape)
+            expand_idx[-3] = t.shape[-4]
+            mask = mask.expand(*expand_idx)
+        t, = checkpoint_blocks(
+            blocks=[
+                partial(
+                    b,
+                    mask=mask,
+                    chunk_size=chunk_size,
+                    _mask_trans=_mask_trans,
+                )
+                for b in self.blocks
+            ],
+            args=(t,),
+            blocks_per_ckpt=self.blocks_per_ckpt if self.training else None,
+        )
+        t = self.layer_norm(t)
+        return t

openfold/model/torchscript.py ADDED Viewed

	@@ -0,0 +1,215 @@

+# Copyright 2021 AlQuraishi Laboratory
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from typing import Optional, Sequence, Tuple
+import torch
+import torch.nn as nn
+from openfold.model.dropout import (
+    DropoutRowwise,
+    DropoutColumnwise,
+)
+from openfold.model.evoformer import (
+    EvoformerBlock,
+    EvoformerStack,
+)
+from openfold.model.outer_product_mean import OuterProductMean
+from openfold.model.msa import (
+    MSARowAttentionWithPairBias,
+    MSAColumnAttention,
+    MSAColumnGlobalAttention,
+)
+from openfold.model.pair_transition import PairTransition
+from openfold.model.primitives import Attention, GlobalAttention
+from openfold.model.structure_module import (
+    InvariantPointAttention,
+    BackboneUpdate,
+)
+from openfold.model.template import TemplatePairStackBlock
+from openfold.model.triangular_attention import (
+    TriangleAttentionStartingNode,
+    TriangleAttentionEndingNode,
+)
+from openfold.model.triangular_multiplicative_update import (
+    TriangleMultiplicationOutgoing,
+    TriangleMultiplicationIncoming,
+)
+def script_preset_(model: torch.nn.Module):
+    """
+    TorchScript a handful of low-level but frequently used submodule types
+    that are known to be scriptable.
+    Args:
+        model:
+            A torch.nn.Module. It should contain at least some modules from
+            this repository, or this function won't do anything.
+    """
+    script_submodules_(
+        model,
+        [
+            nn.Dropout,
+            Attention,
+            GlobalAttention,
+            EvoformerBlock,
+            #TemplatePairStackBlock,
+        ],
+        attempt_trace=False,
+        batch_dims=None,
+    )
+def _get_module_device(module: torch.nn.Module) -> torch.device:
+    """
+    Fetches the device of a module, assuming that all of the module's
+    parameters reside on a single device
+    Args:
+        module: A torch.nn.Module
+    Returns:
+        The module's device
+    """
+    return next(module.parameters()).device
+def _trace_module(module, batch_dims=None):
+    if(batch_dims is None):
+        batch_dims = ()
+    # Stand-in values
+    n_seq = 10
+    n_res = 10
+    device = _get_module_device(module)
+    def msa(channel_dim):
+        return torch.rand(
+            (*batch_dims, n_seq, n_res, channel_dim),
+            device=device,
+        )
+    def pair(channel_dim):
+        return torch.rand(
+            (*batch_dims, n_res, n_res, channel_dim),
+            device=device,
+        )
+    if(isinstance(module, MSARowAttentionWithPairBias)):
+        inputs = {
+            "forward": (
+                msa(module.c_in), # m
+                pair(module.c_z), # z
+                torch.randint(
+                    0, 2,
+                    (*batch_dims, n_seq, n_res)
+                ), # mask
+            ),
+        }
+    elif(isinstance(module, MSAColumnAttention)):
+        inputs = {
+            "forward": (
+                msa(module.c_in), # m
+                torch.randint(
+                    0, 2,
+                    (*batch_dims, n_seq, n_res)
+                ), # mask
+            ),
+        }
+    elif(isinstance(module, OuterProductMean)):
+        inputs = {
+            "forward": (
+                msa(module.c_m),
+                torch.randint(
+                    0, 2,
+                    (*batch_dims, n_seq, n_res)
+                )
+            )
+        }
+    else:
+        raise TypeError(
+            f"tracing is not supported for modules of type {type(module)}"
+        )
+    return torch.jit.trace_module(module, inputs)
+def _script_submodules_helper_(
+    model,
+    types,
+    attempt_trace,
+    to_trace,
+):
+    for name, child in model.named_children():
+        if(types is None or any(isinstance(child, t) for t in types)):
+            try:
+                scripted = torch.jit.script(child)
+                setattr(model, name, scripted)
+                continue
+            except (RuntimeError, torch.jit.frontend.NotSupportedError) as e:
+                if(attempt_trace):
+                    to_trace.add(type(child))
+                else:
+                    raise e
+        _script_submodules_helper_(child, types, attempt_trace, to_trace)
+def _trace_submodules_(
+    model,
+    types,
+    batch_dims=None,
+):
+    for name, child in model.named_children():
+        if(any(isinstance(child, t) for t in types)):
+            traced = _trace_module(child, batch_dims=batch_dims)
+            setattr(model, name, traced)
+        else:
+            _trace_submodules_(child, types, batch_dims=batch_dims)
+def script_submodules_(
+    model: nn.Module,
+    types: Optional[Sequence[type]] = None,
+    attempt_trace: Optional[bool] = True,
+    batch_dims: Optional[Tuple[int]] = None,
+):
+    """
+    Convert all submodules whose types match one of those in the input
+    list to recursively scripted equivalents in place. To script the entire
+    model, just call torch.jit.script on it directly.
+    When types is None, all submodules are scripted.
+    Args:
+        model:
+            A torch.nn.Module
+        types:
+            A list of types of submodules to script
+        attempt_trace:
+            Whether to attempt to trace specified modules if scripting
+            fails. Recall that tracing eliminates all conditional
+            logic---with great tracing comes the mild responsibility of
+            having to remember to ensure that the modules in question
+            perform the same computations no matter what.
+    """
+    to_trace = set()
+    # Aggressively script as much as possible first...
+    _script_submodules_helper_(model, types, attempt_trace, to_trace)
+    # ... and then trace stragglers.
+    if(attempt_trace and len(to_trace) > 0):
+        _trace_submodules_(model, to_trace, batch_dims=batch_dims)

openfold/model/triangular_attention.py ADDED Viewed

	@@ -0,0 +1,139 @@

+# Copyright 2021 AlQuraishi Laboratory
+# Copyright 2021 DeepMind Technologies Limited
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from functools import partialmethod, partial
+import math
+from typing import Optional, List
+import torch
+import torch.nn as nn
+from openfold.model.primitives import Linear, LayerNorm, Attention
+from openfold.utils.tensor_utils import (
+    chunk_layer,
+    permute_final_dims,
+    flatten_final_dims,
+)
+class TriangleAttention(nn.Module):
+    def __init__(
+        self, c_in, c_hidden, no_heads, starting, inf=1e9
+    ):
+        """
+        Args:
+            c_in:
+                Input channel dimension
+            c_hidden:
+                Overall hidden channel dimension (not per-head)
+            no_heads:
+                Number of attention heads
+        """
+        super(TriangleAttention, self).__init__()
+        self.c_in = c_in
+        self.c_hidden = c_hidden
+        self.no_heads = no_heads
+        self.starting = starting
+        self.inf = inf
+        self.layer_norm = LayerNorm(self.c_in)
+        self.linear = Linear(c_in, self.no_heads, bias=False, init="normal")
+        self.mha = Attention(
+            self.c_in, self.c_in, self.c_in, self.c_hidden, self.no_heads
+        )
+    @torch.jit.ignore
+    def _chunk(self,
+        x: torch.Tensor,
+        biases: List[torch.Tensor],
+        chunk_size: int,
+    ) -> torch.Tensor:
+        mha_inputs = {
+            "q_x": x,
+            "kv_x": x,
+            "biases": biases,
+        }
+        return chunk_layer(
+            partial(self.mha),
+            mha_inputs,
+            chunk_size=chunk_size,
+            no_batch_dims=len(x.shape[:-2]),
+        )
+    def forward(self,
+        x: torch.Tensor,
+        mask: Optional[torch.Tensor] = None,
+        chunk_size: Optional[int] = None
+    ) -> torch.Tensor:
+        """
+        Args:
+            x:
+                [*, I, J, C_in] input tensor (e.g. the pair representation)
+        Returns:
+            [*, I, J, C_in] output tensor
+        """
+        if mask is None:
+            # [*, I, J]
+            mask = x.new_ones(
+                x.shape[:-1],
+            )
+        # Shape annotations assume self.starting. Else, I and J are flipped
+        if not self.starting:
+            x = x.transpose(-2, -3)
+            mask = mask.transpose(-1, -2)
+        # [*, I, J, C_in]
+        x = self.layer_norm(x)
+        # [*, I, 1, 1, J]
+        mask_bias = (self.inf * (mask - 1))[..., :, None, None, :]
+        # [*, H, I, J]
+        triangle_bias = permute_final_dims(self.linear(x), (2, 0, 1))
+        # [*, 1, H, I, J]
+        triangle_bias = triangle_bias.unsqueeze(-4)
+        biases = [mask_bias, triangle_bias]
+        if chunk_size is not None:
+            x = self._chunk(x, biases, chunk_size)
+        else:
+            x = self.mha(q_x=x, kv_x=x, biases=biases)
+        if not self.starting:
+            x = x.transpose(-2, -3)
+        return x
+class TriangleAttentionStartingNode(TriangleAttention):
+    """
+    Implements Algorithm 13.
+    """
+    __init__ = partialmethod(TriangleAttention.__init__, starting=True)
+class TriangleAttentionEndingNode(TriangleAttention):
+    """
+    Implements Algorithm 14.
+    """
+    __init__ = partialmethod(TriangleAttention.__init__, starting=False)

openfold/model/triangular_multiplicative_update.py ADDED Viewed

	@@ -0,0 +1,127 @@

+# Copyright 2021 AlQuraishi Laboratory
+# Copyright 2021 DeepMind Technologies Limited
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from functools import partialmethod
+from typing import Optional
+import torch
+import torch.nn as nn
+from openfold.model.primitives import Linear, LayerNorm
+from openfold.utils.tensor_utils import permute_final_dims
+class TriangleMultiplicativeUpdate(nn.Module):
+    """
+    Implements Algorithms 11 and 12.
+    """
+    def __init__(self, c_z, c_hidden, _outgoing=True):
+        """
+        Args:
+            c_z:
+                Input channel dimension
+            c:
+                Hidden channel dimension
+        """
+        super(TriangleMultiplicativeUpdate, self).__init__()
+        self.c_z = c_z
+        self.c_hidden = c_hidden
+        self._outgoing = _outgoing
+        self.linear_a_p = Linear(self.c_z, self.c_hidden)
+        self.linear_a_g = Linear(self.c_z, self.c_hidden, init="gating")
+        self.linear_b_p = Linear(self.c_z, self.c_hidden)
+        self.linear_b_g = Linear(self.c_z, self.c_hidden, init="gating")
+        self.linear_g = Linear(self.c_z, self.c_z, init="gating")
+        self.linear_z = Linear(self.c_hidden, self.c_z, init="final")
+        self.layer_norm_in = LayerNorm(self.c_z)
+        self.layer_norm_out = LayerNorm(self.c_hidden)
+        self.sigmoid = nn.Sigmoid()
+    def _combine_projections(self,
+        a: torch.Tensor,
+        b: torch.Tensor,
+    ) -> torch.Tensor:
+        raise NotImplementedError("This method needs to be overridden")
+    def forward(self,
+        z: torch.Tensor,
+        mask: Optional[torch.Tensor] = None
+    ) -> torch.Tensor:
+        """
+        Args:
+            x:
+                [*, N_res, N_res, C_z] input tensor
+            mask:
+                [*, N_res, N_res] input mask
+        Returns:
+            [*, N_res, N_res, C_z] output tensor
+        """
+        if mask is None:
+            mask = z.new_ones(z.shape[:-1])
+        mask = mask.unsqueeze(-1)
+        z = self.layer_norm_in(z)
+        a = self.linear_a_p(z) * self.sigmoid(self.linear_a_g(z))
+        a = a * mask
+        b = self.linear_b_p(z) * self.sigmoid(self.linear_b_g(z))
+        b = b * mask
+        x = self._combine_projections(a, b)
+        x = self.layer_norm_out(x)
+        x = self.linear_z(x)
+        g = self.sigmoid(self.linear_g(z))
+        z = x * g
+        return z
+class TriangleMultiplicationOutgoing(TriangleMultiplicativeUpdate):
+    """
+    Implements Algorithm 11.
+    """
+    def _combine_projections(self,
+        a: torch.Tensor,  # [*, N_i, N_k, C]
+        b: torch.Tensor,  # [*, N_j, N_k, C]
+    ):
+        # [*, C, N_i, N_j]
+        p = torch.matmul(
+            permute_final_dims(a, (2, 0, 1)),
+            permute_final_dims(b, (2, 1, 0)),
+        )
+        # [*, N_i, N_j, C]
+        return permute_final_dims(p, (1, 2, 0))
+class TriangleMultiplicationIncoming(TriangleMultiplicativeUpdate):
+    """
+    Implements Algorithm 12.
+    """
+    def _combine_projections(self,
+        a: torch.Tensor,  # [*, N_k, N_i, C]
+        b: torch.Tensor,  # [*, N_k, N_j, C]
+    ):
+        # [*, C, N_i, N_j]
+        p = torch.matmul(
+            permute_final_dims(a, (2, 1, 0)),
+            permute_final_dims(b, (2, 0, 1)),
+        )
+        # [*, N_i, N_j, C]
+        return permute_final_dims(p, (1, 2, 0))

openfold/np/__init__.py ADDED Viewed

	@@ -0,0 +1,16 @@

+import os
+import glob
+import importlib as importlib
+_files = glob.glob(os.path.join(os.path.dirname(__file__), "*.py"))
+__all__ = [
+    os.path.basename(f)[:-3]
+    for f in _files
+    if os.path.isfile(f) and not f.endswith("__init__.py")
+]
+_modules = [(m, importlib.import_module("." + m, __name__)) for m in __all__]
+for _m in _modules:
+    globals()[_m[0]] = _m[1]
+# Avoid needlessly cluttering the global namespace
+del _files, _m, _modules

openfold/np/protein.py ADDED Viewed

	@@ -0,0 +1,438 @@

+# Copyright 2021 AlQuraishi Laboratory
+# Copyright 2021 DeepMind Technologies Limited
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""Protein data type."""
+import dataclasses
+import io
+from typing import Any, Sequence, Mapping, Optional
+import re
+import string
+from openfold.np import residue_constants
+from Bio.PDB import PDBParser
+import numpy as np
+FeatureDict = Mapping[str, np.ndarray]
+ModelOutput = Mapping[str, Any]  # Is a nested dict.
+PICO_TO_ANGSTROM = 0.01
+@dataclasses.dataclass(frozen=True)
+class Protein:
+    """Protein structure representation."""
+    # Cartesian coordinates of atoms in angstroms. The atom types correspond to
+    # residue_constants.atom_types, i.e. the first three are N, CA, CB.
+    atom_positions: np.ndarray  # [num_res, num_atom_type, 3]
+    # Amino-acid type for each residue represented as an integer between 0 and
+    # 20, where 20 is 'X'.
+    aatype: np.ndarray  # [num_res]
+    # Binary float mask to indicate presence of a particular atom. 1.0 if an atom
+    # is present and 0.0 if not. This should be used for loss masking.
+    atom_mask: np.ndarray  # [num_res, num_atom_type]
+    # Residue index as used in PDB. It is not necessarily continuous or 0-indexed.
+    residue_index: np.ndarray  # [num_res]
+    # B-factors, or temperature factors, of each residue (in sq. angstroms units),
+    # representing the displacement of the residue from its ground truth mean
+    # value.
+    b_factors: np.ndarray  # [num_res, num_atom_type]
+    # Chain indices for multi-chain predictions
+    chain_index: Optional[np.ndarray] = None
+    # Optional remark about the protein. Included as a comment in output PDB
+    # files
+    remark: Optional[str] = None
+    # Templates used to generate this protein (prediction-only)
+    parents: Optional[Sequence[str]] = None
+    # Chain corresponding to each parent
+    parents_chain_index: Optional[Sequence[int]] = None
+def from_pdb_string(pdb_str: str, chain_id: Optional[str] = None) -> Protein:
+    """Takes a PDB string and constructs a Protein object.
+    WARNING: All non-standard residue types will be converted into UNK. All
+      non-standard atoms will be ignored.
+    Args:
+      pdb_str: The contents of the pdb file
+      chain_id: If None, then the pdb file must contain a single chain (which
+        will be parsed). If chain_id is specified (e.g. A), then only that chain
+        is parsed.
+    Returns:
+      A new `Protein` parsed from the pdb contents.
+    """
+    pdb_fh = io.StringIO(pdb_str)
+    parser = PDBParser(QUIET=True)
+    structure = parser.get_structure("none", pdb_fh)
+    models = list(structure.get_models())
+    if len(models) != 1:
+        raise ValueError(
+            f"Only single model PDBs are supported. Found {len(models)} models."
+        )
+    model = models[0]
+    atom_positions = []
+    aatype = []
+    atom_mask = []
+    residue_index = []
+    chain_ids = []
+    b_factors = []
+    for chain in model:
+        if(chain_id is not None and chain.id != chain_id):
+            continue
+        for res in chain:
+            if res.id[2] != " ":
+                raise ValueError(
+                    f"PDB contains an insertion code at chain {chain.id} and residue "
+                    f"index {res.id[1]}. These are not supported."
+                )
+            res_shortname = residue_constants.restype_3to1.get(res.resname, "X")
+            restype_idx = residue_constants.restype_order.get(
+                res_shortname, residue_constants.restype_num
+            )
+            pos = np.zeros((residue_constants.atom_type_num, 3))
+            mask = np.zeros((residue_constants.atom_type_num,))
+            res_b_factors = np.zeros((residue_constants.atom_type_num,))
+            for atom in res:
+                if atom.name not in residue_constants.atom_types:
+                    continue
+                pos[residue_constants.atom_order[atom.name]] = atom.coord
+                mask[residue_constants.atom_order[atom.name]] = 1.0
+                res_b_factors[
+                    residue_constants.atom_order[atom.name]
+                ] = atom.bfactor
+            if np.sum(mask) < 0.5:
+                # If no known atom positions are reported for the residue then skip it.
+                continue
+            aatype.append(restype_idx)
+            atom_positions.append(pos)
+            atom_mask.append(mask)
+            residue_index.append(res.id[1])
+            chain_ids.append(chain.id)
+            b_factors.append(res_b_factors)
+    parents = None
+    parents_chain_index = None
+    if("PARENT" in pdb_str):
+        parents = []
+        parents_chain_index = []
+        chain_id = 0
+        for l in pdb_str.split("\n"):
+            if("PARENT" in l):
+                if(not "N/A" in l):
+                    parent_names = l.split()[1:]
+                    parents.extend(parent_names)
+                    parents_chain_index.extend([
+                        chain_id for _ in parent_names
+                    ])
+                chain_id += 1
+    unique_chain_ids = np.unique(chain_ids)
+    chain_id_mapping = {cid: n for n, cid in enumerate(string.ascii_uppercase)}
+    chain_index = np.array([chain_id_mapping[cid] for cid in chain_ids])
+    return Protein(
+        atom_positions=np.array(atom_positions),
+        atom_mask=np.array(atom_mask),
+        aatype=np.array(aatype),
+        residue_index=np.array(residue_index),
+        chain_index=chain_index,
+        b_factors=np.array(b_factors),
+        parents=parents,
+        parents_chain_index=parents_chain_index,
+    )
+def from_proteinnet_string(proteinnet_str: str) -> Protein:
+    tag_re = r'(\[[A-Z]+\]\n)'
+    tags = [
+        tag.strip() for tag in re.split(tag_re, proteinnet_str) if len(tag) > 0
+    ]
+    groups = zip(tags[0::2], [l.split('\n') for l in tags[1::2]])
+    atoms = ['N', 'CA', 'C']
+    aatype = None
+    atom_positions = None
+    atom_mask = None
+    for g in groups:
+        if("[PRIMARY]" == g[0]):
+            seq = g[1][0].strip()
+            for i in range(len(seq)):
+                if(seq[i] not in residue_constants.restypes):
+                    seq[i] = 'X'
+            aatype = np.array([
+                residue_constants.restype_order.get(
+                    res_symbol, residue_constants.restype_num
+                ) for res_symbol in seq
+            ])
+        elif("[TERTIARY]" == g[0]):
+            tertiary = []
+            for axis in range(3):
+                tertiary.append(list(map(float, g[1][axis].split())))
+            tertiary_np = np.array(tertiary)
+            atom_positions = np.zeros(
+                (len(tertiary[0])//3, residue_constants.atom_type_num, 3)
+            ).astype(np.float32)
+            for i, atom in enumerate(atoms):
+                atom_positions[:, residue_constants.atom_order[atom], :] = (
+                    np.transpose(tertiary_np[:, i::3])
+                )
+            atom_positions *= PICO_TO_ANGSTROM
+        elif("[MASK]" == g[0]):
+            mask = np.array(list(map({'-': 0, '+': 1}.get, g[1][0].strip())))
+            atom_mask = np.zeros(
+                (len(mask), residue_constants.atom_type_num,)
+            ).astype(np.float32)
+            for i, atom in enumerate(atoms):
+                atom_mask[:, residue_constants.atom_order[atom]] = 1
+            atom_mask *= mask[..., None]
+    return Protein(
+        atom_positions=atom_positions,
+        atom_mask=atom_mask,
+        aatype=aatype,
+        residue_index=np.arange(len(aatype)),
+        b_factors=None,
+    )
+def get_pdb_headers(prot: Protein, chain_id: int = 0) -> Sequence[str]:
+    pdb_headers = []
+    remark = prot.remark
+    if(remark is not None):
+        pdb_headers.append(f"REMARK {remark}")
+    parents = prot.parents
+    parents_chain_index = prot.parents_chain_index
+    if(parents_chain_index is not None):
+        parents = [
+            p for i, p in zip(parents_chain_index, parents) if i == chain_id
+        ]
+    if(parents is None or len(parents) == 0):
+        parents = ["N/A"]
+    pdb_headers.append(f"PARENT {' '.join(parents)}")
+    return pdb_headers
+def add_pdb_headers(prot: Protein, pdb_str: str) -> str:
+    """ Add pdb headers to an existing PDB string. Useful during multi-chain
+        recycling
+    """
+    out_pdb_lines = []
+    lines = pdb_str.split('\n')
+    remark = prot.remark
+    if(remark is not None):
+        out_pdb_lines.append(f"REMARK {remark}")
+    parents_per_chain = None
+    if(prot.parents is not None and len(prot.parents) > 0):
+        parents_per_chain = []
+        if(prot.parents_chain_index is not None):
+            cur_chain = prot.parents_chain_index[0]
+            parent_dict = {}
+            for p, i in zip(prot.parents, prot.parents_chain_index):
+                parent_dict.setdefault(str(i), [])
+                parent_dict[str(i)].append(p)
+            max_idx = max([int(chain_idx) for chain_idx in parent_dict])
+            for i in range(max_idx + 1):
+                chain_parents = parent_dict.get(str(i), ["N/A"])
+                parents_per_chain.append(chain_parents)
+        else:
+            parents_per_chain.append(prot.parents)
+    else:
+        parents_per_chain = [["N/A"]]
+    make_parent_line = lambda p: f"PARENT {' '.join(p)}"
+    out_pdb_lines.append(make_parent_line(parents_per_chain[0]))
+    chain_counter = 0
+    for i, l in enumerate(lines):
+        if("PARENT" not in l and "REMARK" not in l):
+            out_pdb_lines.append(l)
+        if("TER" in l and not "END" in lines[i + 1]):
+            chain_counter += 1
+            if(not chain_counter >= len(parents_per_chain)):
+                chain_parents = parents_per_chain[chain_counter]
+            else:
+                chain_parents = ["N/A"]
+            out_pdb_lines.append(make_parent_line(chain_parents))
+    return '\n'.join(out_pdb_lines)
+def to_pdb(prot: Protein) -> str:
+    """Converts a `Protein` instance to a PDB string.
+    Args:
+      prot: The protein to convert to PDB.
+    Returns:
+      PDB string.
+    """
+    restypes = residue_constants.restypes + ["X"]
+    res_1to3 = lambda r: residue_constants.restype_1to3.get(restypes[r], "UNK")
+    atom_types = residue_constants.atom_types
+    pdb_lines = []
+    atom_mask = prot.atom_mask
+    aatype = prot.aatype
+    atom_positions = prot.atom_positions
+    residue_index = prot.residue_index.astype(int)
+    b_factors = prot.b_factors
+    chain_index = prot.chain_index
+    if np.any(aatype > residue_constants.restype_num):
+        raise ValueError("Invalid aatypes.")
+    headers = get_pdb_headers(prot)
+    if(len(headers) > 0):
+        pdb_lines.extend(headers)
+    n = aatype.shape[0]
+    atom_index = 1
+    prev_chain_index = 0
+    chain_tags = string.ascii_uppercase
+    # Add all atom sites.
+    for i in range(n):
+        res_name_3 = res_1to3(aatype[i])
+        for atom_name, pos, mask, b_factor in zip(
+            atom_types, atom_positions[i], atom_mask[i], b_factors[i]
+        ):
+            if mask < 0.5:
+                continue
+            record_type = "ATOM"
+            name = atom_name if len(atom_name) == 4 else f" {atom_name}"
+            alt_loc = ""
+            insertion_code = ""
+            occupancy = 1.00
+            element = atom_name[
+                0
+            ]  # Protein supports only C, N, O, S, this works.
+            charge = ""
+            chain_tag = "A"
+            if(chain_index is not None):
+                chain_tag = chain_tags[chain_index[i]]
+            # PDB is a columnar format, every space matters here!
+            atom_line = (
+                f"{record_type:<6}{atom_index:>5} {name:<4}{alt_loc:>1}"
+                f"{res_name_3:>3} {chain_tag:>1}"
+                f"{residue_index[i]:>4}{insertion_code:>1}   "
+                f"{pos[0]:>8.3f}{pos[1]:>8.3f}{pos[2]:>8.3f}"
+                f"{occupancy:>6.2f}{b_factor:>6.2f}          "
+                f"{element:>2}{charge:>2}"
+            )
+            pdb_lines.append(atom_line)
+            atom_index += 1
+        should_terminate = (i == n - 1)
+        if(chain_index is not None):
+            if(i != n - 1 and chain_index[i + 1] != prev_chain_index):
+                should_terminate = True
+                prev_chain_index = chain_index[i + 1]
+        if(should_terminate):
+            # Close the chain.
+            chain_end = "TER"
+            chain_termination_line = (
+                f"{chain_end:<6}{atom_index:>5}      "
+                f"{res_1to3(aatype[i]):>3} "
+                f"{chain_tag:>1}{residue_index[i]:>4}"
+            )
+            pdb_lines.append(chain_termination_line)
+            atom_index += 1
+            if(i != n - 1):
+                # "prev" is a misnomer here. This happens at the beginning of
+                # each new chain.
+                pdb_lines.extend(get_pdb_headers(prot, prev_chain_index))
+    pdb_lines.append("END")
+    pdb_lines.append("")
+    return "\n".join(pdb_lines)
+def ideal_atom_mask(prot: Protein) -> np.ndarray:
+    """Computes an ideal atom mask.
+    `Protein.atom_mask` typically is defined according to the atoms that are
+    reported in the PDB. This function computes a mask according to heavy atoms
+    that should be present in the given sequence of amino acids.
+    Args:
+      prot: `Protein` whose fields are `numpy.ndarray` objects.
+    Returns:
+      An ideal atom mask.
+    """
+    return residue_constants.STANDARD_ATOM_MASK[prot.aatype]
+def from_prediction(
+    features: FeatureDict,
+    result: ModelOutput,
+    b_factors: Optional[np.ndarray] = None,
+    chain_index: Optional[np.ndarray] = None,
+    remark: Optional[str] = None,
+    parents: Optional[Sequence[str]] = None,
+    parents_chain_index: Optional[Sequence[int]] = None
+) -> Protein:
+    """Assembles a protein from a prediction.
+    Args:
+      features: Dictionary holding model inputs.
+      result: Dictionary holding model outputs.
+      b_factors: (Optional) B-factors to use for the protein.
+      chain_index: (Optional) Chain indices for multi-chain predictions
+      remark: (Optional) Remark about the prediction
+      parents: (Optional) List of template names
+    Returns:
+      A protein instance.
+    """
+    if b_factors is None:
+        b_factors = np.zeros_like(result["final_atom_mask"])
+    return Protein(
+        aatype=features["aatype"],
+        atom_positions=result["final_atom_positions"],
+        atom_mask=result["final_atom_mask"],
+        residue_index=features["residue_index"] + 1,
+        b_factors=b_factors,
+        chain_index=chain_index,
+        remark=remark,
+        parents=parents,
+        parents_chain_index=parents_chain_index,
+    )

openfold/np/relax/__init__.py ADDED Viewed

	@@ -0,0 +1,16 @@

+import os
+import glob
+import importlib as importlib
+_files = glob.glob(os.path.join(os.path.dirname(__file__), "*.py"))
+__all__ = [
+    os.path.basename(f)[:-3]
+    for f in _files
+    if os.path.isfile(f) and not f.endswith("__init__.py")
+]
+_modules = [(m, importlib.import_module("." + m, __name__)) for m in __all__]
+for _m in _modules:
+    globals()[_m[0]] = _m[1]
+# Avoid needlessly cluttering the global namespace
+del _files, _m, _modules

openfold/np/relax/amber_minimize.py ADDED Viewed

	@@ -0,0 +1,612 @@

+# Copyright 2021 AlQuraishi Laboratory
+# Copyright 2021 DeepMind Technologies Limited
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""Restrained Amber Minimization of a structure."""
+import io
+import time
+from typing import Collection, Optional, Sequence
+from absl import logging
+from openfold.np import (
+    protein,
+    residue_constants,
+)
+import openfold.utils.loss as loss
+from openfold.np.relax import cleanup, utils
+import ml_collections
+import numpy as np
+import openmm
+from openmm import unit
+from openmm import app as openmm_app
+from openmm.app.internal.pdbstructure import PdbStructure
+ENERGY = unit.kilocalories_per_mole
+LENGTH = unit.angstroms
+def will_restrain(atom: openmm_app.Atom, rset: str) -> bool:
+    """Returns True if the atom will be restrained by the given restraint set."""
+    if rset == "non_hydrogen":
+        return atom.element.name != "hydrogen"
+    elif rset == "c_alpha":
+        return atom.name == "CA"
+def _add_restraints(
+    system: openmm.System,
+    reference_pdb: openmm_app.PDBFile,
+    stiffness: unit.Unit,
+    rset: str,
+    exclude_residues: Sequence[int],
+):
+    """Adds a harmonic potential that restrains the system to a structure."""
+    assert rset in ["non_hydrogen", "c_alpha"]
+    force = openmm.CustomExternalForce(
+        "0.5 * k * ((x-x0)^2 + (y-y0)^2 + (z-z0)^2)"
+    )
+    force.addGlobalParameter("k", stiffness)
+    for p in ["x0", "y0", "z0"]:
+        force.addPerParticleParameter(p)
+    for i, atom in enumerate(reference_pdb.topology.atoms()):
+        if atom.residue.index in exclude_residues:
+            continue
+        if will_restrain(atom, rset):
+            force.addParticle(i, reference_pdb.positions[i])
+    logging.info(
+        "Restraining %d / %d particles.",
+        force.getNumParticles(),
+        system.getNumParticles(),
+    )
+    system.addForce(force)
+def _openmm_minimize(
+    pdb_str: str,
+    max_iterations: int,
+    tolerance: unit.Unit,
+    stiffness: unit.Unit,
+    restraint_set: str,
+    exclude_residues: Sequence[int],
+    use_gpu: bool,
+):
+    """Minimize energy via openmm."""
+    pdb_file = io.StringIO(pdb_str)
+    pdb = openmm_app.PDBFile(pdb_file)
+    force_field = openmm_app.ForceField("amber99sb.xml")
+    constraints = openmm_app.HBonds
+    system = force_field.createSystem(pdb.topology, constraints=constraints)
+    if stiffness > 0 * ENERGY / (LENGTH ** 2):
+        _add_restraints(system, pdb, stiffness, restraint_set, exclude_residues)
+    integrator = openmm.LangevinIntegrator(0, 0.01, 0.0)
+    platform = openmm.Platform.getPlatformByName("CUDA" if use_gpu else "CPU")
+    simulation = openmm_app.Simulation(
+        pdb.topology, system, integrator, platform
+    )
+    simulation.context.setPositions(pdb.positions)
+    ret = {}
+    state = simulation.context.getState(getEnergy=True, getPositions=True)
+    ret["einit"] = state.getPotentialEnergy().value_in_unit(ENERGY)
+    ret["posinit"] = state.getPositions(asNumpy=True).value_in_unit(LENGTH)
+    simulation.minimizeEnergy(maxIterations=max_iterations, tolerance=tolerance)
+    state = simulation.context.getState(getEnergy=True, getPositions=True)
+    ret["efinal"] = state.getPotentialEnergy().value_in_unit(ENERGY)
+    ret["pos"] = state.getPositions(asNumpy=True).value_in_unit(LENGTH)
+    ret["min_pdb"] = _get_pdb_string(simulation.topology, state.getPositions())
+    return ret
+def _get_pdb_string(topology: openmm_app.Topology, positions: unit.Quantity):
+    """Returns a pdb string provided OpenMM topology and positions."""
+    with io.StringIO() as f:
+        openmm_app.PDBFile.writeFile(topology, positions, f)
+        return f.getvalue()
+def _check_cleaned_atoms(pdb_cleaned_string: str, pdb_ref_string: str):
+    """Checks that no atom positions have been altered by cleaning."""
+    cleaned = openmm_app.PDBFile(io.StringIO(pdb_cleaned_string))
+    reference = openmm_app.PDBFile(io.StringIO(pdb_ref_string))
+    cl_xyz = np.array(cleaned.getPositions().value_in_unit(LENGTH))
+    ref_xyz = np.array(reference.getPositions().value_in_unit(LENGTH))
+    for ref_res, cl_res in zip(
+        reference.topology.residues(), cleaned.topology.residues()
+    ):
+        assert ref_res.name == cl_res.name
+        for rat in ref_res.atoms():
+            for cat in cl_res.atoms():
+                if cat.name == rat.name:
+                    if not np.array_equal(
+                        cl_xyz[cat.index], ref_xyz[rat.index]
+                    ):
+                        raise ValueError(
+                            f"Coordinates of cleaned atom {cat} do not match "
+                            f"coordinates of reference atom {rat}."
+                        )
+def _check_residues_are_well_defined(prot: protein.Protein):
+    """Checks that all residues contain non-empty atom sets."""
+    if (prot.atom_mask.sum(axis=-1) == 0).any():
+        raise ValueError(
+            "Amber minimization can only be performed on proteins with"
+            " well-defined residues. This protein contains at least"
+            " one residue with no atoms."
+        )
+def _check_atom_mask_is_ideal(prot):
+    """Sanity-check the atom mask is ideal, up to a possible OXT."""
+    atom_mask = prot.atom_mask
+    ideal_atom_mask = protein.ideal_atom_mask(prot)
+    utils.assert_equal_nonterminal_atom_types(atom_mask, ideal_atom_mask)
+def clean_protein(prot: protein.Protein, checks: bool = True):
+    """Adds missing atoms to Protein instance.
+    Args:
+      prot: A `protein.Protein` instance.
+      checks: A `bool` specifying whether to add additional checks to the cleaning
+        process.
+    Returns:
+      pdb_string: A string of the cleaned protein.
+    """
+    _check_atom_mask_is_ideal(prot)
+    # Clean pdb.
+    prot_pdb_string = protein.to_pdb(prot)
+    pdb_file = io.StringIO(prot_pdb_string)
+    alterations_info = {}
+    fixed_pdb = cleanup.fix_pdb(pdb_file, alterations_info)
+    fixed_pdb_file = io.StringIO(fixed_pdb)
+    pdb_structure = PdbStructure(fixed_pdb_file)
+    cleanup.clean_structure(pdb_structure, alterations_info)
+    logging.info("alterations info: %s", alterations_info)
+    # Write pdb file of cleaned structure.
+    as_file = openmm_app.PDBFile(pdb_structure)
+    pdb_string = _get_pdb_string(as_file.getTopology(), as_file.getPositions())
+    if checks:
+        _check_cleaned_atoms(pdb_string, prot_pdb_string)
+    return pdb_string
+def make_atom14_positions(prot):
+    """Constructs denser atom positions (14 dimensions instead of 37)."""
+    restype_atom14_to_atom37 = []  # mapping (restype, atom14) --> atom37
+    restype_atom37_to_atom14 = []  # mapping (restype, atom37) --> atom14
+    restype_atom14_mask = []
+    for rt in residue_constants.restypes:
+        atom_names = residue_constants.restype_name_to_atom14_names[
+            residue_constants.restype_1to3[rt]
+        ]
+        restype_atom14_to_atom37.append(
+            [
+                (residue_constants.atom_order[name] if name else 0)
+                for name in atom_names
+            ]
+        )
+        atom_name_to_idx14 = {name: i for i, name in enumerate(atom_names)}
+        restype_atom37_to_atom14.append(
+            [
+                (atom_name_to_idx14[name] if name in atom_name_to_idx14 else 0)
+                for name in residue_constants.atom_types
+            ]
+        )
+        restype_atom14_mask.append(
+            [(1.0 if name else 0.0) for name in atom_names]
+        )
+    # Add dummy mapping for restype 'UNK'.
+    restype_atom14_to_atom37.append([0] * 14)
+    restype_atom37_to_atom14.append([0] * 37)
+    restype_atom14_mask.append([0.0] * 14)
+    restype_atom14_to_atom37 = np.array(
+        restype_atom14_to_atom37, dtype=int
+    )
+    restype_atom37_to_atom14 = np.array(
+        restype_atom37_to_atom14, dtype=int
+    )
+    restype_atom14_mask = np.array(restype_atom14_mask, dtype=np.float32)
+    # Create the mapping for (residx, atom14) --> atom37, i.e. an array
+    # with shape (num_res, 14) containing the atom37 indices for this protein.
+    residx_atom14_to_atom37 = restype_atom14_to_atom37[prot["aatype"]]
+    residx_atom14_mask = restype_atom14_mask[prot["aatype"]]
+    # Create a mask for known ground truth positions.
+    residx_atom14_gt_mask = residx_atom14_mask * np.take_along_axis(
+        prot["all_atom_mask"], residx_atom14_to_atom37, axis=1
+    ).astype(np.float32)
+    # Gather the ground truth positions.
+    residx_atom14_gt_positions = residx_atom14_gt_mask[:, :, None] * (
+        np.take_along_axis(
+            prot["all_atom_positions"],
+            residx_atom14_to_atom37[..., None],
+            axis=1,
+        )
+    )
+    prot["atom14_atom_exists"] = residx_atom14_mask
+    prot["atom14_gt_exists"] = residx_atom14_gt_mask
+    prot["atom14_gt_positions"] = residx_atom14_gt_positions
+    prot["residx_atom14_to_atom37"] = residx_atom14_to_atom37.astype(np.int64)
+    # Create the gather indices for mapping back.
+    residx_atom37_to_atom14 = restype_atom37_to_atom14[prot["aatype"]]
+    prot["residx_atom37_to_atom14"] = residx_atom37_to_atom14.astype(np.int64)
+    # Create the corresponding mask.
+    restype_atom37_mask = np.zeros([21, 37], dtype=np.float32)
+    for restype, restype_letter in enumerate(residue_constants.restypes):
+        restype_name = residue_constants.restype_1to3[restype_letter]
+        atom_names = residue_constants.residue_atoms[restype_name]
+        for atom_name in atom_names:
+            atom_type = residue_constants.atom_order[atom_name]
+            restype_atom37_mask[restype, atom_type] = 1
+    residx_atom37_mask = restype_atom37_mask[prot["aatype"]]
+    prot["atom37_atom_exists"] = residx_atom37_mask
+    # As the atom naming is ambiguous for 7 of the 20 amino acids, provide
+    # alternative ground truth coordinates where the naming is swapped
+    restype_3 = [
+        residue_constants.restype_1to3[res]
+        for res in residue_constants.restypes
+    ]
+    restype_3 += ["UNK"]
+    # Matrices for renaming ambiguous atoms.
+    all_matrices = {res: np.eye(14, dtype=np.float32) for res in restype_3}
+    for resname, swap in residue_constants.residue_atom_renaming_swaps.items():
+        correspondences = np.arange(14)
+        for source_atom_swap, target_atom_swap in swap.items():
+            source_index = residue_constants.restype_name_to_atom14_names[
+                resname
+            ].index(source_atom_swap)
+            target_index = residue_constants.restype_name_to_atom14_names[
+                resname
+            ].index(target_atom_swap)
+            correspondences[source_index] = target_index
+            correspondences[target_index] = source_index
+            renaming_matrix = np.zeros((14, 14), dtype=np.float32)
+            for index, correspondence in enumerate(correspondences):
+                renaming_matrix[index, correspondence] = 1.0
+        all_matrices[resname] = renaming_matrix.astype(np.float32)
+    renaming_matrices = np.stack(
+        [all_matrices[restype] for restype in restype_3]
+    )
+    # Pick the transformation matrices for the given residue sequence
+    # shape (num_res, 14, 14).
+    renaming_transform = renaming_matrices[prot["aatype"]]
+    # Apply it to the ground truth positions. shape (num_res, 14, 3).
+    alternative_gt_positions = np.einsum(
+        "rac,rab->rbc", residx_atom14_gt_positions, renaming_transform
+    )
+    prot["atom14_alt_gt_positions"] = alternative_gt_positions
+    # Create the mask for the alternative ground truth (differs from the
+    # ground truth mask, if only one of the atoms in an ambiguous pair has a
+    # ground truth position).
+    alternative_gt_mask = np.einsum(
+        "ra,rab->rb", residx_atom14_gt_mask, renaming_transform
+    )
+    prot["atom14_alt_gt_exists"] = alternative_gt_mask
+    # Create an ambiguous atoms mask.  shape: (21, 14).
+    restype_atom14_is_ambiguous = np.zeros((21, 14), dtype=np.float32)
+    for resname, swap in residue_constants.residue_atom_renaming_swaps.items():
+        for atom_name1, atom_name2 in swap.items():
+            restype = residue_constants.restype_order[
+                residue_constants.restype_3to1[resname]
+            ]
+            atom_idx1 = residue_constants.restype_name_to_atom14_names[
+                resname
+            ].index(atom_name1)
+            atom_idx2 = residue_constants.restype_name_to_atom14_names[
+                resname
+            ].index(atom_name2)
+            restype_atom14_is_ambiguous[restype, atom_idx1] = 1
+            restype_atom14_is_ambiguous[restype, atom_idx2] = 1
+    # From this create an ambiguous_mask for the given sequence.
+    prot["atom14_atom_is_ambiguous"] = restype_atom14_is_ambiguous[
+        prot["aatype"]
+    ]
+    return prot
+def find_violations(prot_np: protein.Protein):
+    """Analyzes a protein and returns structural violation information.
+    Args:
+      prot_np: A protein.
+    Returns:
+      violations: A `dict` of structure components with structural violations.
+      violation_metrics: A `dict` of violation metrics.
+    """
+    batch = {
+        "aatype": prot_np.aatype,
+        "all_atom_positions": prot_np.atom_positions.astype(np.float32),
+        "all_atom_mask": prot_np.atom_mask.astype(np.float32),
+        "residue_index": prot_np.residue_index,
+    }
+    batch["seq_mask"] = np.ones_like(batch["aatype"], np.float32)
+    batch = make_atom14_positions(batch)
+    violations = loss.find_structural_violations_np(
+        batch=batch,
+        atom14_pred_positions=batch["atom14_gt_positions"],
+        config=ml_collections.ConfigDict(
+            {
+                "violation_tolerance_factor": 12,  # Taken from model config.
+                "clash_overlap_tolerance": 1.5,  # Taken from model config.
+            }
+        ),
+    )
+    violation_metrics = loss.compute_violation_metrics_np(
+        batch=batch,
+        atom14_pred_positions=batch["atom14_gt_positions"],
+        violations=violations,
+    )
+    return violations, violation_metrics
+def get_violation_metrics(prot: protein.Protein):
+    """Computes violation and alignment metrics."""
+    structural_violations, struct_metrics = find_violations(prot)
+    violation_idx = np.flatnonzero(
+        structural_violations["total_per_residue_violations_mask"]
+    )
+    struct_metrics["residue_violations"] = violation_idx
+    struct_metrics["num_residue_violations"] = len(violation_idx)
+    struct_metrics["structural_violations"] = structural_violations
+    return struct_metrics
+def _run_one_iteration(
+    *,
+    pdb_string: str,
+    max_iterations: int,
+    tolerance: float,
+    stiffness: float,
+    restraint_set: str,
+    max_attempts: int,
+    exclude_residues: Optional[Collection[int]] = None,
+    use_gpu: bool,
+):
+    """Runs the minimization pipeline.
+    Args:
+      pdb_string: A pdb string.
+      max_iterations: An `int` specifying the maximum number of L-BFGS iterations.
+      A value of 0 specifies no limit.
+      tolerance: kcal/mol, the energy tolerance of L-BFGS.
+      stiffness: kcal/mol A**2, spring constant of heavy atom restraining
+        potential.
+      restraint_set: The set of atoms to restrain.
+      max_attempts: The maximum number of minimization attempts.
+      exclude_residues: An optional list of zero-indexed residues to exclude from
+          restraints.
+      use_gpu: Whether to run relaxation on GPU
+    Returns:
+      A `dict` of minimization info.
+    """
+    exclude_residues = exclude_residues or []
+    # Assign physical dimensions.
+    tolerance = tolerance * ENERGY
+    stiffness = stiffness * ENERGY / (LENGTH ** 2)
+    start = time.perf_counter()
+    minimized = False
+    attempts = 0
+    while not minimized and attempts < max_attempts:
+        attempts += 1
+        try:
+            logging.info(
+                "Minimizing protein, attempt %d of %d.", attempts, max_attempts
+            )
+            ret = _openmm_minimize(
+                pdb_string,
+                max_iterations=max_iterations,
+                tolerance=tolerance,
+                stiffness=stiffness,
+                restraint_set=restraint_set,
+                exclude_residues=exclude_residues,
+                use_gpu=use_gpu,
+            )
+            minimized = True
+        except Exception as e:  # pylint: disable=broad-except
+            print(e)
+            logging.info(e)
+    if not minimized:
+        raise ValueError(f"Minimization failed after {max_attempts} attempts.")
+    ret["opt_time"] = time.perf_counter() - start
+    ret["min_attempts"] = attempts
+    return ret
+def run_pipeline(
+    prot: protein.Protein,
+    stiffness: float,
+    use_gpu: bool,
+    max_outer_iterations: int = 1,
+    place_hydrogens_every_iteration: bool = True,
+    max_iterations: int = 0,
+    tolerance: float = 2.39,
+    restraint_set: str = "non_hydrogen",
+    max_attempts: int = 100,
+    checks: bool = True,
+    exclude_residues: Optional[Sequence[int]] = None,
+):
+    """Run iterative amber relax.
+    Successive relax iterations are performed until all violations have been
+    resolved. Each iteration involves a restrained Amber minimization, with
+    restraint exclusions determined by violation-participating residues.
+    Args:
+      prot: A protein to be relaxed.
+      stiffness: kcal/mol A**2, the restraint stiffness.
+      use_gpu: Whether to run on GPU
+      max_outer_iterations: The maximum number of iterative minimization.
+      place_hydrogens_every_iteration: Whether hydrogens are re-initialized
+          prior to every minimization.
+      max_iterations: An `int` specifying the maximum number of L-BFGS steps
+          per relax iteration. A value of 0 specifies no limit.
+      tolerance: kcal/mol, the energy tolerance of L-BFGS.
+          The default value is the OpenMM default.
+      restraint_set: The set of atoms to restrain.
+      max_attempts: The maximum number of minimization attempts per iteration.
+      checks: Whether to perform cleaning checks.
+      exclude_residues: An optional list of zero-indexed residues to exclude from
+          restraints.
+    Returns:
+      out: A dictionary of output values.
+    """
+    # `protein.to_pdb` will strip any poorly-defined residues so we need to
+    # perform this check before `clean_protein`.
+    _check_residues_are_well_defined(prot)
+    pdb_string = clean_protein(prot, checks=checks)
+    exclude_residues = exclude_residues or []
+    exclude_residues = set(exclude_residues)
+    violations = np.inf
+    iteration = 0
+    while violations > 0 and iteration < max_outer_iterations:
+        ret = _run_one_iteration(
+            pdb_string=pdb_string,
+            exclude_residues=exclude_residues,
+            max_iterations=max_iterations,
+            tolerance=tolerance,
+            stiffness=stiffness,
+            restraint_set=restraint_set,
+            max_attempts=max_attempts,
+            use_gpu=use_gpu,
+        )
+        prot = protein.from_pdb_string(ret["min_pdb"])
+        if place_hydrogens_every_iteration:
+            pdb_string = clean_protein(prot, checks=True)
+        else:
+            pdb_string = ret["min_pdb"]
+        ret.update(get_violation_metrics(prot))
+        ret.update(
+            {
+                "num_exclusions": len(exclude_residues),
+                "iteration": iteration,
+            }
+        )
+        violations = ret["violations_per_residue"]
+        exclude_residues = exclude_residues.union(ret["residue_violations"])
+        logging.info(
+            "Iteration completed: Einit %.2f Efinal %.2f Time %.2f s "
+            "num residue violations %d num residue exclusions %d ",
+            ret["einit"],
+            ret["efinal"],
+            ret["opt_time"],
+            ret["num_residue_violations"],
+            ret["num_exclusions"],
+        )
+        iteration += 1
+    return ret
+def get_initial_energies(
+    pdb_strs: Sequence[str],
+    stiffness: float = 0.0,
+    restraint_set: str = "non_hydrogen",
+    exclude_residues: Optional[Sequence[int]] = None,
+):
+    """Returns initial potential energies for a sequence of PDBs.
+    Assumes the input PDBs are ready for minimization, and all have the same
+    topology.
+    Allows time to be saved by not pdbfixing / rebuilding the system.
+    Args:
+      pdb_strs: List of PDB strings.
+      stiffness: kcal/mol A**2, spring constant of heavy atom restraining
+          potential.
+      restraint_set: Which atom types to restrain.
+      exclude_residues: An optional list of zero-indexed residues to exclude from
+          restraints.
+    Returns:
+      A list of initial energies in the same order as pdb_strs.
+    """
+    exclude_residues = exclude_residues or []
+    openmm_pdbs = [
+        openmm_app.PDBFile(PdbStructure(io.StringIO(p))) for p in pdb_strs
+    ]
+    force_field = openmm_app.ForceField("amber99sb.xml")
+    system = force_field.createSystem(
+        openmm_pdbs[0].topology, constraints=openmm_app.HBonds
+    )
+    stiffness = stiffness * ENERGY / (LENGTH ** 2)
+    if stiffness > 0 * ENERGY / (LENGTH ** 2):
+        _add_restraints(
+            system, openmm_pdbs[0], stiffness, restraint_set, exclude_residues
+        )
+    simulation = openmm_app.Simulation(
+        openmm_pdbs[0].topology,
+        system,
+        openmm.LangevinIntegrator(0, 0.01, 0.0),
+        openmm.Platform.getPlatformByName("CPU"),
+    )
+    energies = []
+    for pdb in openmm_pdbs:
+        try:
+            simulation.context.setPositions(pdb.positions)
+            state = simulation.context.getState(getEnergy=True)
+            energies.append(state.getPotentialEnergy().value_in_unit(ENERGY))
+        except Exception as e:  # pylint: disable=broad-except
+            logging.error(
+                "Error getting initial energy, returning large value %s", e
+            )
+            energies.append(unit.Quantity(1e20, ENERGY))
+    return energies

openfold/np/relax/cleanup.py ADDED Viewed

	@@ -0,0 +1,131 @@

+# Copyright 2021 DeepMind Technologies Limited
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""Cleans up a PDB file using pdbfixer in preparation for OpenMM simulations.
+fix_pdb uses a third-party tool. We also support fixing some additional edge
+cases like removing chains of length one (see clean_structure).
+"""
+import io
+import pdbfixer
+from simtk.openmm import app
+from simtk.openmm.app import element
+def fix_pdb(pdbfile, alterations_info):
+    """Apply pdbfixer to the contents of a PDB file; return a PDB string result.
+    1) Replaces nonstandard residues.
+    2) Removes heterogens (non protein residues) including water.
+    3) Adds missing residues and missing atoms within existing residues.
+    4) Adds hydrogens assuming pH=7.0.
+    5) KeepIds is currently true, so the fixer must keep the existing chain and
+       residue identifiers. This will fail for some files in wider PDB that have
+       invalid IDs.
+    Args:
+      pdbfile: Input PDB file handle.
+      alterations_info: A dict that will store details of changes made.
+    Returns:
+      A PDB string representing the fixed structure.
+    """
+    fixer = pdbfixer.PDBFixer(pdbfile=pdbfile)
+    fixer.findNonstandardResidues()
+    alterations_info["nonstandard_residues"] = fixer.nonstandardResidues
+    fixer.replaceNonstandardResidues()
+    _remove_heterogens(fixer, alterations_info, keep_water=False)
+    fixer.findMissingResidues()
+    alterations_info["missing_residues"] = fixer.missingResidues
+    fixer.findMissingAtoms()
+    alterations_info["missing_heavy_atoms"] = fixer.missingAtoms
+    alterations_info["missing_terminals"] = fixer.missingTerminals
+    fixer.addMissingAtoms(seed=0)
+    fixer.addMissingHydrogens()
+    out_handle = io.StringIO()
+    app.PDBFile.writeFile(
+        fixer.topology, fixer.positions, out_handle, keepIds=True
+    )
+    return out_handle.getvalue()
+def clean_structure(pdb_structure, alterations_info):
+    """Applies additional fixes to an OpenMM structure, to handle edge cases.
+    Args:
+      pdb_structure: An OpenMM structure to modify and fix.
+      alterations_info: A dict that will store details of changes made.
+    """
+    _replace_met_se(pdb_structure, alterations_info)
+    _remove_chains_of_length_one(pdb_structure, alterations_info)
+def _remove_heterogens(fixer, alterations_info, keep_water):
+    """Removes the residues that Pdbfixer considers to be heterogens.
+    Args:
+      fixer: A Pdbfixer instance.
+      alterations_info: A dict that will store details of changes made.
+      keep_water: If True, water (HOH) is not considered to be a heterogen.
+    """
+    initial_resnames = set()
+    for chain in fixer.topology.chains():
+        for residue in chain.residues():
+            initial_resnames.add(residue.name)
+    fixer.removeHeterogens(keepWater=keep_water)
+    final_resnames = set()
+    for chain in fixer.topology.chains():
+        for residue in chain.residues():
+            final_resnames.add(residue.name)
+    alterations_info["removed_heterogens"] = initial_resnames.difference(
+        final_resnames
+    )
+def _replace_met_se(pdb_structure, alterations_info):
+    """Replace the Se in any MET residues that were not marked as modified."""
+    modified_met_residues = []
+    for res in pdb_structure.iter_residues():
+        name = res.get_name_with_spaces().strip()
+        if name == "MET":
+            s_atom = res.get_atom("SD")
+            if s_atom.element_symbol == "Se":
+                s_atom.element_symbol = "S"
+                s_atom.element = element.get_by_symbol("S")
+                modified_met_residues.append(s_atom.residue_number)
+    alterations_info["Se_in_MET"] = modified_met_residues
+def _remove_chains_of_length_one(pdb_structure, alterations_info):
+    """Removes chains that correspond to a single amino acid.
+    A single amino acid in a chain is both N and C terminus. There is no force
+    template for this case.
+    Args:
+      pdb_structure: An OpenMM pdb_structure to modify and fix.
+      alterations_info: A dict that will store details of changes made.
+    """
+    removed_chains = {}
+    for model in pdb_structure.iter_models():
+        valid_chains = [c for c in model.iter_chains() if len(c) > 1]
+        invalid_chain_ids = [
+            c.chain_id for c in model.iter_chains() if len(c) <= 1
+        ]
+        model.chains = valid_chains
+        for chain_id in invalid_chain_ids:
+            model.chains_by_id.pop(chain_id)
+        removed_chains[model.number] = invalid_chain_ids
+    alterations_info["removed_chains"] = removed_chains

openfold/np/relax/relax.py ADDED Viewed

	@@ -0,0 +1,90 @@

+# Copyright 2021 AlQuraishi Laboratory
+# Copyright 2021 DeepMind Technologies Limited
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""Amber relaxation."""
+from typing import Any, Dict, Sequence, Tuple
+from openfold.np import protein
+from openfold.np.relax import amber_minimize, utils
+import numpy as np
+class AmberRelaxation(object):
+    """Amber relaxation."""
+    def __init__(
+        self,
+        *,
+        max_iterations: int,
+        tolerance: float,
+        stiffness: float,
+        exclude_residues: Sequence[int],
+        max_outer_iterations: int,
+        use_gpu: bool,
+    ):
+        """Initialize Amber Relaxer.
+        Args:
+          max_iterations: Maximum number of L-BFGS iterations. 0 means no max.
+          tolerance: kcal/mol, the energy tolerance of L-BFGS.
+          stiffness: kcal/mol A**2, spring constant of heavy atom restraining
+            potential.
+          exclude_residues: Residues to exclude from per-atom restraining.
+            Zero-indexed.
+          max_outer_iterations: Maximum number of violation-informed relax
+           iterations. A value of 1 will run the non-iterative procedure used in
+           CASP14. Use 20 so that >95% of the bad cases are relaxed. Relax finishes
+           as soon as there are no violations, hence in most cases this causes no
+           slowdown. In the worst case we do 20 outer iterations.
+          use_gpu: Whether to run on GPU
+        """
+        self._max_iterations = max_iterations
+        self._tolerance = tolerance
+        self._stiffness = stiffness
+        self._exclude_residues = exclude_residues
+        self._max_outer_iterations = max_outer_iterations
+        self._use_gpu = use_gpu
+    def process(
+        self, *, prot: protein.Protein
+    ) -> Tuple[str, Dict[str, Any], np.ndarray]:
+        """Runs Amber relax on a prediction, adds hydrogens, returns PDB string."""
+        out = amber_minimize.run_pipeline(
+            prot=prot,
+            max_iterations=self._max_iterations,
+            tolerance=self._tolerance,
+            stiffness=self._stiffness,
+            exclude_residues=self._exclude_residues,
+            max_outer_iterations=self._max_outer_iterations,
+            use_gpu=self._use_gpu,
+        )
+        min_pos = out["pos"]
+        start_pos = out["posinit"]
+        rmsd = np.sqrt(np.sum((start_pos - min_pos) ** 2) / start_pos.shape[0])
+        debug_data = {
+            "initial_energy": out["einit"],
+            "final_energy": out["efinal"],
+            "attempts": out["min_attempts"],
+            "rmsd": rmsd,
+        }
+        pdb_str = amber_minimize.clean_protein(prot)
+        min_pdb = utils.overwrite_pdb_coordinates(pdb_str, min_pos)
+        min_pdb = utils.overwrite_b_factors(min_pdb, prot.b_factors)
+        utils.assert_equal_nonterminal_atom_types(
+            protein.from_pdb_string(min_pdb).atom_mask, prot.atom_mask
+        )
+        violations = out["structural_violations"][
+            "total_per_residue_violations_mask"
+        ]
+        return min_pdb, debug_data, violations

openfold/np/relax/utils.py ADDED Viewed

	@@ -0,0 +1,88 @@

+# Copyright 2021 AlQuraishi Laboratory
+# Copyright 2021 DeepMind Technologies Limited
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""Utils for minimization."""
+import io
+from openfold.np import residue_constants
+from Bio import PDB
+import numpy as np
+# simtk.openmm is not supported anymore. Remove simtk.
+# https://github.com/openmm/openmm/releases
+from openmm import app as openmm_app
+from openmm.app.internal.pdbstructure import PdbStructure
+def overwrite_pdb_coordinates(pdb_str: str, pos) -> str:
+    pdb_file = io.StringIO(pdb_str)
+    structure = PdbStructure(pdb_file)
+    topology = openmm_app.PDBFile(structure).getTopology()
+    with io.StringIO() as f:
+        openmm_app.PDBFile.writeFile(topology, pos, f)
+        return f.getvalue()
+def overwrite_b_factors(pdb_str: str, bfactors: np.ndarray) -> str:
+    """Overwrites the B-factors in pdb_str with contents of bfactors array.
+    Args:
+      pdb_str: An input PDB string.
+      bfactors: A numpy array with shape [1, n_residues, 37]. We assume that the
+        B-factors are per residue; i.e. that the nonzero entries are identical in
+        [0, i, :].
+    Returns:
+      A new PDB string with the B-factors replaced.
+    """
+    if bfactors.shape[-1] != residue_constants.atom_type_num:
+        raise ValueError(
+            f"Invalid final dimension size for bfactors: {bfactors.shape[-1]}."
+        )
+    parser = PDB.PDBParser(QUIET=True)
+    handle = io.StringIO(pdb_str)
+    structure = parser.get_structure("", handle)
+    curr_resid = ("", "", "")
+    idx = -1
+    for atom in structure.get_atoms():
+        atom_resid = atom.parent.get_id()
+        if atom_resid != curr_resid:
+            idx += 1
+            if idx >= bfactors.shape[0]:
+                raise ValueError(
+                    "Index into bfactors exceeds number of residues. "
+                    "B-factors shape: {shape}, idx: {idx}."
+                )
+        curr_resid = atom_resid
+        atom.bfactor = bfactors[idx, residue_constants.atom_order["CA"]]
+    new_pdb = io.StringIO()
+    pdb_io = PDB.PDBIO()
+    pdb_io.set_structure(structure)
+    pdb_io.save(new_pdb)
+    return new_pdb.getvalue()
+def assert_equal_nonterminal_atom_types(
+    atom_mask: np.ndarray, ref_atom_mask: np.ndarray
+):
+    """Checks that pre- and post-minimized proteins have same atom set."""
+    # Ignore any terminal OXT atoms which may have been added by minimization.
+    oxt = residue_constants.atom_order["OXT"]
+    no_oxt_mask = np.ones(shape=atom_mask.shape, dtype=np.bool)
+    no_oxt_mask[..., oxt] = False
+    np.testing.assert_almost_equal(
+        ref_atom_mask[no_oxt_mask], atom_mask[no_oxt_mask]
+    )

openfold/np/residue_constants.py ADDED Viewed

	@@ -0,0 +1,1310 @@

+# Copyright 2021 AlQuraishi Laboratory
+# Copyright 2021 DeepMind Technologies Limited
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""Constants used in AlphaFold."""
+import collections
+import functools
+from typing import Mapping, List, Tuple
+from importlib import resources
+import numpy as np
+import tree
+# Internal import (35fd).
+# Distance from one CA to next CA [trans configuration: omega = 180].
+ca_ca = 3.80209737096
+# Format: The list for each AA type contains chi1, chi2, chi3, chi4 in
+# this order (or a relevant subset from chi1 onwards). ALA and GLY don't have
+# chi angles so their chi angle lists are empty.
+chi_angles_atoms = {
+    "ALA": [],
+    # Chi5 in arginine is always 0 +- 5 degrees, so ignore it.
+    "ARG": [
+        ["N", "CA", "CB", "CG"],
+        ["CA", "CB", "CG", "CD"],
+        ["CB", "CG", "CD", "NE"],
+        ["CG", "CD", "NE", "CZ"],
+    ],
+    "ASN": [["N", "CA", "CB", "CG"], ["CA", "CB", "CG", "OD1"]],
+    "ASP": [["N", "CA", "CB", "CG"], ["CA", "CB", "CG", "OD1"]],
+    "CYS": [["N", "CA", "CB", "SG"]],
+    "GLN": [
+        ["N", "CA", "CB", "CG"],
+        ["CA", "CB", "CG", "CD"],
+        ["CB", "CG", "CD", "OE1"],
+    ],
+    "GLU": [
+        ["N", "CA", "CB", "CG"],
+        ["CA", "CB", "CG", "CD"],
+        ["CB", "CG", "CD", "OE1"],
+    ],
+    "GLY": [],
+    "HIS": [["N", "CA", "CB", "CG"], ["CA", "CB", "CG", "ND1"]],
+    "ILE": [["N", "CA", "CB", "CG1"], ["CA", "CB", "CG1", "CD1"]],
+    "LEU": [["N", "CA", "CB", "CG"], ["CA", "CB", "CG", "CD1"]],
+    "LYS": [
+        ["N", "CA", "CB", "CG"],
+        ["CA", "CB", "CG", "CD"],
+        ["CB", "CG", "CD", "CE"],
+        ["CG", "CD", "CE", "NZ"],
+    ],
+    "MET": [
+        ["N", "CA", "CB", "CG"],
+        ["CA", "CB", "CG", "SD"],
+        ["CB", "CG", "SD", "CE"],
+    ],
+    "PHE": [["N", "CA", "CB", "CG"], ["CA", "CB", "CG", "CD1"]],
+    "PRO": [["N", "CA", "CB", "CG"], ["CA", "CB", "CG", "CD"]],
+    "SER": [["N", "CA", "CB", "OG"]],
+    "THR": [["N", "CA", "CB", "OG1"]],
+    "TRP": [["N", "CA", "CB", "CG"], ["CA", "CB", "CG", "CD1"]],
+    "TYR": [["N", "CA", "CB", "CG"], ["CA", "CB", "CG", "CD1"]],
+    "VAL": [["N", "CA", "CB", "CG1"]],
+}
+# If chi angles given in fixed-length array, this matrix determines how to mask
+# them for each AA type. The order is as per restype_order (see below).
+chi_angles_mask = [
+    [0.0, 0.0, 0.0, 0.0],  # ALA
+    [1.0, 1.0, 1.0, 1.0],  # ARG
+    [1.0, 1.0, 0.0, 0.0],  # ASN
+    [1.0, 1.0, 0.0, 0.0],  # ASP
+    [1.0, 0.0, 0.0, 0.0],  # CYS
+    [1.0, 1.0, 1.0, 0.0],  # GLN
+    [1.0, 1.0, 1.0, 0.0],  # GLU
+    [0.0, 0.0, 0.0, 0.0],  # GLY
+    [1.0, 1.0, 0.0, 0.0],  # HIS
+    [1.0, 1.0, 0.0, 0.0],  # ILE
+    [1.0, 1.0, 0.0, 0.0],  # LEU
+    [1.0, 1.0, 1.0, 1.0],  # LYS
+    [1.0, 1.0, 1.0, 0.0],  # MET
+    [1.0, 1.0, 0.0, 0.0],  # PHE
+    [1.0, 1.0, 0.0, 0.0],  # PRO
+    [1.0, 0.0, 0.0, 0.0],  # SER
+    [1.0, 0.0, 0.0, 0.0],  # THR
+    [1.0, 1.0, 0.0, 0.0],  # TRP
+    [1.0, 1.0, 0.0, 0.0],  # TYR
+    [1.0, 0.0, 0.0, 0.0],  # VAL
+]
+# The following chi angles are pi periodic: they can be rotated by a multiple
+# of pi without affecting the structure.
+chi_pi_periodic = [
+    [0.0, 0.0, 0.0, 0.0],  # ALA
+    [0.0, 0.0, 0.0, 0.0],  # ARG
+    [0.0, 0.0, 0.0, 0.0],  # ASN
+    [0.0, 1.0, 0.0, 0.0],  # ASP
+    [0.0, 0.0, 0.0, 0.0],  # CYS
+    [0.0, 0.0, 0.0, 0.0],  # GLN
+    [0.0, 0.0, 1.0, 0.0],  # GLU
+    [0.0, 0.0, 0.0, 0.0],  # GLY
+    [0.0, 0.0, 0.0, 0.0],  # HIS
+    [0.0, 0.0, 0.0, 0.0],  # ILE
+    [0.0, 0.0, 0.0, 0.0],  # LEU
+    [0.0, 0.0, 0.0, 0.0],  # LYS
+    [0.0, 0.0, 0.0, 0.0],  # MET
+    [0.0, 1.0, 0.0, 0.0],  # PHE
+    [0.0, 0.0, 0.0, 0.0],  # PRO
+    [0.0, 0.0, 0.0, 0.0],  # SER
+    [0.0, 0.0, 0.0, 0.0],  # THR
+    [0.0, 0.0, 0.0, 0.0],  # TRP
+    [0.0, 1.0, 0.0, 0.0],  # TYR
+    [0.0, 0.0, 0.0, 0.0],  # VAL
+    [0.0, 0.0, 0.0, 0.0],  # UNK
+]
+# Atoms positions relative to the 8 rigid groups, defined by the pre-omega, phi,
+# psi and chi angles:
+# 0: 'backbone group',
+# 1: 'pre-omega-group', (empty)
+# 2: 'phi-group', (currently empty, because it defines only hydrogens)
+# 3: 'psi-group',
+# 4,5,6,7: 'chi1,2,3,4-group'
+# The atom positions are relative to the axis-end-atom of the corresponding
+# rotation axis. The x-axis is in direction of the rotation axis, and the y-axis
+# is defined such that the dihedral-angle-definiting atom (the last entry in
+# chi_angles_atoms above) is in the xy-plane (with a positive y-coordinate).
+# format: [atomname, group_idx, rel_position]
+rigid_group_atom_positions = {
+    "ALA": [
+        ["N", 0, (-0.525, 1.363, 0.000)],
+        ["CA", 0, (0.000, 0.000, 0.000)],
+        ["C", 0, (1.526, -0.000, -0.000)],
+        ["CB", 0, (-0.529, -0.774, -1.205)],
+        ["O", 3, (0.627, 1.062, 0.000)],
+    ],
+    "ARG": [
+        ["N", 0, (-0.524, 1.362, -0.000)],
+        ["CA", 0, (0.000, 0.000, 0.000)],
+        ["C", 0, (1.525, -0.000, -0.000)],
+        ["CB", 0, (-0.524, -0.778, -1.209)],
+        ["O", 3, (0.626, 1.062, 0.000)],
+        ["CG", 4, (0.616, 1.390, -0.000)],
+        ["CD", 5, (0.564, 1.414, 0.000)],
+        ["NE", 6, (0.539, 1.357, -0.000)],
+        ["NH1", 7, (0.206, 2.301, 0.000)],
+        ["NH2", 7, (2.078, 0.978, -0.000)],
+        ["CZ", 7, (0.758, 1.093, -0.000)],
+    ],
+    "ASN": [
+        ["N", 0, (-0.536, 1.357, 0.000)],
+        ["CA", 0, (0.000, 0.000, 0.000)],
+        ["C", 0, (1.526, -0.000, -0.000)],
+        ["CB", 0, (-0.531, -0.787, -1.200)],
+        ["O", 3, (0.625, 1.062, 0.000)],
+        ["CG", 4, (0.584, 1.399, 0.000)],
+        ["ND2", 5, (0.593, -1.188, 0.001)],
+        ["OD1", 5, (0.633, 1.059, 0.000)],
+    ],
+    "ASP": [
+        ["N", 0, (-0.525, 1.362, -0.000)],
+        ["CA", 0, (0.000, 0.000, 0.000)],
+        ["C", 0, (1.527, 0.000, -0.000)],
+        ["CB", 0, (-0.526, -0.778, -1.208)],
+        ["O", 3, (0.626, 1.062, -0.000)],
+        ["CG", 4, (0.593, 1.398, -0.000)],
+        ["OD1", 5, (0.610, 1.091, 0.000)],
+        ["OD2", 5, (0.592, -1.101, -0.003)],
+    ],
+    "CYS": [
+        ["N", 0, (-0.522, 1.362, -0.000)],
+        ["CA", 0, (0.000, 0.000, 0.000)],
+        ["C", 0, (1.524, 0.000, 0.000)],
+        ["CB", 0, (-0.519, -0.773, -1.212)],
+        ["O", 3, (0.625, 1.062, -0.000)],
+        ["SG", 4, (0.728, 1.653, 0.000)],
+    ],
+    "GLN": [
+        ["N", 0, (-0.526, 1.361, -0.000)],
+        ["CA", 0, (0.000, 0.000, 0.000)],
+        ["C", 0, (1.526, 0.000, 0.000)],
+        ["CB", 0, (-0.525, -0.779, -1.207)],
+        ["O", 3, (0.626, 1.062, -0.000)],
+        ["CG", 4, (0.615, 1.393, 0.000)],
+        ["CD", 5, (0.587, 1.399, -0.000)],
+        ["NE2", 6, (0.593, -1.189, -0.001)],
+        ["OE1", 6, (0.634, 1.060, 0.000)],
+    ],
+    "GLU": [
+        ["N", 0, (-0.528, 1.361, 0.000)],
+        ["CA", 0, (0.000, 0.000, 0.000)],
+        ["C", 0, (1.526, -0.000, -0.000)],
+        ["CB", 0, (-0.526, -0.781, -1.207)],
+        ["O", 3, (0.626, 1.062, 0.000)],
+        ["CG", 4, (0.615, 1.392, 0.000)],
+        ["CD", 5, (0.600, 1.397, 0.000)],
+        ["OE1", 6, (0.607, 1.095, -0.000)],
+        ["OE2", 6, (0.589, -1.104, -0.001)],
+    ],
+    "GLY": [
+        ["N", 0, (-0.572, 1.337, 0.000)],
+        ["CA", 0, (0.000, 0.000, 0.000)],
+        ["C", 0, (1.517, -0.000, -0.000)],
+        ["O", 3, (0.626, 1.062, -0.000)],
+    ],
+    "HIS": [
+        ["N", 0, (-0.527, 1.360, 0.000)],
+        ["CA", 0, (0.000, 0.000, 0.000)],
+        ["C", 0, (1.525, 0.000, 0.000)],
+        ["CB", 0, (-0.525, -0.778, -1.208)],
+        ["O", 3, (0.625, 1.063, 0.000)],
+        ["CG", 4, (0.600, 1.370, -0.000)],
+        ["CD2", 5, (0.889, -1.021, 0.003)],
+        ["ND1", 5, (0.744, 1.160, -0.000)],
+        ["CE1", 5, (2.030, 0.851, 0.002)],
+        ["NE2", 5, (2.145, -0.466, 0.004)],
+    ],
+    "ILE": [
+        ["N", 0, (-0.493, 1.373, -0.000)],
+        ["CA", 0, (0.000, 0.000, 0.000)],
+        ["C", 0, (1.527, -0.000, -0.000)],
+        ["CB", 0, (-0.536, -0.793, -1.213)],
+        ["O", 3, (0.627, 1.062, -0.000)],
+        ["CG1", 4, (0.534, 1.437, -0.000)],
+        ["CG2", 4, (0.540, -0.785, -1.199)],
+        ["CD1", 5, (0.619, 1.391, 0.000)],
+    ],
+    "LEU": [
+        ["N", 0, (-0.520, 1.363, 0.000)],
+        ["CA", 0, (0.000, 0.000, 0.000)],
+        ["C", 0, (1.525, -0.000, -0.000)],
+        ["CB", 0, (-0.522, -0.773, -1.214)],
+        ["O", 3, (0.625, 1.063, -0.000)],
+        ["CG", 4, (0.678, 1.371, 0.000)],
+        ["CD1", 5, (0.530, 1.430, -0.000)],
+        ["CD2", 5, (0.535, -0.774, 1.200)],
+    ],
+    "LYS": [
+        ["N", 0, (-0.526, 1.362, -0.000)],
+        ["CA", 0, (0.000, 0.000, 0.000)],
+        ["C", 0, (1.526, 0.000, 0.000)],
+        ["CB", 0, (-0.524, -0.778, -1.208)],
+        ["O", 3, (0.626, 1.062, -0.000)],
+        ["CG", 4, (0.619, 1.390, 0.000)],
+        ["CD", 5, (0.559, 1.417, 0.000)],
+        ["CE", 6, (0.560, 1.416, 0.000)],
+        ["NZ", 7, (0.554, 1.387, 0.000)],
+    ],
+    "MET": [
+        ["N", 0, (-0.521, 1.364, -0.000)],
+        ["CA", 0, (0.000, 0.000, 0.000)],
+        ["C", 0, (1.525, 0.000, 0.000)],
+        ["CB", 0, (-0.523, -0.776, -1.210)],
+        ["O", 3, (0.625, 1.062, -0.000)],
+        ["CG", 4, (0.613, 1.391, -0.000)],
+        ["SD", 5, (0.703, 1.695, 0.000)],
+        ["CE", 6, (0.320, 1.786, -0.000)],
+    ],
+    "PHE": [
+        ["N", 0, (-0.518, 1.363, 0.000)],
+        ["CA", 0, (0.000, 0.000, 0.000)],
+        ["C", 0, (1.524, 0.000, -0.000)],
+        ["CB", 0, (-0.525, -0.776, -1.212)],
+        ["O", 3, (0.626, 1.062, -0.000)],
+        ["CG", 4, (0.607, 1.377, 0.000)],
+        ["CD1", 5, (0.709, 1.195, -0.000)],
+        ["CD2", 5, (0.706, -1.196, 0.000)],
+        ["CE1", 5, (2.102, 1.198, -0.000)],
+        ["CE2", 5, (2.098, -1.201, -0.000)],
+        ["CZ", 5, (2.794, -0.003, -0.001)],
+    ],
+    "PRO": [
+        ["N", 0, (-0.566, 1.351, -0.000)],
+        ["CA", 0, (0.000, 0.000, 0.000)],
+        ["C", 0, (1.527, -0.000, 0.000)],
+        ["CB", 0, (-0.546, -0.611, -1.293)],
+        ["O", 3, (0.621, 1.066, 0.000)],
+        ["CG", 4, (0.382, 1.445, 0.0)],
+        # ['CD', 5, (0.427, 1.440, 0.0)],
+        ["CD", 5, (0.477, 1.424, 0.0)],  # manually made angle 2 degrees larger
+    ],
+    "SER": [
+        ["N", 0, (-0.529, 1.360, -0.000)],
+        ["CA", 0, (0.000, 0.000, 0.000)],
+        ["C", 0, (1.525, -0.000, -0.000)],
+        ["CB", 0, (-0.518, -0.777, -1.211)],
+        ["O", 3, (0.626, 1.062, -0.000)],
+        ["OG", 4, (0.503, 1.325, 0.000)],
+    ],
+    "THR": [
+        ["N", 0, (-0.517, 1.364, 0.000)],
+        ["CA", 0, (0.000, 0.000, 0.000)],
+        ["C", 0, (1.526, 0.000, -0.000)],
+        ["CB", 0, (-0.516, -0.793, -1.215)],
+        ["O", 3, (0.626, 1.062, 0.000)],
+        ["CG2", 4, (0.550, -0.718, -1.228)],
+        ["OG1", 4, (0.472, 1.353, 0.000)],
+    ],
+    "TRP": [
+        ["N", 0, (-0.521, 1.363, 0.000)],
+        ["CA", 0, (0.000, 0.000, 0.000)],
+        ["C", 0, (1.525, -0.000, 0.000)],
+        ["CB", 0, (-0.523, -0.776, -1.212)],
+        ["O", 3, (0.627, 1.062, 0.000)],
+        ["CG", 4, (0.609, 1.370, -0.000)],
+        ["CD1", 5, (0.824, 1.091, 0.000)],
+        ["CD2", 5, (0.854, -1.148, -0.005)],
+        ["CE2", 5, (2.186, -0.678, -0.007)],
+        ["CE3", 5, (0.622, -2.530, -0.007)],
+        ["NE1", 5, (2.140, 0.690, -0.004)],
+        ["CH2", 5, (3.028, -2.890, -0.013)],
+        ["CZ2", 5, (3.283, -1.543, -0.011)],
+        ["CZ3", 5, (1.715, -3.389, -0.011)],
+    ],
+    "TYR": [
+        ["N", 0, (-0.522, 1.362, 0.000)],
+        ["CA", 0, (0.000, 0.000, 0.000)],
+        ["C", 0, (1.524, -0.000, -0.000)],
+        ["CB", 0, (-0.522, -0.776, -1.213)],
+        ["O", 3, (0.627, 1.062, -0.000)],
+        ["CG", 4, (0.607, 1.382, -0.000)],
+        ["CD1", 5, (0.716, 1.195, -0.000)],
+        ["CD2", 5, (0.713, -1.194, -0.001)],
+        ["CE1", 5, (2.107, 1.200, -0.002)],
+        ["CE2", 5, (2.104, -1.201, -0.003)],
+        ["OH", 5, (4.168, -0.002, -0.005)],
+        ["CZ", 5, (2.791, -0.001, -0.003)],
+    ],
+    "VAL": [
+        ["N", 0, (-0.494, 1.373, -0.000)],
+        ["CA", 0, (0.000, 0.000, 0.000)],
+        ["C", 0, (1.527, -0.000, -0.000)],
+        ["CB", 0, (-0.533, -0.795, -1.213)],
+        ["O", 3, (0.627, 1.062, -0.000)],
+        ["CG1", 4, (0.540, 1.429, -0.000)],
+        ["CG2", 4, (0.533, -0.776, 1.203)],
+    ],
+}
+# A list of atoms (excluding hydrogen) for each AA type. PDB naming convention.
+residue_atoms = {
+    "ALA": ["C", "CA", "CB", "N", "O"],
+    "ARG": ["C", "CA", "CB", "CG", "CD", "CZ", "N", "NE", "O", "NH1", "NH2"],
+    "ASP": ["C", "CA", "CB", "CG", "N", "O", "OD1", "OD2"],
+    "ASN": ["C", "CA", "CB", "CG", "N", "ND2", "O", "OD1"],
+    "CYS": ["C", "CA", "CB", "N", "O", "SG"],
+    "GLU": ["C", "CA", "CB", "CG", "CD", "N", "O", "OE1", "OE2"],
+    "GLN": ["C", "CA", "CB", "CG", "CD", "N", "NE2", "O", "OE1"],
+    "GLY": ["C", "CA", "N", "O"],
+    "HIS": ["C", "CA", "CB", "CG", "CD2", "CE1", "N", "ND1", "NE2", "O"],
+    "ILE": ["C", "CA", "CB", "CG1", "CG2", "CD1", "N", "O"],
+    "LEU": ["C", "CA", "CB", "CG", "CD1", "CD2", "N", "O"],
+    "LYS": ["C", "CA", "CB", "CG", "CD", "CE", "N", "NZ", "O"],
+    "MET": ["C", "CA", "CB", "CG", "CE", "N", "O", "SD"],
+    "PHE": ["C", "CA", "CB", "CG", "CD1", "CD2", "CE1", "CE2", "CZ", "N", "O"],
+    "PRO": ["C", "CA", "CB", "CG", "CD", "N", "O"],
+    "SER": ["C", "CA", "CB", "N", "O", "OG"],
+    "THR": ["C", "CA", "CB", "CG2", "N", "O", "OG1"],
+    "TRP": [
+        "C",
+        "CA",
+        "CB",
+        "CG",
+        "CD1",
+        "CD2",
+        "CE2",
+        "CE3",
+        "CZ2",
+        "CZ3",
+        "CH2",
+        "N",
+        "NE1",
+        "O",
+    ],
+    "TYR": [
+        "C",
+        "CA",
+        "CB",
+        "CG",
+        "CD1",
+        "CD2",
+        "CE1",
+        "CE2",
+        "CZ",
+        "N",
+        "O",
+        "OH",
+    ],
+    "VAL": ["C", "CA", "CB", "CG1", "CG2", "N", "O"],
+}
+# Naming swaps for ambiguous atom names.
+# Due to symmetries in the amino acids the naming of atoms is ambiguous in
+# 4 of the 20 amino acids.
+# (The LDDT paper lists 7 amino acids as ambiguous, but the naming ambiguities
+# in LEU, VAL and ARG can be resolved by using the 3d constellations of
+# the 'ambiguous' atoms and their neighbours)
+# TODO: ^ interpret this
+residue_atom_renaming_swaps = {
+    "ASP": {"OD1": "OD2"},
+    "GLU": {"OE1": "OE2"},
+    "PHE": {"CD1": "CD2", "CE1": "CE2"},
+    "TYR": {"CD1": "CD2", "CE1": "CE2"},
+}
+# Van der Waals radii [Angstroem] of the atoms (from Wikipedia)
+van_der_waals_radius = {
+    "C": 1.7,
+    "N": 1.55,
+    "O": 1.52,
+    "S": 1.8,
+}
+Bond = collections.namedtuple(
+    "Bond", ["atom1_name", "atom2_name", "length", "stddev"]
+)
+BondAngle = collections.namedtuple(
+    "BondAngle",
+    ["atom1_name", "atom2_name", "atom3name", "angle_rad", "stddev"],
+)
+@functools.lru_cache(maxsize=None)
+def load_stereo_chemical_props() -> Tuple[
+    Mapping[str, List[Bond]],
+    Mapping[str, List[Bond]],
+    Mapping[str, List[BondAngle]],
+]:
+    """Load stereo_chemical_props.txt into a nice structure.
+    Load literature values for bond lengths and bond angles and translate
+    bond angles into the length of the opposite edge of the triangle
+    ("residue_virtual_bonds").
+    Returns:
+      residue_bonds:  dict that maps resname --> list of Bond tuples
+      residue_virtual_bonds: dict that maps resname --> list of Bond tuples
+      residue_bond_angles: dict that maps resname --> list of BondAngle tuples
+    """
+    # TODO: this file should be downloaded in a setup script
+    stereo_chemical_props = resources.read_text("openfold.resources", "stereo_chemical_props.txt")
+    lines_iter = iter(stereo_chemical_props.splitlines())
+    # Load bond lengths.
+    residue_bonds = {}
+    next(lines_iter)  # Skip header line.
+    for line in lines_iter:
+        if line.strip() == "-":
+            break
+        bond, resname, length, stddev = line.split()
+        atom1, atom2 = bond.split("-")
+        if resname not in residue_bonds:
+            residue_bonds[resname] = []
+        residue_bonds[resname].append(
+            Bond(atom1, atom2, float(length), float(stddev))
+        )
+    residue_bonds["UNK"] = []
+    # Load bond angles.
+    residue_bond_angles = {}
+    next(lines_iter)  # Skip empty line.
+    next(lines_iter)  # Skip header line.
+    for line in lines_iter:
+        if line.strip() == "-":
+            break
+        bond, resname, angle_degree, stddev_degree = line.split()
+        atom1, atom2, atom3 = bond.split("-")
+        if resname not in residue_bond_angles:
+            residue_bond_angles[resname] = []
+        residue_bond_angles[resname].append(
+            BondAngle(
+                atom1,
+                atom2,
+                atom3,
+                float(angle_degree) / 180.0 * np.pi,
+                float(stddev_degree) / 180.0 * np.pi,
+            )
+        )
+    residue_bond_angles["UNK"] = []
+    def make_bond_key(atom1_name, atom2_name):
+        """Unique key to lookup bonds."""
+        return "-".join(sorted([atom1_name, atom2_name]))
+    # Translate bond angles into distances ("virtual bonds").
+    residue_virtual_bonds = {}
+    for resname, bond_angles in residue_bond_angles.items():
+        # Create a fast lookup dict for bond lengths.
+        bond_cache = {}
+        for b in residue_bonds[resname]:
+            bond_cache[make_bond_key(b.atom1_name, b.atom2_name)] = b
+        residue_virtual_bonds[resname] = []
+        for ba in bond_angles:
+            bond1 = bond_cache[make_bond_key(ba.atom1_name, ba.atom2_name)]
+            bond2 = bond_cache[make_bond_key(ba.atom2_name, ba.atom3name)]
+            # Compute distance between atom1 and atom3 using the law of cosines
+            # c^2 = a^2 + b^2 - 2ab*cos(gamma).
+            gamma = ba.angle_rad
+            length = np.sqrt(
+                bond1.length ** 2
+                + bond2.length ** 2
+                - 2 * bond1.length * bond2.length * np.cos(gamma)
+            )
+            # Propagation of uncertainty assuming uncorrelated errors.
+            dl_outer = 0.5 / length
+            dl_dgamma = (
+                2 * bond1.length * bond2.length * np.sin(gamma)
+            ) * dl_outer
+            dl_db1 = (
+                2 * bond1.length - 2 * bond2.length * np.cos(gamma)
+            ) * dl_outer
+            dl_db2 = (
+                2 * bond2.length - 2 * bond1.length * np.cos(gamma)
+            ) * dl_outer
+            stddev = np.sqrt(
+                (dl_dgamma * ba.stddev) ** 2
+                + (dl_db1 * bond1.stddev) ** 2
+                + (dl_db2 * bond2.stddev) ** 2
+            )
+            residue_virtual_bonds[resname].append(
+                Bond(ba.atom1_name, ba.atom3name, length, stddev)
+            )
+    return (residue_bonds, residue_virtual_bonds, residue_bond_angles)
+# Between-residue bond lengths for general bonds (first element) and for Proline
+# (second element).
+between_res_bond_length_c_n = [1.329, 1.341]
+between_res_bond_length_stddev_c_n = [0.014, 0.016]
+# Between-residue cos_angles.
+between_res_cos_angles_c_n_ca = [-0.5203, 0.0353]  # degrees: 121.352 +- 2.315
+between_res_cos_angles_ca_c_n = [-0.4473, 0.0311]  # degrees: 116.568 +- 1.995
+# This mapping is used when we need to store atom data in a format that requires
+# fixed atom data size for every residue (e.g. a numpy array).
+atom_types = [
+    "N",
+    "CA",
+    "C",
+    "CB",
+    "O",
+    "CG",
+    "CG1",
+    "CG2",
+    "OG",
+    "OG1",
+    "SG",
+    "CD",
+    "CD1",
+    "CD2",
+    "ND1",
+    "ND2",
+    "OD1",
+    "OD2",
+    "SD",
+    "CE",
+    "CE1",
+    "CE2",
+    "CE3",
+    "NE",
+    "NE1",
+    "NE2",
+    "OE1",
+    "OE2",
+    "CH2",
+    "NH1",
+    "NH2",
+    "OH",
+    "CZ",
+    "CZ2",
+    "CZ3",
+    "NZ",
+    "OXT",
+]
+atom_order = {atom_type: i for i, atom_type in enumerate(atom_types)}
+atom_type_num = len(atom_types)  # := 37.
+# A compact atom encoding with 14 columns
+# pylint: disable=line-too-long
+# pylint: disable=bad-whitespace
+restype_name_to_atom14_names = {
+    "ALA": ["N", "CA", "C", "O", "CB", "", "", "", "", "", "", "", "", ""],
+    "ARG": [
+        "N",
+        "CA",
+        "C",
+        "O",
+        "CB",
+        "CG",
+        "CD",
+        "NE",
+        "CZ",
+        "NH1",
+        "NH2",
+        "",
+        "",
+        "",
+    ],
+    "ASN": [
+        "N",
+        "CA",
+        "C",
+        "O",
+        "CB",
+        "CG",
+        "OD1",
+        "ND2",
+        "",
+        "",
+        "",
+        "",
+        "",
+        "",
+    ],
+    "ASP": [
+        "N",
+        "CA",
+        "C",
+        "O",
+        "CB",
+        "CG",
+        "OD1",
+        "OD2",
+        "",
+        "",
+        "",
+        "",
+        "",
+        "",
+    ],
+    "CYS": ["N", "CA", "C", "O", "CB", "SG", "", "", "", "", "", "", "", ""],
+    "GLN": [
+        "N",
+        "CA",
+        "C",
+        "O",
+        "CB",
+        "CG",
+        "CD",
+        "OE1",
+        "NE2",
+        "",
+        "",
+        "",
+        "",
+        "",
+    ],
+    "GLU": [
+        "N",
+        "CA",
+        "C",
+        "O",
+        "CB",
+        "CG",
+        "CD",
+        "OE1",
+        "OE2",
+        "",
+        "",
+        "",
+        "",
+        "",
+    ],
+    "GLY": ["N", "CA", "C", "O", "", "", "", "", "", "", "", "", "", ""],
+    "HIS": [
+        "N",
+        "CA",
+        "C",
+        "O",
+        "CB",
+        "CG",
+        "ND1",
+        "CD2",
+        "CE1",
+        "NE2",
+        "",
+        "",
+        "",
+        "",
+    ],
+    "ILE": [
+        "N",
+        "CA",
+        "C",
+        "O",
+        "CB",
+        "CG1",
+        "CG2",
+        "CD1",
+        "",
+        "",
+        "",
+        "",
+        "",
+        "",
+    ],
+    "LEU": [
+        "N",
+        "CA",
+        "C",
+        "O",
+        "CB",
+        "CG",
+        "CD1",
+        "CD2",
+        "",
+        "",
+        "",
+        "",
+        "",
+        "",
+    ],
+    "LYS": [
+        "N",
+        "CA",
+        "C",
+        "O",
+        "CB",
+        "CG",
+        "CD",
+        "CE",
+        "NZ",
+        "",
+        "",
+        "",
+        "",
+        "",
+    ],
+    "MET": [
+        "N",
+        "CA",
+        "C",
+        "O",
+        "CB",
+        "CG",
+        "SD",
+        "CE",
+        "",
+        "",
+        "",
+        "",
+        "",
+        "",
+    ],
+    "PHE": [
+        "N",
+        "CA",
+        "C",
+        "O",
+        "CB",
+        "CG",
+        "CD1",
+        "CD2",
+        "CE1",
+        "CE2",
+        "CZ",
+        "",
+        "",
+        "",
+    ],
+    "PRO": ["N", "CA", "C", "O", "CB", "CG", "CD", "", "", "", "", "", "", ""],
+    "SER": ["N", "CA", "C", "O", "CB", "OG", "", "", "", "", "", "", "", ""],
+    "THR": [
+        "N",
+        "CA",
+        "C",
+        "O",
+        "CB",
+        "OG1",
+        "CG2",
+        "",
+        "",
+        "",
+        "",
+        "",
+        "",
+        "",
+    ],
+    "TRP": [
+        "N",
+        "CA",
+        "C",
+        "O",
+        "CB",
+        "CG",
+        "CD1",
+        "CD2",
+        "NE1",
+        "CE2",
+        "CE3",
+        "CZ2",
+        "CZ3",
+        "CH2",
+    ],
+    "TYR": [
+        "N",
+        "CA",
+        "C",
+        "O",
+        "CB",
+        "CG",
+        "CD1",
+        "CD2",
+        "CE1",
+        "CE2",
+        "CZ",
+        "OH",
+        "",
+        "",
+    ],
+    "VAL": [
+        "N",
+        "CA",
+        "C",
+        "O",
+        "CB",
+        "CG1",
+        "CG2",
+        "",
+        "",
+        "",
+        "",
+        "",
+        "",
+        "",
+    ],
+    "UNK": ["", "", "", "", "", "", "", "", "", "", "", "", "", ""],
+}
+# pylint: enable=line-too-long
+# pylint: enable=bad-whitespace
+# This is the standard residue order when coding AA type as a number.
+# Reproduce it by taking 3-letter AA codes and sorting them alphabetically.
+restypes = [
+    "A",
+    "R",
+    "N",
+    "D",
+    "C",
+    "Q",
+    "E",
+    "G",
+    "H",
+    "I",
+    "L",
+    "K",
+    "M",
+    "F",
+    "P",
+    "S",
+    "T",
+    "W",
+    "Y",
+    "V",
+]
+restype_order = {restype: i for i, restype in enumerate(restypes)}
+restype_num = len(restypes)  # := 20.
+unk_restype_index = restype_num  # Catch-all index for unknown restypes.
+restypes_with_x = restypes + ["X"]
+restype_order_with_x = {restype: i for i, restype in enumerate(restypes_with_x)}
+def sequence_to_onehot(
+    sequence: str, mapping: Mapping[str, int], map_unknown_to_x: bool = False
+) -> np.ndarray:
+    """Maps the given sequence into a one-hot encoded matrix.
+    Args:
+      sequence: An amino acid sequence.
+      mapping: A dictionary mapping amino acids to integers.
+      map_unknown_to_x: If True, any amino acid that is not in the mapping will be
+        mapped to the unknown amino acid 'X'. If the mapping doesn't contain
+        amino acid 'X', an error will be thrown. If False, any amino acid not in
+        the mapping will throw an error.
+    Returns:
+      A numpy array of shape (seq_len, num_unique_aas) with one-hot encoding of
+      the sequence.
+    Raises:
+      ValueError: If the mapping doesn't contain values from 0 to
+        num_unique_aas - 1 without any gaps.
+    """
+    num_entries = max(mapping.values()) + 1
+    if sorted(set(mapping.values())) != list(range(num_entries)):
+        raise ValueError(
+            "The mapping must have values from 0 to num_unique_aas-1 "
+            "without any gaps. Got: %s" % sorted(mapping.values())
+        )
+    one_hot_arr = np.zeros((len(sequence), num_entries), dtype=int)
+    for aa_index, aa_type in enumerate(sequence):
+        if map_unknown_to_x:
+            if aa_type.isalpha() and aa_type.isupper():
+                aa_id = mapping.get(aa_type, mapping["X"])
+            else:
+                raise ValueError(
+                    f"Invalid character in the sequence: {aa_type}"
+                )
+        else:
+            aa_id = mapping[aa_type]
+        one_hot_arr[aa_index, aa_id] = 1
+    return one_hot_arr
+restype_1to3 = {
+    "A": "ALA",
+    "R": "ARG",
+    "N": "ASN",
+    "D": "ASP",
+    "C": "CYS",
+    "Q": "GLN",
+    "E": "GLU",
+    "G": "GLY",
+    "H": "HIS",
+    "I": "ILE",
+    "L": "LEU",
+    "K": "LYS",
+    "M": "MET",
+    "F": "PHE",
+    "P": "PRO",
+    "S": "SER",
+    "T": "THR",
+    "W": "TRP",
+    "Y": "TYR",
+    "V": "VAL",
+}
+# NB: restype_3to1 differs from Bio.PDB.protein_letters_3to1 by being a simple
+# 1-to-1 mapping of 3 letter names to one letter names. The latter contains
+# many more, and less common, three letter names as keys and maps many of these
+# to the same one letter name (including 'X' and 'U' which we don't use here).
+restype_3to1 = {v: k for k, v in restype_1to3.items()}
+# Define a restype name for all unknown residues.
+unk_restype = "UNK"
+resnames = [restype_1to3[r] for r in restypes] + [unk_restype]
+resname_to_idx = {resname: i for i, resname in enumerate(resnames)}
+# The mapping here uses hhblits convention, so that B is mapped to D, J and O
+# are mapped to X, U is mapped to C, and Z is mapped to E. Other than that the
+# remaining 20 amino acids are kept in alphabetical order.
+# There are 2 non-amino acid codes, X (representing any amino acid) and
+# "-" representing a missing amino acid in an alignment.  The id for these
+# codes is put at the end (20 and 21) so that they can easily be ignored if
+# desired.
+HHBLITS_AA_TO_ID = {
+    "A": 0,
+    "B": 2,
+    "C": 1,
+    "D": 2,
+    "E": 3,
+    "F": 4,
+    "G": 5,
+    "H": 6,
+    "I": 7,
+    "J": 20,
+    "K": 8,
+    "L": 9,
+    "M": 10,
+    "N": 11,
+    "O": 20,
+    "P": 12,
+    "Q": 13,
+    "R": 14,
+    "S": 15,
+    "T": 16,
+    "U": 1,
+    "V": 17,
+    "W": 18,
+    "X": 20,
+    "Y": 19,
+    "Z": 3,
+    "-": 21,
+}
+# Partial inversion of HHBLITS_AA_TO_ID.
+ID_TO_HHBLITS_AA = {
+    0: "A",
+    1: "C",  # Also U.
+    2: "D",  # Also B.
+    3: "E",  # Also Z.
+    4: "F",
+    5: "G",
+    6: "H",
+    7: "I",
+    8: "K",
+    9: "L",
+    10: "M",
+    11: "N",
+    12: "P",
+    13: "Q",
+    14: "R",
+    15: "S",
+    16: "T",
+    17: "V",
+    18: "W",
+    19: "Y",
+    20: "X",  # Includes J and O.
+    21: "-",
+}
+restypes_with_x_and_gap = restypes + ["X", "-"]
+MAP_HHBLITS_AATYPE_TO_OUR_AATYPE = tuple(
+    restypes_with_x_and_gap.index(ID_TO_HHBLITS_AA[i])
+    for i in range(len(restypes_with_x_and_gap))
+)
+def _make_standard_atom_mask() -> np.ndarray:
+    """Returns [num_res_types, num_atom_types] mask array."""
+    # +1 to account for unknown (all 0s).
+    mask = np.zeros([restype_num + 1, atom_type_num], dtype=int)
+    for restype, restype_letter in enumerate(restypes):
+        restype_name = restype_1to3[restype_letter]
+        atom_names = residue_atoms[restype_name]
+        for atom_name in atom_names:
+            atom_type = atom_order[atom_name]
+            mask[restype, atom_type] = 1
+    return mask
+STANDARD_ATOM_MASK = _make_standard_atom_mask()
+# A one hot representation for the first and second atoms defining the axis
+# of rotation for each chi-angle in each residue.
+def chi_angle_atom(atom_index: int) -> np.ndarray:
+    """Define chi-angle rigid groups via one-hot representations."""
+    chi_angles_index = {}
+    one_hots = []
+    for k, v in chi_angles_atoms.items():
+        indices = [atom_types.index(s[atom_index]) for s in v]
+        indices.extend([-1] * (4 - len(indices)))
+        chi_angles_index[k] = indices
+    for r in restypes:
+        res3 = restype_1to3[r]
+        one_hot = np.eye(atom_type_num)[chi_angles_index[res3]]
+        one_hots.append(one_hot)
+    one_hots.append(np.zeros([4, atom_type_num]))  # Add zeros for residue `X`.
+    one_hot = np.stack(one_hots, axis=0)
+    one_hot = np.transpose(one_hot, [0, 2, 1])
+    return one_hot
+chi_atom_1_one_hot = chi_angle_atom(1)
+chi_atom_2_one_hot = chi_angle_atom(2)
+# An array like chi_angles_atoms but using indices rather than names.
+chi_angles_atom_indices = [chi_angles_atoms[restype_1to3[r]] for r in restypes]
+chi_angles_atom_indices = tree.map_structure(
+    lambda atom_name: atom_order[atom_name], chi_angles_atom_indices
+)
+chi_angles_atom_indices = np.array(
+    [
+        chi_atoms + ([[0, 0, 0, 0]] * (4 - len(chi_atoms)))
+        for chi_atoms in chi_angles_atom_indices
+    ]
+)
+# Mapping from (res_name, atom_name) pairs to the atom's chi group index
+# and atom index within that group.
+chi_groups_for_atom = collections.defaultdict(list)
+for res_name, chi_angle_atoms_for_res in chi_angles_atoms.items():
+    for chi_group_i, chi_group in enumerate(chi_angle_atoms_for_res):
+        for atom_i, atom in enumerate(chi_group):
+            chi_groups_for_atom[(res_name, atom)].append((chi_group_i, atom_i))
+chi_groups_for_atom = dict(chi_groups_for_atom)
+def _make_rigid_transformation_4x4(ex, ey, translation):
+    """Create a rigid 4x4 transformation matrix from two axes and transl."""
+    # Normalize ex.
+    ex_normalized = ex / np.linalg.norm(ex)
+    # make ey perpendicular to ex
+    ey_normalized = ey - np.dot(ey, ex_normalized) * ex_normalized
+    ey_normalized /= np.linalg.norm(ey_normalized)
+    # compute ez as cross product
+    eznorm = np.cross(ex_normalized, ey_normalized)
+    m = np.stack(
+        [ex_normalized, ey_normalized, eznorm, translation]
+    ).transpose()
+    m = np.concatenate([m, [[0.0, 0.0, 0.0, 1.0]]], axis=0)
+    return m
+# create an array with (restype, atomtype) --> rigid_group_idx
+# and an array with (restype, atomtype, coord) for the atom positions
+# and compute affine transformation matrices (4,4) from one rigid group to the
+# previous group
+restype_atom37_to_rigid_group = np.zeros([21, 37], dtype=int)
+restype_atom37_mask = np.zeros([21, 37], dtype=np.float32)
+restype_atom37_rigid_group_positions = np.zeros([21, 37, 3], dtype=np.float32)
+restype_atom14_to_rigid_group = np.zeros([21, 14], dtype=int)
+restype_atom14_mask = np.zeros([21, 14], dtype=np.float32)
+restype_atom14_rigid_group_positions = np.zeros([21, 14, 3], dtype=np.float32)
+restype_rigid_group_default_frame = np.zeros([21, 8, 4, 4], dtype=np.float32)
+def _make_rigid_group_constants():
+    """Fill the arrays above."""
+    for restype, restype_letter in enumerate(restypes):
+        resname = restype_1to3[restype_letter]
+        for atomname, group_idx, atom_position in rigid_group_atom_positions[
+            resname
+        ]:
+            atomtype = atom_order[atomname]
+            restype_atom37_to_rigid_group[restype, atomtype] = group_idx
+            restype_atom37_mask[restype, atomtype] = 1
+            restype_atom37_rigid_group_positions[
+                restype, atomtype, :
+            ] = atom_position
+            atom14idx = restype_name_to_atom14_names[resname].index(atomname)
+            restype_atom14_to_rigid_group[restype, atom14idx] = group_idx
+            restype_atom14_mask[restype, atom14idx] = 1
+            restype_atom14_rigid_group_positions[
+                restype, atom14idx, :
+            ] = atom_position
+    for restype, restype_letter in enumerate(restypes):
+        resname = restype_1to3[restype_letter]
+        atom_positions = {
+            name: np.array(pos)
+            for name, _, pos in rigid_group_atom_positions[resname]
+        }
+        # backbone to backbone is the identity transform
+        restype_rigid_group_default_frame[restype, 0, :, :] = np.eye(4)
+        # pre-omega-frame to backbone (currently dummy identity matrix)
+        restype_rigid_group_default_frame[restype, 1, :, :] = np.eye(4)
+        # phi-frame to backbone
+        mat = _make_rigid_transformation_4x4(
+            ex=atom_positions["N"] - atom_positions["CA"],
+            ey=np.array([1.0, 0.0, 0.0]),
+            translation=atom_positions["N"],
+        )
+        restype_rigid_group_default_frame[restype, 2, :, :] = mat
+        # psi-frame to backbone
+        mat = _make_rigid_transformation_4x4(
+            ex=atom_positions["C"] - atom_positions["CA"],
+            ey=atom_positions["CA"] - atom_positions["N"],
+            translation=atom_positions["C"],
+        )
+        restype_rigid_group_default_frame[restype, 3, :, :] = mat
+        # chi1-frame to backbone
+        if chi_angles_mask[restype][0]:
+            base_atom_names = chi_angles_atoms[resname][0]
+            base_atom_positions = [
+                atom_positions[name] for name in base_atom_names
+            ]
+            mat = _make_rigid_transformation_4x4(
+                ex=base_atom_positions[2] - base_atom_positions[1],
+                ey=base_atom_positions[0] - base_atom_positions[1],
+                translation=base_atom_positions[2],
+            )
+            restype_rigid_group_default_frame[restype, 4, :, :] = mat
+        # chi2-frame to chi1-frame
+        # chi3-frame to chi2-frame
+        # chi4-frame to chi3-frame
+        # luckily all rotation axes for the next frame start at (0,0,0) of the
+        # previous frame
+        for chi_idx in range(1, 4):
+            if chi_angles_mask[restype][chi_idx]:
+                axis_end_atom_name = chi_angles_atoms[resname][chi_idx][2]
+                axis_end_atom_position = atom_positions[axis_end_atom_name]
+                mat = _make_rigid_transformation_4x4(
+                    ex=axis_end_atom_position,
+                    ey=np.array([-1.0, 0.0, 0.0]),
+                    translation=axis_end_atom_position,
+                )
+                restype_rigid_group_default_frame[
+                    restype, 4 + chi_idx, :, :
+                ] = mat
+_make_rigid_group_constants()
+def make_atom14_dists_bounds(
+    overlap_tolerance=1.5, bond_length_tolerance_factor=15
+):
+    """compute upper and lower bounds for bonds to assess violations."""
+    restype_atom14_bond_lower_bound = np.zeros([21, 14, 14], np.float32)
+    restype_atom14_bond_upper_bound = np.zeros([21, 14, 14], np.float32)
+    restype_atom14_bond_stddev = np.zeros([21, 14, 14], np.float32)
+    residue_bonds, residue_virtual_bonds, _ = load_stereo_chemical_props()
+    for restype, restype_letter in enumerate(restypes):
+        resname = restype_1to3[restype_letter]
+        atom_list = restype_name_to_atom14_names[resname]
+        # create lower and upper bounds for clashes
+        for atom1_idx, atom1_name in enumerate(atom_list):
+            if not atom1_name:
+                continue
+            atom1_radius = van_der_waals_radius[atom1_name[0]]
+            for atom2_idx, atom2_name in enumerate(atom_list):
+                if (not atom2_name) or atom1_idx == atom2_idx:
+                    continue
+                atom2_radius = van_der_waals_radius[atom2_name[0]]
+                lower = atom1_radius + atom2_radius - overlap_tolerance
+                upper = 1e10
+                restype_atom14_bond_lower_bound[
+                    restype, atom1_idx, atom2_idx
+                ] = lower
+                restype_atom14_bond_lower_bound[
+                    restype, atom2_idx, atom1_idx
+                ] = lower
+                restype_atom14_bond_upper_bound[
+                    restype, atom1_idx, atom2_idx
+                ] = upper
+                restype_atom14_bond_upper_bound[
+                    restype, atom2_idx, atom1_idx
+                ] = upper
+        # overwrite lower and upper bounds for bonds and angles
+        for b in residue_bonds[resname] + residue_virtual_bonds[resname]:
+            atom1_idx = atom_list.index(b.atom1_name)
+            atom2_idx = atom_list.index(b.atom2_name)
+            lower = b.length - bond_length_tolerance_factor * b.stddev
+            upper = b.length + bond_length_tolerance_factor * b.stddev
+            restype_atom14_bond_lower_bound[
+                restype, atom1_idx, atom2_idx
+            ] = lower
+            restype_atom14_bond_lower_bound[
+                restype, atom2_idx, atom1_idx
+            ] = lower
+            restype_atom14_bond_upper_bound[
+                restype, atom1_idx, atom2_idx
+            ] = upper
+            restype_atom14_bond_upper_bound[
+                restype, atom2_idx, atom1_idx
+            ] = upper
+            restype_atom14_bond_stddev[restype, atom1_idx, atom2_idx] = b.stddev
+            restype_atom14_bond_stddev[restype, atom2_idx, atom1_idx] = b.stddev
+    return {
+        "lower_bound": restype_atom14_bond_lower_bound,  # shape (21,14,14)
+        "upper_bound": restype_atom14_bond_upper_bound,  # shape (21,14,14)
+        "stddev": restype_atom14_bond_stddev,  # shape (21,14,14)
+    }
+restype_atom14_ambiguous_atoms = np.zeros((21, 14), dtype=np.float32)
+restype_atom14_ambiguous_atoms_swap_idx = np.tile(
+    np.arange(14, dtype=int), (21, 1)
+)
+def _make_atom14_ambiguity_feats():
+    for res, pairs in residue_atom_renaming_swaps.items():
+        res_idx = restype_order[restype_3to1[res]]
+        for atom1, atom2 in pairs.items():
+            atom1_idx = restype_name_to_atom14_names[res].index(atom1)
+            atom2_idx = restype_name_to_atom14_names[res].index(atom2)
+            restype_atom14_ambiguous_atoms[res_idx, atom1_idx] = 1
+            restype_atom14_ambiguous_atoms[res_idx, atom2_idx] = 1
+            restype_atom14_ambiguous_atoms_swap_idx[
+                res_idx, atom1_idx
+            ] = atom2_idx
+            restype_atom14_ambiguous_atoms_swap_idx[
+                res_idx, atom2_idx
+            ] = atom1_idx
+_make_atom14_ambiguity_feats()
+def aatype_to_str_sequence(aatype):
+    return ''.join([
+        restypes_with_x[aatype[i]]
+        for i in range(len(aatype))
+    ])