Files
foundry/configs/experiment/ncorley/af3-elements-as-ligand-atom-names.yaml
Nathaniel Corley 5a492032d5 refactor: new modelhub (#109)
* Initial commit of chiral changes

Initial checkin of chiral feature code

Add chiral metric

* Update the way chiral features are incorporated into the model

Move initialization to new func

use default pytorch reset parameters

fix initialization for chirals

config

rename argument of confidence head

fix initialization for chirals

* refactor: src nest, rename rf2aa to modelhub

* refactor: initial commit without projects

* Initial commit of chiral changes

* Initial checkin of chiral feature code

* Add chiral metric

* Remove option for double residual connection.  Add kq_norm oiptions to base (20250125) config.

* Restoring flag

* config

* rename argument of confidence head

* Update the way chiral features are incorporated into the model

* config

* rename argument of confidence head

* Update the way chiral features are incorporated into the model

* Initial commit of chiral changes

Initial checkin of chiral feature code

Add chiral metric

* Update the way chiral features are incorporated into the model

Move initialization to new func

use default pytorch reset parameters

fix initialization for chirals

config

rename argument of confidence head

fix initialization for chirals

* refactor: new modelhub

---------

Co-authored-by: fdimaio <dimaio@uw.edu>
Co-authored-by: HaotianZhangAI4Science <haotianzhang@zju.edu.cn>
2025-04-08 13:33:17 -07:00

84 lines
3.6 KiB
YAML

# @package _global_
name: af3-elements-as-ligand-atom-names
# For explanation of the "override" syntax, see: https://hydra.cc/docs/upgrades/1.0_to_1.1/defaults_list_override/
defaults:
- override /trainer: af3
- override /datasets: af3
- override /model: af3
tags:
# list of tags to add to the run ( & on wandb to easily find & filter runs)
- atom-names
- experiment
project: af3
ckpt_path: /projects/ml/modelhub/inference/weights_with_no_confidence_2025_1_21_new_modelhub.ckpt
model:
lr_scheduler:
base_lr: 0.9e-3 # 1/2 of original learning rate (1.8e-3)
datasets:
train:
pdb:
probability: 1.0
sub_datasets:
interface:
dataset:
transform:
use_element_for_atom_names_of_atomized_tokens: True
dataset:
# Same as AF-3 training, but limit to protein-ligand interfaces
filters:
# (from before)
- "deposition_date < '2021-09-30'"
- "resolution < 9.0"
- "num_polymer_pn_units <= 300"
- "cluster.notnull()"
- >
~(pn_unit_1_non_polymer_res_names.notnull() and
pn_unit_1_non_polymer_res_names.str.contains(
'${resolve_import:cifutils.constants,AF3_EXCLUDED_LIGANDS_REGEX}',
regex=True))
- >
~(pn_unit_2_non_polymer_res_names.notnull() and
pn_unit_2_non_polymer_res_names.str.contains(
'${resolve_import:cifutils.constants,AF3_EXCLUDED_LIGANDS_REGEX}',
regex=True))
- "is_inter_molecule"
# only protein-ligand interfaces
- "(n_prot == 1 and n_nuc == 0 and n_ligand == 1)"
pn_unit:
dataset:
transform:
use_element_for_atom_names_of_atomized_tokens: True
dataset:
# Same as AF-3 training, but limit to protein-ligand interfaces
filters:
# (from before)
- "deposition_date < '2021-09-30'"
- "resolution < 9.0"
- "num_polymer_pn_units <= 300"
- "cluster.notnull()"
- "~(q_pn_unit_non_polymer_res_names.notnull() and q_pn_unit_non_polymer_res_names.str.contains('${resolve_import:cifutils.constants,AF3_EXCLUDED_LIGANDS_REGEX}', regex=True))"
# only proteins or ligands
- "(n_prot == 1 or n_ligand == 1)"
# Datasets set to null are ignored
monomer_distillation: null
val:
af3_validation:
dataset:
transform:
use_element_for_atom_names_of_atomized_tokens: True
dataset:
filters:
- "n_tokens_total < 400"
- "interfaces_to_score.str.contains('protein-ligand')"
# Exclude example where RDKit errors
- example_id not in ["{['validation']}{7qbs}{1}{[]}"]