Spaces:

Zaixi
/

FoldMark

Sleeping

App Files Files Community

FoldMark / configs /configs_base.py

Zaixi

no evo

33001d2 5 months ago

raw

history blame contribute delete

13.6 kB

	# Copyright 2024 ByteDance and/or its affiliates.
	#
	# Licensed under the Apache License, Version 2.0 (the "License");
	# you may not use this file except in compliance with the License.
	# You may obtain a copy of the License at
	#
	# http://www.apache.org/licenses/LICENSE-2.0
	#
	# Unless required by applicable law or agreed to in writing, software
	# distributed under the License is distributed on an "AS IS" BASIS,
	# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	# See the License for the specific language governing permissions and
	# limitations under the License.

	# pylint: disable=C0114,C0301
	from protenix.config.extend_types import (
	GlobalConfigValue,
	ListValue,
	RequiredValue,
	ValueMaybeNone,
	)

	basic_configs = {
	"project": RequiredValue(str),
	"run_name": RequiredValue(str),
	"base_dir": RequiredValue(str),
	# training
	"eval_interval": RequiredValue(int),
	"log_interval": RequiredValue(int),
	"checkpoint_interval": -1,
	"eval_first": False, # run evaluate() before training steps
	"iters_to_accumulate": 1,
	"eval_only": False,
	"load_checkpoint_path": "",
	"load_ema_checkpoint_path": "",
	"load_strict": False,
	"load_params_only": True,
	"skip_load_step": False,
	"skip_load_optimizer": False,
	"skip_load_scheduler": False,
	"train_confidence_only": False,
	"use_wandb": True,
	"wandb_id": "",
	"seed": 66,
	"deterministic": False,
	"ema_decay": -1.0,
	"eval_ema_only": False, # whether wandb only tracking ema checkpoint metrics
	"ema_mutable_param_keywords": [""],
	}
	data_configs = {
	# Data
	"train_crop_size": 256,
	"test_max_n_token": -1,
	"train_lig_atom_rename": False,
	"train_shuffle_mols": False,
	"train_shuffle_sym_ids": False,
	"test_lig_atom_rename": False,
	"test_shuffle_mols": False,
	"test_shuffle_sym_ids": False,
	}
	optim_configs = {
	# Optim
	"lr": 0.0018,
	"lr_scheduler": "af3",
	"warmup_steps": 10,
	"max_steps": RequiredValue(int),
	"min_lr_ratio": 0.1,
	"decay_every_n_steps": 50000,
	"grad_clip_norm": 10,
	# Optim - Adam
	"adam": {
	"beta1": 0.9,
	"beta2": 0.95,
	"weight_decay": 1e-8,
	"lr": GlobalConfigValue("lr"),
	"use_adamw": False,
	},
	# Optim - LRScheduler
	"af3_lr_scheduler": {
	"warmup_steps": GlobalConfigValue("warmup_steps"),
	"decay_every_n_steps": GlobalConfigValue("decay_every_n_steps"),
	"decay_factor": 0.95,
	"lr": GlobalConfigValue("lr"),
	},
	}
	model_configs = {
	# Model
	"c_s": 384,
	"c_z": 128,
	"c_s_inputs": 449, # c_s_inputs == c_token + 32 + 32 + 1
	"watermark": 32,
	"c_atom": 128,
	"c_atompair": 16,
	"c_token": 384,
	"n_blocks": 48,
	"max_atoms_per_token": 24, # DNA G max_atoms = 23
	"no_bins": 64,
	"sigma_data": 16.0,
	"diffusion_batch_size": 48,
	"diffusion_chunk_size": ValueMaybeNone(4), # chunksize of diffusion_batch_size
	"blocks_per_ckpt": ValueMaybeNone(
	1
	), # NOTE: Number of blocks in each activation checkpoint, if None, no checkpointing is performed.
	# switch of kernels
	"use_memory_efficient_kernel": False,
	"use_deepspeed_evo_attention": False,
	"use_flash": False,
	"use_lma": False,
	"use_xformer": False,
	"find_unused_parameters": False,
	"dtype": "bf16", # default training dtype: bf16
	"loss_metrics_sparse_enable": True, # the swicth for both sparse lddt metrics and sparse bond/smooth lddt loss
	"skip_amp": {
	"sample_diffusion": True,
	"confidence_head": True,
	"sample_diffusion_training": True,
	"loss": True,
	},
	"infer_setting": {
	"chunk_size": ValueMaybeNone(
	64
	), # should set to null for normal training and small dataset eval [for efficiency]
	"sample_diffusion_chunk_size": ValueMaybeNone(
	1
	), # should set to null for normal training and small dataset eval [for efficiency]
	"lddt_metrics_sparse_enable": GlobalConfigValue("loss_metrics_sparse_enable"),
	"lddt_metrics_chunk_size": ValueMaybeNone(
	1
	), # only works if loss_metrics_sparse_enable, can set as default 1
	},
	"train_noise_sampler": {
	"p_mean": -1.2,
	"p_std": 1.5,
	"sigma_data": 16.0, # NOTE: in EDM, this is 1.0
	},
	"inference_noise_scheduler": {
	"s_max": 160.0,
	"s_min": 4e-4,
	"rho": 7,
	"sigma_data": 16.0, # NOTE: in EDM, this is 1.0
	},
	"sample_diffusion": {
	"gamma0": 0.8,
	"gamma_min": 1.0,
	"noise_scale_lambda": 1.003,
	"step_scale_eta": 1.5,
	"N_step": 200,
	"N_sample": 5,
	"N_step_mini_rollout": 20,
	"N_sample_mini_rollout": 1,
	},
	"model": {
	"N_model_seed": 1, # for inference
	"N_cycle": 4,
	"input_embedder": {
	"c_atom": GlobalConfigValue("c_atom"),
	"c_atompair": GlobalConfigValue("c_atompair"),
	"c_token": GlobalConfigValue("c_token"),
	},
	"relative_position_encoding": {
	"r_max": 32,
	"s_max": 2,
	"c_z": GlobalConfigValue("c_z"),
	},
	"template_embedder": {
	"c": 64,
	"c_z": GlobalConfigValue("c_z"),
	"n_blocks": 0,
	"dropout": 0.25,
	"blocks_per_ckpt": GlobalConfigValue("blocks_per_ckpt"),
	},
	"msa_module": {
	"c_m": 64,
	"c_z": GlobalConfigValue("c_z"),
	"c_s_inputs": GlobalConfigValue("c_s_inputs"),
	"n_blocks": 4,
	"msa_dropout": 0.15,
	"pair_dropout": 0.25,
	"blocks_per_ckpt": GlobalConfigValue("blocks_per_ckpt"),
	},
	"pairformer": {
	"n_blocks": GlobalConfigValue("n_blocks"),
	"c_z": GlobalConfigValue("c_z"),
	"c_s": GlobalConfigValue("c_s"),
	"n_heads": 16,
	"dropout": 0.25,
	"blocks_per_ckpt": GlobalConfigValue("blocks_per_ckpt"),
	},
	"pairformer_encoder": {
	"n_blocks": 6,
	"c_z": GlobalConfigValue("c_z"),
	"c_s": GlobalConfigValue("c_s"),
	"n_heads": 16,
	"dropout": 0.25,
	"blocks_per_ckpt": GlobalConfigValue("blocks_per_ckpt"),
	},
	"pairformer_decoder": {
	"n_blocks": 6,
	"c_z": GlobalConfigValue("c_z"),
	"c_s": GlobalConfigValue("c_s"),
	"n_heads": 16,
	"dropout": 0.25,
	"blocks_per_ckpt": GlobalConfigValue("blocks_per_ckpt"),
	},
	"diffusion_module": {
	"use_fine_grained_checkpoint": True,
	"sigma_data": GlobalConfigValue("sigma_data"),
	"c_token": 768,
	"c_atom": GlobalConfigValue("c_atom"),
	"c_atompair": GlobalConfigValue("c_atompair"),
	"c_z": GlobalConfigValue("c_z"),
	"c_s": GlobalConfigValue("c_s"),
	"c_s_inputs": GlobalConfigValue("c_s_inputs"),
	"initialization": {
	"zero_init_condition_transition": False,
	"zero_init_atom_encoder_residual_linear": False,
	"he_normal_init_atom_encoder_small_mlp": False,
	"he_normal_init_atom_encoder_output": False,
	"glorot_init_self_attention": False,
	"zero_init_adaln": True,
	"zero_init_residual_condition_transition": False,
	"zero_init_dit_output": True,
	"zero_init_atom_decoder_linear": False,
	},
	"atom_encoder": {
	"n_blocks": 3,
	"n_heads": 4,
	},
	"transformer": {
	"n_blocks": 24,
	"n_heads": 16,
	},
	"atom_decoder": {
	"n_blocks": 3,
	"n_heads": 4,
	},
	"blocks_per_ckpt": GlobalConfigValue("blocks_per_ckpt"),
	},
	"diffusion_module_encoder_decoder": {
	"use_fine_grained_checkpoint": True,
	"sigma_data": GlobalConfigValue("sigma_data"),
	"c_token": 768,
	"c_atom": GlobalConfigValue("c_atom"),
	"c_atompair": GlobalConfigValue("c_atompair"),
	"c_z": GlobalConfigValue("c_z"),
	"c_s": GlobalConfigValue("c_s"),
	"c_s_inputs": GlobalConfigValue("c_s_inputs"),
	"watermark": GlobalConfigValue("watermark"),
	"initialization": {
	"zero_init_condition_transition": False,
	"zero_init_atom_encoder_residual_linear": False,
	"he_normal_init_atom_encoder_small_mlp": False,
	"he_normal_init_atom_encoder_output": False,
	"glorot_init_self_attention": False,
	"zero_init_adaln": True,
	"zero_init_residual_condition_transition": False,
	"zero_init_dit_output": True,
	"zero_init_atom_decoder_linear": False,
	},
	"atom_encoder": {
	"n_blocks": 3,
	"n_heads": 4,
	},
	"transformer": {
	"n_blocks": 6,
	"n_heads": 16,
	},
	"atom_decoder": {
	"n_blocks": 3,
	"n_heads": 4,
	},
	"blocks_per_ckpt": GlobalConfigValue("blocks_per_ckpt"),
	},
	"confidence_head": {
	"c_z": GlobalConfigValue("c_z"),
	"c_s": GlobalConfigValue("c_s"),
	"c_s_inputs": GlobalConfigValue("c_s_inputs"),
	"n_blocks": 4,
	"max_atoms_per_token": GlobalConfigValue("max_atoms_per_token"),
	"pairformer_dropout": 0.0,
	"blocks_per_ckpt": GlobalConfigValue("blocks_per_ckpt"),
	"distance_bin_start": 3.25,
	"distance_bin_end": 52.0,
	"distance_bin_step": 1.25,
	"stop_gradient": True,
	},
	"distogram_head": {
	"c_z": GlobalConfigValue("c_z"),
	"no_bins": GlobalConfigValue("no_bins"),
	},
	},
	}
	perm_configs = {
	# Chain and Atom Permutation
	"chain_permutation": {
	"train": {
	"mini_rollout": True,
	"diffusion_sample": False,
	},
	"test": {
	"diffusion_sample": True,
	},
	"permute_by_pocket": True,
	"configs": {
	"use_center_rmsd": False,
	"find_gt_anchor_first": False,
	"accept_it_as_it_is": False,
	"enumerate_all_anchor_pairs": False,
	"selection_metric": "aligned_rmsd",
	},
	},
	"atom_permutation": {
	"train": {
	"mini_rollout": True,
	"diffusion_sample": False,
	},
	"test": {
	"diffusion_sample": True,
	},
	"permute_by_pocket": True,
	"global_align_wo_symmetric_atom": False,
	},
	}
	loss_configs = {
	"loss": {
	"diffusion_lddt_chunk_size": ValueMaybeNone(1),
	"diffusion_bond_chunk_size": ValueMaybeNone(1),
	"diffusion_chunk_size_outer": ValueMaybeNone(-1),
	"diffusion_sparse_loss_enable": GlobalConfigValue("loss_metrics_sparse_enable"),
	"diffusion_lddt_loss_dense": True, # only set true in initial training for training speed
	"resolution": {"min": 0.1, "max": 4.0},
	"weight": {
	"alpha_confidence": 1e-4,
	"alpha_pae": 0.0, # or 1 in finetuning stage 3
	"alpha_except_pae": 1.0,
	"alpha_diffusion": 4.0,
	"alpha_distogram": 3e-2,
	"alpha_bond": 0.0, # or 1 in finetuning stages
	"smooth_lddt": 1.0, # or 0 in finetuning stages
	"watermark": 1.0,
	},
	"plddt": {
	"min_bin": 0,
	"max_bin": 1.0,
	"no_bins": 50,
	"normalize": True,
	"eps": 1e-6,
	},
	"pde": {
	"min_bin": 0,
	"max_bin": 32,
	"no_bins": 64,
	"eps": 1e-6,
	},
	"resolved": {
	"eps": 1e-6,
	},
	"pae": {
	"min_bin": 0,
	"max_bin": 32,
	"no_bins": 64,
	"eps": 1e-6,
	},
	"diffusion": {
	"mse": {
	"weight_mse": 1 / 3,
	"weight_dna": 5.0,
	"weight_rna": 5.0,
	"weight_ligand": 10.0,
	"eps": 1e-6,
	},
	"bond": {
	"eps": 1e-6,
	},
	"smooth_lddt": {
	"eps": 1e-6,
	},
	},
	"watermark": {
	"eps": 1e-6,
	},
	"distogram": {
	"min_bin": 2.3125,
	"max_bin": 21.6875,
	"no_bins": 64,
	"eps": 1e-6,
	},
	},
	"metrics": {
	"lddt": {
	"eps": 1e-6,
	},
	"complex_ranker_keys": ListValue(["plddt", "gpde", "ranking_score"]),
	"chain_ranker_keys": ListValue(["chain_ptm", "chain_plddt"]),
	"interface_ranker_keys": ListValue(
	["chain_pair_iptm", "chain_pair_iptm_global", "chain_pair_plddt"]
	),
	"clash": {"af3_clash_threshold": 1.1, "vdw_clash_threshold": 0.75},
	},
	}

	configs = {
	**basic_configs,
	**data_configs,
	**optim_configs,
	**model_configs,
	**perm_configs,
	**loss_configs,
	}