forked from Ligo-Biosciences/AlphaFold3
-
Notifications
You must be signed in to change notification settings - Fork 0
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Draft training pipeline and bug fixes
- Loading branch information
ardagoreci
committed
Jul 29, 2024
1 parent
6e01552
commit 96e9042
Showing
26 changed files
with
907 additions
and
400 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,20 +1,22 @@ | ||
_target_: src.data.protein_datamodule.ProteinDataModule | ||
_target_: src.data.components.protein_datamodule.ProteinDataModule | ||
data_dir: "./data/" | ||
resolution_thr: 3.5 # Resolution threshold for PDB structures | ||
min_seq_id: 0.3 # Minimum sequence identity for MMSeq2 clustering | ||
crop_size: 384 # The number of residues to crop the proteins to. | ||
crop_size: 128 # The number of residues to crop the proteins to. | ||
max_length: 10_000 # Entries with total length of chains larger than max_length will be disregarded. | ||
use_fraction: 1.0 # the fraction of the clusters to use (first N in alphabetic order) | ||
entry_type: "chain" # { "biounit", "chain", "pair" } the type of entries to generate | ||
classes_to_exclude: ['homomer', 'heteromer'] # a list of classes to exclude from the dataset | ||
mask_residues: False # if True, the masked residues will be added to the output | ||
classes_to_exclude: null # a list of classes to exclude from the dataset | ||
# - 'homomer' | ||
# - 'heteromer' | ||
mask_residues: false # if True, the masked residues will be added to the output | ||
lower_limit: 15 # the lower limit of the number of residues to mask | ||
upper_limit: 100 # the upper limit of the number of residues to mask | ||
mask_frac: None # if given, the number of residues to mask is mask_frac times the length of the chain | ||
mask_sequential: False # if True, the masked residues will be neighbors in the sequence; otherwise geometric mask | ||
mask_whole_chains: False # if True, the whole chain is masked | ||
force_binding_sites_frac: 0.15 | ||
batch_size: 12 # The batch size. Defaults to `64`. | ||
batch_size: 4 # The batch size. Defaults to `64`. | ||
num_workers: 7 # The number of workers. Defaults to `0`. | ||
pin_memory: True # Whether to pin memory. | ||
debug: True | ||
debug: False |
This file was deleted.
Oops, something went wrong.
This file was deleted.
Oops, something went wrong.
This file was deleted.
Oops, something went wrong.
Oops, something went wrong.