You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
split_type: "sequence_similarity"# Split sequences by sequence similarity clustering, other options are "random" and "time_cutoff"
14
-
split_sequence_similiarity: 0.3# Clustering at 30% sequence similarity (argument is ignored if split_type!="sequence_similarity")
15
-
overwrite_sequence_clusters: False # Previous clusterings at same sequence similarity are reused and not overwritten
16
-
split_time_frames: null # Time-cutoffs for train, val and test set (argument is ignored if split_type!="time_cutoff") - e.g., ["2020-01-01", "2021-01-01", "2023-03-01"]
17
-
train_val_test: [0.8, 0.1, 0.1] # Cross-validation ratios to use for train, val, and test splits
18
13
fraction: 1.0# Fraction of dataset to use
19
14
molecule_type: "protein"# Type of molecule for which to select
20
15
experiment_types: ["diffraction", "NMR", "EM", "other"] # All experiment types
@@ -28,4 +23,10 @@ datamodule:
28
23
remove_ligands: [] # Exclude specific ligands from any available protein-ligand complexes
29
24
remove_non_standard_residues: True # Include only proteins containing standard amino acid residues
30
25
remove_pdb_unavailable: True # Include only proteins that are available to download
26
+
train_val_test: [0.8, 0.1, 0.1] # Cross-validation ratios to use for train, val, and test splits
27
+
split_type: "sequence_similarity"# Split sequences by sequence similarity clustering, other options are "random" and "time_cutoff"
28
+
split_sequence_similiarity: 0.3# Clustering at 30% sequence similarity (argument is ignored if split_type!="sequence_similarity")
29
+
overwrite_sequence_clusters: False # Previous clusterings at same sequence similarity are reused and not overwritten
30
+
split_time_frames: null # Time-cutoffs for train, val and test set (argument is ignored if split_type!="time_cutoff") - e.g., ["2020-01-01", "2021-01-01", "2023-03-01"]
0 commit comments