1
+ # # Protein-ligand docking and docking poses re-ranking
2
+ # #
3
+ # # input: pdb structures from PDBbind refined dataset
4
+ # # output:
5
+ # # 1. docking poses
6
+ # # 2. scoring file (vina score, sfct correction, combined_score for re-ranking docking poses)
7
+
8
+ steps :
9
+ #
10
+ - extract_pdbbind_refined :
11
+ in :
12
+ # https://pandas.pydata.org/docs/reference/api/pandas.DataFrame.query.html
13
+ # "The query() method uses a slightly modified Python syntax by default.
14
+ # For example, the & and | (bitwise) operators have the precedence of their boolean cousins, and and or.
15
+ # This is syntactically valid Python, however the semantics are different."
16
+ query : ' (Kd_Ki == "Kd") and (value < 0.000002)'
17
+ # to obtain a broader experimental dGs
18
+ max_row : 1
19
+ convert_Kd_dG : ' True'
20
+ output_txt_path : ' &binding_data.txt'
21
+ output_pdb_paths : ' &pdbbind_pdbs'
22
+ output_sdf_paths : ' &pdbbind_sdfs'
23
+ experimental_dGs : ' &exp_dGs'
24
+
25
+ - fix_side_chain :
26
+ scatter : [input_pdb_path]
27
+ in :
28
+ input_pdb_path : ' *pdbbind_pdbs'
29
+ output_pdb_path : ' &pdbbind_pdbs.pdb'
30
+
31
+ - minimize_ligand_only.yml :
32
+ scatter : [sdf_path]
33
+ in :
34
+ sdf_path : ' *pdbbind_sdfs'
35
+
36
+ - smina_docking :
37
+ scatter : [receptor_file, ligand_file, ligand_box]
38
+ scatterMethod : dotproduct
39
+ in :
40
+ receptor_file : ' *pdbbind_pdbs.pdb'
41
+ ligand_file : ' *ligand_min.mol2'
42
+ ligand_box : ' *ligand_min.mol2'
43
+ scoring : ' vina'
44
+ local_only : True
45
+ output_dock_file : ' &ligand_opt.pdb'
46
+ output_path : output
47
+
48
+ - clean_smina_pdb :
49
+ scatter : [input_pdb]
50
+ in :
51
+ input_pdb : ' *ligand_opt.pdb'
52
+ output_pdb : ' &ligand_opt_clean.pdb'
53
+
54
+ - cat_pdb :
55
+ scatter : [input_structure1, input_structure2]
56
+ scatterMethod : dotproduct
57
+ in :
58
+ input_structure1 : ' *pdbbind_pdbs.pdb'
59
+ input_structure2 : ' *ligand_opt_clean.pdb'
60
+ output_structure_path : ' &complex_pdbs.pdb'
61
+
62
+ - onionnet-feature :
63
+ scatter : [complex_path_file]
64
+ in :
65
+ complex_path_file : ' *complex_pdbs.pdb'
66
+ output_feature_file : ' &output_features.csv'
67
+
68
+ - onionnet-score :
69
+ scatter : [input_feature_file]
70
+ in :
71
+ input_feature_file : ' *output_features.csv'
72
+ output_score_file : ' &predicted_pKa.csv'
73
+ onionnet_score : ' &onionnet_score'
74
+
75
+ - scatter_plot :
76
+ in :
77
+ xs : ' *exp_dGs'
78
+ ys : ' *onionnet_score'
79
+
80
+ wic :
81
+ graphviz :
82
+ label : Protein-ligand docking (Smina) and docking poses re-ranking (OnionNet-sfct)
83
+ steps :
84
+ (1, extract_pdbbind_refined) :
85
+ wic :
86
+ graphviz :
87
+ label : extract protein-ligand structure (protein.pdb and ligand.sdf) from pdbbind_refined dataset
88
+ (2, fix_side_chain) :
89
+ wic :
90
+ graphviz :
91
+ label : fix_side_chain of protein structure.
92
+ (3, minimize_ligand_only.yml) :
93
+ wic :
94
+ inlineable : False
95
+ graphviz :
96
+ label : minimize (obminimize) ligand structure.
97
+ (4, smina_docking) :
98
+ wic :
99
+ graphviz :
100
+ label : Smina docking (flexible ligand - rigid protein docking)
0 commit comments