|
1 | 1 | {
|
2 |
| - "class": "CommandLineTool", |
3 |
| - "name": "diffdock", |
4 |
| - "description": "Docking of small molecules to a protein", |
5 |
| - "baseCommand": ["/bin/bash", "-c"], |
6 |
| - "arguments": [ |
7 |
| - "python datasets/esm_embedding_preparation.py --protein_path $(inputs.protein.filepath) --out_file /outputs/prepared_for_esm.fasta;", |
8 |
| - "HOME=esm/model_weights python esm/scripts/extract.py esm2_t33_650M_UR50D /outputs/prepared_for_esm.fasta /outputs/esm2_output --repr_layers $(inputs.repr_layers.default) --include per_tok && cp -r /outputs/esm2_output data/esm2_output;", |
9 |
| - "python -m inference --protein_path $(inputs.protein.filepath) --ligand $(inputs.small_molecule.filepath) --out_dir /outputs --inference_steps $(inputs.inference_steps.default) --samples_per_complex $(inputs.samples_per_complex.default) --batch_size $(inputs.batch_size.default) --actual_steps $(inputs.actual_steps.default) --no_final_step_noise;", |
10 |
| - "cp $(inputs.protein.filepath) /outputs" |
11 |
| - ], |
12 |
| - "dockerPull": "ghcr.io/labdao/diffdock:main@sha256:b00432de73478d3da578e4a16ee669178828109f3c7bf9c58d44bb7514f68629", |
13 |
| - "gpuBool": true, |
14 |
| - "networkBool": true, |
15 |
| - "memoryGB": 12, |
16 |
| - "inputs": { |
17 |
| - "protein": { |
18 |
| - "type": "File", |
19 |
| - "glob": ["*.pdb"] |
20 |
| - }, |
21 |
| - "small_molecule": { |
22 |
| - "type": "File", |
23 |
| - "glob": ["*.sdf", "*.mol2"] |
24 |
| - }, |
25 |
| - "repr_layers": { |
26 |
| - "type": "int", |
27 |
| - "default": "33" |
28 |
| - }, |
29 |
| - "inference_steps": { |
30 |
| - "type": "int", |
31 |
| - "default": "20" |
32 |
| - }, |
33 |
| - "samples_per_complex": { |
34 |
| - "type": "int", |
35 |
| - "default": "40" |
36 |
| - }, |
37 |
| - "batch_size": { |
38 |
| - "type": "int", |
39 |
| - "default": "10" |
40 |
| - }, |
41 |
| - "actual_steps": { |
42 |
| - "type": "int", |
43 |
| - "default": "18" |
44 |
| - } |
45 |
| - }, |
46 |
| - "outputs": { |
47 |
| - "best_docked_small_molecule": { |
48 |
| - "type": "File", |
49 |
| - "item": "", |
50 |
| - "glob": ["index*/rank1.sdf"] |
51 |
| - }, |
52 |
| - "all_docked_small_molecules": { |
53 |
| - "type": "Array", |
54 |
| - "item": "File", |
55 |
| - "glob": ["index*/rank*.sdf"] |
56 |
| - }, |
57 |
| - "protein": { |
58 |
| - "type": "File", |
59 |
| - "item": "", |
60 |
| - "glob": ["*.pdb"] |
61 |
| - } |
| 2 | + "class": "CommandLineTool", |
| 3 | + "name": "diffdock", |
| 4 | + "description": "Docking of small molecules to a protein", |
| 5 | + "author": "@misc{corso2023diffdock,\n title={DiffDock: Diffusion Steps, Twists, and Turns for Molecular Docking},\n author={Gabriele Corso and Hannes Stärk and Bowen Jing and Regina Barzilay and Tommi Jaakkola},\n year={2023},\n eprint={2210.01776},\n archivePrefix={arXiv},\n primaryClass={q-bio.BM}\n}", |
| 6 | + "baseCommand": ["/bin/bash", "-c"], |
| 7 | + "arguments": [ |
| 8 | + "python datasets/esm_embedding_preparation.py --protein_path $(inputs.protein.filepath) --out_file /outputs/prepared_for_esm.fasta;", |
| 9 | + "HOME=esm/model_weights python esm/scripts/extract.py esm2_t33_650M_UR50D /outputs/prepared_for_esm.fasta /outputs/esm2_output --repr_layers $(inputs.repr_layers.default) --include per_tok && cp -r /outputs/esm2_output data/esm2_output;", |
| 10 | + "python -m inference --protein_path $(inputs.protein.filepath) --ligand $(inputs.small_molecule.filepath) --out_dir /outputs --inference_steps $(inputs.inference_steps.default) --samples_per_complex $(inputs.samples_per_complex.default) --batch_size $(inputs.batch_size.default) --actual_steps $(inputs.actual_steps.default) --no_final_step_noise;", |
| 11 | + "cp $(inputs.protein.filepath) /outputs" |
| 12 | + ], |
| 13 | + "dockerPull": "ghcr.io/labdao/diffdock:main@sha256:b00432de73478d3da578e4a16ee669178828109f3c7bf9c58d44bb7514f68629", |
| 14 | + "gpuBool": true, |
| 15 | + "networkBool": true, |
| 16 | + "memoryGB": 12, |
| 17 | + "inputs": { |
| 18 | + "protein": { |
| 19 | + "type": "File", |
| 20 | + "glob": ["*.pdb"] |
| 21 | + }, |
| 22 | + "small_molecule": { |
| 23 | + "type": "File", |
| 24 | + "glob": ["*.sdf", "*.mol2"] |
| 25 | + }, |
| 26 | + "repr_layers": { |
| 27 | + "type": "int", |
| 28 | + "default": "33" |
| 29 | + }, |
| 30 | + "inference_steps": { |
| 31 | + "type": "int", |
| 32 | + "default": "20" |
| 33 | + }, |
| 34 | + "samples_per_complex": { |
| 35 | + "type": "int", |
| 36 | + "default": "40" |
| 37 | + }, |
| 38 | + "batch_size": { |
| 39 | + "type": "int", |
| 40 | + "default": "10" |
| 41 | + }, |
| 42 | + "actual_steps": { |
| 43 | + "type": "int", |
| 44 | + "default": "18" |
| 45 | + } |
| 46 | + }, |
| 47 | + "outputs": { |
| 48 | + "best_docked_small_molecule": { |
| 49 | + "type": "File", |
| 50 | + "item": "", |
| 51 | + "glob": ["index*/rank1.sdf"] |
| 52 | + }, |
| 53 | + "all_docked_small_molecules": { |
| 54 | + "type": "Array", |
| 55 | + "item": "File", |
| 56 | + "glob": ["index*/rank*.sdf"] |
| 57 | + }, |
| 58 | + "protein": { |
| 59 | + "type": "File", |
| 60 | + "item": "", |
| 61 | + "glob": ["*.pdb"] |
62 | 62 | }
|
| 63 | + } |
63 | 64 | }
|
0 commit comments