Fix (#806)

1b5820a5 · Mufei Li · Zihao Ye · 98b825e3 · 1b5820a5 · 1b5820a5
Commit 1b5820a5 authored Aug 29, 2019 by Mufei Li Committed by Zihao Ye Aug 29, 2019
Showing with 37 additions and 6 deletions

examples/pytorch/model_zoo/chem/README.md examples/pytorch/model_zoo/chem/README.md +34 -4

examples/pytorch/model_zoo/chem/generative_models/dgmg/utils.py ...es/pytorch/model_zoo/chem/generative_models/dgmg/utils.py +3 -2

No files found.
--- a/examples/pytorch/model_zoo/chem/README.md
+++ b/examples/pytorch/model_zoo/chem/README.md
@@ -23,8 +23,6 @@ The rest dependencies can be installed with `pip install -r requirements.txt`.
 ## Property Prediction
-[**Get started with our example code!**](https://github.com/dmlc/dgl/tree/master/examples/pytorch/model_zoo/chem/property_prediction)
 To evaluate molecules for drug candidates, we need to know their properties and activities. In practice, this is
 mostly achieved via wet lab experiments. We can cast the problem as a regression or classification problem.
 In practice, this can be quite difficult due to the scarcity of labeled data.
@@ -54,7 +52,22 @@ as front end and Set2Set for output prediction.
 ### Example Usage of Pre-trained Models
-![](https://s3.us-east-2.amazonaws.com/dgl.ai/model_zoo/drug_discovery/gcn_model_zoo_example.png)
+```python
+from dgl.data import Tox21
+from dgl import model_zoo
+dataset = Tox21()
+model = model_zoo.chem.load_pretrained('GCN_Tox21') # Pretrained model loaded
+model.eval()
+smiles, g, label, mask = dataset[0]
+feats = g.ndata.pop('h')
+label_pred = model(feats, g)
+print(smiles)                   # CCOc1ccc2nc(S(N)(=O)=O)sc2c1
+print(label_pred[:, mask != 0]) # Mask non-existing labels
+# tensor([[-0.7956,  0.4054,  0.4288, -0.5565, -0.0911,  
+# 0.9981, -0.1663,  0.2311, -0.2376,  0.9196]])
+```
 ## Generative Models
@@ -76,7 +89,24 @@ progressively adding atoms and bonds.
 ### Example Usage of Pre-trained Models
-![](https://s3.us-east-2.amazonaws.com/dgl.ai/model_zoo/drug_discovery/dgmg_model_zoo_example1.png)
+```python
+# We recommend running the code below with Jupyter notebooks
+from IPython.display import SVG
+from rdkit import Chem
+from rdkit.Chem import Draw
+from dgl import model_zoo
+model = model_zoo.chem.load_pretrained('DGMG_ZINC_canonical')
+model.eval()
+mols = []
+for i in range(4):
+    SMILES = model(rdkit_mol=True)
+    mols.append(Chem.MolFromSmiles(SMILES))
+# Generating 4 molecules takes less than a second.
+SVG(Draw.MolsToGridImage(mols, molsPerRow=4, subImgSize=(180, 150), useSVG=True))
+```
 ![](https://s3.us-east-2.amazonaws.com/dgl.ai/model_zoo/drug_discovery/dgmg_model_zoo_example2.png)

--- a/examples/pytorch/model_zoo/chem/generative_models/dgmg/utils.py
+++ b/examples/pytorch/model_zoo/chem/generative_models/dgmg/utils.py
@@ -578,6 +578,7 @@ def preprocess_dataset(atom_types, bond_types, smiles, max_num_atoms=23):
        mol = smiles_to_standard_mol(raw_s)
        if mol is None:
            continue
+        standard_s = Chem.MolToSmiles(mol)
        if (max_num_atoms is not None) and (mol.GetNumAtoms() > max_num_atoms):
            continue
@@ -586,10 +587,10 @@ def preprocess_dataset(atom_types, bond_types, smiles, max_num_atoms=23):
        canonical_mol = Chem.MolFromSmiles(canonical_s)
        random_mol = Chem.MolFromSmiles(random_s)
-        if (raw_s != canonical_s) or (canonical_s != random_s) or (canonical_mol is None) or (random_mol is None):
+        if (standard_s != canonical_s) or (canonical_s != random_s) or (canonical_mol is None) or (random_mol is None):
            continue
-        valid_smiles.append(Chem.MolToSmiles(mol))
+        valid_smiles.append(standard_s)
    valid_smiles = list(set(valid_smiles))
    return valid_smiles