Commit 3e011a10 authored by Joseph Gomes's avatar Joseph Gomes
Browse files

Fix SDF reader

parent 70016432
Loading
Loading
Loading
Loading
+1 −1
Original line number Diff line number Diff line
@@ -69,7 +69,7 @@ def load_sdf_files(input_files):
    raw_df = next(load_csv_files([input_file+".csv"], shard_size=None))
    # Structures are stored in .sdf file
    print("Reading structures from %s." % input_file)
    suppl = Chem.SDMolSupplier(str(input_file), removeHs=False)
    suppl = Chem.SDMolSupplier(str(input_file), False, False, False)
    df_rows = []
    for ind, mol in enumerate(suppl):
      if mol is not None:
+1 −1
Original line number Diff line number Diff line
echo "Pulling GDB7 dataset from deepchem"
#wget http://deepchem.io.s3-website-us-west-1.amazonaws.com/datasets/gdb7.tar.gz
wget http://deepchem.io.s3-website-us-west-1.amazonaws.com/datasets/gdb7.tar.gz
echo "Extracting gdb7 structures"
tar -zxvf gdb7.tar.gz