import urllib, sys,CoolProp, json sys.path.append('C:\RDKit_2014_09_2') from rdkit import Chem from collections import Counter for fluid in CoolProp.__fluids__: CAS = CoolProp.CoolProp.get_fluid_param_string(fluid, "CAS") print fluid, CAS, if '.ppf' in CAS or '.PPF' in CAS or 'o' in CAS or 'p' in CAS: print '' continue txt = urllib.urlretrieve('http://cactus.nci.nih.gov/chemical/structure/'+CAS+'/file?format=mol') with open(txt[0],'r') as fp: contents = fp.read() if '