Notebook
import psycopg2 cn = psycopg2.connect(host='localhost',dbname='chembl_28') curs = cn.cursor() curs.execute('''select chembl_id,mol_send(m) from rdk.mols tablesample BERNOULLI(5) join chembl_id_lookup on (molregno=entity_id and entity_type='COMPOUND') limit 100000''') chembl_data = curs.fetchall() chembl_data = [(x,y.tobytes()) for x,y in chembl_data]import pickle pickle.dump(chembl_data,open('./results/chembl28_background_set.pkl','wb+'))