diff --git a/.gitignore b/.gitignore index bbf65f7..f283f81 100644 --- a/.gitignore +++ b/.gitignore @@ -8,4 +8,6 @@ *.traj *__pycache__* **/.vscode/ -meta_production_sample.pkl \ No newline at end of file +meta_production_sample.pkl +development/**/*.csv +development/**/*.mol2 \ No newline at end of file diff --git a/architector/complex_construction.py b/architector/complex_construction.py index 40b43e4..1f236f5 100644 --- a/architector/complex_construction.py +++ b/architector/complex_construction.py @@ -487,7 +487,7 @@ def complex_driver(inputDict1): ligandDict = newligDict else: # Generate from scratch ligandDict = {} # - + coreCoordList = core_geo_class.geometry_dict[coreType] # Assign con atoms based on all ligands @@ -540,7 +540,7 @@ def complex_driver(inputDict1): out_energies.append(complexClass.calculator.energy) if inputDict['parameters']['return_only_1']: break - if not isinstance(complexClass, bool): # Catch cases where no conformation generated. + if not isinstance(complexClass, bool): # Catch cases where no conformation generated. order = np.argsort(out_energies) for ind, j in enumerate(order[0:inputDict[ 'parameters']['n_conformers']]): @@ -585,7 +585,7 @@ def complex_driver(inputDict1): return conf_dict,inputDict,core_preprocess_time,symmetry_preprocess_time,int_time1 else: return {},inputDict,0,0,0 - + def build_complex_driver(inputDict1): """build_complex_driver overall driver building of the complex @@ -787,12 +787,13 @@ def build_complex(inputDict): keys.append(key) vals.append(val) order = np.argsort(xtb_energies) - for j,i in enumerate(order): + for j, i in enumerate(order): if tmp_inputDict['parameters']['add_secondary_shell_species'] and \ (j < tmp_inputDict['parameters'][ 'secondary_shell_n_conformers']): if tmp_inputDict['parameters']['debug']: - print('Starting secondary shell addition on {} of {}!'.format(j+1,len(order))) + print('Starting secondary shell addition on {} of {}!'.format(j+1, + len(order))) print('Normally adds a chunk of time to generation.') # Use the docking function to add species specified in inputDict/parameters mol_plus_species, species_list = \ diff --git a/architector/io_process_input.py b/architector/io_process_input.py index 874d970..6f0f7bb 100644 --- a/architector/io_process_input.py +++ b/architector/io_process_input.py @@ -1094,12 +1094,13 @@ def inparse(inputDict): if metal in io_ptable.metal_charge_dict: outparams['metal_ox'] = io_ptable.metal_charge_dict[metal] else: # Pull lowest positive "main" oxidation state from mendeleev - elem = mendeleev.__dict__[newinpDict['core']['metal']] + elem = mendeleev.element(newinpDict['core']['metal']) outparams['metal_ox'] = [x.oxidation_state for x in elem._oxidation_states if (x.category == 'main') and (x.oxidation_state > 0)][0] if outparams['metal_spin'] is None: if outparams['metal_ox'] != io_ptable.metal_charge_dict.get(metal,100): # Calculate from mendeleev reference - Generally aufbau. - outparams['metal_spin'] = mendeleev.__dict__[newinpDict['core']['metal']].ec.ionize(outparams['metal_ox']).unpaired_electrons() + outparams['metal_spin'] = mendeleev.element( + newinpDict['core']['metal']).ec.ionize(outparams['metal_ox']).unpaired_electrons() else: # Otherwise use refdict. outparams['metal_spin'] = io_ptable.metal_spin_dict[metal] @@ -1434,12 +1435,13 @@ def inparse_2D(inputDict): if metal in io_ptable.metal_charge_dict: outparams['metal_ox'] = io_ptable.metal_charge_dict[metal] else: # Pull lowest positive "main" oxidation state from mendeleev - elem = mendeleev.__dict__[newinpDict['core']['metal']] + elem = mendeleev.element(newinpDict['core']['metal']) outparams['metal_ox'] = [x.oxidation_state for x in elem._oxidation_states if (x.category == 'main') and (x.oxidation_state > 0)][0] if outparams['metal_spin'] is None: if outparams['metal_ox'] != io_ptable.metal_charge_dict.get(metal,100): # Calculate from mendeleev reference - Generally aufbau. - outparams['metal_spin'] = mendeleev.__dict__[newinpDict['core']['metal']].ec.ionize(outparams['metal_ox']).unpaired_electrons() + outparams['metal_spin'] = mendeleev.element( + newinpDict['core']['metal']).ec.ionize(outparams['metal_ox']).unpaired_electrons() else: # Otherwise use refdict. outparams['metal_spin'] = io_ptable.metal_spin_dict[metal] diff --git a/development/dipole_conformers.ipynb b/development/dipole_conformers.ipynb new file mode 100644 index 0000000..d7c6f45 --- /dev/null +++ b/development/dipole_conformers.ipynb @@ -0,0 +1,301 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 7, + "metadata": {}, + "outputs": [], + "source": [ + "from architector.io_obabel import generate_obmol_conformers\n", + "from architector.io_calc import CalcExecutor\n", + "from architector import view_structures, convert_io_molecule\n", + "import numpy as np" + ] + }, + { + "cell_type": "code", + "execution_count": 16, + "metadata": {}, + "outputs": [], + "source": [ + "example_smi = '[O-]CCCCCCCC'" + ] + }, + { + "cell_type": "code", + "execution_count": 17, + "metadata": {}, + "outputs": [ + { + "data": { + "application/3dmoljs_load.v0": "
3Dmol.js failed to load for some reason. Please check your browser console for error messages.
3Dmol.js failed to load for some reason. Please check your browser console for error messages.
\n", + " | ID | \n", + "Name | \n", + "InChIKey | \n", + "SMILES | \n", + "Solubility | \n", + "
---|---|---|---|---|---|
0 | \n", + "A-3 | \n", + "N,N,N-trimethyloctadecan-1-aminium bromide | \n", + "SZEMGTQCPRNXEG-UHFFFAOYSA-M | \n", + "[Br-].CCCCCCCCCCCCCCCCCC[N+](C)(C)C | \n", + "-3.616127 | \n", + "
1 | \n", + "A-4 | \n", + "Benzo[cd]indol-2(1H)-one | \n", + "GPYLCFQEKPUWLD-UHFFFAOYSA-N | \n", + "O=C1Nc2cccc3cccc1c23 | \n", + "-3.254767 | \n", + "
2 | \n", + "A-5 | \n", + "4-chlorobenzaldehyde | \n", + "AVPYQKSLYISFPO-UHFFFAOYSA-N | \n", + "Clc1ccc(C=O)cc1 | \n", + "-2.177078 | \n", + "
3 | \n", + "A-8 | \n", + "zinc bis[2-hydroxy-3,5-bis(1-phenylethyl)benzo... | \n", + "XTUPUYCJWKHGSW-UHFFFAOYSA-L | \n", + "[Zn++].CC(c1ccccc1)c2cc(C(C)c3ccccc3)c(O)c(c2)... | \n", + "-3.924409 | \n", + "
4 | \n", + "A-9 | \n", + "4-({4-[bis(oxiran-2-ylmethyl)amino]phenyl}meth... | \n", + "FAUAZXVRLVIARB-UHFFFAOYSA-N | \n", + "C1OC1CN(CC2CO2)c3ccc(Cc4ccc(cc4)N(CC5CO5)CC6CO... | \n", + "-4.662065 | \n", + "
... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "
9977 | \n", + "I-84 | \n", + "tetracaine | \n", + "GKCBAIGFKIBETG-UHFFFAOYSA-N | \n", + "C(c1ccc(cc1)NCCCC)(=O)OCCN(C)C | \n", + "-3.010000 | \n", + "
9978 | \n", + "I-85 | \n", + "tetracycline | \n", + "OFVLGDICTFRJMM-WESIUVDSSA-N | \n", + "OC1=C(C(C2=C(O)[C@@](C(C(C(N)=O)=C(O)[C@H]3N(C... | \n", + "-2.930000 | \n", + "
9979 | \n", + "I-86 | \n", + "thymol | \n", + "MGSRCZKZVOBKFT-UHFFFAOYSA-N | \n", + "c1(cc(ccc1C(C)C)C)O | \n", + "-2.190000 | \n", + "
9980 | \n", + "I-93 | \n", + "verapamil | \n", + "SGTNSNPWRIOYBX-UHFFFAOYSA-N | \n", + "COc1ccc(CCN(C)CCCC(C#N)(C(C)C)c2ccc(OC)c(OC)c2... | \n", + "-3.980000 | \n", + "
9981 | \n", + "I-94 | \n", + "warfarin | \n", + "PJVWKTKQMONHTI-UHFFFAOYSA-N | \n", + "CC(=O)CC(c1ccccc1)c1c(O)c2ccccc2oc1=O | \n", + "-4.780000 | \n", + "
9982 rows × 5 columns
\n", + "3Dmol.js failed to load for some reason. Please check your browser console for error messages.
3Dmol.js failed to load for some reason. Please check your browser console for error messages.
3Dmol.js failed to load for some reason. Please check your browser console for error messages.
3Dmol.js failed to load for some reason. Please check your browser console for error messages.
3Dmol.js failed to load for some reason. Please check your browser console for error messages.
3Dmol.js failed to load for some reason. Please check your browser console for error messages.
\n", + " | energy | \n", + "free_energy | \n", + "forces | \n", + "dipole | \n", + "charges | \n", + "xtb_mol2 | \n", + "
---|---|---|---|---|---|---|
0 | \n", + "-941.953893 | \n", + "-941.953893 | \n", + "[[-0.0064054274805771675, 0.002893010498177088... | \n", + "[-0.04072509722616722, 0.4271721600245919, 0.5... | \n", + "[-0.11478628082344275, 0.003135417180573183, -... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
1 | \n", + "-941.950280 | \n", + "-941.950280 | \n", + "[[-0.005747968896342007, 0.0018745948789265158... | \n", + "[-0.17535441597366486, -0.4851559094552098, 0.... | \n", + "[-0.11412520265988979, 0.0030248534750732248, ... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
2 | \n", + "-942.042879 | \n", + "-942.042879 | \n", + "[[-0.004074275762437106, -0.004648667982582211... | \n", + "[-0.04347311031771758, -0.537465498185844, 0.1... | \n", + "[-0.11308169713123725, 0.0046844825432522524, ... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
3 | \n", + "-941.917303 | \n", + "-941.917303 | \n", + "[[0.02297184960918795, -0.007096980853435831, ... | \n", + "[-0.1081611768128786, 0.5700338757740078, 0.39... | \n", + "[-0.11282084473184698, 0.00343528545446857, -0... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
4 | \n", + "-941.925803 | \n", + "-941.925803 | \n", + "[[-0.00950542960255489, 0.0013225729101183279,... | \n", + "[0.03999807451346173, 0.5137888912027536, 0.43... | \n", + "[-0.1133431929759389, 0.004619124125817553, -0... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
5 | \n", + "-941.944995 | \n", + "-941.944995 | \n", + "[[-0.012649020593404663, 0.008891172917475326,... | \n", + "[-0.02019514472401081, 0.3534161701592894, 0.5... | \n", + "[-0.1132901094327726, 0.0038520755462167766, -... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
6 | \n", + "-941.963922 | \n", + "-941.963922 | \n", + "[[-0.004040395285581353, -0.005494595557095002... | \n", + "[-0.2760326399408978, -0.6226984118173071, 0.2... | \n", + "[-0.1132794690839442, 0.005506370801200339, -0... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
7 | \n", + "-941.933859 | \n", + "-941.933859 | \n", + "[[-0.03113600670791028, -0.012523592246384135,... | \n", + "[-0.4646939981518977, -0.4543851187179526, 0.2... | \n", + "[-0.11455749486667728, 0.004402608688685528, -... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
8 | \n", + "-941.933840 | \n", + "-941.933840 | \n", + "[[-0.0023090121795046, -0.0012468292679679693,... | \n", + "[-0.11902841857768293, 0.37839388841507415, 0.... | \n", + "[-0.11360419866355351, 0.0037736931269920365, ... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
9 | \n", + "-941.942060 | \n", + "-941.942060 | \n", + "[[-0.005573365585241426, 0.016333912964534444,... | \n", + "[0.008244584381401365, 0.3509699766971826, 0.3... | \n", + "[-0.11019970991046024, 0.005848684216261016, -... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
10 | \n", + "-941.982895 | \n", + "-941.982895 | \n", + "[[-0.005789551710469486, -0.005415001277539138... | \n", + "[-0.20080321600305756, -0.441855094329486, 0.2... | \n", + "[-0.11285473497350985, 0.005063549018848312, -... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
11 | \n", + "-941.989306 | \n", + "-941.989306 | \n", + "[[0.0023797569165056494, 0.0014927387150377607... | \n", + "[-0.34217775743938655, 0.206008261524908, 0.39... | \n", + "[-0.11232483049930286, 0.0042552854505437665, ... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
12 | \n", + "-941.996077 | \n", + "-941.996077 | \n", + "[[0.007872942006244004, -0.015973658216846945,... | \n", + "[-0.03057891685648984, -0.6035728943770056, 0.... | \n", + "[-0.11466408844107442, 0.0030596302840158046, ... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
13 | \n", + "-941.961751 | \n", + "-941.961751 | \n", + "[[0.013873978777933609, 0.008714346279801942, ... | \n", + "[-0.3090836179001432, -0.5710604396804403, 0.2... | \n", + "[-0.11457207094463301, 0.004317772363820485, -... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
14 | \n", + "-941.945587 | \n", + "-941.945587 | \n", + "[[0.02330201120535815, 0.0037549411116072928, ... | \n", + "[-0.06403308012802437, 0.4502260235518645, 0.3... | \n", + "[-0.11190094981249321, 0.006234969573618007, -... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
15 | \n", + "-941.959734 | \n", + "-941.959734 | \n", + "[[-0.004274421525671059, 0.00933781864063549, ... | \n", + "[-0.2996062613744575, 0.42448345272549765, 0.4... | \n", + "[-0.11448587052718476, 0.00301700806848354, -0... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
16 | \n", + "-941.957871 | \n", + "-941.957871 | \n", + "[[0.029044434923186434, -0.014841328242279772,... | \n", + "[-0.20993014063235144, 0.49726264633227535, 0.... | \n", + "[-0.11264407067753646, 0.0032690517505117173, ... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
17 | \n", + "-941.975852 | \n", + "-941.975852 | \n", + "[[0.013154518965379634, 0.00377022015669898, 0... | \n", + "[0.008486763537757912, 0.4417631514538985, 0.4... | \n", + "[-0.11406889911063403, 0.003555211048615295, -... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
18 | \n", + "-942.008965 | \n", + "-942.008965 | \n", + "[[-0.007688946886930841, 0.0037896335380984384... | \n", + "[0.10234664997307748, -0.5114196914304929, 0.2... | \n", + "[-0.11205578255935358, 0.004674101182466722, -... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
19 | \n", + "-941.966669 | \n", + "-941.966669 | \n", + "[[0.0026953435096534087, 0.002979370969931447,... | \n", + "[-0.2988712089214222, 0.4570317276286429, -0.1... | \n", + "[-0.11239806409192919, 0.0021378138634558785, ... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
20 | \n", + "-941.976303 | \n", + "-941.976303 | \n", + "[[0.00949072281355, -0.003257001332871327, 0.0... | \n", + "[-0.4087391157241313, 0.3738489962543335, 0.38... | \n", + "[-0.11341018058416302, 0.0010303001999083239, ... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
21 | \n", + "-941.957536 | \n", + "-941.957536 | \n", + "[[-0.006712128253738265, 0.003174343250744261,... | \n", + "[-0.07689631278551505, 0.49246974693425255, 0.... | \n", + "[-0.11285616336687668, 0.0006248046019975695, ... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
22 | \n", + "-941.986535 | \n", + "-941.986535 | \n", + "[[0.0031198718917791464, 0.0035276424727782303... | \n", + "[-0.13607065699767962, 0.32826054550023237, -0... | \n", + "[-0.11352561367974287, 0.0022344351214790142, ... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
23 | \n", + "-941.968502 | \n", + "-941.968502 | \n", + "[[-0.0008081220351732268, -0.02263822517147316... | \n", + "[-0.272093398576091, 0.4600825022722129, -0.12... | \n", + "[-0.11395220340664092, 0.00478164559167335, -0... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
24 | \n", + "-941.944514 | \n", + "-941.944514 | \n", + "[[-0.013292161034476373, 0.006266857420767831,... | \n", + "[-0.19348582923642033, 0.4954191617800937, -0.... | \n", + "[-0.11329557958925107, 0.004670431551598034, -... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
25 | \n", + "-941.967755 | \n", + "-941.967755 | \n", + "[[0.018707547630603883, -0.006985174117220028,... | \n", + "[-0.24485392634771252, 0.37875702621492124, 0.... | \n", + "[-0.11473579876678727, 0.0038344852950510933, ... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
26 | \n", + "-941.981779 | \n", + "-941.981779 | \n", + "[[0.0042593208766267395, -0.001137467886214728... | \n", + "[0.3710727954892336, 0.5068447243139468, 0.433... | \n", + "[-0.11302409334121935, 0.005889123355889356, -... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
27 | \n", + "-941.937742 | \n", + "-941.937742 | \n", + "[[-0.004415312469214524, -0.020941742452419677... | \n", + "[-0.33549841731401703, -0.21726389396929238, -... | \n", + "[-0.11295230012463539, 0.003917668476299971, -... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
28 | \n", + "-941.959590 | \n", + "-941.959590 | \n", + "[[-0.0019702566455652728, -0.00723399908969859... | \n", + "[-0.1692058793516984, 0.4845564511321144, -0.2... | \n", + "[-0.11328248251225162, 0.0031808024696459575, ... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
29 | \n", + "-941.932717 | \n", + "-941.932717 | \n", + "[[-0.028987095684595784, -0.002520984421162864... | \n", + "[0.11355148006057446, 0.31523511055311776, 0.5... | \n", + "[-0.11290935710169636, 0.0052879522534911155, ... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
30 | \n", + "-942.005847 | \n", + "-942.005847 | \n", + "[[-0.029631153712220554, 0.007592473178661552,... | \n", + "[0.017330046307516635, -0.3929130878068432, -0... | \n", + "[-0.11221807413984114, 0.004229490258218435, -... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
31 | \n", + "-941.901757 | \n", + "-941.901757 | \n", + "[[0.004824352437003144, -0.009401487785090024,... | \n", + "[0.25575055726103113, 0.40874344166617377, 0.3... | \n", + "[-0.11242996946527903, -0.0002510390197548451,... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
32 | \n", + "-941.950690 | \n", + "-941.950690 | \n", + "[[0.0026851207587491373, 0.0068610564945188945... | \n", + "[-0.2803754786065773, -0.5334886680474346, 0.3... | \n", + "[-0.1143846573356333, 0.0007603854631822171, -... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
33 | \n", + "-941.968843 | \n", + "-941.968843 | \n", + "[[-0.01867505201993493, 0.003181643012599281, ... | \n", + "[-0.15301724594136062, 0.2790231605693987, 0.4... | \n", + "[-0.11036408143591933, 0.004562874819385346, -... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
34 | \n", + "-941.960774 | \n", + "-941.960774 | \n", + "[[-0.011877644788936905, -0.026954376709123075... | \n", + "[-0.180940180910476, 0.5516790344836181, -0.03... | \n", + "[-0.11294364578269431, 0.0058543182899778445, ... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
35 | \n", + "-942.014285 | \n", + "-942.014285 | \n", + "[[0.0022976800395958846, -0.013589687592119109... | \n", + "[-0.1233117303197784, 0.404802148964335, -0.22... | \n", + "[-0.11307602877487552, 0.002501638750332616, -... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
36 | \n", + "-941.903403 | \n", + "-941.903403 | \n", + "[[-0.02331996214296517, 0.010685002632797171, ... | \n", + "[-0.332922798967579, -0.12642438605821282, -0.... | \n", + "[-0.11343353190285174, 0.0043780086253094735, ... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
37 | \n", + "-942.007395 | \n", + "-942.007395 | \n", + "[[0.0037780741836213076, 0.01902316925118944, ... | \n", + "[-0.1858311274812901, -0.21594710678209902, -0... | \n", + "[-0.11177213363081451, 0.004453577860408647, -... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
38 | \n", + "-941.988840 | \n", + "-941.988840 | \n", + "[[-0.03240830104540279, -0.02253494700723065, ... | \n", + "[-0.2555268008384709, -0.029942606439405283, -... | \n", + "[-0.11609808215104198, 0.006123767778125511, -... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
39 | \n", + "-941.969572 | \n", + "-941.969572 | \n", + "[[0.0040911268112533246, 0.012365663907514207,... | \n", + "[-0.2663932517587651, 0.26697139093640154, -0.... | \n", + "[-0.11165253467512878, 0.0049063381096841885, ... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
40 | \n", + "-941.927235 | \n", + "-941.927235 | \n", + "[[-0.008174874431749588, 0.013413745987587647,... | \n", + "[0.20904164456672533, 0.448837039860279, 0.397... | \n", + "[-0.1145075396193811, 0.0021868780484034234, -... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
41 | \n", + "-942.000749 | \n", + "-942.000749 | \n", + "[[0.01962134024504779, 0.003156185634012357, 0... | \n", + "[-0.06965001336782749, -0.3691016573623966, -0... | \n", + "[-0.11276189668287563, 0.004253667859406118, -... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
42 | \n", + "-941.971101 | \n", + "-941.971101 | \n", + "[[-0.004151267084641824, 0.00915523136618795, ... | \n", + "[-0.4321532218356113, 0.20033685859622585, 0.1... | \n", + "[-0.11322831382126233, 0.004611301130298395, -... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
43 | \n", + "-941.939776 | \n", + "-941.939776 | \n", + "[[-0.010520437363048455, 0.003726169169612492,... | \n", + "[0.06603613307825389, 0.40741966296805665, -0.... | \n", + "[-0.11132501957504222, 0.005441943149804271, -... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
44 | \n", + "-941.953197 | \n", + "-941.953197 | \n", + "[[0.0018059801146283656, -0.00335369257013824,... | \n", + "[-0.20444341850718695, -0.4359319005681523, -0... | \n", + "[-0.11333333683408459, 0.0009756690332999446, ... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
45 | \n", + "-941.946527 | \n", + "-941.946527 | \n", + "[[0.014795988019366456, 0.02189946451324612, 0... | \n", + "[-0.3175890531027094, 0.43342801047633495, -0.... | \n", + "[-0.11427698722596516, 0.0023814808037803115, ... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
46 | \n", + "-941.940041 | \n", + "-941.940041 | \n", + "[[0.00015349676460309794, -0.00903777215247311... | \n", + "[0.019740685879562958, 0.6193679712236572, 0.4... | \n", + "[-0.11393793263361515, 0.006143554757771022, -... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
47 | \n", + "-941.976173 | \n", + "-941.976173 | \n", + "[[-0.00358151778159043, 0.01569987890645837, 0... | \n", + "[-0.4206374798811715, 0.3549809044674297, 0.01... | \n", + "[-0.11447556030989668, 0.001317522791494885, -... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
48 | \n", + "-941.952127 | \n", + "-941.952127 | \n", + "[[-0.0028454505148780237, 0.014495838430332444... | \n", + "[-0.030667465591407494, -0.3920030947808661, -... | \n", + "[-0.11077041313482294, 0.0063098981597411175, ... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
49 | \n", + "-941.940078 | \n", + "-941.940078 | \n", + "[[0.005687163462374582, 0.009315960485936454, ... | \n", + "[-0.423702477923642, 0.1986383126846553, 0.494... | \n", + "[-0.11355494951655856, 0.001975819011750174, -... | \n", + "@<TRIPOS>MOLECULE\\nGFn2-XTB_relax Charge: 0 Un... | \n", + "
\n", + " | ID | \n", + "Name | \n", + "InChIKey | \n", + "SMILES | \n", + "Solubility | \n", + "
---|---|---|---|---|---|
1 | \n", + "A-4 | \n", + "Benzo[cd]indol-2(1H)-one | \n", + "GPYLCFQEKPUWLD-UHFFFAOYSA-N | \n", + "O=C1Nc2cccc3cccc1c23 | \n", + "-3.254767 | \n", + "
2 | \n", + "A-5 | \n", + "4-chlorobenzaldehyde | \n", + "AVPYQKSLYISFPO-UHFFFAOYSA-N | \n", + "Clc1ccc(C=O)cc1 | \n", + "-2.177078 | \n", + "
4 | \n", + "A-9 | \n", + "4-({4-[bis(oxiran-2-ylmethyl)amino]phenyl}meth... | \n", + "FAUAZXVRLVIARB-UHFFFAOYSA-N | \n", + "C1OC1CN(CC2CO2)c3ccc(Cc4ccc(cc4)N(CC5CO5)CC6CO... | \n", + "-4.662065 | \n", + "
5 | \n", + "A-10 | \n", + "vinyltoluene | \n", + "JZHGRUMIRATHIU-UHFFFAOYSA-N | \n", + "Cc1cccc(C=C)c1 | \n", + "-3.123150 | \n", + "
6 | \n", + "A-11 | \n", + "3-(3-ethylcyclopentyl)propanoic acid | \n", + "WVRFSLWCFASCIS-UHFFFAOYSA-N | \n", + "CCC1CCC(CCC(O)=O)C1 | \n", + "-3.286116 | \n", + "
... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "
9977 | \n", + "I-84 | \n", + "tetracaine | \n", + "GKCBAIGFKIBETG-UHFFFAOYSA-N | \n", + "C(c1ccc(cc1)NCCCC)(=O)OCCN(C)C | \n", + "-3.010000 | \n", + "
9978 | \n", + "I-85 | \n", + "tetracycline | \n", + "OFVLGDICTFRJMM-WESIUVDSSA-N | \n", + "OC1=C(C(C2=C(O)[C@@](C(C(C(N)=O)=C(O)[C@H]3N(C... | \n", + "-2.930000 | \n", + "
9979 | \n", + "I-86 | \n", + "thymol | \n", + "MGSRCZKZVOBKFT-UHFFFAOYSA-N | \n", + "c1(cc(ccc1C(C)C)C)O | \n", + "-2.190000 | \n", + "
9980 | \n", + "I-93 | \n", + "verapamil | \n", + "SGTNSNPWRIOYBX-UHFFFAOYSA-N | \n", + "COc1ccc(CCN(C)CCCC(C#N)(C(C)C)c2ccc(OC)c(OC)c2... | \n", + "-3.980000 | \n", + "
9981 | \n", + "I-94 | \n", + "warfarin | \n", + "PJVWKTKQMONHTI-UHFFFAOYSA-N | \n", + "CC(=O)CC(c1ccccc1)c1c(O)c2ccccc2oc1=O | \n", + "-4.780000 | \n", + "
8797 rows × 5 columns
\n", + "