Prediction of Aqueous Solubility of Organic Compounds from Molecular Structure. Mitchell, B. & Jurs, P. J.~Chem.~Inf.~Comput.~Sci., 38:489--496, 1998. abstract bibtex Multiple linear regression (MLR) and computational neural networks (CNN) are utilized to develop mathematical models to relate the structures of a diverse set of 332 organic compounds to their aqueous solubilities. Topological, geometric, and electronic descriptors are used to numerically represent structural features of the data set compounds. Genetic algorithm and simulated annealing routines, in conjunction with MLR and CNN, are used to select subsets of descriptors that accurately relate to aqueous solubility. Nonlinear models with nine calculated structural descriptors are developed that have a training set root-mean-square error of 0.394 log units for compounds which span a −log(molarity) range from −2 to +12 log units.
@article{Mitchell:1998pi,
Abstract = {Multiple linear regression (MLR) and computational neural networks (CNN) are utilized to develop mathematical models to relate the structures of a diverse set of 332 organic compounds to their aqueous solubilities. Topological, geometric, and electronic descriptors are used to numerically represent structural features of the data set compounds. Genetic algorithm and simulated annealing routines, in conjunction with MLR and CNN, are used to select subsets of descriptors that accurately relate to aqueous solubility. Nonlinear models with nine calculated structural descriptors are developed that have a training set root-mean-square error of 0.394 log units for compounds which span a −log(molarity) range from −2 to +12 log units.},
Author = {Mitchell, B.E. and Jurs, P.C.},
Date-Added = {2009-04-14 11:51:45 -0400},
Date-Modified = {2009-04-14 11:52:40 -0400},
Journal = {J.~Chem.~Inf.~Comput.~Sci.},
Keywords = {qsar; solubility},
Pages = {489--496},
Title = {Prediction of Aqueous Solubility of Organic Compounds from Molecular Structure},
Volume = {38},
Year = {1998},
Bdsk-File-1 = {YnBsaXN0MDDUAQIDBAUIJidUJHRvcFgkb2JqZWN0c1gkdmVyc2lvblkkYXJjaGl2ZXLRBgdUcm9vdIABqAkKFRYXGyIjVSRudWxs0wsMDQ4RElpOUy5vYmplY3RzViRjbGFzc1dOUy5rZXlzog8QgASABoAHohMUgAKAA1lhbGlhc0RhdGFccmVsYXRpdmVQYXRo0hgMGRpXTlMuZGF0YU8RAW4AAAAAAW4AAgAAA212IAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAMU5bQNIKwAAABCNbQ1jaTk3MDExN2YucGRmAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAALZmVxgooeAAAAAAAAAAAAAIAAwAACSAAAAAAAAAAAAAAAAAAAAAIYXJ0aWNsZXMAEAAIAADFObNTAAAAEQAIAADGCmC4AAAAAQAQABCNbQAKTIAACkxpAAB8EwACADBtdiA6VXNlcnM6cmd1aGE6RG9jdW1lbnRzOmFydGljbGVzOmNpOTcwMTE3Zi5wZGYADgAcAA0AYwBpADkANwAwADEAMQA3AGYALgBwAGQAZgAPAAgAAwBtAHYAIAASACxVc2Vycy9yZ3VoYS9Eb2N1bWVudHMvYXJ0aWNsZXMvY2k5NzAxMTdmLnBkZgATAAEvAAAVAAIADP//AACABdIcHR4fWCRjbGFzc2VzWiRjbGFzc25hbWWjHyAhXU5TTXV0YWJsZURhdGFWTlNEYXRhWE5TT2JqZWN0XxAmLi4vLi4vRG9jdW1lbnRzL2FydGljbGVzL2NpOTcwMTE3Zi5wZGbSHB0kJaIlIVxOU0RpY3Rpb25hcnkSAAGGoF8QD05TS2V5ZWRBcmNoaXZlcgAIABEAFgAfACgAMgA1ADoAPABFAEsAUgBdAGQAbABvAHEAcwB1AHgAegB8AIYAkwCYAKACEgIUAhkCIgItAjECPwJGAk8CeAJ9AoACjQKSAAAAAAAAAgEAAAAAAAAAKAAAAAAAAAAAAAAAAAAAAqQ=},
Bdsk-Url-1 = {http://dx.doi.org/10.1021/ci970117f}}
Downloads: 0
{"_id":"TG7T92TFgqTCpbkkJ","bibbaseid":"mitchell-jurs-predictionofaqueoussolubilityoforganiccompoundsfrommolecularstructure-1998","downloads":0,"creationDate":"2016-02-18T13:03:30.514Z","title":"Prediction of Aqueous Solubility of Organic Compounds from Molecular Structure","author_short":["Mitchell, B.","Jurs, P."],"year":1998,"bibtype":"article","biburl":"https://dl.dropboxusercontent.com/u/26998770/main.bib","bibdata":{"bibtype":"article","type":"article","abstract":"Multiple linear regression (MLR) and computational neural networks (CNN) are utilized to develop mathematical models to relate the structures of a diverse set of 332 organic compounds to their aqueous solubilities. Topological, geometric, and electronic descriptors are used to numerically represent structural features of the data set compounds. Genetic algorithm and simulated annealing routines, in conjunction with MLR and CNN, are used to select subsets of descriptors that accurately relate to aqueous solubility. Nonlinear models with nine calculated structural descriptors are developed that have a training set root-mean-square error of 0.394 log units for compounds which span a −log(molarity) range from −2 to +12 log units.","author":[{"propositions":[],"lastnames":["Mitchell"],"firstnames":["B.E."],"suffixes":[]},{"propositions":[],"lastnames":["Jurs"],"firstnames":["P.C."],"suffixes":[]}],"date-added":"2009-04-14 11:51:45 -0400","date-modified":"2009-04-14 11:52:40 -0400","journal":"J.~Chem.~Inf.~Comput.~Sci.","keywords":"qsar; solubility","pages":"489--496","title":"Prediction of Aqueous Solubility of Organic Compounds from Molecular Structure","volume":"38","year":"1998","bdsk-file-1":"YnBsaXN0MDDUAQIDBAUIJidUJHRvcFgkb2JqZWN0c1gkdmVyc2lvblkkYXJjaGl2ZXLRBgdUcm9vdIABqAkKFRYXGyIjVSRudWxs0wsMDQ4RElpOUy5vYmplY3RzViRjbGFzc1dOUy5rZXlzog8QgASABoAHohMUgAKAA1lhbGlhc0RhdGFccmVsYXRpdmVQYXRo0hgMGRpXTlMuZGF0YU8RAW4AAAAAAW4AAgAAA212IAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAMU5bQNIKwAAABCNbQ1jaTk3MDExN2YucGRmAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAALZmVxgooeAAAAAAAAAAAAAIAAwAACSAAAAAAAAAAAAAAAAAAAAAIYXJ0aWNsZXMAEAAIAADFObNTAAAAEQAIAADGCmC4AAAAAQAQABCNbQAKTIAACkxpAAB8EwACADBtdiA6VXNlcnM6cmd1aGE6RG9jdW1lbnRzOmFydGljbGVzOmNpOTcwMTE3Zi5wZGYADgAcAA0AYwBpADkANwAwADEAMQA3AGYALgBwAGQAZgAPAAgAAwBtAHYAIAASACxVc2Vycy9yZ3VoYS9Eb2N1bWVudHMvYXJ0aWNsZXMvY2k5NzAxMTdmLnBkZgATAAEvAAAVAAIADP//AACABdIcHR4fWCRjbGFzc2VzWiRjbGFzc25hbWWjHyAhXU5TTXV0YWJsZURhdGFWTlNEYXRhWE5TT2JqZWN0XxAmLi4vLi4vRG9jdW1lbnRzL2FydGljbGVzL2NpOTcwMTE3Zi5wZGbSHB0kJaIlIVxOU0RpY3Rpb25hcnkSAAGGoF8QD05TS2V5ZWRBcmNoaXZlcgAIABEAFgAfACgAMgA1ADoAPABFAEsAUgBdAGQAbABvAHEAcwB1AHgAegB8AIYAkwCYAKACEgIUAhkCIgItAjECPwJGAk8CeAJ9AoACjQKSAAAAAAAAAgEAAAAAAAAAKAAAAAAAAAAAAAAAAAAAAqQ=","bdsk-url-1":"http://dx.doi.org/10.1021/ci970117f","bibtex":"@article{Mitchell:1998pi,\n\tAbstract = {Multiple linear regression (MLR) and computational neural networks (CNN) are utilized to develop mathematical models to relate the structures of a diverse set of 332 organic compounds to their aqueous solubilities. Topological, geometric, and electronic descriptors are used to numerically represent structural features of the data set compounds. Genetic algorithm and simulated annealing routines, in conjunction with MLR and CNN, are used to select subsets of descriptors that accurately relate to aqueous solubility. Nonlinear models with nine calculated structural descriptors are developed that have a training set root-mean-square error of 0.394 log units for compounds which span a −log(molarity) range from −2 to +12 log units.},\n\tAuthor = {Mitchell, B.E. and Jurs, P.C.},\n\tDate-Added = {2009-04-14 11:51:45 -0400},\n\tDate-Modified = {2009-04-14 11:52:40 -0400},\n\tJournal = {J.~Chem.~Inf.~Comput.~Sci.},\n\tKeywords = {qsar; solubility},\n\tPages = {489--496},\n\tTitle = {Prediction of Aqueous Solubility of Organic Compounds from Molecular Structure},\n\tVolume = {38},\n\tYear = {1998},\n\tBdsk-File-1 = {YnBsaXN0MDDUAQIDBAUIJidUJHRvcFgkb2JqZWN0c1gkdmVyc2lvblkkYXJjaGl2ZXLRBgdUcm9vdIABqAkKFRYXGyIjVSRudWxs0wsMDQ4RElpOUy5vYmplY3RzViRjbGFzc1dOUy5rZXlzog8QgASABoAHohMUgAKAA1lhbGlhc0RhdGFccmVsYXRpdmVQYXRo0hgMGRpXTlMuZGF0YU8RAW4AAAAAAW4AAgAAA212IAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAMU5bQNIKwAAABCNbQ1jaTk3MDExN2YucGRmAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAALZmVxgooeAAAAAAAAAAAAAIAAwAACSAAAAAAAAAAAAAAAAAAAAAIYXJ0aWNsZXMAEAAIAADFObNTAAAAEQAIAADGCmC4AAAAAQAQABCNbQAKTIAACkxpAAB8EwACADBtdiA6VXNlcnM6cmd1aGE6RG9jdW1lbnRzOmFydGljbGVzOmNpOTcwMTE3Zi5wZGYADgAcAA0AYwBpADkANwAwADEAMQA3AGYALgBwAGQAZgAPAAgAAwBtAHYAIAASACxVc2Vycy9yZ3VoYS9Eb2N1bWVudHMvYXJ0aWNsZXMvY2k5NzAxMTdmLnBkZgATAAEvAAAVAAIADP//AACABdIcHR4fWCRjbGFzc2VzWiRjbGFzc25hbWWjHyAhXU5TTXV0YWJsZURhdGFWTlNEYXRhWE5TT2JqZWN0XxAmLi4vLi4vRG9jdW1lbnRzL2FydGljbGVzL2NpOTcwMTE3Zi5wZGbSHB0kJaIlIVxOU0RpY3Rpb25hcnkSAAGGoF8QD05TS2V5ZWRBcmNoaXZlcgAIABEAFgAfACgAMgA1ADoAPABFAEsAUgBdAGQAbABvAHEAcwB1AHgAegB8AIYAkwCYAKACEgIUAhkCIgItAjECPwJGAk8CeAJ9AoACjQKSAAAAAAAAAgEAAAAAAAAAKAAAAAAAAAAAAAAAAAAAAqQ=},\n\tBdsk-Url-1 = {http://dx.doi.org/10.1021/ci970117f}}\n\n","author_short":["Mitchell, B.","Jurs, P."],"key":"Mitchell:1998pi","id":"Mitchell:1998pi","bibbaseid":"mitchell-jurs-predictionofaqueoussolubilityoforganiccompoundsfrommolecularstructure-1998","role":"author","urls":{},"keyword":["qsar; solubility"],"downloads":0},"search_terms":["prediction","aqueous","solubility","organic","compounds","molecular","structure","mitchell","jurs"],"keywords":["qsar; solubility"],"authorIDs":[],"dataSources":["c5japf9eAQRaeMS4h"]}