GeneIndex: An Open Source Parallel Program for Enumerating and Locating Words in a Genome

GeneIndex: An Open Source Parallel Program for Enumerating and Locating Words in a Genome. Li, H., Hart, D., Mueller, M., Markwardt, U., & Stewart, C. In 2009 International Joint Conference on Bioinformatics, Systems Biology and Intelligent Computing, pages 98-102, 2009. IEEE.

Website doi abstract bibtex

GeneIndex is an open-source program that locates words of any length k specified by the user in a sequence. GeneIndex is useful for understanding the structure of entire genomes or very large sets of genetic sequences, particularly in finding highly repeated words and words that occur with low frequency. GeneIndex accepts DNA sequences in FASTA format input files, and performs computations and input/output in parallel. GeneIndex has been implemented on Linux, IBM AIX, and NEC SX-8, and is available with test data sets (the entire genomes of Drosophila melanogaster and Homo sapiens). The performance of the program scales well with processor count - that is, as the number of processors increases, the processing time required decreases proportionally. © 2009 IEEE.

@inproceedings{
 title = {GeneIndex: An Open Source Parallel Program for Enumerating and Locating Words in a Genome},
 type = {inproceedings},
 year = {2009},
 pages = {98-102},
 websites = {http://ieeexplore.ieee.org/document/5260731/},
 publisher = {IEEE},
 id = {8df474a6-efa6-3931-ae8b-9da2f58cf3ad},
 created = {2019-10-01T17:20:42.472Z},
 file_attached = {false},
 profile_id = {42d295c0-0737-38d6-8b43-508cab6ea85d},
 last_modified = {2020-09-09T18:06:46.034Z},
 read = {false},
 starred = {false},
 authored = {true},
 confirmed = {true},
 hidden = {false},
 citation_key = {Li2009},
 folder_uuids = {2aba6c14-9027-4f47-8627-0902e1e2342b,ec6ad3c6-db7d-494d-863c-ef38d23f1f7e,22c3b665-9e84-4884-8172-710aa9082eaf},
 private_publication = {false},
 abstract = {GeneIndex is an open-source program that locates words of any length k specified by the user in a sequence. GeneIndex is useful for understanding the structure of entire genomes or very large sets of genetic sequences, particularly in finding highly repeated words and words that occur with low frequency. GeneIndex accepts DNA sequences in FASTA format input files, and performs computations and input/output in parallel. GeneIndex has been implemented on Linux, IBM AIX, and NEC SX-8, and is available with test data sets (the entire genomes of Drosophila melanogaster and Homo sapiens). The performance of the program scales well with processor count - that is, as the number of processors increases, the processing time required decreases proportionally. © 2009 IEEE.},
 bibtype = {inproceedings},
 author = {Li, Huian and Hart, David and Mueller, Matthias and Markwardt, Ulf and Stewart, Craig},
 doi = {10.1109/IJCBS.2009.127},
 booktitle = {2009 International Joint Conference on Bioinformatics, Systems Biology and Intelligent Computing}
}

Downloads: 0

{"_id":"rYfTm5kSttNpDRWBi","bibbaseid":"li-hart-mueller-markwardt-stewart-geneindexanopensourceparallelprogramforenumeratingandlocatingwordsinagenome-2009","downloads":0,"creationDate":"2018-03-12T19:10:27.120Z","title":"GeneIndex: An Open Source Parallel Program for Enumerating and Locating Words in a Genome","author_short":["Li, H.","Hart, D.","Mueller, M.","Markwardt, U.","Stewart, C."],"year":2009,"bibtype":"inproceedings","biburl":"https://bibbase.org/service/mendeley/42d295c0-0737-38d6-8b43-508cab6ea85d","bibdata":{"title":"GeneIndex: An Open Source Parallel Program for Enumerating and Locating Words in a Genome","type":"inproceedings","year":"2009","pages":"98-102","websites":"http://ieeexplore.ieee.org/document/5260731/","publisher":"IEEE","id":"8df474a6-efa6-3931-ae8b-9da2f58cf3ad","created":"2019-10-01T17:20:42.472Z","file_attached":false,"profile_id":"42d295c0-0737-38d6-8b43-508cab6ea85d","last_modified":"2020-09-09T18:06:46.034Z","read":false,"starred":false,"authored":"true","confirmed":"true","hidden":false,"citation_key":"Li2009","folder_uuids":"2aba6c14-9027-4f47-8627-0902e1e2342b,ec6ad3c6-db7d-494d-863c-ef38d23f1f7e,22c3b665-9e84-4884-8172-710aa9082eaf","private_publication":false,"abstract":"GeneIndex is an open-source program that locates words of any length k specified by the user in a sequence. GeneIndex is useful for understanding the structure of entire genomes or very large sets of genetic sequences, particularly in finding highly repeated words and words that occur with low frequency. GeneIndex accepts DNA sequences in FASTA format input files, and performs computations and input/output in parallel. GeneIndex has been implemented on Linux, IBM AIX, and NEC SX-8, and is available with test data sets (the entire genomes of Drosophila melanogaster and Homo sapiens). The performance of the program scales well with processor count - that is, as the number of processors increases, the processing time required decreases proportionally. © 2009 IEEE.","bibtype":"inproceedings","author":"Li, Huian and Hart, David and Mueller, Matthias and Markwardt, Ulf and Stewart, Craig","doi":"10.1109/IJCBS.2009.127","booktitle":"2009 International Joint Conference on Bioinformatics, Systems Biology and Intelligent Computing","bibtex":"@inproceedings{\n title = {GeneIndex: An Open Source Parallel Program for Enumerating and Locating Words in a Genome},\n type = {inproceedings},\n year = {2009},\n pages = {98-102},\n websites = {http://ieeexplore.ieee.org/document/5260731/},\n publisher = {IEEE},\n id = {8df474a6-efa6-3931-ae8b-9da2f58cf3ad},\n created = {2019-10-01T17:20:42.472Z},\n file_attached = {false},\n profile_id = {42d295c0-0737-38d6-8b43-508cab6ea85d},\n last_modified = {2020-09-09T18:06:46.034Z},\n read = {false},\n starred = {false},\n authored = {true},\n confirmed = {true},\n hidden = {false},\n citation_key = {Li2009},\n folder_uuids = {2aba6c14-9027-4f47-8627-0902e1e2342b,ec6ad3c6-db7d-494d-863c-ef38d23f1f7e,22c3b665-9e84-4884-8172-710aa9082eaf},\n private_publication = {false},\n abstract = {GeneIndex is an open-source program that locates words of any length k specified by the user in a sequence. GeneIndex is useful for understanding the structure of entire genomes or very large sets of genetic sequences, particularly in finding highly repeated words and words that occur with low frequency. GeneIndex accepts DNA sequences in FASTA format input files, and performs computations and input/output in parallel. GeneIndex has been implemented on Linux, IBM AIX, and NEC SX-8, and is available with test data sets (the entire genomes of Drosophila melanogaster and Homo sapiens). The performance of the program scales well with processor count - that is, as the number of processors increases, the processing time required decreases proportionally. © 2009 IEEE.},\n bibtype = {inproceedings},\n author = {Li, Huian and Hart, David and Mueller, Matthias and Markwardt, Ulf and Stewart, Craig},\n doi = {10.1109/IJCBS.2009.127},\n booktitle = {2009 International Joint Conference on Bioinformatics, Systems Biology and Intelligent Computing}\n}","author_short":["Li, H.","Hart, D.","Mueller, M.","Markwardt, U.","Stewart, C."],"urls":{"Website":"http://ieeexplore.ieee.org/document/5260731/"},"biburl":"https://bibbase.org/service/mendeley/42d295c0-0737-38d6-8b43-508cab6ea85d","bibbaseid":"li-hart-mueller-markwardt-stewart-geneindexanopensourceparallelprogramforenumeratingandlocatingwordsinagenome-2009","role":"author","metadata":{"authorlinks":{}},"downloads":0},"search_terms":["geneindex","open","source","parallel","program","enumerating","locating","words","genome","li","hart","mueller","markwardt","stewart"],"keywords":[],"authorIDs":[],"dataSources":["zgahneP4uAjKbudrQ","ya2CyA73rpZseyrZ8","2252seNhipfTmjEBQ"]}