doi abstract bibtex

MOTIVATION: Molecular diagnostics aims at classifying diseases into clinically relevant sub-entities based on molecular characteristics. Typically, the entities are split into subgroups, which might contain several variants yielding a hierarchical model of the disease. Recent years have introduced a plethora of new molecular screening technologies to molecular diagnostics. As a result molecular profiles of patients became complex and the classification task more difficult. RESULTS: We present a novel tool for detecting hierarchical structure in binary datasets. We aim for identifying molecular characteristics, which are stochastically implying other characteristics. The final hierarchical structure is encoded in a directed transitive graph where nodes represent molecular characteristics and a directed edge from a node A to a node B denotes that almost all cases with characteristic B also display characteristic A. Naturally, these graphs need to be transitive. In the core of our modeling approach lies the problem of calculating good transitive approximations of given directed but not necessarily transitive graphs. By good transitive approximation we understand transitive graphs, which differ from the reference graph in only a small number of edges. It is known that the problem of finding optimal transitive approximation is NP-complete. Here we develop an efficient heuristic for generating good transitive approximations. We evaluate the computational efficiency of the algorithm in simulations, and demonstrate its use in the context of a large genome-wide study on mature aggressive lymphomas. AVAILABILITY: The software used in our analysis is freely available fromhttp://pc56269/software/transApproxs.shtml. CONTACT: Juby.Jacob@klinik.uni-regensburg.de, Rainer.Spang@klinik.uniregensburg.de.

@Article{jacob08detecting, author = {Juby Jacob and Marcel Jentsch and Dennis Kostka and Stefan Bentink and Rainer Spang}, title = {Detecting hierarchical structure in molecular characteristics of disease using transitive approximations of directed graphs}, journal = {Bioinformatics}, year = {2008}, volume = {24}, number = {7}, pages = {995--1001}, issn = {1460-2059}, abstract = {MOTIVATION: Molecular diagnostics aims at classifying diseases into clinically relevant sub-entities based on molecular characteristics. Typically, the entities are split into subgroups, which might contain several variants yielding a hierarchical model of the disease. Recent years have introduced a plethora of new molecular screening technologies to molecular diagnostics. As a result molecular profiles of patients became complex and the classification task more difficult. RESULTS: We present a novel tool for detecting hierarchical structure in binary datasets. We aim for identifying molecular characteristics, which are stochastically implying other characteristics. The final hierarchical structure is encoded in a directed transitive graph where nodes represent molecular characteristics and a directed edge from a node A to a node B denotes that almost all cases with characteristic B also display characteristic A. Naturally, these graphs need to be transitive. In the core of our modeling approach lies the problem of calculating good transitive approximations of given directed but not necessarily transitive graphs. By good transitive approximation we understand transitive graphs, which differ from the reference graph in only a small number of edges. It is known that the problem of finding optimal transitive approximation is NP-complete. Here we develop an efficient heuristic for generating good transitive approximations. We evaluate the computational efficiency of the algorithm in simulations, and demonstrate its use in the context of a large genome-wide study on mature aggressive lymphomas. AVAILABILITY: The software used in our analysis is freely available fromhttp://pc56269/software/transApproxs.shtml. CONTACT: Juby.Jacob@klinik.uni-regensburg.de, Rainer.Spang@klinik.uniregensburg.de.}, address = {Computational Diagnostics Group, Institute of Functional Genomics, University of Regensburg, 93053 Regensburg, Germany Max Planck Institute for Molecular Genetics, Ihnesta{\ss}e 63/73, 14195 Berlin, Germany.}, doi = {10.1093/bioinformatics/btn056}, keywords = {approximation, dragan, graph, transitive}, owner = {Sebastian}, timestamp = {2008.05.14}, }

Downloads: 0