BACKGROUND:Cluster analysis is an important technique for the exploratory analysis of biological data. Such data is often high-dimensional, inherently noisy and contains outliers. This makes clustering challenging. Mixtures are versatile and powerful statistical models which perform robustly for clustering in the presence of noise and have been successfully applied in a wide range of applications.RESULTS:PyMix implements algorithms and data structures for clustering with basic and advanced mixture models. The advanced models include context-specific independence mixtures, mixtures of dependence trees and semi-supervised learning. PyMix is licenced under the GNU General Public licence (GPL). PyMix has been successfully used for the analysis of biological sequence, complex disease and gene expression data.CONCLUSIONS:PyMix is a useful tool for cluster analysis of biological data. Due to the general nature of the framework, PyMix can be applied to a wide range of applications and data sets.
Description
Abstract | PyMix - The Python mixture package - a tool for clustering of heterogeneous biological data
%0 Journal Article
%1 20053276
%A Georgi, Benjamin
%A Costa, Ivan Gesteira
%A Schliep, Alexander
%D 2010
%J BMC Bioinformatics
%K bio clustering imported python software
%N 1
%P 9
%R 10.1186/1471-2105-11-9
%T PyMix - The Python mixture package - a tool for clustering of heterogeneous biological data
%U http://www.biomedcentral.com/1471-2105/11/9
%V 11
%X BACKGROUND:Cluster analysis is an important technique for the exploratory analysis of biological data. Such data is often high-dimensional, inherently noisy and contains outliers. This makes clustering challenging. Mixtures are versatile and powerful statistical models which perform robustly for clustering in the presence of noise and have been successfully applied in a wide range of applications.RESULTS:PyMix implements algorithms and data structures for clustering with basic and advanced mixture models. The advanced models include context-specific independence mixtures, mixtures of dependence trees and semi-supervised learning. PyMix is licenced under the GNU General Public licence (GPL). PyMix has been successfully used for the analysis of biological sequence, complex disease and gene expression data.CONCLUSIONS:PyMix is a useful tool for cluster analysis of biological data. Due to the general nature of the framework, PyMix can be applied to a wide range of applications and data sets.
@article{20053276,
abstract = {BACKGROUND:Cluster analysis is an important technique for the exploratory analysis of biological data. Such data is often high-dimensional, inherently noisy and contains outliers. This makes clustering challenging. Mixtures are versatile and powerful statistical models which perform robustly for clustering in the presence of noise and have been successfully applied in a wide range of applications.RESULTS:PyMix implements algorithms and data structures for clustering with basic and advanced mixture models. The advanced models include context-specific independence mixtures, mixtures of dependence trees and semi-supervised learning. PyMix is licenced under the GNU General Public licence (GPL). PyMix has been successfully used for the analysis of biological sequence, complex disease and gene expression data.CONCLUSIONS:PyMix is a useful tool for cluster analysis of biological data. Due to the general nature of the framework, PyMix can be applied to a wide range of applications and data sets.
},
added-at = {2010-02-16T15:58:26.000+0100},
author = {Georgi, Benjamin and Costa, Ivan Gesteira and Schliep, Alexander},
biburl = {https://www.bibsonomy.org/bibtex/25b5db200857ec73213d40b94d38a730e/wnpxrz},
description = {Abstract | PyMix - The Python mixture package - a tool for clustering of heterogeneous biological data},
doi = {10.1186/1471-2105-11-9},
interhash = {725d31ec46dde6dfd3708ee53a87d548},
intrahash = {5b5db200857ec73213d40b94d38a730e},
issn = {1471-2105},
journal = {BMC Bioinformatics},
keywords = {bio clustering imported python software},
number = 1,
pages = 9,
pubmedid = {20053276},
timestamp = {2010-02-16T15:58:26.000+0100},
title = {PyMix - The Python mixture package - a tool for clustering of heterogeneous biological data},
url = {http://www.biomedcentral.com/1471-2105/11/9},
volume = 11,
year = 2010
}