An accurate classifier with linguistic
interpretability using a small number of relevant genes
is beneficial to microarray data analysis and
development of inexpensive diagnostic tests. Several
frequently used techniques for designing classifiers of
microarray data, such as support vector machine, neural
networks, k-nearest neighbour, and logistic regression
model, suffer from low interpretabilities. This paper
proposes an interpretable gene expression classifier
(named iGEC) with an accurate and compact fuzzy rule
base for microarray data analysis. The design of iGEC
has three objectives to be simultaneously optimised:
maximal classification accuracy, minimal number of
rules, and minimal number of used genes. An
"intelligent" genetic algorithm IGA is used to
efficiently solve the design problem with a large
number of tuning parameters. The performance of iGEC is
evaluated using eight commonly-used data sets. It is
shown that iGEC has an accurate, concise, and
interpretable rule base (1.1 rules per class) on
average in terms of test classification accuracy
(87.9percent), rule number (3.9), and used gene number
(5.0). Moreover, iGEC not only has better performance
than the existing fuzzy rule-based classifier in terms
of the above-mentioned objectives, but also is more
accurate than some existing non-rule-based
classifiers.
%0 Journal Article
%1 ho:2006:biosystems
%A Ho, Shinn-Ying
%A Hsieh, Chih-Hung
%A Chen, Hung-Ming
%A Huang, Hui-Ling
%D 2006
%J Biosystems
%K algorithms, genetic programming
%N 3
%P 165--176
%R doi:10.1016/j.biosystems.2006.01.002
%T Interpretable gene expression classifier with an
accurate and compact fuzzy rule base for microarray
data analysis
%V 85
%X An accurate classifier with linguistic
interpretability using a small number of relevant genes
is beneficial to microarray data analysis and
development of inexpensive diagnostic tests. Several
frequently used techniques for designing classifiers of
microarray data, such as support vector machine, neural
networks, k-nearest neighbour, and logistic regression
model, suffer from low interpretabilities. This paper
proposes an interpretable gene expression classifier
(named iGEC) with an accurate and compact fuzzy rule
base for microarray data analysis. The design of iGEC
has three objectives to be simultaneously optimised:
maximal classification accuracy, minimal number of
rules, and minimal number of used genes. An
"intelligent" genetic algorithm IGA is used to
efficiently solve the design problem with a large
number of tuning parameters. The performance of iGEC is
evaluated using eight commonly-used data sets. It is
shown that iGEC has an accurate, concise, and
interpretable rule base (1.1 rules per class) on
average in terms of test classification accuracy
(87.9percent), rule number (3.9), and used gene number
(5.0). Moreover, iGEC not only has better performance
than the existing fuzzy rule-based classifier in terms
of the above-mentioned objectives, but also is more
accurate than some existing non-rule-based
classifiers.
@article{ho:2006:biosystems,
abstract = {An accurate classifier with linguistic
interpretability using a small number of relevant genes
is beneficial to microarray data analysis and
development of inexpensive diagnostic tests. Several
frequently used techniques for designing classifiers of
microarray data, such as support vector machine, neural
networks, k-nearest neighbour, and logistic regression
model, suffer from low interpretabilities. This paper
proposes an interpretable gene expression classifier
(named iGEC) with an accurate and compact fuzzy rule
base for microarray data analysis. The design of iGEC
has three objectives to be simultaneously optimised:
maximal classification accuracy, minimal number of
rules, and minimal number of used genes. An
{"}intelligent{"} genetic algorithm IGA is used to
efficiently solve the design problem with a large
number of tuning parameters. The performance of iGEC is
evaluated using eight commonly-used data sets. It is
shown that iGEC has an accurate, concise, and
interpretable rule base (1.1 rules per class) on
average in terms of test classification accuracy
(87.9percent), rule number (3.9), and used gene number
(5.0). Moreover, iGEC not only has better performance
than the existing fuzzy rule-based classifier in terms
of the above-mentioned objectives, but also is more
accurate than some existing non-rule-based
classifiers.},
added-at = {2008-06-19T17:35:00.000+0200},
author = {Ho, Shinn-Ying and Hsieh, Chih-Hung and Chen, Hung-Ming and Huang, Hui-Ling},
biburl = {https://www.bibsonomy.org/bibtex/2a168852df5095664a1fea37779a3490a/brazovayeye},
doi = {doi:10.1016/j.biosystems.2006.01.002},
interhash = {73f31705c8d70a64e967ba8085bd43d0},
intrahash = {a168852df5095664a1fea37779a3490a},
journal = {Biosystems},
keywords = {algorithms, genetic programming},
month = {September},
notes = {PMID: 16490299 [PubMed - in process]},
number = 3,
pages = {165--176},
timestamp = {2008-06-19T17:41:33.000+0200},
title = {Interpretable gene expression classifier with an
accurate and compact fuzzy rule base for microarray
data analysis},
volume = 85,
year = 2006
}