Large-Scale Multi-Label Text Classification (LMTC) includes tasks with
hierarchical label spaces, such as automatic assignment of ICD-9 codes to
discharge summaries. Performance of models in prior art is evaluated with
standard precision, recall, and F1 measures without regard for the rich
hierarchical structure. In this work we argue for hierarchical evaluation of
the predictions of neural LMTC models. With the example of the ICD-9 ontology
we describe a structural issue in the representation of the structured label
space in prior art, and propose an alternative representation based on the
depth of the ontology. We propose a set of metrics for hierarchical evaluation
using the depth-based representation. We compare the evaluation scores from the
proposed metrics with previously used metrics on prior art LMTC models for
ICD-9 coding in MIMIC-III. We also propose further avenues of research
involving the proposed ontological representation.
Description
[2109.04853v1] CoPHE: A Count-Preserving Hierarchical Evaluation Metric in Large-Scale Multi-Label Text Classification
%0 Generic
%1 falis2021cophe
%A Falis, Matúš
%A Dong, Hang
%A Birch, Alexandra
%A Alex, Beatrice
%D 2021
%K automated_medical_coding clinical_coding evluation hierarchy hlan icd icd9 medical_coding multi-label_classification myown subsumption
%T CoPHE: A Count-Preserving Hierarchical Evaluation Metric in Large-Scale
Multi-Label Text Classification
%U http://arxiv.org/abs/2109.04853
%X Large-Scale Multi-Label Text Classification (LMTC) includes tasks with
hierarchical label spaces, such as automatic assignment of ICD-9 codes to
discharge summaries. Performance of models in prior art is evaluated with
standard precision, recall, and F1 measures without regard for the rich
hierarchical structure. In this work we argue for hierarchical evaluation of
the predictions of neural LMTC models. With the example of the ICD-9 ontology
we describe a structural issue in the representation of the structured label
space in prior art, and propose an alternative representation based on the
depth of the ontology. We propose a set of metrics for hierarchical evaluation
using the depth-based representation. We compare the evaluation scores from the
proposed metrics with previously used metrics on prior art LMTC models for
ICD-9 coding in MIMIC-III. We also propose further avenues of research
involving the proposed ontological representation.
@misc{falis2021cophe,
abstract = {Large-Scale Multi-Label Text Classification (LMTC) includes tasks with
hierarchical label spaces, such as automatic assignment of ICD-9 codes to
discharge summaries. Performance of models in prior art is evaluated with
standard precision, recall, and F1 measures without regard for the rich
hierarchical structure. In this work we argue for hierarchical evaluation of
the predictions of neural LMTC models. With the example of the ICD-9 ontology
we describe a structural issue in the representation of the structured label
space in prior art, and propose an alternative representation based on the
depth of the ontology. We propose a set of metrics for hierarchical evaluation
using the depth-based representation. We compare the evaluation scores from the
proposed metrics with previously used metrics on prior art LMTC models for
ICD-9 coding in MIMIC-III. We also propose further avenues of research
involving the proposed ontological representation.},
added-at = {2021-09-13T16:56:29.000+0200},
author = {Falis, Matúš and Dong, Hang and Birch, Alexandra and Alex, Beatrice},
biburl = {https://www.bibsonomy.org/bibtex/2b4a94973c3a68ab7ad27528cc50bab6a/hangdong},
description = {[2109.04853v1] CoPHE: A Count-Preserving Hierarchical Evaluation Metric in Large-Scale Multi-Label Text Classification},
interhash = {79d1546b2b626a140d4033e6a04050a1},
intrahash = {b4a94973c3a68ab7ad27528cc50bab6a},
keywords = {automated_medical_coding clinical_coding evluation hierarchy hlan icd icd9 medical_coding multi-label_classification myown subsumption},
note = {cite arxiv:2109.04853Comment: 5 pages, 2 figures, EMNLP 2021},
timestamp = {2021-09-13T16:56:29.000+0200},
title = {CoPHE: A Count-Preserving Hierarchical Evaluation Metric in Large-Scale
Multi-Label Text Classification},
url = {http://arxiv.org/abs/2109.04853},
year = 2021
}