@inproceedings{7b6fd8b5c98e4d40983f43250faabeb4,
title = "Determining the Need for Multi-label Classifiers by Measuring Unexplained Covariance",
abstract = "Multi-label classifiers make use of associations between labels in multi-label data to increase the accuracy of prediction. Before using a multi-label classifier, the data should be analysed to identify if there are associations between labels. If sets of independent labels are found, the data can be split in to multiple smaller data sets for analysis. Unfortunately, each label is dependent on the set of observations and so measuring label dependence is futile. What we actually seek is independence after taking the observations into account. In this article, we examine the concepts of explained and unexplained label covariance for measuring label dependence. We explore the use of a Normal copula model for modelling the label dependence/covariance and show that it is not able to measure conditional covariance directly. We then propose a new statistical model that allows direct measurement of label covariance (both constant and conditional). The model is validated using generated data and it is also used to examine the label covariance in real world data, allowing us to build simpler multi-label models.",
author = "Park, \{Laurence A.F.\} and Jesse Read",
note = "Publisher Copyright: {\textcopyright} The Author(s), under exclusive license to Springer Nature Singapore Pte Ltd. 2025.; 29th Pacific-Asia Conference on Knowledge Discovery and Data Mining, PAKDD 2025 ; Conference date: 10-06-2025 Through 13-06-2025",
year = "2025",
month = jan,
day = "1",
doi = "10.1007/978-981-96-8295-9\_18",
language = "English",
isbn = "9789819682942",
series = "Lecture Notes in Computer Science",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "250--261",
editor = "Xintao Wu and Myra Spiliopoulou and Can Wang and Vipin Kumar and Longbing Cao and Xiangmin Zhou and Guansong Pang and Joao Gama",
booktitle = "Data Science",
}