Semi-supervised active learning for sound classification in hybrid learning environments

Semi-supervised active learning for sound classification in hybrid learning environments. Han, W., Coutinho, E., Ruan, H., Li, H., Schuller, B., Yu, X., & Zhu, X. PLoS ONE, 11(9):e0162075, 9, 2016.

Paper

Semi-supervised active learning for sound classification in hybrid learning environments [link]

Website doi abstract bibtex

Coping with scarcity of labeled data is a common problem in sound classification tasks. Approaches for classifying sounds are commonly based on supervised learning algorithms, which require labeled data which is often scarce and leads to models that do not generalize well. In this paper, we make an efficient combination of confidence-based Active Learning and Self-Training with the aim of minimizing the need for human annotation for sound classification model training. The proposed method pre-processes the instances that are ready for labeling by calculating their classifier confidence scores, and then delivers the candidates with lower scores to human annotators, and those with high scores are automatically labeled by the machine. We demonstrate the feasibility and efficacy of this method in two practical scenarios: pool-based and stream-based processing. Extensive experimental results indicate that our approach requires significantly less labeled instances to reach the same performance in both scenarios compared to Passive Learning, Active Learning and Self-Training. A reduction of 52.2% in human labeled instances is achieved in both of the pool-based and stream-based scenarios on a sound classification task considering 16,930 sound instances.

@article{
 title = {Semi-supervised active learning for sound classification in hybrid learning environments},
 type = {article},
 year = {2016},
 keywords = {article,journal},
 pages = {e0162075},
 volume = {11},
 websites = {http://gateway.webofknowledge.com/gateway/Gateway.cgi?GWVersion=2&SrcApp=PARTNER_APP&SrcAuth=LinksAMR&KeyUT=WOS:000383680600017&DestLinkType=FullRecord&DestApp=ALL_WOS&UsrCustomerID=f3ec48df247ee1138ccd8d3ba59bacc2 http://dx.plos.org/10.1371/journal.pone.},
 month = {9},
 day = {14},
 id = {e1511f4d-9528-3cec-a591-ac665da796fe},
 created = {2024-08-09T12:19:56.089Z},
 file_attached = {true},
 profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1},
 group_id = {da2a8249-fdf4-3036-ba56-7358198a1600},
 last_modified = {2024-08-09T12:20:50.272Z},
 read = {false},
 starred = {false},
 authored = {false},
 confirmed = {true},
 hidden = {false},
 citation_key = {han2016semisupervisedenvironments},
 source_type = {article},
 private_publication = {false},
 abstract = {Coping with scarcity of labeled data is a common problem in sound classification tasks. Approaches for classifying sounds are commonly based on supervised learning algorithms, which require labeled data which is often scarce and leads to models that do not generalize well. In this paper, we make an efficient combination of confidence-based Active Learning and Self-Training with the aim of minimizing the need for human annotation for sound classification model training. The proposed method pre-processes the instances that are ready for labeling by calculating their classifier confidence scores, and then delivers the candidates with lower scores to human annotators, and those with high scores are automatically labeled by the machine. We demonstrate the feasibility and efficacy of this method in two practical scenarios: pool-based and stream-based processing. Extensive experimental results indicate that our approach requires significantly less labeled instances to reach the same performance in both scenarios compared to Passive Learning, Active Learning and Self-Training. A reduction of 52.2% in human labeled instances is achieved in both of the pool-based and stream-based scenarios on a sound classification task considering 16,930 sound instances.},
 bibtype = {article},
 author = {Han, Wenjing and Coutinho, Eduardo and Ruan, Huabin and Li, Haifeng and Schuller, Björn and Yu, Xiaojie and Zhu, Xuan},
 editor = {Schwenker, Friedhelm},
 doi = {10.1371/journal.pone.0162075},
 journal = {PLoS ONE},
 number = {9}
}

Downloads: 0

{"_id":"q3XNWkyQJYwd6Lj8T","bibbaseid":"han-coutinho-ruan-li-schuller-yu-zhu-semisupervisedactivelearningforsoundclassificationinhybridlearningenvironments-2016","downloads":0,"creationDate":"2017-04-06T12:03:59.141Z","title":"Semi-supervised active learning for sound classification in hybrid learning environments","author_short":["Han, W.","Coutinho, E.","Ruan, H.","Li, H.","Schuller, B.","Yu, X.","Zhu, X."],"year":2016,"bibtype":"article","biburl":"https://bibbase.org/service/mendeley/ffa9027c-806a-3827-93a1-02c42eb146a1","bibdata":{"title":"Semi-supervised active learning for sound classification in hybrid learning environments","type":"article","year":"2016","keywords":"article,journal","pages":"e0162075","volume":"11","websites":"http://gateway.webofknowledge.com/gateway/Gateway.cgi?GWVersion=2&SrcApp=PARTNER_APP&SrcAuth=LinksAMR&KeyUT=WOS:000383680600017&DestLinkType=FullRecord&DestApp=ALL_WOS&UsrCustomerID=f3ec48df247ee1138ccd8d3ba59bacc2 http://dx.plos.org/10.1371/journal.pone.","month":"9","day":"14","id":"e1511f4d-9528-3cec-a591-ac665da796fe","created":"2024-08-09T12:19:56.089Z","file_attached":"true","profile_id":"ffa9027c-806a-3827-93a1-02c42eb146a1","group_id":"da2a8249-fdf4-3036-ba56-7358198a1600","last_modified":"2024-08-09T12:20:50.272Z","read":false,"starred":false,"authored":false,"confirmed":"true","hidden":false,"citation_key":"han2016semisupervisedenvironments","source_type":"article","private_publication":false,"abstract":"Coping with scarcity of labeled data is a common problem in sound classification tasks. Approaches for classifying sounds are commonly based on supervised learning algorithms, which require labeled data which is often scarce and leads to models that do not generalize well. In this paper, we make an efficient combination of confidence-based Active Learning and Self-Training with the aim of minimizing the need for human annotation for sound classification model training. The proposed method pre-processes the instances that are ready for labeling by calculating their classifier confidence scores, and then delivers the candidates with lower scores to human annotators, and those with high scores are automatically labeled by the machine. We demonstrate the feasibility and efficacy of this method in two practical scenarios: pool-based and stream-based processing. Extensive experimental results indicate that our approach requires significantly less labeled instances to reach the same performance in both scenarios compared to Passive Learning, Active Learning and Self-Training. A reduction of 52.2% in human labeled instances is achieved in both of the pool-based and stream-based scenarios on a sound classification task considering 16,930 sound instances.","bibtype":"article","author":"Han, Wenjing and Coutinho, Eduardo and Ruan, Huabin and Li, Haifeng and Schuller, Björn and Yu, Xiaojie and Zhu, Xuan","editor":"Schwenker, Friedhelm","doi":"10.1371/journal.pone.0162075","journal":"PLoS ONE","number":"9","bibtex":"@article{\n title = {Semi-supervised active learning for sound classification in hybrid learning environments},\n type = {article},\n year = {2016},\n keywords = {article,journal},\n pages = {e0162075},\n volume = {11},\n websites = {http://gateway.webofknowledge.com/gateway/Gateway.cgi?GWVersion=2&SrcApp=PARTNER_APP&SrcAuth=LinksAMR&KeyUT=WOS:000383680600017&DestLinkType=FullRecord&DestApp=ALL_WOS&UsrCustomerID=f3ec48df247ee1138ccd8d3ba59bacc2 http://dx.plos.org/10.1371/journal.pone.},\n month = {9},\n day = {14},\n id = {e1511f4d-9528-3cec-a591-ac665da796fe},\n created = {2024-08-09T12:19:56.089Z},\n file_attached = {true},\n profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1},\n group_id = {da2a8249-fdf4-3036-ba56-7358198a1600},\n last_modified = {2024-08-09T12:20:50.272Z},\n read = {false},\n starred = {false},\n authored = {false},\n confirmed = {true},\n hidden = {false},\n citation_key = {han2016semisupervisedenvironments},\n source_type = {article},\n private_publication = {false},\n abstract = {Coping with scarcity of labeled data is a common problem in sound classification tasks. Approaches for classifying sounds are commonly based on supervised learning algorithms, which require labeled data which is often scarce and leads to models that do not generalize well. In this paper, we make an efficient combination of confidence-based Active Learning and Self-Training with the aim of minimizing the need for human annotation for sound classification model training. The proposed method pre-processes the instances that are ready for labeling by calculating their classifier confidence scores, and then delivers the candidates with lower scores to human annotators, and those with high scores are automatically labeled by the machine. We demonstrate the feasibility and efficacy of this method in two practical scenarios: pool-based and stream-based processing. Extensive experimental results indicate that our approach requires significantly less labeled instances to reach the same performance in both scenarios compared to Passive Learning, Active Learning and Self-Training. A reduction of 52.2% in human labeled instances is achieved in both of the pool-based and stream-based scenarios on a sound classification task considering 16,930 sound instances.},\n bibtype = {article},\n author = {Han, Wenjing and Coutinho, Eduardo and Ruan, Huabin and Li, Haifeng and Schuller, Björn and Yu, Xiaojie and Zhu, Xuan},\n editor = {Schwenker, Friedhelm},\n doi = {10.1371/journal.pone.0162075},\n journal = {PLoS ONE},\n number = {9}\n}","author_short":["Han, W.","Coutinho, E.","Ruan, H.","Li, H.","Schuller, B.","Yu, X.","Zhu, X."],"editor_short":["Schwenker, F."],"urls":{"Paper":"https://bibbase.org/service/mendeley/ffa9027c-806a-3827-93a1-02c42eb146a1/file/6052c374-c34f-0555-0b35-514417cd760b/2016___Han_et_al___Semi_supervised_active_learning_for_sound_classification_in_hybrid_learning_environments.pdf.pdf","Website":"http://gateway.webofknowledge.com/gateway/Gateway.cgi?GWVersion=2&SrcApp=PARTNER_APP&SrcAuth=LinksAMR&KeyUT=WOS:000383680600017&DestLinkType=FullRecord&DestApp=ALL_WOS&UsrCustomerID=f3ec48df247ee1138ccd8d3ba59bacc2 http://dx.plos.org/10.1371/journal.pone."},"biburl":"https://bibbase.org/service/mendeley/ffa9027c-806a-3827-93a1-02c42eb146a1","bibbaseid":"han-coutinho-ruan-li-schuller-yu-zhu-semisupervisedactivelearningforsoundclassificationinhybridlearningenvironments-2016","role":"author","keyword":["article","journal"],"metadata":{"authorlinks":{"coutinho, e":"https://amlab.liverpool.ac.uk/publications.html"}},"downloads":0},"search_terms":["semi","supervised","active","learning","sound","classification","hybrid","learning","environments","han","coutinho","ruan","li","schuller","yu","zhu"],"keywords":["article","journal"],"authorIDs":["58e62eafe417243f58000008","58e63ebe8f93a1ae58000053","5c0e7cf57d11e01000000150","6Z276FjCJdxu2qttA","7HsugpwDMrLzay5kC","FShD3dRw9yuvcgPCs","HmyGQqdmpxNriPHXS","LxZfJ4SZafxuJzeKG","S2CzJg64apkJsPsHA","gSef4eEL8c5wuNF7w","hzjyyz7CdSRZyRptY","mo4CFXJ7ukAMT9nho","nxyiocLrG567rGYAm","oenDqaFMmkBMZtjuK","tE6ysWmRvSH5uoPFW","tvZgz2JnB9BN8znPF"],"dataSources":["Tcd3cXtdQsiKHPZsW","ya2CyA73rpZseyrZ8","YqW8pMoihb7JazZcx","2252seNhipfTmjEBQ"]}