<script src="https://bibbase.org/service/mendeley/ffa9027c-806a-3827-93a1-02c42eb146a1?jsonp=1"></script>
<?php
$contents = file_get_contents("https://bibbase.org/service/mendeley/ffa9027c-806a-3827-93a1-02c42eb146a1");
print_r($contents);
?>
<iframe src="https://bibbase.org/service/mendeley/ffa9027c-806a-3827-93a1-02c42eb146a1"></iframe>
For more details see the documention.
To the site owner:
Action required! Mendeley is changing its API. In order to keep using Mendeley with BibBase past April 14th, you need to:
@inbook{ type = {inbook}, year = {2023}, pages = {230-254}, websites = {http://www.bloomsburycollections.com/book/youtube-and-music-online-culture-and-everyday-life/ch11-talking-about-music}, publisher = {Bloomsbury Academic}, city = {London}, id = {c4df822f-f29a-3c5d-88d4-44ad13fbb9b9}, created = {2022-05-04T11:30:07.875Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2023-03-02T12:10:04.866Z}, read = {true}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, private_publication = {false}, bibtype = {inbook}, author = {Lamont, Alexandra and Bannister, Scott and Coutinho, Eduardo}, editor = {Rogers, Holly and Freitas, Joana and Porfírio, João Francisco}, doi = {10.5040/9781501387302.0023}, chapter = {‘Talking’ about Music}, title = {YouTube and Music} }
@article{ title = {Automated composition of Galician Xota - tuning RNN-based composers for specific musical styles using Deep Q-Learning}, type = {article}, year = {2023}, keywords = {automated music composition,deep q-learning,galician xota,magenta,rl-tuner}, pages = {e1356}, volume = {9}, websites = {https://peerj.com/articles/cs-1356}, month = {5}, day = {15}, id = {dc6d199d-44fa-3ab0-b581-bebb3057fe16}, created = {2023-05-15T08:14:20.617Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2023-08-23T15:24:46.421Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, private_publication = {false}, abstract = {Music composition is a complex field that is difficult to automate because the computational definition of what is good or aesthetically pleasing is vague and subjective. Many neural network-based methods have been applied in the past, but they lack consistency and in most cases, their outputs fail to impress. The most common issues include excessive repetition and a lack of style and structure, which are hallmarks of artificial compositions. In this project, we build on a model created by Magenta—the RL Tuner—extending it to emulate a specific musical genre—the Galician Xota. To do this, we design a new rule-set containing rules that the composition should follow to adhere to this style. We then implement them using reward functions, which are used to train the Deep Q Network that will be used to generate the pieces. After extensive experimentation, we achieve an implementation of our rule-set that effectively enforces each rule on the generated compositions, and outline a solid research methodology for future researchers looking to use this architecture. Finally, we propose some promising future work regarding further applications for this model and improvements to the experimental procedure.}, bibtype = {article}, author = {Mira, R and Coutinho, Eduardo and Parada-Cabaleiro, E and Schuller, Björn}, doi = {10.7717/peerj-cs.1356}, journal = {PeerJ Computer Science} }
@article{ title = {Measuring the Structural Complexity of Music: From Structural Segmentations to the Automatic Evaluation of Models for Music Generation}, type = {article}, year = {2022}, keywords = {Music structure analysis,evaluation measures}, pages = {1963-1976}, volume = {30}, websites = {https://ieeexplore.ieee.org/document/9787343/}, id = {d8babf70-62dd-3945-bbea-1086e22a2052}, created = {2022-05-04T11:30:07.838Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2023-05-15T08:14:21.790Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, private_publication = {false}, abstract = {Composing musical ideas longer than motifs or figures is still rare in music generated by machine learning methods, a problem that is commonly referred to as the lack of long-term structure in the generated sequences. In addition, the evaluation of the structural complexity of artificial compositions is still a manual task, requiring expert knowledge, time and involving subjectivity which is inherent in the perception of musical structure. Based on recent advancements in music structure analysis, we automate the evaluation process by introducing a collection of metrics that can objectively describe structural properties of the music signal. This is done by segmenting music hierarchically, and computing our metrics on the resulting hierarchies to characterise the decomposition process of music into its structural components. We tested our method on a dataset collecting music with different degrees of structural complexity, from random and computer-generated pieces to real compositions of different genres and formats. Results indicate that our method can discriminate between these classes of complexity and identify further non-trivial subdivisions according to their structural properties. Our work contributes a simple yet effective framework for the evaluation of music generation models in regard to their ability to create structurally meaningful compositions.}, bibtype = {article}, author = {De Berardinis, Jacopo and Cangelosi, Angelo and Coutinho, Eduardo}, doi = {10.1109/TASLP.2022.3178203}, journal = {IEEE/ACM Transactions on Audio Speech and Language Processing} }
@article{ title = {Music therapy interventions for eating disorders: Lack of robust evidence and recommendations for future research}, type = {article}, year = {2022}, pages = {84-93}, volume = {36}, websites = {http://journals.sagepub.com/doi/10.1177/13594575221110193}, month = {11}, day = {13}, id = {f00c8319-f8f2-318c-a1e8-8f8be34a8582}, created = {2022-06-22T10:54:58.391Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2022-11-29T11:48:43.332Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, private_publication = {false}, abstract = {Music therapy (MT) has been used to support people with a variety of eating disorders (EDs), but it is unclear whether there is sufficient and robust evidence from controlled experimental studies. In this article, we report the results of a systematic review that summarises the evidence from published controlled studies where MT has been used to treat people diagnosed with any type of ED. Our results demonstrate that robust evidence concerning the effectiveness of MT for the treatment of EDs is severely lacking. Nonetheless, the evidence described in this paper warrants further investigation especially given that new treatment strategies for EDs are urgently needed. To this end, we offer a set of recommendations for future high-quality experimental studies that can inform the development of effective MT interventions and support for people with EDs.}, bibtype = {article}, author = {Coutinho, Eduardo and Van Criekinge, Tamaya and Hanford, Greg and Nathan, Rajan and Maden, Michelle and Hill, Ruaraidh}, doi = {10.1177/13594575221110193}, journal = {British Journal of Music Therapy}, number = {2} }
@article{ title = {Background Music and Cognitive Task Performance: A Systematic Review of Task, Music, and Population Impact}, type = {article}, year = {2022}, keywords = {Background music,cognitive task performance,effects of music,individual differences,systematic review}, pages = {205920432211343}, volume = {5}, websites = {http://journals.sagepub.com/doi/10.1177/20592043221134392}, month = {1}, day = {28}, id = {2fd5ea27-74e9-3b7c-b1d7-9feea85eb6d6}, created = {2022-09-27T12:17:55.148Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2023-07-03T09:46:12.837Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, private_publication = {false}, abstract = {Research on the effect of background music (BgM) on cognitive task performance is marked by inconsistent methods and inconclusive findings. In order to provide clarity to this area, we performed a systematic review on the impact of BgM on performances in a variety of tasks whilst considering the contributions of various task, music, and population characteristics. Following the PRISMA and SWiM protocols, we identified 95 articles (154 experiments) that comprise cognitive tasks across six different cognitive domains—memory; language; thinking, reasoning, and problem-solving; inhibition; attention and processing speed. Extracted data were synthesized using vote counting based (solely) on the direction of effects and analyzed using a sign test analysis. Overall, our results demonstrate a general detrimental effect of BgM on memory and language-related tasks, and a tendency for BgM with lyrics to be more detrimental than instrumental BgM. Only one positive effect (of instrumental BgM) was found; and in most cases, we did not find any effect of BgM on task performance. We also identified a general detrimental impact of BgM towards difficult (but not easy) tasks; and towards introverts (but not extraverts). Taken together, our results show that task, music, and population-specific analyses are all necessary when studying the effects of BgM on cognitive task performance. They also call attention to the necessity to control for task difficulty as well as individual differences (especially level of extraversion) in empirical studies. Finally, our results also demonstrate that many areas remain understudied and therefore a lot more work still needs to be done to gain a comprehensive understanding of how BgM impacts cognitive task performance.}, bibtype = {article}, author = {Cheah, Yiting and Wong, Hoo Keat and Spitzer, Michael and Coutinho, Eduardo}, doi = {10.1177/20592043221134392}, journal = {Music and Science} }
@misc{ title = {Background music and cognitive task performance: systematic review dataset}, type = {misc}, year = {2022}, websites = {https://doi.org/10.5281/zenodo.6301061}, publisher = {Zenodo}, id = {14ad7c10-5f4a-3688-b361-07ae155523a7}, created = {2022-11-29T11:52:16.089Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2023-03-02T12:12:14.370Z}, read = {true}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, source_type = {Dataset}, private_publication = {false}, abstract = {This repository contains the raw data used for a systematic review on the impact of background music on cognitive task performance (Cheah et al., 2022). Our intention is to facilitate future updates to this work. Cheah, Y., Wong, H. K., Spitzer, M., & Coutinho, E. (2022). Background music and cognitive task performance: A systematic review of task, music and population impact. Music & Science, 5(1), 1-38. https://doi.org/10.1177/20592043221134392}, bibtype = {misc}, author = {Cheah, Yiting and Wong, Hoo Keat and Spitzer, Michael and Coutinho, Eduardo}, doi = {10.5281/zenodo.6301061} }
@inproceedings{ title = {POLYHYMNIA Mood – A pilot evaluation of a new app to empower people to cope with low mood and depression through music listening.}, type = {inproceedings}, year = {2021}, city = {Sheffield, UK}, id = {ce188c0f-1627-3197-8189-792c7f8a29cb}, created = {2021-04-27T17:16:46.888Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2022-03-08T09:49:29.174Z}, read = {true}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {Coutinho2021}, private_publication = {false}, bibtype = {inproceedings}, author = {Coutinho, Eduardo and Dowrick, Christopher}, booktitle = {Proceedings of the 16th International Conference on Music Perception and Cognition}, keywords = {conference,paper} }
@article{ title = {Music and Hypertonia: Can Music Listening Help Reduce Muscle Tension and Improve Movement Quality?}, type = {article}, year = {2021}, keywords = {journal}, pages = {1-12}, volume = {4}, websites = {http://journals.sagepub.com/doi/10.1177/20592043211015353}, month = {1}, day = {1}, id = {c5085928-f360-3eb9-9d63-1f43a5299f7a}, created = {2021-04-27T17:16:46.934Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2023-05-15T08:14:21.017Z}, read = {true}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {VanCriekinge2021}, private_publication = {false}, abstract = {Although there is a strong consensus that music listening is a common and effective means to induce states of relaxation, little attention has been given to the physical effects of such states and the potential health-related applications. In this article, we investigated whether music listening could induce affective states of relaxation and accelerate the recovery of fatigued muscles, through the analysis of quality of movement. Twenty healthy participants were asked to perform a fatigue induction protocol of the non-dominant arm followed by a resting period and the execution of a drinking task. During recovery periods, all participants were exposed to three experimental conditions: listening to relaxing music; arousing music; and no music. 3D motion capture and surface electromyography were used to record upper limb movements and muscle activity when performing the drinking task before and after the recovery periods. Movement quality was assessed by means of movement smoothness (jerk index) and muscle recovery (motor unit recruitment). Results showed that recovery of movement smoothness in the relaxing music condition was significantly greater (-35%) than in the relaxing music condition (compared to arousing music, -25%, and silence, -16%) which demonstrates that listening to relaxing music speeds up the recovery process of (fatigued) muscles. We discuss our findings in the context of potential applications of music listening for reducing muscle tension in people suffering from hypertonia.}, bibtype = {article}, author = {Van Criekinge, T. and D’Août, K. and O’Brien, J. and Coutinho, E.}, doi = {10.1177/20592043211015353}, journal = {Music and Science} }
@inproceedings{ title = {Background Music and Performance on Memory-related Tasks: Preliminary Findings from a Systematic Review}, type = {inproceedings}, year = {2021}, city = {Sheffield, UK}, id = {f6791c84-1bb2-3d0e-9d49-13ccce404bd2}, created = {2021-04-27T17:16:46.934Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2022-03-08T09:49:51.029Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {Cheah2021}, private_publication = {false}, bibtype = {inproceedings}, author = {Cheah, Yi-Ting and Spitzer, Michael and Coutinho, Eduardo}, booktitle = {Proceedings of the 16th International Conference on Music Perception and Cognition}, keywords = {abstract,conference} }
@inproceedings{ title = {POLYHYMNIA Mood-Empowering people to cope with depression through music listening}, type = {inproceedings}, year = {2021}, keywords = {Depression,Health Intervention,Machine Learning,Mood Regulation,Music Listening,Web App}, pages = {188-193}, publisher = {ACM}, city = {Virtual, USA}, id = {ab00675a-b93c-34d7-9e06-2cbce52968cb}, created = {2021-08-31T11:17:11.812Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2024-03-28T16:00:11.221Z}, read = {true}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {CoutinhoPolyhymnia2021}, private_publication = {false}, abstract = {Depression is one of the largest sources of burden of disease in the worldwide and the development of flexible, timely and easily accessible interventions is considered to be a critical direction for the future. Mood Regulation (MR) via music listening may be a viable tool support these aims if people have adequate support to make music selections that underpin healthy MR strategies. We developed a new app (POLYHYMNIA Mood) that automatically generates personalised music playlists for mood elevation and the reduction of depression symptoms and here we provide an overview of POLYHYMNIA Mood and report the results of a preliminary evaluation of its effectiveness and acceptability. Results show that listening to POLYHYMNIA Mood playlists over a period of 4 weeks led to a large reduction in negative affect and a clinically significant reduction in depression symptoms. Whereas these results should be interpreted cautiously due to the small sample size and the lack of control conditions, they provide strong support to our approach.}, bibtype = {inproceedings}, author = {Coutinho, Eduardo and Alshukri, Ayesh and De Berardinis, Jacopo and Dowrick, Chris}, doi = {10.1145/3460418.3479334}, booktitle = {UbiComp/ISWC 2021 - Adjunct Proceedings of the 2021 ACM International Joint Conference on Pervasive and Ubiquitous Computing and Proceedings of the 2021 ACM International Symposium on Wearable Computers} }
@inbook{ type = {inbook}, year = {2021}, websites = {https://edicoeshumus.pt//index.php?route=product/product&product_id=1300&search=musica+humana&description=true}, publisher = {Húmus}, city = {V. N. Famalicão, Portugal}, edition = {1}, id = {c1d1a2aa-3a09-35ee-922b-8418ca5e7157}, created = {2021-10-14T15:59:33.451Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2021-12-16T16:18:27.423Z}, read = {true}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, private_publication = {false}, abstract = {In this chapter, we provide a brief overview of the available evidence concerning the impact of music listening on cognitive performance, i.e., how listening to music can affect mental abilities (e.g., memory, attention) and our performance in tasks that require them (e.g., writing, reading). The chapter is divided into two main sections which reflect two main research trends: cognitive performance after listening to music (a.k.a. Mozart effect) and cognitive performance whilst listening to music.}, bibtype = {inbook}, author = {Coutinho, Eduardo and Cheah, Yi-Ting}, editor = {Martingo, Ângelo}, chapter = {Audição musical e performance cognitiva [Music listening and cognitive performance]}, title = {Musica Humana} }
@article{ title = {Unveiling the Hierarchical Structure of Music by Multi-Resolution Community Detection}, type = {article}, year = {2020}, keywords = {article,journal}, pages = {82-97}, volume = {3}, websites = {http://transactions.ismir.net/articles/10.5334/tismir.41/}, month = {6}, day = {24}, id = {7e94c5a8-6ed8-3cfd-a472-2e4e06353afe}, created = {2019-09-18T08:06:23.731Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2023-05-15T08:14:21.862Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {deberardinismscomdetection}, source_type = {article}, folder_uuids = {116db2f1-e6ac-4780-bccf-a977325250cd,99880aa7-55df-4b45-bfce-0ffc00b23ced}, private_publication = {false}, abstract = {Human perception of musical structure is supposed to depend on the generation of hierarchies, which is inherently related to the actual organisation of sounds in music. Musical structures are indeed best retained by listeners when they form hierarchical patterns, with consequent implications on the appreciation of music and its performance. The automatic detection of musical structure in audio recordings is one of the most challenging problems in the field of music information retrieval, since even human experts tend to disagree on the structural decomposition of a piece of music. However, most of the current music segmentation algorithms in literature can only produce flat segmentations, meaning that they cannot segment music at different levels in order to reveal its hierarchical structure. We propose a novel methodology for the hierarchical analysis of music structure that is based on graph theory and multi-resolution community detection. This unsupervised method can perform both the tasks of boundary detection and structural grouping, without the need of particular constraints that would limit the resulting segmentation. To evaluate our approach, we designed an experiment that allowed us to compare its segmentation performance with that of the current state of the art algorithms for hierarchical segmentation. Our results indicate that the proposed methodology can achieve state of the art performance on a well-known benchmark dataset, thus providing a deeper analysis of musical structure.}, bibtype = {article}, author = {De Berardinis, Jacopo and Vamvakaris, Michail and Cangelosi, Angelo and Coutinho, Eduardo}, doi = {10.5334/tismir.41}, journal = {Transactions of the International Society for Music Information Retrieval}, number = {1} }
@misc{ title = {The impact of background music on cognitive task performance: a systematic review protocol.}, type = {misc}, year = {2020}, websites = {https://www.crd.york.ac.uk/prospero/display_record.php?ID=CRD42020207193}, publisher = {PROSPERO - International prospective register of systematic reviews}, institution = {University of Liverpool}, id = {70c0e760-c95b-3142-8377-961897aae211}, created = {2020-10-12T15:19:09.853Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2021-05-14T09:05:35.953Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {Cheah2020}, source_type = {Systematic Review Protocol}, private_publication = {false}, bibtype = {misc}, author = {Cheah, Yiting and Spitzer, Michael and Coutinho, Eduardo} }
@inproceedings{ title = {The multiple voices of musical emotions: source separation for improving music emotion recognition models and their interpretability}, type = {inproceedings}, year = {2020}, pages = {310-217}, websites = {https://www.ismir2020.net/assets/img/proceedings/2020_ISMIR_Proceedings.pdf}, publisher = {International Society for Music Information Retrieval}, city = {Montréal, Québec, Canada}, id = {d352dc1b-deb3-348f-8e54-c7b1f689089a}, created = {2020-10-12T15:41:02.947Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2021-05-14T09:05:35.878Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {DeBerardinis2020a}, private_publication = {false}, abstract = {Despite the manifold developments in music emotion recognition and related areas, estimating the emotional impact of music still poses many challenges. These are often associated to the complexity of the acoustic codes to emotion and the lack of large amounts of data with robust golden standards. In this paper, we propose a new computational model (EmoMucs) that considers the role of different musical voices in the prediction of the emotions induced by music. We combine source separation algorithms for breaking up music signals into independent song elements (vocals, bass, drums, other) and end-to-end state-of-the-art machine learning techniques for feature extraction and emotion modelling (valence and arousal regression). Through a series of computational experiments on a benchmark dataset using source-specialised models trained independently and different fusion strategies, we demonstrate that EmoMucs outperforms state-of-the-art approaches with the advantage of providing insights into the relative contribution of different musical elements to the emotions perceived by listeners.}, bibtype = {inproceedings}, author = {de Berardinis, J. and Cangelosi, A. and Coutinho, E.}, editor = {Cumming, Julie and Lee, Jin Ha and McFee, Brian and Schedl, Markus and Devaney, Johanna and McKay, Cory and Zangerle, Eva and de Reuse, Timothy}, booktitle = {Proceedings of the 21st International Society for Music Information Retrieval Conference} }
@inproceedings{ title = {'Talking’ about music - The emotional content of comments on YouTube videos}, type = {inproceedings}, year = {2020}, websites = {https://youtcc2020.weebly.com/abstract-book.html}, id = {dbbd3e1f-e74c-3e26-b26c-083294935ef0}, created = {2020-10-12T15:41:03.005Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2021-05-14T09:05:35.797Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {Lamont2020}, private_publication = {false}, bibtype = {inproceedings}, author = {Lamont, A. and Bannister, S. and Coutinho, E. and Egermann, H.}, booktitle = {Music and cyberculture before and after the new decade} }
@inproceedings{ title = {Modelling long- and short-term structure in symbolic music with attention and recurrence}, type = {inproceedings}, year = {2020}, websites = {https://boblsturm.github.io/aimusic2020/}, city = {Stockholm, Sweden}, id = {d987ec74-4b6e-3b6d-b6f3-0f19eb74b818}, created = {2020-10-12T15:42:50.876Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2023-05-15T08:14:21.057Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {DeBerardinis2020}, private_publication = {false}, abstract = {The automatic composition of music with long-term structure is a central problem in music generation. Neural network-based models have been shown to perform relatively well in melody generation, but generating music with long-term structure is still a major challenge. This paper introduces a new approach for music modelling that combines recent advancements of transformer models with recurrent networks-the long-short term universal transformer (LSTUT), and compare its ability to predict music against current state-of-the-art music models. Our experiments are designed to push the boundaries of music models on considerably long music sequences-a crucial requirement for learning long-term structure effectively. Results show that the LSTUT outper-forms all the other models and can potentially learn features related to music structure at different time scales. Overall, we show the importance of integrating both recurrence and attention in the architecture of music models, and their potential use in future automatic composition systems.}, bibtype = {inproceedings}, author = {de Berardinis, J. and Barrett, S. and Cangelosi, A. and Coutinho, E.}, booktitle = {CSMC + MuMe 2020: 2020 Joint Conference on AI Music Creativity} }
@misc{ title = {The effectiveness of music therapy interventions for people with eating disorders: a systematic review protocol}, type = {misc}, year = {2020}, websites = {https://www.crd.york.ac.uk/prospero/display_record.php?ID=CRD42020169901}, publisher = {PROSPERO}, id = {8695afb6-3ac9-3d29-b02f-76cc0c69e78e}, created = {2021-05-14T08:41:49.496Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2021-05-14T09:08:05.487Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {Coutinho2020}, source_type = {Systematic Review Protocol}, private_publication = {false}, abstract = {Review question Is music therapy an effective treatment for the reduction in eating disorder psychopathology and/or symptoms? Searches MEDLINE (OVID), Cochrane Library, CINAHL, Embase, RILM, BASE, PsycINFO, Scopus No restrictions were applied during the searches. Types of study to be included Any study with an experimental design. Condition or domain being studied Eating disorders are severe disturbances in behaviors and related thoughts and emotions. People with eating disorders typically become pre-occupied with food and their body weight. A doctor or mental health profession will make a diagnosis based on physical examination (to rule out medical causes), psychological evaluation (questions about thoughts, feelings and eating habits), or other additional tests based on signs, symptoms and eating habits. Participants/population People diagnosed with any type of eating disorder of any age. Intervention(s), exposure(s) Music Therapy executed by qualified music therapists (formal, manualised and facilitated music therapies, such as Nordoff-Robbins and/or recognsied by professional bodies, such as British Association for Music Therapy) Comparator(s)/control Any other intervention, non-exposed control group, treatment as usual Main outcome(s) Reduction in eating disorder psychopathology and/or symptoms. No direction of the impact can be formulated as they can be moving in different directions. Measures of effect Mean Change Additional outcome(s) This will not be the main objective of this systematic review. However, if reported we will include economic evidence (cost-effectiveness), quality of life beyond the disorder and formulate a hierarchy of outcome measures. Measures of effect Mean Change Data extraction (selection and coding) The following information was collected: information concerning the first author, the year of publication, the number and characteristics of the participants, the outcome measures, the interventions, the results and the conclusions. Two independent reviewers will extract the data and third reviewer will resolve discrepancies when they occur. Risk of bias (quality) assessment The methodological scoring will be assessed by two independent reviewers. In case of uncertainty at any point during the screening- or scoring process, consensus will be sought during a meeting. Risk of bias scales suggested by Cochrane will be used depending on the design of the study. Strategy for data synthesis A synthesis without meta-analysis (SWiM) will be provided to discuss the observed effect as prelimary searches reveal a lack of homogenous and qualitative studies to perform statistical analysis of standard effect sizes. The population in the study will be grouped based on conditions of eating disorders (other subgroups as mentioned below or also possible). The criteria for justification of the results will be based on at least the support of two studies with sufficient methodological quality (moderate to low risk of bias). Level of Evidence will be determined for each study to support effect claims. The outcomes used will dependent on the available literature but the objective is to examine the change scores before and after music therapy. The data presentation methods used will consist of tables and graphs to act as supporting material to visualize the data. Analysis of subgroups or subsets Analysis of differentconditions of eating disorders or other patient characteristics such as age, clinical/community/home setting, type of music therapy, etc}, bibtype = {misc}, author = {Coutinho, Eduardo and Van Criekinge, Tamaya and Hanford, Greg and Rajan, Nathan and Maden, Michelle and Hill, Ruaraidh}, keywords = {Systematic review,prospero,protocol} }
@article{ title = {Effect of music listening on hypertonia in neurologically impaired patients-systematic review}, type = {article}, year = {2019}, keywords = {Electromyography,Hypertonia,Music,Neurology,Relaxation,Spasticity}, pages = {e8228}, volume = {7}, websites = {https://peerj.com/articles/8228}, month = {12}, day = {19}, id = {4529f512-222b-3f8a-b347-e6dc2a467232}, created = {2020-05-27T15:18:58.472Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2023-05-15T08:14:21.869Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {VanCriekinge2019}, source_type = {JOUR}, folder_uuids = {16d8408d-4737-41ee-91fc-ea9af111c0fe}, private_publication = {false}, abstract = {Background. As music listening is able to induce self-perceived and physiological signs of relaxation, it might be an interesting tool to induce muscle relaxation in patients with hypertonia. To this date effective non-pharmacological rehabilitation strategies to treat hypertonia in neurologically impaired patients are lacking. Therefore the aim is to investigate the effectiveness of music listening on muscle activity and relaxation. Methodology. The search strategy was performed by the PRISMA guidelines and registered in the PROSPERO database (no. 42019128511). Seven databases were systematically searched until March 2019. Six of the 1,684 studies met the eligibility criteria and were included in this review. Risk of bias was assessed by the PEDro scale. In total 171 patients with a variety of neurological conditions were included assessing hypertonia with both clinicall and biomechanical measures. Results. The analysis showed that there was a large treatment effect of music listening on muscle performance (SMD 0.96, 95% CI [0.29-1.63], I2 = 10%, Z = 2.82, p = 0.005). Music can be used as either background music during rehabilitation (dual-task) or during rest (single-task) and musical preferences seem to play a major role in the observed treatment effect. Conclusions. Although music listening is able to induce muscle relaxation, several gaps in the available literature were acknowledged. Future research is in need of an accurate and objective assessment of hypertonia.}, bibtype = {article}, author = {van Criekinge, Tamaya and D'Août, Kristiaan and O'Brien, Jonathon and Coutinho, Eduardo}, doi = {10.7717/PEERJ.8228}, journal = {PeerJ} }
@inproceedings{ title = {Emotion and themes recognition in music utilising convolutional and recurrent neural networks}, type = {inproceedings}, year = {2019}, pages = {26-28}, volume = {2670}, month = {10}, day = {27}, city = {Sophia Antipolis, France}, id = {6f372c47-d0e7-31aa-aec8-0901922dbda2}, created = {2020-05-29T10:17:30.748Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2023-05-15T08:14:21.180Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {Amiriparian2019}, source_type = {CONF}, private_publication = {false}, abstract = {Emotion is an inherent aspect of music, and associations to music can be made via both life experience and specific musical techniques applied by the composer. Computational approaches for music recognition have been well-established in the research community; however, deep approaches have been limited and not yet comparable to conventional approaches. In this study, we present our fusion system of end-to-end convolutional recurrent neural networks (CRNN) and pre-trained convolutional feature extractors for music emotion and theme recognition1. We train 9 models and conduct various late fusion experiments. Our best performing model (team name: AugLi) achieves 74.2 % ROC-AUC on the test partition which is 1.6 percentage points over the baseline system of the MediaEval 2019 Emotion & Themes in Music task.}, bibtype = {inproceedings}, author = {Amiriparian, Shahin and Gerczuk, Maurice and Coutinho, Eduardo and Baird, Alice and Ottl, Sandra and Milling, Manuel and Schuller, Björn}, booktitle = {CEUR Workshop Proceedings} }
@inbook{ type = {inbook}, year = {2019}, keywords = {book,chapter}, pages = {382-409}, websites = {http://dx.doi.org/10.4135/9781452283012.n23 http://sk.sagepub.com/reference/music-in-the-social-and-behavioral-sciences/n25.xml,http://sk.sagepub.com/reference/music-in-the-social-and-behavioral-sciences/n25.xml}, publisher = {SAGE Publications, Inc.}, city = {2455 Teller Road, Thousand Oaks California 91320 United States}, id = {80f3e7ed-7f30-3702-bacc-15eddfd686fb}, created = {2020-05-29T10:17:30.824Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2023-05-15T08:14:21.026Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {Coutinho2014}, source_type = {CHAP}, private_publication = {false}, bibtype = {inbook}, author = {Hood, Susan}, editor = {Thompson, W F}, doi = {10.5422/fordham/9780823252008.003.0017}, chapter = {Appraisal}, title = {The Cambridge Handbook of Systemic Functional Linguistics} }
@inproceedings{ title = {The impact of music listening on the quality of life of people with dementia and their caregivers}, type = {inproceedings}, year = {2019}, keywords = {abstract,conference}, publisher = {British Society of Gerontology}, institution = {Durham}, id = {c24e9d8d-9b5f-3327-9bec-39ff8d12a990}, created = {2020-05-29T11:51:36.880Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-06-08T17:31:31.678Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {houthecaregivers}, source_type = {inproceedings}, folder_uuids = {a2a583e8-b0a3-48f9-900f-27e15c9a7f71}, private_publication = {false}, abstract = {Dementia is an incurable and fatal brain-damaging disease associated with psychological and behavioural symptoms that may decrease people’s Quality of Life (QoL) (Ravi, 2011). Current pharmacological interventions are costly, entail serious side effects and, most importantly, have limited effects on the QoL of people with dementia (PWD) and their caregivers. In this context, non-pharmacological interventions are being explored as alternative (or supplementary) strategies (Overshott & Burns, 2005), and meaningful music listening is a very promising one. Although academic and clinical evidence shows that exposure to music and musical activities has positive impacts in PWD at a variety of levels (e.g., Clark, Lipe, & Bilbrey, 1998; Gerdner, 2000), less research has been directed towards the QoL outcomes of music listening for both PWD and their caregivers. The current study addresses this void by systematically reviewing primary research studies that assess the impact of music listening on a variety of outcome measures related to PWD (QoL, mood, cognitive function and behavioural symptoms), patient-caregiver relationships, and caregivers (QoL, mood, and burden). The results of this systematic review will provide a clearer picture on the effectiveness of music listening intervention in improving the QoL of PWD and their caregivers, an evaluation of the interventions methodologies, and inform the design of a new empirical study aimed at devising a systematic methodology for the application of meaningful music listening to improve the QoL of PWD and their caregivers.}, bibtype = {inproceedings}, author = {Hou, Xiaoxiao and Brooks, H and Donnellan, W and Coutinho, E}, booktitle = {Proceedings of the British Society of Gerontology 48th Annual Conference} }
@inproceedings{ title = {The role of music listening in eliciting autobiographical memories and improving the quality of life of people with dementia and their caregivers}, type = {inproceedings}, year = {2019}, keywords = {abstract,conference}, month = {11}, publisher = {University of Durham}, day = {1}, city = {Durham}, institution = {Liverpool}, id = {02fb37c9-20ca-359f-89ff-f12d20867b90}, created = {2020-05-29T11:51:37.063Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-05-30T17:17:27.187Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {xiaoxiaothecaregivers}, source_type = {inproceedings}, folder_uuids = {a2a583e8-b0a3-48f9-900f-27e15c9a7f71}, private_publication = {false}, abstract = {Dementia is an incurable and fatal brain-damaging disease associated with psychological and behavioural symptoms that may decrease people’s Quality of Life (QoL) (Ravi, 2011). Current pharmacological interventions are costly, entail serious side effects and, most importantly, have limited effects on the QoL of people with dementia (PWD) and their caregivers. In this context, non-pharmacological interventions are being explored as alternative (or supplementary) strategies (Overshott & Burns, 2005), and meaningful music listening is a very promising one. Although academic and clinical evidence shows that exposure to music and musical activities has positive impacts in PWD at a variety of levels (e.g., Clark, Lipe, & Bilbrey, 1998; Gerdner, 2000), less research has been directed towards the QoL outcomes of music listening for both PWD and their caregivers. The current study addresses this void by systematically reviewing primary research studies that assess the impact of music listening on a variety of outcome measures related to PWD (QoL, mood, cognitive function and behavioural symptoms), patient-caregiver relationships, and caregivers (QoL, mood, and burden). The results of this systematic review will provide a clearer picture on the effectiveness of music listening intervention in improving the QoL of PWD and their caregivers, an evaluation of the interventions methodologies, and inform the design of a new empirical study aimed at devising a systematic methodology for the application of meaningful music listening to improve the QoL of PWD and their caregivers.}, bibtype = {inproceedings}, author = {Hou, Xiaoxiao and Brooks, H and Donnellan, W and Coutinho, E}, booktitle = {Proceedings of the Music & lifetime memories: An interdisciplinary conference} }
@article{ title = {Comments on comments by Cupchik (2019) and Jacobsen (2019)}, type = {article}, year = {2019}, keywords = {Comment,journal}, pages = {264-265}, volume = {13}, websites = {https://psycnet.apa.org/record/2019-45121-004}, month = {8}, id = {6f6c7ba3-bcba-37fa-8c6a-eba7eb6bd00e}, created = {2020-05-29T11:51:37.116Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-06-08T17:31:31.791Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {scherer2019comments2019}, source_type = {article}, folder_uuids = {5bf27d41-c6e6-415f-a135-2eb1d8164244}, private_publication = {false}, abstract = {In this response to comments by Cupchik (2019) and Jacobsen (2019), we address the points made and extend the discussion to raise a number of issues to consider in the quest for ecologically valid research on aesthetic emotions generated by music performances.}, bibtype = {article}, author = {Scherer, Klaus R. and Trznadel, Stéphanie and Fantini, Bernardino and Coutinho, Eduardo}, doi = {10.1037/aca0000246}, journal = {Psychology of Aesthetics, Creativity, and the Arts}, number = {3} }
@article{ title = {Assessing emotional experiences of opera spectators in situ}, type = {article}, year = {2019}, keywords = {article,journal}, pages = {244-258}, volume = {13}, websites = {http://doi.apa.org/getdoi.cfm?doi=10.1037/aca0000163}, month = {8}, publisher = {APA}, day = {16}, id = {015fa105-7208-3c6a-b818-def98574428d}, created = {2020-05-29T11:51:37.137Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2023-05-15T08:14:21.718Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {schererassessingsitu}, source_type = {article}, folder_uuids = {116db2f1-e6ac-4780-bccf-a977325250cd,99880aa7-55df-4b45-bfce-0ffc00b23ced}, private_publication = {false}, abstract = {Opera performances elicit strong emotional reactions in listeners. Yet, empirical demonstrations of these effects in situ are rare. Here we report a series of studies examining the emotional reactions of participants invited to the dress rehearsal of three different operas at the Geneva opera house before large audiences. Using a new affect checklist developed specifically for in situ studies of music performances, we asked participants to record (a) the intensity of 12 different types of affective reactions they experienced during selected scenes or (b) the frequency with which they experienced these emotions during specific acts or the opera as a whole. Results showed a high degree of specificity regarding the emotional impact of the operas as a whole and of individual scenes/acts. For one opera, Verdi's Macbeth, we also asked participants to rate both the emotions they actually felt during the opera scenes and the emotions expressed by the music or the singers' interpretation. Results confirm that spectators are clearly able to separate their own affective responses from what they perceive to be the emotions portrayed by the orchestra or on the stage. In addition, we evaluated the effect of different types of preperformance information sessions (on plot or music), as well as of participant personality and prior mood. Overall, the results demonstrate the feasibility of measuring highly differentiated emotional audience reactions to an opera performance with a brief validated checklist during actual performances in the opera house and the validity of self-reported emotions.}, bibtype = {article}, author = {Scherer, Klaus R. and Trznadel, Stéphanie and Fantini, Bernardino and Coutinho, Eduardo}, doi = {10.1037/aca0000163}, journal = {Psychology of Aesthetics, Creativity, and the Arts}, number = {3} }
@article{ title = {Dynamic difficulty awareness training for continuous emotion prediction}, type = {article}, year = {2019}, keywords = {article,journal}, pages = {1289-1301}, volume = {21}, websites = {https://ieeexplore.ieee.org/document/8471224/,http://gateway.webofknowledge.com/gateway/Gateway.cgi?GWVersion=2%5C&SrcApp=PARTNER_APP%5C&SrcAuth=LinksAMR%5C&KeyUT=WOS:000466223600017%5C&DestLinkType=FullRecord%5C&DestApp=ALL_WOS%5C&UsrCustomerID=f3ec48df2}, month = {5}, id = {27bf2db0-8b71-337c-a1f6-79e25600ed88}, created = {2020-05-29T11:51:37.187Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2023-05-15T08:14:21.719Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {Zhang2019}, source_type = {JOUR}, folder_uuids = {116db2f1-e6ac-4780-bccf-a977325250cd,99880aa7-55df-4b45-bfce-0ffc00b23ced}, private_publication = {false}, abstract = {Time-continuous emotion prediction has become an increasingly compelling task in machine learning. Considerable efforts have been made to advance the performance of these systems. Nonetheless, the main focus has been the development of more sophisticated models and the incorporation of different expressive modalities (e.g., speech, face, and physiology). In this paper, motivated by the benefit of difficulty awareness in a human learning procedure, we propose a novel machine learning framework, namely, dynamic difficulty awareness training (DDAT), which sheds fresh light on the research - directly exploiting the difficulties in learning to boost the machine learning process. The DDAT framework consists of two stages: information retrieval and information exploitation. In the first stage, we make use of the reconstruction error of input features or the annotation uncertainty to estimate the difficulty of learning specific information. The obtained difficulty level is then used in tandem with original features to update the model input in a second learning stage with the expectation that the model can learn to focus on high difficulty regions of the learning process. We perform extensive experiments on a benchmark database REmote COLlaborative and affective to evaluate the effectiveness of the proposed framework. The experimental results show that our approach outperforms related baselines as well as other well-established time-continuous emotion prediction systems, which suggests that dynamically integrating the difficulty information for neural networks can help enhance the learning process.}, bibtype = {article}, author = {Zhang, Zixing and Han, Jing and Coutinho, Eduardo and Schuller, Bjorn}, doi = {10.1109/TMM.2018.2871949}, journal = {IEEE Transactions on Multimedia}, number = {5} }
@inproceedings{ title = {Sincerity in acted speech: Presenting the sincere apology corpus and results}, type = {inproceedings}, year = {2019}, keywords = {article,conference}, pages = {539-543}, volume = {2019-Septe}, websites = {http://www.isca-speech.org/archive/Interspeech_2019/abstracts/1349.html}, month = {9}, publisher = {ISCA}, day = {15}, city = {ISCA}, institution = {Graz, Austria}, id = {96556506-9cf4-38f9-8280-e97e4f1b3396}, created = {2020-05-29T11:51:37.296Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2023-07-03T09:46:08.633Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {bairdsincerityresults}, source_type = {inproceedings}, folder_uuids = {aac08d0d-38e7-4f4e-a381-5271c5c099ce}, private_publication = {false}, abstract = {The ability to discern an individual's level of sincerity varies from person to person and across cultures. Sincerity is typically a key indication of personality traits such as trustworthiness, and portraying sincerity can be integral to an abundance of scenarios, e. g., when apologising. Speech signals are one important factor when discerning sincerity and, with more modern interactions occurring remotely, automatic approaches for the recognition of sincerity from speech are beneficial during both interpersonal and professional scenarios. In this study we present details of the Sincere Apology Corpus (SINA-C). Annotated by 22 individuals for their perception of sincerity, SINA-C is an English acted-speech corpus of 32 speakers, apologising in multiple ways. To provide an updated baseline for the corpus, various machine learning experiments are conducted. Finding that extracting deep data-representations (utilising the DEEP SPECTRUM toolkit) from the speech signals is best suited. Classification results on the binary (sincere / not sincere) task are at best 79.2 % Unweighted Average Recall and for regression, in regards to the degree of sincerity, a Root Mean Square Error of 0.395 from the standardised range [-1.51; 1.72] is obtained.}, bibtype = {inproceedings}, author = {Baird, Alice and Coutinho, Eduardo and Hirschberg, Julia and Schuller, Björn}, doi = {10.21437/Interspeech.2019-1349}, booktitle = {Proceedings of the Annual Conference of the International Speech Communication Association, INTERSPEECH} }
@inbook{ type = {inbook}, year = {2019}, keywords = {book,chapter}, pages = {296-314}, volume = {1}, websites = {http://oxfordhandbooks.com/view/10.1093/oxfordhb/9780199660773.001.0001/oxfordhb-9780199660773-e-006}, month = {4}, publisher = {Oxford University Press}, day = {11}, series = {Scholarly Research Reviews}, id = {13fce87d-e90d-34f0-ba3b-04c4740962dc}, created = {2020-05-29T11:51:39.216Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-06-08T17:31:32.249Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {coutinho2014singingemotion}, source_type = {CHAP}, folder_uuids = {5db95977-632e-457e-b1b5-8ad03c3d17c4}, private_publication = {false}, abstract = {In this chapter the authors discuss the emotional power of the singing voice. The chapter begins by providing an overview of the process of externalization of emotions by the human voice. Then, the authors discuss some fundamental determinants of emotional expression in singing, namely the ‘emotional script’, the artistic interpretation, and the singer’s affective state. Next, they describe the manner in which expressed emotions are encoded in the voice by singers and recognized by listeners, and compare it with vocal expression in everyday life. Finally, they identify various methodologies that can enhance understanding of the physiology of vocal production and the acoustic cues fundamental to perception and production of expressive sung performance. The authors propose that the knowledge gained from application of these methodologies can inform singing practice, and that interdisciplinary approaches and cooperation are central aspects of a fruitful and sustainable study of the expressive powers of the singing voice.}, bibtype = {inbook}, author = {Coutinho, Eduardo and Scherer, Klaus R. and Dibben, Nicola}, editor = {Welch, Graham F. and Howard, David M and Nix, John}, doi = {10.1093/oxfordhb/9780199660773.013.006}, chapter = {Singing and Emotion}, title = {The Oxford Handbook of Singing} }
@misc{ title = {The Sincere Apology Corpus (SinA-C)}, type = {misc}, year = {2019}, keywords = {Dataset}, websites = {http://doi.org/10.5281/zenodo.3241253}, month = {8}, id = {7cd66e98-384c-31ba-b26f-2aeffd173f5e}, created = {2020-05-29T11:51:39.340Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-06-08T17:31:32.297Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {baird2019thesinac}, source_type = {DATASET}, folder_uuids = {d67f8010-76e6-4bba-9ed2-6cfd0416d87b,116db2f1-e6ac-4780-bccf-a977325250cd}, private_publication = {false}, abstract = {This repository contains the Sincere Apology Corpus (SinA-C). SinA-C is an English speech corpus of acted apologies in various prosodic styles created with the purpose of investigating the attributes of the human voice which convey sincerity.}, bibtype = {misc}, author = {Baird, A and Coutinho, E}, doi = {10.5281/zenodo.3241253} }
@article{ title = {The Influence of Sound-Based Interventions on Motor Behavior After Stroke: A Systematic Review}, type = {article}, year = {2019}, keywords = {biomechanics,music,sound,sound-based interventions,stroke rehabilitation,stroke—diagnosis,therapy}, volume = {10}, websites = {https://www.frontiersin.org/articles/10.3389/fneur.2019.01141/full,https://www.frontiersin.org/article/10.3389/fneur.2019.01141/full}, month = {11}, publisher = {Frontiers Media}, day = {1}, id = {b7604290-cd17-3b4b-9e51-a193c186fc7d}, created = {2020-05-30T14:51:24.355Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2023-05-15T08:14:21.765Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {VanCriekinge2019a}, source_type = {JOUR}, folder_uuids = {16d8408d-4737-41ee-91fc-ea9af111c0fe}, private_publication = {false}, abstract = {Objective: To investigate the effects of sound-based interventions (SBIs) on biomechanical parameters in stroke patients. Methods: PubMed/Medline, Web of Science, the Physiotherapy Evidence Database (PEDro), and the Cochrane Library were searched until September 2019. Studies examining the effect of SBIs on kinematic, kinetic, and electromyographic outcome measures were included. Two independent reviewers performed the screening, and data extraction and risk-of-bias assessment were conducted with the PEDro and Newcastle–Ottawa scale. Disagreements were resolved by a third independent reviewer. Results: Of the 858 studies obtained from all databases, 12 studies and 240 participants met the inclusion and exclusion criteria. Six studies investigated the effect of SBI on upper limb motor tasks, while six examined walking. Concerning quality assessment (Newcastle–Ottawa Quality Assessment Scale and PEDro), the nine cross-sectional studies had a median score of seven, while the randomized controlled trials had a median score of five (fair to good quality). In relation to upper limb motor tasks, only one study found improvements in cortical reorganization and increased central excitability and motor control during reaching after SBI (results of the other five studies were too diverse and lacked quality to substantiate their findings). In relation to walking, results were clearer: SBI led to improvements in knee flexion and gastrocnemius muscle activity. Conclusion: Despite of the heterogeneity of the included studies, evidence was found demonstrating that SBI can induce biomechanical changes in motor behavior during walking in stroke patients. No conclusions could be formulated regarding reaching tasks. Additionally, directions for future research for understanding the underlying mechanism of the clinical improvements after SBI are: (1) using actual music pieces instead of rhythmic sound sequences and (2) examining sub-acute stroke rather than chronic stroke patients.}, bibtype = {article}, author = {Van Criekinge, Tamaya and D'Août, Kristiaan and O'Brien, Jonathon and Coutinho, Eduardo}, doi = {10.3389/fneur.2019.01141}, journal = {Frontiers in Neurology}, number = {1141} }
@article{ title = {Connecting subspace learning and extreme learning machine in speech emotion recognition}, type = {article}, year = {2019}, keywords = {article,journal}, pages = {795-808}, volume = {21}, websites = {http://gateway.webofknowledge.com/gateway/Gateway.cgi?GWVersion=2%5C&SrcApp=PARTNER_APP%5C&SrcAuth=LinksAMR%5C&KeyUT=WOS:000460333800022%5C&DestLinkType=FullRecord%5C&DestApp=ALL_WOS%5C&UsrCustomerID=f3ec48df247ee1138ccd8d3ba59bacc2,https://ieeexplore.iee}, month = {3}, id = {882b8384-fc52-3a64-a198-4c8a4c774dbd}, created = {2020-05-30T17:34:32.954Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-06-08T17:31:31.543Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {xu2019connectingrecognition}, source_type = {article}, folder_uuids = {116db2f1-e6ac-4780-bccf-a977325250cd,99880aa7-55df-4b45-bfce-0ffc00b23ced}, private_publication = {false}, abstract = {Speech emotion recognition (SER) is a powerful tool for endowing computers with the capacity to process information about the affective states of users in human–machine interactions. Recent research has shown the effectiveness of graph embedding-based subspace learning and extreme learning machine applied to SER, but there are still various drawbacks in these two techniques that limit their application. Regarding subspace learning, the change from linearity to nonlinearity is usually achieved through kernelization, whereas extreme learning machines only take label information into consideration at the output layer. In order to overcome these drawbacks, this paper leverages extreme learning machines for dimensionality reduction and proposes a novel framework to combine spectral regression-based subspace learning and extreme learning machines. The proposed framework contains three stages—data mapping, graph decomposition, and regression. At the data mapping stage, various mapping strategies provide different views of the samples. At the graph decomposition stage, specifically designed embedding graphs provide a possibility to better represent the structure of data through generating virtual coordinates. Finally, at the regression stage, dimension-reduced mappings are achieved by connecting the virtual coordinates and data mapping. Using this framework, we propose several novel dimensionality reduction algorithms, apply them to SER tasks, and compare their performance to relevant state-of-the-art methods. Our results on several paralinguistic corpora show that our proposed techniques lead to significant improvements.}, bibtype = {article}, author = {Xu, Xinzhou and Deng, Jun and Coutinho, Eduardo and Wu, Chen and Zhao, Li and Schuller, Björn W.}, doi = {10.1109/TMM.2018.2865834}, journal = {IEEE Transactions on Multimedia}, number = {3} }
@article{ title = {MUSEBAQ: A modular tool for music research to assess musicianship, musical capacity, music preferences, and motivations for music use}, type = {article}, year = {2018}, keywords = {article,journal}, pages = {376-399}, volume = {35}, websites = {http://mp.ucpress.edu/lookup/doi/10.1525/mp.2018.35.3.376}, month = {2}, publisher = {University of California Press Journals}, day = {12}, id = {1777eeae-cddb-3be2-8dc4-12fb3090c33f}, created = {2018-03-29T13:11:33.343Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2023-05-15T08:14:21.037Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {chin2018musebaquse}, source_type = {article}, folder_uuids = {116db2f1-e6ac-4780-bccf-a977325250cd,99880aa7-55df-4b45-bfce-0ffc00b23ced}, private_publication = {false}, abstract = {MUSIC ENGAGEMENT IS COMPLEX AND IS INFLUENCED by music training, capacity, preferences, and motivations. A multi-modular self-report instrument (the Music Use and Background Questionnaire, or MUSEBAQ) was developed to measure a diverse set of music engagement constructs. Based on earlier work, a hybrid approach of exploratory and confirmatory analyses was conducted across a series of three independent studies to establish reliability and validity of the modular tool. Module 1 (Musicianship) provides a brief assessment of formal and informalmusic knowledge and practice.Module 2 (Musical capacity) measures emotional sensitivity to music, listening sophistication, music memory and imagery, and personal commitment to music.Module 3 (Music preferences) captures preferences from six broad genres and utilizes adaptive reasoning to selectively expand subgenres when administered online. Module 4 (Motivations for music use) assesses musical transcendence, emotion regulation, social, and musical identity and expression. The MUSEBAQoffers researchers and practitioners a comprehensive, modular instrument that can be used inwhole, or by module as required to capture an individual's level of engagement with music and to serve as a background questionnaire to measure and interpret the effects of dispositional differences in emotional reactions to music.}, bibtype = {article}, author = {Chin, Tan Chyuan and Coutinho, Eduardo and Scherer, Klaus R. and Rickard, Nikki S.}, doi = {10.1525/MP.2018.35.3.376}, journal = {Music Perception}, number = {3} }
@article{ title = {Do individual differences influence moment-by-moment reports of emotion perceived in music and speech prosody?}, type = {article}, year = {2018}, keywords = {article,journal}, pages = {184}, volume = {12}, websites = {http://www.ncbi.nlm.nih.gov/pubmed/30210316,http://www.pubmedcentral.nih.gov/articlerender.fcgi?artid=PMC6119718,http://www.ncbi.nlm.nih.gov/pubmed/30210316 http://www.pubmedcentral.nih.gov/articlerender.fcgi?artid=PMC6119718,https://www.frontiersin.org/a}, month = {8}, day = {27}, id = {31aec067-4e19-3835-8a72-9d8f6e5d84dc}, created = {2020-05-29T11:51:38.782Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2023-05-15T08:14:21.900Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {Dibben2018}, source_type = {JOUR}, folder_uuids = {116db2f1-e6ac-4780-bccf-a977325250cd,99880aa7-55df-4b45-bfce-0ffc00b23ced}, private_publication = {false}, abstract = {Comparison of emotion perception in music and prosody has the potential to contribute to an understanding of their speculated shared evolutionary origin. Previous research suggests shared sensitivity to and processing of music and speech, but less is known about how emotion perception in the auditory domain might be influenced by individual differences. Personality, emotional intelligence, gender, musical training and age exert some influence on discrete, summative judgments of perceived emotion in music and speech stimuli. However, music and speech are temporal phenomena, and little is known about whether individual differences influence moment-by-moment perception of emotion in these domains. A behavioral study collected two main types of data: continuous ratings of perceived emotion while listening to extracts of music and speech, using a computer interface which modeled emotion on two dimensions (arousal and valence), and demographic information including measures of personality (TIPI) and emotional intelligence (TEIQue-SF). Functional analysis of variance on the time series data revealed a small number of statistically significant differences associated with Emotional Stability, Agreeableness, musical training and age. The results indicate that individual differences exert limited influence on continuous judgments of dynamic, naturalistic expressions. We suggest that this reflects a reliance on acoustic cues to emotion in moment-by-moment judgments of perceived emotions and is further evidence of the shared sensitivity to and processing of music and speech.}, bibtype = {article}, author = {Dibben, Nicola and Coutinho, Eduardo and Vilar, José A. and Estévez-Pérez, Graciela}, doi = {10.3389/fnbeh.2018.00184}, journal = {Frontiers in Behavioral Neuroscience} }
@article{ title = {Evidence of emotion-antecedent appraisal checks in electroencephalography and facial electromyography}, type = {article}, year = {2018}, keywords = {article,journal}, pages = {e0189367}, volume = {13}, websites = {http://gateway.webofknowledge.com/gateway/Gateway.cgi?GWVersion=2%5C&SrcApp=PARTNER_APP%5C&SrcAuth=LinksAMR%5C&KeyUT=WOS:000419101600016%5C&DestLinkType=FullRecord%5C&DestApp=ALL_WOS%5C&UsrCustomerID=f3ec48df247ee1138ccd8d3ba59bacc2 https://dx.plos.org/10}, month = {1}, day = {2}, id = {9336c657-e759-31c9-86c7-fd4d16d0d18c}, created = {2020-05-29T11:51:38.987Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2023-05-15T08:14:21.853Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {coutinho2018evidenceelectromyography}, source_type = {JOUR}, folder_uuids = {116db2f1-e6ac-4780-bccf-a977325250cd,99880aa7-55df-4b45-bfce-0ffc00b23ced}, private_publication = {false}, abstract = {In the present study, we applied Machine Learning (ML) methods to identify psychobiological markers of cognitive processes involved in the process of emotion elicitation as postulated by the Component Process Model (CPM). In particular, we focused on the automatic detection of five appraisal checks—novelty, intrinsic pleasantness, goal conduciveness, control, and power—in electroencephalography (EEG) and facial electromyography (EMG) signals. We also evaluated the effects on classification accuracy of averaging the raw physiological signals over different numbers of trials, and whether the use of minimal sets of EEG channels localized over specific scalp regions of interest are sufficient to discriminate between appraisal checks. We demonstrated the effectiveness of our approach on two data sets obtained from previous studies. Our results show that novelty and power appraisal checks can be consistently detected in EEG signals above chance level (binary tasks). For novelty, the best classification performance in terms of accuracy was achieved using features extracted from the whole scalp, and by averaging across 20 individual trials in the same experimental condition (UAR = 83.5 ± 4.2; N = 25). For power, the best performance was obtained by using the signals from four pre-selected EEG channels averaged across all trials available for each participant (UAR = 70.6 ± 5.3; N = 24). Together, our results indicate that accurate classification can be achieved with a relatively small number of trials and channels, but that averaging across a larger number of individual trials is beneficial for the classification for both appraisal checks. We were not able to detect any evidence of the appraisal checks under study in the EMG data. The proposed methodology is a promising tool for the study of the psychophysiological mechanisms underlying emotional episodes, and their application to the development of computerized tools (e.g., Brain-Computer Interface) for the study of cognitive processes involved in emotions.}, bibtype = {article}, author = {Coutinho, Eduardo and Gentsch, Kornelia and Van Peer, Jacobien and Scherer, Klaus R. and Schuller, Björn W.}, editor = {Valenza, Gaetano}, doi = {10.1371/journal.pone.0189367}, journal = {PLoS ONE}, number = {1} }
@inproceedings{ title = {Deep recurrent music writer: Memory-enhanced variational autoencoder-based musical score composition and an objective measure}, type = {inproceedings}, year = {2017}, pages = {3467-3474}, volume = {2017-May}, websites = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-85031004981&doi=10.1109%2FIJCNN.2017.7966292&partnerID=40&md5=773c59463fe8c1985666a5d8ee739954,http://ieeexplore.ieee.org/document/7966292/}, month = {5}, publisher = {IEEE}, id = {159c3cf8-fc75-3ad3-9351-d5d1c4bd98b6}, created = {2020-05-27T15:19:59.533Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2023-05-15T08:14:21.519Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {Sabathe2017}, source_type = {CONF}, notes = {cited By 4}, private_publication = {false}, abstract = {In recent years, there has been an increasing interest in music generation using machine learning techniques typically used for classification or regression tasks. This is a field still in its infancy, and most attempts are still characterized by the imposition of many restrictions to the music composition process in order to favor the creation of 'interesting' outputs. Furthermore, and most importantly, none of the past attempts has focused on developing objective measures to evaluate the music composed, which would allow to evaluate the pieces composed against a predetermined standard as well as permitting to fine-tune models for better 'performance' and music composition goals. In this work, we intend to advance state-of-the-art in this area by introducing and evaluating a new metric for an objective assessment of the quality of the generated pieces. We will use this measure to evaluate the outputs of a truly generative model based on Variational Autoencoders that we apply here to automated music composition. Using our metric, we demonstrate that our model can generate music pieces that follow general stylistic characteristics of a given composer or musical genre. Additionally, we use this measure to investigate the impact of various parameters and model architectures on the compositional process and output.}, bibtype = {inproceedings}, author = {Sabathe, Romain and Coutinho, Eduardo and Schuller, Bjorn}, doi = {10.1109/IJCNN.2017.7966292}, booktitle = {Proceedings of the International Joint Conference on Neural Networks} }
@misc{ title = {Shared Acoustic Codes Underlie Emotional Communication in Music and Speech - Evidence from Deep Transfer Learning (Datasets)}, type = {misc}, year = {2017}, source = {Zenodo}, keywords = {arousal,dataset,emotion,music,time-continuous,valence}, issue = {1}, websites = {https://zenodo.org/record/345944#.WTZdgl2qNFQ}, month = {3}, publisher = {Zenodo}, day = {6}, id = {a036a5c3-6770-37fc-8e0b-9b8ab8fca30e}, created = {2020-05-29T10:17:30.772Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2021-05-14T09:05:35.698Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {Coutinho2017}, source_type = {DATASET}, private_publication = {false}, abstract = {This repository contains the datasets used in the article "Shared Acoustic Codes Underlie Emotional Communication in Music and Speech - Evidence from Deep Transfer Learning" (Coutinho & Schuller, 2017). In that article four different data sets were used: SEMAINE, RECOLA, ME14 and MP (acronyms and datasets described below). The SEMAINE (speech) and ME14 (music) corpora were used for the unsupervised training of the Denoising Auto-encoders (domain adaptation stage) - only the audio features extracted from the audio files in these corpora were used and are provided in this repository. The RECOLA (speech) and MP (music) corpora were used for the supervised training phase - both the audio features extracted from the audio files and the Arousal and Valence annotations were used. In this repository, we provide the audio features extracted from the audio files for both corpora, and Arousal and Valence annotations for some of the music datasets (those that the author of this repository is the data curator).}, bibtype = {misc}, author = {Coutinho, E}, doi = {10.5281/zenodo.600657} }
@misc{ title = {Emotion-Antecedent Appraisal Checks: EEG and EMG datasets for Novelty and Pleasantness}, type = {misc}, year = {2017}, keywords = {dataset}, pages = {1-4}, websites = {https://doi.org/10.5281/zenodo.197404}, month = {12}, publisher = {Zenodo}, id = {c992033c-a9f0-37e8-b6d9-52ec697f3543}, created = {2020-05-29T11:51:37.170Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-06-08T17:31:31.815Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {coutinho2017emotionantecedentset}, source_type = {DATASET}, folder_uuids = {d67f8010-76e6-4bba-9ed2-6cfd0416d87b,116db2f1-e6ac-4780-bccf-a977325250cd}, private_publication = {false}, abstract = {This document describes the full details of the first data set (Study 1) used in Coutinho et al., to appear. The Electroencephalography (EEG) and facial Electromyography (EMG) signals included in this dataset, and now made public, were collected in the context of a previous study by Peer, Grandjean, and Scherer, 2014 that addressed three fundamental questions regarding the mechanisms underlying the appraisal process: Whether appraisal criteria are processed (a) in a fixed sequence, (b) independent of each other, and (c) by different neural structures or circuits. In that study, an oddball paradigm with affective pictures was used to experimentally manipulate novelty and intrinsic pleasantness appraisals. EEG was recorded during task performance, together with facial EMG, to measure, respectively, cognitive processing and efferent responses stemming from the appraisal manipulations.}, bibtype = {misc}, author = {van Peer, J. and Coutinho, E. and Grandjean, D. and Scherer, K. R.}, doi = {10.5281/zenodo.197404} }
@article{ title = {The effect of context and audio-visual modality on emotions elicited by a musical performance}, type = {article}, year = {2017}, keywords = {article,journal}, pages = {550-569}, volume = {45}, websites = {http://dx.doi.org/10.1177/0305735616670496 http://journals.sagepub.com/doi/10.1177/0305735616670496,http://dx.doi.org/10.1177/0305735616670496,http://journals.sagepub.com/doi/10.1177/0305735616670496}, month = {7}, day = {26}, id = {afc391cf-b15a-3422-b5d4-fa0c6522d298}, created = {2020-05-29T11:51:37.246Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2023-05-15T08:14:21.220Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {doi:10.1177/0305735616670496}, source_type = {JOUR}, folder_uuids = {116db2f1-e6ac-4780-bccf-a977325250cd,99880aa7-55df-4b45-bfce-0ffc00b23ced}, private_publication = {false}, abstract = {In this work, we compared emotions induced by the same performance of Schubert Lieder during a live concert and in a laboratory viewing/listening setting to determine the extent to which laboratory research on affective reactions to music approximates real listening conditions in dedicated performances. We measured emotions experienced by volunteer members of an audience that attended a Lieder recital in a church (Context 1) and emotional reactions to an audio-video-recording of the same performance in a university lecture hall (Context 2). Three groups of participants were exposed to three presentation versions in Context 2: (1) an audio-visual recording, (2) an audio-only recording, and (3) a video-only recording. Participants achieved statistically higher levels of emotional convergence in the live performance than in the laboratory context, and the experience of particular emotions was determined by complex interactions between auditory and visual cues in the performance. This study demonstrates the contribution of the performance setting and the performers' appearance and nonverbal expression to emotion induction by music, encouraging further systematic research into the factors involved.}, bibtype = {article}, author = {Coutinho, Eduardo and Scherer, Klaus R.}, doi = {10.1177/0305735616670496}, journal = {Psychology of Music}, number = {4} }
@misc{ title = {Emotion-Antecedent Appraisal Checks: EEG and EMG datasets for Goal Conduciveness, Control and Power}, type = {misc}, year = {2017}, keywords = {dataset}, pages = {1-4}, websites = {http://doi.org/10.5281/zenodo.222615}, month = {12}, publisher = {Zenodo}, id = {921f0eb1-b115-3b70-8f13-16b31a419a9b}, created = {2020-05-29T11:51:37.289Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-06-08T17:31:32.436Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {coutinho2017emotionantecedentpower}, source_type = {DATASET}, folder_uuids = {d67f8010-76e6-4bba-9ed2-6cfd0416d87b,116db2f1-e6ac-4780-bccf-a977325250cd}, private_publication = {false}, abstract = {This document describes the full details of the second data set (Study 2) used in Coutinho et al., to appear. The Electroencephalography (EEG) and facial Electromyography (EMG) signals included in this data set, and now made public, were collected in the context of a previous study by Gentsch, Grandjean, and Scherer, 2013 that addressed three fundamental questions regarding the mechanisms underlying the appraisal process: Whether appraisal criteria are processed (1) in a fixed sequence, (2) independent of each other, and (3) by different neural structures or circuits. In this study, a gambling task was applied in which feedback stimuli manipulated simultaneously the information about goal conduciveness, control, and power appraisals. EEG was recorded during task performance, together with facial EMG, to measure, respectively, cognitive processing and efferent responses stemming from the appraisal manipulations.}, bibtype = {misc}, author = {Gentsch, K and Coutinho, E and Grandjean, D and Scherer, K R and Gentsch, K and Grandjean, D and Scherer, K R}, doi = {10.5281/zenodo.222615} }
@article{ title = {Shared acoustic codes underlie emotional communication in music and speech—evidence from deep transfer learning}, type = {article}, year = {2017}, keywords = {article,journal}, pages = {e0179289}, volume = {12}, websites = {http://dx.plos.org/10.1371/journal.pone.0179289,http://gateway.webofknowledge.com/gateway/Gateway.cgi?GWVersion=2%5C&SrcApp=PARTNER_APP%5C&SrcAuth=LinksAMR%5C&KeyUT=WOS:000404607900019%5C&DestLinkType=FullRecord%5C&DestApp=ALL_WOS%5C&UsrCustomerID=f3ec48d}, month = {6}, publisher = {Public Library of Science (PLoS)}, day = {28}, id = {8b0218eb-eaaa-36aa-9a6d-870b794ede57}, created = {2020-05-29T11:51:38.591Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-06-08T17:31:31.970Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {coutinho2017sharedlearning}, source_type = {JOUR}, folder_uuids = {116db2f1-e6ac-4780-bccf-a977325250cd,99880aa7-55df-4b45-bfce-0ffc00b23ced}, private_publication = {false}, abstract = {Music and speech exhibit striking similarities in the communication of emotions in the acoustic domain, in such a way that the communication of specific emotions is achieved, at least to a certain extent, by means of shared acoustic patterns. From an Affective Sciences points of view, determining the degree of overlap between both domains is fundamental to understand the shared mechanisms underlying such phenomenon. From a Machine learning perspective, the overlap between acoustic codes for emotional expression in music and speech opens new possibilities to enlarge the amount of data available to develop music and speech emotion recognition systems. In this article, we investigate time-continuous predictions of emotion (Arousal and Valence) in music and speech, and the Transfer Learning between these domains. We establish a comparative framework including intra- (i.e., models trained and tested on the same modality, either music or speech) and cross-domain experiments (i.e., models trained in one modality and tested on the other). In the cross-domain context, we evaluated two strategies—the direct transfer between domains, and the contribution of Transfer Learning techniques (feature-representation-transfer based on Denoising Auto Encoders) for reducing the gap in the feature space distributions. Our results demonstrate an excellent cross-domain generalisation performance with and without feature representation transfer in both directions. In the case of music, cross-domain approaches outperformed intra-domain models for Valence estimation, whereas for Speech intra-domain models achieve the best performance. This is the first demonstration of shared acoustic codes for emotional expression in music and speech in the time-continuous domain.}, bibtype = {article}, author = {Coutinho, Eduardo and Schuller, Björn}, editor = {Zhang, Yudong}, doi = {10.1371/journal.pone.0179289}, journal = {PLoS ONE}, number = {6} }
@article{ title = {Introducing the Geneva music-induced affect checklist (GEMIAC): A brief instrument for the rapid assessment of musically induced emotions}, type = {article}, year = {2017}, keywords = {Checklist,Emotion,Feeling,Measurement,Music}, pages = {371-386}, volume = {34}, websites = {https://online.ucpress.edu/mp/article/34/4/371/62796/Introducing-the-GEneva-MusicInduced-Affect}, month = {4}, day = {1}, id = {b67e6804-7446-3dca-938f-507d3cf631d8}, created = {2021-09-17T10:31:01.529Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2023-05-15T08:14:21.680Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, private_publication = {false}, abstract = {THE SYSTEMATIC STUDY OF MUSIC-INDUCED emotions requires standardized measurement instruments to reliably assess the nature of affective reactions to music, which tend to go beyond garden-variety basic emotions.We describe the development and conceptual validation of a checklist for rapid assessment of musicinduced affect, designed to extend and complement the Geneva Emotional Music Scale. The checklist contains a selection of affect and emotion categories that are frequently used in the literature to refer to emotional reactions to music. The development of the checklist focused on an empirical investigation of the semantic structure of the relevant terms, combined with fuzzy classes based on a series of hierarchical cluster analyses. Two versions of the checklist for assessing the intensity and frequency of affective responses to music are proposed.}, bibtype = {article}, author = {Coutinho, Eduardo and Scherer, Klaus R.}, doi = {10.1525/MP.2017.34.4.371}, journal = {Music Perception}, number = {4} }
@inproceedings{ title = {The INTERSPEECH 2016 computational paralinguistics challenge: Deception, sincerity & native language}, type = {inproceedings}, year = {2016}, keywords = {article,conference}, pages = {2001-2005}, volume = {08-12-Sept}, websites = {http://www.isca-speech.org/archive/Interspeech_2016/abstracts/0129.html http://gateway.webofknowledge.com/gateway/Gateway.cgi?GWVersion=2%255C&SrcApp=PARTNER_APP%255C&SrcAuth=LinksAMR%255C&KeyUT=WOS:000409394401102%255C&DestLinkType=FullRecord%255C&DestAp}, month = {9}, day = {8}, id = {68bb5f48-7268-3ea7-b41f-deb9e24ed29a}, created = {2020-05-29T11:51:36.895Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2023-07-03T09:46:08.675Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {schuller2016thelanguage}, source_type = {CONF}, folder_uuids = {aac08d0d-38e7-4f4e-a381-5271c5c099ce}, private_publication = {false}, abstract = {The INTERSPEECH 2016 Computational Paralinguistics Challenge addresses three different problems for the first time in research competition under well-defined conditions: classification of deceptive vs. non-deceptive speech, the estimation of the degree of sincerity, and the identification of the native language out of eleven L1 classes of English L2 speakers. In this paper, we describe these sub-challenges, their conditions, the baseline feature extraction and classifiers, and the resulting baselines, as provided to the participants.}, bibtype = {inproceedings}, author = {Schuller, Björn and Steidl, Stefan and Batliner, Anton and Hirschberg, Julia and Burgoon, Judee K. and Baird, Alice and Elkins, Aaron and Zhang, Yue and Coutinho, Eduardo and Evanini, Keelan}, doi = {10.21437/Interspeech.2016-129}, booktitle = {Proceedings of the Annual Conference of the International Speech Communication Association, INTERSPEECH} }
@inproceedings{ title = {MUSEBAQ: A psychometrically robust questionnaire for capturing the many voices of music engagement}, type = {inproceedings}, year = {2016}, keywords = {Conference,abstract}, month = {7}, publisher = {San Francisco, CA}, institution = {San Francisco, CA}, id = {cd02abac-1938-3fc5-a0d5-5631c96f5ca5}, created = {2020-05-29T11:51:37.064Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-05-30T17:17:27.721Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {rickard2016musebaqengagement}, source_type = {inproceedings}, folder_uuids = {a2a583e8-b0a3-48f9-900f-27e15c9a7f71}, private_publication = {false}, bibtype = {inproceedings}, author = {Rickard, Nikki Sue and Chin, T and Coutinho, E and Scherer, K R}, booktitle = {Proceedings of the 14th International Conference on Music Perception and Cognition} }
@inproceedings{ title = {Ask alice: An artificial retrieval of information agent}, type = {inproceedings}, year = {2016}, keywords = {article,conference}, pages = {419-420}, websites = {http://dl.acm.org/citation.cfm?doid=2993148.2998535}, month = {11}, publisher = {ACM Press}, city = {New York, New York, USA}, institution = {Tokyo, Japan}, id = {dce1e39d-d5f4-3e49-96f8-c4bad9f59b0e}, created = {2020-05-29T11:51:38.700Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2023-05-15T08:14:21.989Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {valstar2016askagent}, source_type = {inproceedings}, folder_uuids = {aac08d0d-38e7-4f4e-a381-5271c5c099ce}, private_publication = {false}, abstract = {We present a demonstration of the ARIA framework, a modular approach for rapid development of virtual humans for information retrieval that have linguistic, emotional, and social skills and a strong personality. We demonstrate the framework's capabilities in a scenario where Alice in Wonderland', a popular English literature book, is embodied by a virtual human representing Alice. The user can engage in an information exchange dialogue, where Alice acts as the expert on the book, and the user as an interested novice. Besides speech recognition, sophisticated audio-visual behaviour analysis is used to inform the core agent dialogue module about the user's state and intentions, so that it can go beyond simple chat-bot dialogue. The behaviour generation module features a unique new capability of being able to deal gracefully with interruptions of the agent.}, bibtype = {inproceedings}, author = {Valstar, Michel and Ghitulescu, Alexandru and Baur, Tobias and Potard, Blaise and Cafaro, Angelo and Wagner, Johannes and André, Elisabeth and Durieu, Laurent and Aylett, Matthew and Dermouche, Soumia and Pelachaud, Catherine and Coutinho, Eduardo and Schuller, Björn and Zhang, Yue and Heylen, Dirk and Theune, Mariët and van Waterschoot, Jelte}, doi = {10.1145/2993148.2998535}, booktitle = {ICMI 2016 - Proceedings of the 18th ACM International Conference on Multimodal Interaction} }
@inproceedings{ title = {Enhanced semi-supervised learning for multimodal emotion recognition}, type = {inproceedings}, year = {2016}, keywords = {article,conference}, pages = {5185-5189}, volume = {2016-May}, websites = {http://ieeexplore.ieee.org/document/7472666/}, month = {3}, publisher = {IEEE}, id = {8f1f3221-0c83-30dd-84a1-4992535dbafb}, created = {2020-05-29T11:51:38.718Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2023-05-15T08:14:21.986Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {zhang2016enhancedrecognition}, source_type = {inproceedings}, folder_uuids = {aac08d0d-38e7-4f4e-a381-5271c5c099ce}, private_publication = {false}, abstract = {Semi-Supervised Learning (SSL) techniques have found many applications where labeled data is scarce and/or expensive to obtain. However, SSL suffers from various inherent limitations that limit its performance in practical applications. A central problem is that the low performance that a classifier can deliver on challenging recognition tasks reduces the trustability of the automatically labeled data. Another related issue is the noise accumulation problem - instances that are misclassified by the system are still used to train it in future iterations. In this paper, we propose to address both issues in the context of emotion recognition. Initially, we exploit the complementarity between audio-visual features to improve the performance of the classifier during the supervised phase. Then, we iteratively re-evaluate the automatically labeled instances to correct possibly mislabeled data and this enhances the overall confidence of the system's predictions. Experimental results performed on the RECOLA database demonstrate that our methodology delivers a strong performance in the classification of high/low emotional arousal (UAR = 76.5%), and significantly outperforms traditional SSL methods by at least 5.0% (absolute gain).}, bibtype = {inproceedings}, author = {Zhang, Zixing and Ringeval, Fabien and Dong, Bin and Coutinho, Eduardo and Marchi, Erik and Schuller, Bjorn}, doi = {10.1109/ICASSP.2016.7472666}, booktitle = {ICASSP, IEEE International Conference on Acoustics, Speech and Signal Processing - Proceedings} }
@inproceedings{ title = {Assessing the prosody of non-native speakers of English: Measures and feature sets}, type = {inproceedings}, year = {2016}, keywords = {article,conference}, pages = {1328-1332}, volume = {645378}, issue = {645378}, month = {1}, publisher = {European Language Resources Association (ELRA)}, institution = {Paris, France}, id = {2fec392e-1f05-3f48-b89b-b26c1456a278}, created = {2020-05-29T11:51:39.102Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-05-30T17:16:39.657Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {coutinho2016assessingsets}, source_type = {CONF}, folder_uuids = {aac08d0d-38e7-4f4e-a381-5271c5c099ce}, private_publication = {false}, abstract = {In this paper, we describe a new database with audio recordings of non-native (L2) speakers of English, and the perceptual evaluation experiment conducted with native English speakers for assessing the prosody of each recording. These annotations are then used to compute the gold standard using different methods, and a series of regression experiments is conducted to evaluate their impact on the performance of a regression model predicting the degree of naturalness of L2 speech. Further, we compare the relevance of different feature groups modelling prosody in general (without speech tempo), speech rate and pauses modelling speech tempo (fluency), voice quality, and a variety of spectral features. We also discuss the impact of various fusion strategies on performance. Overall, our results demonstrate that the prosody of non-native speakers of English as L2 can be reliably assessed using supra-segmental audio features; prosodic features seem to be the most important ones.}, bibtype = {inproceedings}, author = {Coutinho, Eduardo and Hönig, Florian and Zhang, Yue and Hantke, Simone and Batliner, Anton and Nöth, Elmar and Schuller, Björn}, editor = {Calzolari, N and Choukri, K and Declerck, T and Goggi, S and Grobelnik, M and Maegaard, B and Mariani, J and Mazo, H and Moreno, A and Odijk, J and Piperidis, S}, booktitle = {Proceedings of the 10th International Conference on Language Resources and Evaluation, LREC 2016} }
@article{ title = {Semi-supervised active learning for sound classification in hybrid learning environments}, type = {article}, year = {2016}, keywords = {article,journal}, pages = {e0162075}, volume = {11}, websites = {http://gateway.webofknowledge.com/gateway/Gateway.cgi?GWVersion=2&SrcApp=PARTNER_APP&SrcAuth=LinksAMR&KeyUT=WOS:000383680600017&DestLinkType=FullRecord&DestApp=ALL_WOS&UsrCustomerID=f3ec48df247ee1138ccd8d3ba59bacc2 http://dx.plos.org/10.1371/journal.pone.}, month = {9}, day = {14}, id = {2fb19fb0-efc7-3ae7-bd2c-40d1948d933b}, created = {2020-05-29T11:51:39.251Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2023-05-15T08:14:21.423Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {han2016semisupervisedenvironments}, source_type = {article}, folder_uuids = {99880aa7-55df-4b45-bfce-0ffc00b23ced}, private_publication = {false}, abstract = {Coping with scarcity of labeled data is a common problem in sound classification tasks. Approaches for classifying sounds are commonly based on supervised learning algorithms, which require labeled data which is often scarce and leads to models that do not generalize well. In this paper, we make an efficient combination of confidence-based Active Learning and Self-Training with the aim of minimizing the need for human annotation for sound classification model training. The proposed method pre-processes the instances that are ready for labeling by calculating their classifier confidence scores, and then delivers the candidates with lower scores to human annotators, and those with high scores are automatically labeled by the machine. We demonstrate the feasibility and efficacy of this method in two practical scenarios: pool-based and stream-based processing. Extensive experimental results indicate that our approach requires significantly less labeled instances to reach the same performance in both scenarios compared to Passive Learning, Active Learning and Self-Training. A reduction of 52.2% in human labeled instances is achieved in both of the pool-based and stream-based scenarios on a sound classification task considering 16,930 sound instances.}, bibtype = {article}, author = {Han, Wenjing and Coutinho, Eduardo and Ruan, Huabin and Li, Haifeng and Schuller, Björn and Yu, Xiaojie and Zhu, Xuan}, editor = {Schwenker, Friedhelm}, doi = {10.1371/journal.pone.0162075}, journal = {PLoS ONE}, number = {9} }
@article{ title = {Automatic Estimation of Biosignals From the Human Voice}, type = {article}, year = {2015}, keywords = {article,invited,journal}, pages = {114:48--50}, volume = {350}, websites = {http://science.sciencemag.org/content/350/6256/114.3}, month = {10}, day = {2}, id = {7d00c805-b7f1-3183-b2da-2258809dd8fe}, created = {2018-03-29T13:11:33.538Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2023-05-15T08:14:21.110Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {coutinho2015automaticvoice}, source_type = {article}, notes = {invited contribution}, private_publication = {false}, abstract = {Computational paralinguistics (CP) is a relatively new area of research that provides new methods, tools, and techniques to automatically recognize the states, traits, and qualities embedded in the nonsemantic aspects of human speech (1). In recent years, CP has reached a level of maturity that has permitted the development of a myriad of applications in everyday life, such as the automatic estimation of a speaker’s age, gender, height, emotional state, cognitive load, personality traits, likability, intelligibility, and medical condition (2). Here, we provide an overview of one particular application of CP that offers new solutions for health care—the recognition of physiological parameters (biosignals) from the voice alone.}, bibtype = {article}, author = {Coutinho, E and Schuller, Björn W.}, journal = {Science}, number = {6256} }
@inproceedings{ title = {Does my Speech Rock? Automatic Assessment of Public Speaking Skills}, type = {inproceedings}, year = {2015}, keywords = {article,conference}, pages = {2519-2523}, volume = {1}, websites = {http://www.isca-speech.org/archive/interspeech_2015/papers/i15_2519.pdf}, publisher = {ISCA}, city = {Dresden, Germany}, id = {c074b917-846e-3d0c-872d-00c4df3d3ca4}, created = {2020-05-29T11:51:37.001Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-06-08T17:31:31.714Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {azais2015doesskills}, source_type = {inproceedings}, folder_uuids = {aac08d0d-38e7-4f4e-a381-5271c5c099ce}, private_publication = {false}, abstract = {In this paper, we introduce results for the task of Automatic Public Speech Assessment (APSA). Given the comparably sparse work carried out on this task up to this point, a novel database was required for training and evaluation of machine learning models. As a basis, the freely available oral presentations of the ICASSP conference in 2011 were selected due to their transcription including non-verbal vocalisations. The data was specifically labelled in terms of the perceived oratory ability of the speakers by five raters according to a 5-point Public Speaking Skill Rating Likert scale. We investigate the feasibility of speaker-independent APSA using different standardised acoustic feature sets computed per fixed chunk of an oral presentation in a series of ternary classification and continuous regression experiments. Further, we compare the relevance of different feature groups related to fluency (speech/hesitation rate), prosody, voice quality and a variety of spectral features. Our results demonstrate that oratory speaking skills can be reliably assessed using supra-segmental audio features, with prosodic ones being particularly suited.}, bibtype = {inproceedings}, author = {Payan, Adrien and Sun, Tianjiao and Vidal, Guillaume and Zhang, Tina and Coutinho, Eduardo and Eyben, Florian}, booktitle = {Proceedings of the Annual Conference of the International Speech Communication Association, INTERSPEECH} }
@inproceedings{ title = {The MUSEBAQ: a Comprehensive and Modular Instrument for Assessing Musical Engagement}, type = {inproceedings}, year = {2015}, keywords = {abstract,conference}, pages = {1}, city = {Geneva, Switzerland}, id = {72fb3c65-7a58-31b9-a2e4-cbe3721548bc}, created = {2020-05-29T11:51:37.111Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-05-30T17:17:28.286Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {rickard2015theengagement}, source_type = {inproceedings}, folder_uuids = {a2a583e8-b0a3-48f9-900f-27e15c9a7f71}, private_publication = {false}, bibtype = {inproceedings}, author = {Rickard, Nikki Sue and Chin, T-C and Coutinho, E and Scherer, K R}, booktitle = {Proceedings of the 4th International Conference on Music and Emotion (ICME’4)} }
@article{ title = {Automatic Estimation of Biosignals From the Human Voice}, type = {article}, year = {2015}, keywords = {article,invited,journal}, pages = {114:48--50}, volume = {350}, websites = {http://science.sciencemag.org/content/350/6256/114.3}, month = {10}, edition = {Special Su}, id = {5efd3c28-1e87-3da6-829f-566e56ba6cf4}, created = {2020-05-29T11:51:37.235Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-06-08T17:36:24.579Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {coutinho2015automaticvoice}, source_type = {article}, notes = {invited contribution}, folder_uuids = {99880aa7-55df-4b45-bfce-0ffc00b23ced}, private_publication = {false}, abstract = {Computational paralinguistics (CP) is a relatively new area of research that provides new methods, tools, and techniques to automatically recognize the states, traits, and qualities embedded in the nonsemantic aspects of human speech (1). In recent years, CP has reached a level of maturity that has permitted the development of a myriad of applications in everyday life, such as the automatic estimation of a speaker’s age, gender, height, emotional state, cognitive load, personality traits, likability, intelligibility, and medical condition (2). Here, we provide an overview of one particular application of CP that offers new solutions for health care—the recognition of physiological parameters (biosignals) from the voice alone.}, bibtype = {article}, author = {Coutinho, E and Schuller, Björn W.}, journal = {Science}, number = {6256} }
@inproceedings{ title = {On rater reliability and agreement based dynamic active learning}, type = {inproceedings}, year = {2015}, keywords = {article,conference}, pages = {70-76}, websites = {http://gateway.webofknowledge.com/gateway/Gateway.cgi?GWVersion=2&SrcApp=PARTNER_APP&SrcAuth=LinksAMR&KeyUT=WOS:000377887000011&DestLinkType=FullRecord&DestApp=ALL_WOS&UsrCustomerID=f3ec48df247ee1138ccd8d3ba59bacc2,http://ieeexplore.ieee.org/document/7344}, month = {9}, publisher = {IEEE}, id = {38dc393a-f322-3f71-9db6-0bf17a81191b}, created = {2020-05-29T11:51:37.237Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-06-08T17:31:31.875Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {zhang2015onlearning}, source_type = {inproceedings}, folder_uuids = {aac08d0d-38e7-4f4e-a381-5271c5c099ce}, private_publication = {false}, abstract = {In this paper, we propose two novel Dynamic Active Learning (DAL) methods with the aim of ultimately reducing the costly human labelling work for subjective tasks such as speech emotion recognition. Compared to conventional Active Learning (AL) algorithms, the proposed DAL approaches employ a highly efficient adaptive query strategy that minimises the number of annotations through three advancements. First, we shift from the standard majority voting procedure, in which unlabelled instances are annotated by a fixed number of raters, to an agreement-based annotation technique that dynamically determines how many human annotators are required to label a selected instance. Second, we introduce the concept of the order-based DAL algorithm by considering rater reliability and inter-rater agreement. Third, a highly dynamic development trend is successfully implemented by upgrading the agreement levels depending on the prediction uncertainty. In extensive experiments on standardised test-beds, we show that the new dynamic methods significantly improve the efficiency of the existing AL algorithms by reducing human labelling effort up to 85.41%, while achieving the same classification accuracy. Thus, the enhanced DAL derivations opens up high-potential research directions for the utmost exploitation of unlabelled data.}, bibtype = {inproceedings}, author = {Zhang, Yue and Coutinho, Eduardo and Schuller, Bjorn and Zhang, Zixing and Adam, Michael}, doi = {10.1109/ACII.2015.7344553}, booktitle = {2015 International Conference on Affective Computing and Intelligent Interaction, ACII 2015} }
@inproceedings{ title = {Dynamic Active Learning based on agreement and applied to emotion recognition in spoken interactions}, type = {inproceedings}, year = {2015}, keywords = {article,conference}, pages = {275-278}, websites = {http://dl.acm.org/citation.cfm?doid=2818346.2820774}, publisher = {ACM Press}, city = {New York, New York, USA}, id = {b81a6392-0597-30a6-a8ba-10abc421d190}, created = {2020-05-29T11:51:38.588Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-05-30T17:16:24.065Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {zhang2015dynamicinteractions}, source_type = {inproceedings}, folder_uuids = {aac08d0d-38e7-4f4e-a381-5271c5c099ce}, private_publication = {false}, abstract = {In this contribution, we propose a novel method for Active Learning (AL) - Dynamic Active Learning (DAL) - which targets the reduction of the costly human labelling work necessary for modelling subjective tasks such as emotion recognition in spoken interactions. The method implements an adaptive query strategy that minimises the amount of human labelling work by deciding for each instance whether it should automatically be labelled by machine or manually by human, as well as how many human annotators are required. Extensive experiments on standardised test-beds show that DAL significantly improves the efficiency of conventional AL. In particular, DAL achieves the same classification accuracy obtained with AL with up to 79.17 % less human annotation effort.}, bibtype = {inproceedings}, author = {Zhang, Yue and Coutinho, Eduardo and Zhang, Zixing and Quan, Caijiao and Schuller, Björn}, doi = {10.1145/2818346.2820774}, booktitle = {ICMI 2015 - Proceedings of the 2015 ACM International Conference on Multimodal Interaction} }
@article{ title = {Cooperative learning and its application to emotion recognition from speech}, type = {article}, year = {2015}, keywords = {article,journal}, pages = {115-126}, volume = {23}, websites = {http://gateway.webofknowledge.com/gateway/Gateway.cgi?GWVersion=2&SrcApp=PARTNER_APP&SrcAuth=LinksAMR&KeyUT=WOS:000348070700011&DestLinkType=FullRecord&DestApp=ALL_WOS&UsrCustomerID=f3ec48df247ee1138ccd8d3ba59bacc2 http://ieeexplore.ieee.org/document/6971}, month = {1}, id = {b9377466-8ba0-3199-97bb-ca60b014716a}, created = {2020-05-29T11:51:38.695Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-06-08T17:31:31.997Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {zhang2015cooperativespeech}, source_type = {JOUR}, folder_uuids = {116db2f1-e6ac-4780-bccf-a977325250cd,99880aa7-55df-4b45-bfce-0ffc00b23ced}, private_publication = {false}, abstract = {In this paper, we propose a novel method for highly efficient exploitation of unlabeled data-Cooperative Learning. Our approach consists of combining Active Learning and Semi-Supervised Learning techniques, with the aim of reducing the costly effects of human annotation. The core underlying idea of Cooperative Learning is to share the labeling work between human and machine efficiently in such a way that instances predicted with insufficient confidence value are subject to human labeling, and those with high confidence values are machine labeled. We conducted various test runs on two emotion recognition tasks with a variable number of initial supervised training instances and two different feature sets. The results show that Cooperative Learning consistently outperforms individual Active and Semi-Supervised Learning techniques in all test cases. In particular, we show that our method based on the combination of Active Learning and Co-Training leads to the same performance of a model trained on the whole training set, but using 75% fewer labeled instances. Therefore, our method efficiently and robustly reduces the need for human annotations.}, bibtype = {article}, author = {Zhang, Zixing and Coutinho, Eduardo and Deng, Jun and Schuller, Björn}, doi = {10.1109/TASLP.2014.2375558}, journal = {IEEE/ACM Transactions on Audio Speech and Language Processing}, number = {1} }
@inproceedings{ title = {Automatic recognition of emotional dimensions in singing}, type = {inproceedings}, year = {2015}, keywords = {abstract,conference}, pages = {1}, publisher = {University of Geneva}, city = {Geneva, Switzerland}, institution = {University of Geneva}, id = {03abea09-2867-3c3f-a387-224018afece2}, created = {2020-05-29T11:51:38.859Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-06-08T17:36:24.317Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {eyben2015automaticsinging}, source_type = {inproceedings}, folder_uuids = {a2a583e8-b0a3-48f9-900f-27e15c9a7f71}, private_publication = {false}, bibtype = {inproceedings}, author = {Eyben, F and Coutinho, E and Schuller, Björn W.}, booktitle = {Proceedings of the 4th International Conference on Music and Emotion (ICME’4)} }
@inproceedings{ title = {Agreement-Based Dynamic Active Learning with Least and Medium Certainty Query Strategy}, type = {inproceedings}, year = {2015}, keywords = {article,conference}, pages = {1-5}, publisher = {International Machine Learning Society (IMLS)}, city = {Lille, France}, id = {ca15255b-57b8-3b51-9a22-035b3d36b816}, created = {2020-05-29T11:51:38.863Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-05-30T17:16:56.561Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {zhang2015agreementbasedstrategy}, source_type = {inproceedings}, folder_uuids = {aac08d0d-38e7-4f4e-a381-5271c5c099ce}, private_publication = {false}, abstract = {In this contribution, we propose a novel method for active learning termed ‘dynamic active learn- ing’ or DAL for short, with the aim of ultimately reducing the costly human labelling work for sub- jective tasks such as speech emotion recognition. Through an adaptive query strategy, the amount of manual labelling work is minimised by deciding for each instance not only whether or not it should be annotated, but also dynamically on how many human annotators’ opinions are needed. Through extensive experiments on standardised test-beds, we show that DAL achieves the same classifica- tion accuracy of ‘traditional’ AL with a cost re- duction of up to 79.17%. Thus, the DAL method significantly improves the efficiency of existing al- gorithms, setting a new benchmark for the utmost exploitation of unlabelled data.}, bibtype = {inproceedings}, author = {Zhang, Yue and Coutinho, Eduardo and Zhang, Zixing and Quan, Caijiao and Schuller, Björn}, editor = {Krishnamurthy, A and Ramdas, A and Balcan, N and Singh, A}, booktitle = {Proceedings of the 32nd International Conference on Machine Learning (ICML 2015)} }
@inproceedings{ title = {Classifying Emotion-Antecedent Appraisal in Brain Activity Using Machine Learning Methods}, type = {inproceedings}, year = {2015}, keywords = {Conference,abstract}, pages = {1}, city = {Geneva, Switzerland}, id = {283b5af8-4929-3a4e-aff8-298ed0c6612a}, created = {2020-05-29T11:51:38.924Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-05-30T17:16:59.306Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {gentsch2015classifyingmethods}, source_type = {inproceedings}, notes = {1 page}, folder_uuids = {a2a583e8-b0a3-48f9-900f-27e15c9a7f71}, private_publication = {false}, bibtype = {inproceedings}, author = {Gentsch, Kornelia and Coutinho, Eduardo and Eyben, Florian and Schuller, Björn W. and Scherer, Klaus R.}, booktitle = {Proceedings of the International Society for Research on Emotions Conference (ISRE 2015)} }
@inproceedings{ title = {Exploring the importance of individual differences to the automatic estimation of emotions induced by music}, type = {inproceedings}, year = {2015}, keywords = {abstract,conference}, pages = {57-63}, websites = {http://dl.acm.org/citation.cfm?doid=2808196.2811643}, month = {10}, publisher = {ACM Press}, city = {New York, New York, USA}, id = {497e5bf2-b45b-3385-bf8f-85674f8d836e}, created = {2020-05-29T11:51:38.946Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-05-30T17:16:58.644Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {sagha2015exploringmusic}, source_type = {inproceedings}, folder_uuids = {a2a583e8-b0a3-48f9-900f-27e15c9a7f71}, private_publication = {false}, abstract = {The goal of this study was to evaluate the impact of the inclusion of listener-related factors (individual differences) on the prediction of music induced affect. A group of 24 subjects listened to a set of music excerpts previously demonstrated to express specific emotional characteristics (in terms of Arousal and Valence), and we collected information related to listeners' stable (personality, emotional intelligence, attentiveness, music preferences) and transient (mood, and physiological activity) states. Through a series of regression analysis we identified those factors which have a significant explanatory power over the affective states induced in the listeners. Our results show that incorporating information related to individual differences permits to identify more accurately the affective states induced in the listeners, which differ from those expressed by the music.}, bibtype = {inproceedings}, author = {Sagha, Hesam and Coutinho, Eduardo and Schuller, Björn}, doi = {10.1145/2808196.2811643}, booktitle = {AVEC 2015 - Proceedings of the 5th International Workshop on Audio/Visual Emotion Challenge, co-Located with MM 2015} }
@inproceedings{ title = {A Comparison of Undergraduates Music Listening Habits in Everyday Life and While Studying}, type = {inproceedings}, year = {2015}, keywords = {abstract,conference}, pages = {1}, publisher = {University of Geneva}, city = {Geneva, Switzerland}, institution = {University of Geneva}, id = {194a8cd6-1a6b-3ba9-85f9-56ba013a761e}, created = {2020-05-29T11:51:39.049Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-05-30T17:16:39.046Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {coutinho2015astudying}, source_type = {inproceedings}, folder_uuids = {a2a583e8-b0a3-48f9-900f-27e15c9a7f71}, private_publication = {false}, bibtype = {inproceedings}, author = {Coutinho, E and Lisser, A}, booktitle = {Proceedings of the 4th International Conference on Music and Emotion (ICME’4)} }
@inbook{ type = {inbook}, year = {2015}, keywords = {edition,journal}, volume = {7}, websites = {http://journal.frontiersin.org/researchtopic/3083/music-cognition}, publisher = {Frontiers Media}, id = {4d1fb4b4-b3ab-3b47-a92a-8b652b80d484}, created = {2020-05-29T11:51:39.262Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-05-30T17:16:25.432Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {perlovsky2016frontierspsychology}, source_type = {CHAP}, folder_uuids = {22cecb78-7b06-4839-9375-3735f65ff563}, private_publication = {false}, bibtype = {inbook}, author = {}, editor = {Perlovsky, L and Coutinho, E and Wilkins, R W}, chapter = {Music Cognition [Research Topic]}, title = {Frontiers in Psychology} }
@inproceedings{ title = {Predicting Musical Emotions From Low-level Acoustics and Physiological Measurements: Music and Speech}, type = {inproceedings}, year = {2015}, keywords = {abstract,conference}, pages = {1}, city = {Geneva, Switzerland}, id = {aef43df1-84ed-355c-bcfd-8ffd1b005903}, created = {2020-05-29T11:51:39.350Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-05-30T17:16:32.978Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {coutinho2015predictingspeech}, source_type = {inproceedings}, folder_uuids = {a2a583e8-b0a3-48f9-900f-27e15c9a7f71}, private_publication = {false}, bibtype = {inproceedings}, author = {Coutinho, E}, booktitle = {Proceedings of the 4th International Conference on Music and Emotion (ICME’4)} }
@inproceedings{ title = {The ICL-TUM-PASSAU approach for the MediaEval 2015 "affective impact of movies" task}, type = {inproceedings}, year = {2015}, volume = {1436}, month = {1}, publisher = {CEUR}, city = {Wurzen, Germany}, id = {b264e3e7-0921-3c0c-bd3c-e33747025430}, created = {2020-05-30T14:51:24.442Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-05-30T17:17:37.690Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {trigeorgis2015}, source_type = {inproceedings}, folder_uuids = {aac08d0d-38e7-4f4e-a381-5271c5c099ce}, private_publication = {false}, abstract = {In this paper we describe the Imperial College London, Technische Universitat München and University of Passau (ICL+TUM+PASSAU) team approach to the MediaEval's "Affective Impact of Movies" challenge, which consists in the automatic detection of affective (arousal and valence) and violent content in movie excerpts. In addition to the baseline features, we computed spectral and energy related acoustic features, and the probability of various objects being present in the video. Random Forests, AdaBoost and Support Vector Machines were used as classification methods. Best results show that the dataset is highly challenging for both affect and violence detection tasks, mainly because of issues in inter-rater agreement and data scarcity.}, bibtype = {inproceedings}, author = {Trigeorgis, George and Coutinho, Eduardo and Ringeval, Fabien and Marchi, Erik and Zafeiriou, Stefanos and Schuller, Björn}, editor = {Larson, Martha and Ionescu, Bogdan and Sjöberg, Mats and Anguera, Xavier and Poignant, Johann and Riegler, Michael and Eskevich, Maria and Hauff, Claudia and Sutcliffe, Richard and Jones, Gareth J.F. and Yang, Yi-Hsuan and Soleymani, Mohammad and Papadopoulos, Symeon}, booktitle = {CEUR Workshop Proceedings}, keywords = {article,conference} }
@inproceedings{ title = {Automatically estimating emotion in music with deep long-short term memory recurrent neural networks}, type = {inproceedings}, year = {2015}, pages = {1-3}, volume = {1436}, websites = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-84989923198&partnerID=40&md5=f0d407c8ffb96c19f299c78435558371,http://ceur-ws.org/Vol-1436/Paper64.pdf}, month = {9}, publisher = {CEUR}, city = {Wurzen, Germany}, id = {dfa7431b-f2ff-3228-adca-a768df6d0581}, created = {2020-05-30T17:34:32.702Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2021-06-17T15:16:03.160Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {coutinho2015automaticallynetworks}, source_type = {inproceedings}, notes = {<b>From Duplicate 1 (<i>Automatically estimating emotion in music with deep long-short term memory recurrent neural networks</i> - Coutinho, Eduardo; Trigeorgis, George; Zafeiriou, Stefanos; Schuller, Björn)<br/></b><br/><b>From Duplicate 1 (<i>Automatically estimating emotion in music with deep long-short term memory recurrent neural networks</i> - Coutinho, Eduardo; Trigeorgis, George; Zafeiriou, Stefanos; Schuller, Björn)<br/></b><br/>cited By 7<br/><br/><b>From Duplicate 2 (<i>Automatically estimating emotion in music with deep long-short term memory recurrent neural networks</i> - Coutinho, Eduardo; Trigeorgis, George; Zafeiriou, Stefanos; Schuller, Björn)<br/></b><br/><b>From Duplicate 1 (<i>Automatically estimating emotion in music with deep long-short term memory recurrent neural networks</i> - Coutinho, E; Trigeorgis, G; Zafeiriou, S; Schuller, B)<br/></b><br/>cited By 7<br/><br/><b>From Duplicate 2 (<i>Automatically estimating emotion in music with deep long-short term memory recurrent neural networks</i> - Coutinho, Eduardo; Trigeorgis, George; Zafeiriou, Stefanos; Schuller, Björn)<br/></b><br/><b>From Duplicate 1 (<i>Automatically estimating emotion in music with deep long-short term memory recurrent neural networks</i> - Coutinho, E; Trigeorgis, G; Zafeiriou, S; Schuller, B)<br/></b><br/>cited By 7}, folder_uuids = {aac08d0d-38e7-4f4e-a381-5271c5c099ce}, private_publication = {false}, abstract = {In this paper we describe our approach for the MediaEval's "Emotion in Music" task. Our method consists of deep Long-Short Term Memory Recurrent Neural Networks (LSTM-RNN) for dynamic Arousal and Valence regression, using acoustic and psychoacoustic features extracted from the songs that have been previously proven as effective for emotion prediction in music. Results on the challenge test demonstrate an excellent performance for Arousal estimation (r = 0.613 ± 0.278), but not for Valence (r = 0.026 ± 0.500). Issues regarding the quality of the test set annotations' reliability and distributions are indicated as plausible justifications for these results. By using a subset of the development set that was left out for performance estimation, we could determine that the performance of our approach may be underestimated for Valence (Arousal: r = 0.596 ± 0.386; Valence: r = 0.458 ± 0.551).}, bibtype = {inproceedings}, author = {Coutinho, Eduardo and Trigeorgis, George and Zafeiriou, Stefanos and Schuller, Björn}, editor = {Larson, Martha and Ionescu, Bogdan and Sjöberg, Mats and Anguera, Xavier and Poignant, Johann and Riegler, Michael and Eskevich, Maria and Hauff, Claudia and Sutcliffe, Richard and Jones, Gareth J.F. and Yang, Yi-Hsuan and Soleymani, Mohammad and Papadopoulos, Symeon}, booktitle = {CEUR Workshop Proceedings}, keywords = {article,conference} }
@inproceedings{ title = {The munich LSTM-RNN approach to the MediaEval 2014 "Emotion in Music" Task}, type = {inproceedings}, year = {2014}, volume = {1263}, websites = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-84909953530&partnerID=40&md5=96b8657503c52119dd83867ccbdc3264}, id = {87114ac2-214b-3813-b485-ba0f7153d1fd}, created = {2020-05-27T15:09:41.796Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2021-06-18T09:04:34.619Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {Coutinho2014a}, source_type = {CONF}, notes = {cited By 11}, private_publication = {false}, abstract = {In this paper we describe TUM's approach for the MediaEval's \Emotion in Music" task. The goal of this task is to automatically estimate the emotions expressed by music (in terms of Arousal and Valence) in a time-continuous fashion. Our system consists of Long-Short Term Memory Recurrent Neural Networks (LSTM-RNN) for dynamic Arousal and Valence regression. We used two di erent sets of acoustic and psychoacoustic features that have been previously proven as e ective for emotion prediction in music and speech. The best model yielded an average Pearson's correlation coe-cient of 0.354 (Arousal) and 0.198 (Valence), and an average Root Mean Squared Error of 0.102 (Arousal) and 0.079 (Valence).}, bibtype = {inproceedings}, author = {Coutinho, Eduardo and Weninger, Felix and Schuller, Björn and Scherer, Klaus R.}, booktitle = {CEUR Workshop Proceedings} }
@article{ title = {The effects of expert musical training on the perception of emotions in Bach’s Sonata for Unaccompanied Violin No. 1 in G Minor (BWV 1001).}, type = {article}, year = {2014}, keywords = {article,journal}, pages = {35-57}, volume = {24}, websites = {http://doi.apa.org/getdoi.cfm?doi=10.1037/pmu0000036}, id = {441486d4-3671-36e5-be8e-b13c2909e431}, created = {2020-05-29T11:51:38.590Z}, accessed = {2014-04-22}, file_attached = {false}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-06-08T17:31:54.615Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {spitzer2014the1001}, source_type = {article}, folder_uuids = {116db2f1-e6ac-4780-bccf-a977325250cd,99880aa7-55df-4b45-bfce-0ffc00b23ced,ba331422-1c6a-4d1c-a682-9282f58b3182}, private_publication = {false}, abstract = {: The focus of this article is the relationship between musical emotion, as expressed by the composer and perceived by the listener, and the structural features of a work of art-music. First, we analyzed a work by J. S. Bach for solo violin (Sonata for Unaccompanied Violin, No. 1 in G Minor, BWV 1001), from the standpoint of how its structural features were associated with the expression of different emotional categories from the perspective of the composer and through the eyes and ears of the music analyst. We then constructed 2 empirical experiments to test whether contemporary listeners could identify the same emotions identified by the analysis, targeted at 2 groups of subjects: relatively inexperienced popular music students; and musicians, composers, and music academics (including some of the world's leading Bach scholars). Our results suggest that-emotional attributions by low-level experts are led by surface acoustic features; those by high-expert listeners are led by both acoustic and formal features; that this applied much more to the emotions of Sadness and Tenderness rather than to Anger or Fear; and that despite the common confusion between Anger and Fear in real life, listeners were capable of differentiating these emotions in the music supporting analytical findings in the score., (C) 2014 by the American Psychological Association}, bibtype = {article}, author = {Spitzer, Michael and Coutinho, Eduardo}, doi = {10.1037/pmu0000036}, journal = {Psychomusicology: Music, Mind, and Brain}, number = {1} }
@article{ title = {Special Issue on Interactions Between Emotion and Cognition in Music}, type = {article}, year = {2014}, keywords = {edition,journal}, pages = {1-115}, volume = {24}, month = {3}, publisher = {American Psychological Association}, id = {f0842552-3d88-343e-b5f0-2d58bf18663a}, created = {2020-05-29T11:51:38.797Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-05-30T17:17:11.103Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {coutinho2014psychomusicologycognition}, source_type = {CHAP}, folder_uuids = {22cecb78-7b06-4839-9375-3735f65ff563}, private_publication = {false}, abstract = {Welcome to this special issue on interactions between emotion and cognition in music. The combined investigation of emotion and cognition and their interactions has been prominent in general psychology for some years. Nonetheless, we felt that within music research, this area of research has received less systematic attention. With a call for papers related to this theme, our intention was to stimulate more research activity in this area and to develop further our understanding of the ways in which emotions influence music cognition, as well as the ways in which our cognitive appraisal of events, persons and/or objects influence music related emotions. The very good response to our call from authors from a range of countries demonstrated that the theme taps into current developments in music research. A collection of submissions can be found in this issue, while publication of several others can be expected in upcoming issues. From the submissions to this special issue, it became clear that the topic has many ramifications and can be addressed from various perspectives. Together the submissions deepen and broaden our understanding of ways in which cognition and emotion are intertwined in the context of music. The first two articles investigate emotional associations of tonal modulation (Korsakova-Kreyn and Dowling) and emotional associations of musical sequences presented in different tonal modes (Straehley and Loebach), exploring the influence of our tonal knowledge on emotion perception in music. The influence of musical knowledge is also central to the paper by Spitzer and Coutinho who combine music analysis and psychological methods to compare the perception of emotion in Bach’s violin solo sonatas in highly trained experts and regular music connoisseurs. These laboratory based studies on perception of emotion are complemented by an exploration of listeners’ emotional experiences in ecological contexts: Balteş and Miu provide evidence on the importance of empathy and imagery mechanisms for the experience of musical emotions. Using a large-scale online questionnaire, Perdomo-Guevera investigates emotions experienced during music performance and highlights different profiles in performers depending on the context of emotional peak experiences which occur during practice, performance, and/or daily life. Taking an exploratory neuroscientific approach, Leslei, Ojeda and Makeig examine the behavior and brain dynamics related to musical engagement, and demonstrate that musical feelings can be effectively communicated through rhythmic gestures. From a theoretical perspective, Habibi and Damasio explore the link between music and feelings, and suggest the existence of a close tie between music and basic processes of life regulations, which have an impact at the individual level but are also significant promoters of socio-cultural organization. They consider that such a link is responsible for the pervasiveness of music-related experiences and activities. In a short report, Dean and Bailes use time series analysis to show that music-analytical large-scale segmentation can be discriminated in non-musicians' continuous perception of change in music, and suggest ways in which musical structure and agency (such as soloist vs. orchestra, singer vs. accompaniment) may influence those perceived changes. The special issue is complemented by a short report on an international summer school held in Sheffield during 2013, communicating new developments and ongoing activities in this psychology of music hub in the UK. Finally, we are pleased to highlight recently completed doctoral theses that directly or indirectly are related to the topic of the special issue, and which further illustrate the volume and breadth of current research efforts in this area and suggest that the future of the field is in good hands. We hope that the issue will foster further interest and research in this area and show that there is considerable scope for follow up issues on related topics. In particular, influences of emotional responses on the perception and cognition of music is an issue still mostly unexplored. Moreover, current models of emotion and cognition in music are still too often segregated. Renee Timmers & Eduardo Coutinho}, bibtype = {article}, author = {}, editor = {Coutinho, E and Timmers, R}, journal = {Psychomusicology: a journal of research in music cognition}, number = {1} }
@inproceedings{ title = {Transfer learning emotion manifestation across music and speech}, type = {inproceedings}, year = {2014}, keywords = {article,conference}, pages = {3592-3598}, websites = {http://ieeexplore.ieee.org/lpdocs/epic03/wrapper.htm?arnumber=6889814}, month = {7}, publisher = {IEEE}, id = {dec34897-c5c4-365c-97fd-741efea93123}, created = {2020-05-29T11:51:38.964Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2023-05-15T08:14:21.832Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {coutinho2014transferspeech}, source_type = {inproceedings}, folder_uuids = {aac08d0d-38e7-4f4e-a381-5271c5c099ce}, private_publication = {false}, abstract = {In this article, we focus on time-continuous predictions of emotion in music and speech, and the transfer of learning from one domain to the other. First, we compare the use of Recurrent Neural Networks (RNN) with standard hidden units (Simple Recurrent Network SRN) and Long-Short Term Memory (LSTM) blocks for intra-domain acoustic emotion recognition. We show that LSTM networks outperform SRN, and we explain, in average, 74%/59% (music) and 42%/29% (speech) of the variance in Arousal/Valence. Next, we evaluate whether cross-domain predictions of emotion are a viable option for acoustic emotion recognition, and we test the use of Transfer Learning (TL) for feature space adaptation. In average, our models are able to explain 70%/43% (music) and 28%/ll% (speech) of the variance in Arousal/Valence. Overall, results indicate a good cross-domain generalization performance, particularly for the model trained on speech and tested on music without pre-encoding of the input features. To our best knowledge, this is the first demonstration of cross-modal time-continuous predictions of emotion in the acoustic domain.}, bibtype = {inproceedings}, author = {Coutinho, Eduardo and Deng, Jun and Schuller, Bjorn}, doi = {10.1109/IJCNN.2014.6889814}, booktitle = {Proceedings of the International Joint Conference on Neural Networks} }
@article{ title = {Distributing recognition in computational paralinguistics}, type = {article}, year = {2014}, keywords = {article,journal}, pages = {406-417}, volume = {5}, websites = {http://gateway.webofknowledge.com/gateway/Gateway.cgi?GWVersion=2&SrcApp=PARTNER_APP&SrcAuth=LinksAMR&KeyUT=WOS:000346043900005&DestLinkType=FullRecord&DestApp=ALL_WOS&UsrCustomerID=f3ec48df247ee1138ccd8d3ba59bacc2,http://ieeexplore.ieee.org/document/6906}, month = {10}, day = {1}, id = {debe3fe6-0ca9-3a53-8af5-1c235385b724}, created = {2020-05-29T11:51:39.067Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-05-30T17:16:40.774Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {zhang2014distributingparalinguistics}, source_type = {article}, folder_uuids = {116db2f1-e6ac-4780-bccf-a977325250cd,99880aa7-55df-4b45-bfce-0ffc00b23ced}, private_publication = {false}, abstract = {In this paper, we propose and evaluate a distributed system for multiple Computational Paralinguistics tasks in a client-server architecture. The client side deals with feature extraction, compression, and bit-stream formatting, while the server side performs the reverse process, plus model training, and classification. The proposed architecture favors large-scale data collection and continuous model updating, personal information protection, and transmission bandwidth optimization. In order to preliminarily investigate the feasibility and reliability of the proposed system, we focus on the trade-off between transmission bandwidth and recognition accuracy. We conduct large-scale evaluations of some key functions, namely, feature compression/decompression, model training and classification, on five common paralinguistic tasks related to emotion, intoxication, pathology, age and gender. We show that, for most tasks, with compression ratios up to 40 (bandwidth savings up to 97.5 percent), the recognition accuracies are very close to the baselines. Our results encourage future exploitation of the system proposed in this paper, and demonstrate that we are not far from the creation of robust distributed multi-task paralinguistic recognition systems which can be applied to a myriad of everyday life scenarios.}, bibtype = {article}, author = {Zhang, Zixing and Coutinho, Eduardo and Deng, Jun and Schuller, Björn}, doi = {10.1109/TAFFC.2014.2359655}, journal = {IEEE Transactions on Affective Computing}, number = {4} }
@techreport{ title = {Geneva Music Background Questionnaire (GEMUBAQ)}, type = {techreport}, year = {2014}, keywords = {report}, month = {5}, publisher = {Swiss Center for Affective Sciences}, city = {Geneva, Switzerland}, institution = {Swiss Center for Affective Sciences}, id = {3f508823-4546-3f27-853e-5bf36958112f}, created = {2020-05-29T11:51:39.233Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-05-30T17:16:32.320Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {coutinho2014genevagemubaq}, source_type = {RPRT}, folder_uuids = {116db2f1-e6ac-4780-bccf-a977325250cd,8c7cc370-0269-4fc3-b738-15ea2990ae1e}, private_publication = {false}, abstract = {This report describes work carried out by the authors in preparation for the development of a Music Background Questionnaire intended to serve as a standard instrument to measure important background variables such as music activities, music abilities and attitudes, and frequent music listening experiences. In the course of development we decided to join forces with Tan-Chyuan Chin and Nikki Rickard who had been working on individual differences in music engagements. The result of the joint work is published as The MUSEBAQ: A Modular Tool for Measuring Multiple Dimensions of Music Engagement. The purpose of this brief report is to document the work performed in the context of the Music and Emotion project of the Swiss Center of Affective Sciences in 2014.}, bibtype = {techreport}, author = {Coutinho, E and Scherer, K R} }
@article{ title = {Music, Voice and Emotion (Special Issue)}, type = {article}, year = {2013}, volume = {7}, websites = {http://musicstudies.org/all-issues/volume-7-2013/}, id = {e29bacd0-33ff-38ab-a3cd-edff9b1bc43f}, created = {2018-12-10T11:57:57.002Z}, file_attached = {false}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2021-09-17T10:31:01.908Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {Coutinho2013}, private_publication = {false}, bibtype = {article}, author = {Coutinho, Eduardo and Fantini, Bernardino and Scherer, Klaus R.}, journal = {International Journal of Interdisciplinary Music Studies}, number = {1&2} }
@inproceedings{ title = {The influence of individual differences on emotion perception in music and speech prosody}, type = {inproceedings}, year = {2013}, pages = {1}, id = {b3384201-e12a-3046-835d-e48fb480ff8e}, created = {2019-09-18T08:06:23.629Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-05-29T12:00:31.731Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {dibben2013individualprosody}, source_type = {inproceedings}, folder_uuids = {a2a583e8-b0a3-48f9-900f-27e15c9a7f71}, private_publication = {false}, abstract = {The study reported here investigates the influence of individual differences on perception of emotion in music and speech: specifically we tested the mediating influence of personality, emotional intelligence, gender and musical training. A behavioural study collected two main types of data: continuous ratings of emotion perceived while listening to extracts of music and speech, using a computer interface which modelled emotion on two dimensions (arousal and valence), and demographic information including measures of personality (TIPI) and emotional intelligence (TEIQue-SF). We employed the novel statistical method of functional analysis of variance on the time series data which revealed a small number of statistically significant differences according to gender, emotional intelligence, emotional stability and musical training. This is the first time to our knowledge that effects of individual differences on continuous measures of emotion have been tested. \n}, bibtype = {inproceedings}, author = {Dibben, N J and Coutinho, E}, booktitle = {Proceedings of the 3rd International Conference on Music and Emotion (ICME’3), Jyväskylä, Finland, June 11-15}, keywords = {abstract,conference} }
@article{ title = {Psychoacoustic cues to emotion in speech prosody and music}, type = {article}, year = {2013}, keywords = {article,journal}, pages = {658-684}, volume = {27}, websites = {http://gateway.webofknowledge.com/gateway/Gateway.cgi?GWVersion=2%5C&SrcApp=PARTNER_APP%5C&SrcAuth=LinksAMR%5C&KeyUT=WOS:000319106500006%5C&DestLinkType=FullRecord%5C&DestApp=ALL_WOS%5C&UsrCustomerID=f3ec48df247ee1138ccd8d3ba59bacc2}, month = {6}, id = {2a5a8467-79ff-3480-9ca8-9521b2d9c322}, created = {2020-05-29T11:51:38.754Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2023-05-15T08:14:21.967Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {coutinho2013psychoacousticmusic}, source_type = {article}, folder_uuids = {99880aa7-55df-4b45-bfce-0ffc00b23ced}, private_publication = {false}, abstract = {There is strong evidence of shared acoustic profiles common to the expression of emotions in music and speech, yet relatively limited understanding of the specific psychoacoustic features involved. This study combined a controlled experiment and computational modelling to investigate the perceptual codes associated with the expression of emotion in the acoustic domain. The empirical stage of the study provided continuous human ratings of emotions perceived in excerpts of film music and natural speech samples. The computational stage created a computer model that retrieves the relevant information from the acoustic stimuli and makes predictions about the emotional expressiveness of speech and music close to the responses of human subjects. We show that a significant part of the listeners' second-by-second reported emotions to music and speech prosody can be predicted from a set of seven psychoacoustic features: loudness, tempo/speech rate, melody/prosody contour, spectral centroid, spectral flux, sharpness, and roughness. The implications of these results are discussed in the context of cross-modal similarities in the communication of emotion in the acoustic domain. © 2013 Copyright Taylor and Francis Group, LLC.}, bibtype = {article}, author = {Coutinho, Eduardo and Dibben, Nicola}, doi = {10.1080/02699931.2012.732559}, journal = {Cognition and Emotion}, number = {4} }
@inbook{ type = {inbook}, year = {2013}, keywords = {edition,journal}, volume = {7}, issue = {1&2}, websites = {http://musicstudies.org/all-issues/volume-7-2013/}, id = {f5220d83-9f39-3dfa-9ff1-501dc0bcae1c}, created = {2020-05-29T11:51:38.857Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2023-07-03T09:46:08.601Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {coutinho2013internationalstudies}, source_type = {CHAP}, folder_uuids = {22cecb78-7b06-4839-9375-3735f65ff563}, private_publication = {false}, bibtype = {inbook}, author = {Coutinho, Eduardo and Fantini, Bernardino and Scherer, Klaus R.}, editor = {Coutinho, E and Fantini, B and Scherer, K R}, chapter = {Special Issue on Music, Voice and Emotion}, title = {International Journal of Interdisciplinary Music Studies} }
@inproceedings{ title = {Emotions Induced by Music: the Role of the Listening Context and Modality of Presentation}, type = {inproceedings}, year = {2013}, keywords = {abstract,conference}, pages = {1}, publisher = {University of Jyväskylä, Department of Music.}, city = {Jyväskylä, Finland}, id = {18d5e4d4-ba40-3886-90a2-b27308da6bea}, created = {2020-05-29T11:51:39.028Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-05-30T17:17:02.217Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {coutinho2013emotionspresentation}, source_type = {inproceedings}, folder_uuids = {a2a583e8-b0a3-48f9-900f-27e15c9a7f71}, private_publication = {false}, bibtype = {inproceedings}, author = {Coutinho, E and Scherer, K R}, editor = {Luck, Geoff and Brabant, Olivier}, booktitle = {Proceedings of the 3rd International Conference on Music and Emotion (ICME’3)} }
@inproceedings{ title = {Emotions perceived in music and speech: relationships between psychoacoustic features, second-by-second subjective feelings of emotion and physiological responses}, type = {inproceedings}, year = {2013}, keywords = {Conference,abstract}, pages = {1}, publisher = {University of Jyväskylä, Department of Music.}, city = {Jyväskylä, Finland}, id = {cfd4d04b-de5e-3c66-9849-40abaf5e3378}, created = {2020-05-29T11:51:39.123Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-05-30T17:16:42.124Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {coutinho2013emotionsresponses}, source_type = {inproceedings}, folder_uuids = {a2a583e8-b0a3-48f9-900f-27e15c9a7f71}, private_publication = {false}, abstract = {There is strong evidence that the structure of affective responses to auditory stimuli is largely dependent on dynamic temporal patterns in low-level music structural parameters. Previous studies have shown that spatiotemporal dynamics in a small set of psychoacoustic features can predict two fundamental psychological dimensions of emotion: valence and arousal. The study reported here aims to determine the extent to which specific physiological responses can be used in tandem with psychoacoustic cues to predict emotional responses to music as well as to speech. In a behavioural study collected two main types of data: continuous ratings of emotion perceived while listening to extracts of music and speech, using a computer interface which modelled emotion on two dimensions (arousal and valence), and physiological measures (respiration, heart rate, skin conductance, skin temperature, and blood pressure) taken while listening to each stimulus. Then we analysed the existence of linear and non-linear correlations and associations between psychoacoutic features extracted from music and speech, physiological activity, and self-reported arousal and valence. For both domains, we found very strong correlations showing that physiological measures and psychoacoutic cues account for a large proportion of the variance in the reported arousal and valence. Strong correlations also emerged between psychocoutic cues and physiological responses, suggesting a possible route for the elicitation of subjective feelings. When comparing music and speech directly we found that while the significant changes to physiological measures for speech stimuli are confined to a small number of features, the physiological responses for music are much more diffuse across the various measures.}, bibtype = {inproceedings}, author = {Coutinho, Eduardo and Dibben, Nicola}, editor = {Luck, Geoff and Brabant, Olivier}, booktitle = {3rd International Conference on Music & Emotion} }
@inbook{ type = {inbook}, year = {2013}, pages = {121-145}, issue = {10}, websites = {http://www.oxfordscholarship.com/view/10.1093/acprof:oso/9780199654888.001.0001/acprof-9780199654888-chapter-10,https://liverpool.idm.oclc.org/login?url=https://search.ebscohost.com/login.aspx?direct=true&db=psyh&AN=2013-32821-010&site=ehost-live&scope=si}, publisher = {Oxford University Press}, series = {Series in affective science}, id = {659327c3-1d17-3477-a52f-777bd3c7ddeb}, created = {2020-05-30T17:34:32.953Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2022-02-02T13:58:44.809Z}, read = {true}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {scherer2013howapproach}, source_type = {CHAP}, folder_uuids = {5db95977-632e-457e-b1b5-8ad03c3d17c4}, private_publication = {false}, abstract = {- In this chapter we propose an integrated framework that links the perception and cognition of music to the production of emotion by means of psychobiological pathways recruiting various subsystems of the central and autonomous nervous systems. These pathways (which we call routes) are Appraisal, Memory, Entrainment, Empathy, and Contagion, and they permit to describe the nature and substrate of a wide variety of emotional responses to music. We focus on music characteristics, more precisely the musical structure and performance variables, as the determinant factors of emotional indication, while considering a variety of possible modulatory effects related to listener characteristics and states, the performer, and the listening context.}, bibtype = {inbook}, author = {Scherer, Klaus R. and Coutinho, Eduardo}, editor = {Cochrane, T and Fantini, B and Scherer, K R}, doi = {10.1093/acprof:oso/9780199654888.003.0010}, chapter = {How music creates emotion}, title = {The Emotional Power of Music}, keywords = {book,chapter} }
@inproceedings{ title = {Towards a Brief Domain-specific Self-report Scale for the Rapid Assessment of Musically Induced Emotions}, type = {inproceedings}, year = {2012}, keywords = {Conference,abstract}, pages = {229}, id = {e7500ca5-1c4e-3c2a-a137-4377ea35f715}, created = {2020-05-29T11:51:38.897Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-05-30T17:16:55.584Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {coutinho2012towardsemotions}, source_type = {inproceedings}, folder_uuids = {a2a583e8-b0a3-48f9-900f-27e15c9a7f71}, private_publication = {false}, abstract = {The Geneva Emotional Music Scale (GEMS; Zentner, Grandjean, & Scherer, 2008) is the first domain-specific model of emotion specifically developed to measure musically evoked subjective feelings of emotion (particularly in live performances). The scale consists of a list of 45 emotion terms pertaining to nine emotion factors or categories, describing a pervasive universe of feelings of emotion frequently experienced while listening to music (particularly in live performances). In this paper, we highlight and address two potential limitations of the GEMS. The first one is related to the fact that the GEMS comprises a high number of elements to be rated, an aspect that creates many difficulties in fieldwork studies where a rapid assessment is often necessary. The second, is the extent to which the GEMS may be consistently used to discern the emotions experienced while listening to music genres differing significantly from those that led to its development (especially due to an overrepresentation of classical music performances).}, bibtype = {inproceedings}, author = {Coutinho, E and Scherer, K R}, editor = {Cambouropoulos, E and Tsougras, C and Mavromatis, P and Pastiadis, C}, booktitle = {Proceedings of the 12th International Conference of Music Perception and Cognition (ICMPC12)} }
@article{ title = {Musical Emotions: Predicting Second-by-Second Subjective Feelings of Emotion From Low-Level Psychoacoustic Features and Physiological Measurements}, type = {article}, year = {2011}, keywords = {article,journal}, pages = {921-937}, volume = {11}, websites = {http://gateway.webofknowledge.com/gateway/Gateway.cgi?GWVersion=2&SrcApp=PARTNER_APP&SrcAuth=LinksAMR&KeyUT=WOS:000294594400021&DestLinkType=FullRecord&DestApp=ALL_WOS&UsrCustomerID=f3ec48df247ee1138ccd8d3ba59bacc2,http://doi.apa.org/getdoi.cfm?doi=10.103}, month = {8}, id = {b6765f38-d386-3dd2-900c-061d0d93556e}, created = {2020-05-29T11:51:38.748Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-05-30T17:17:09.709Z}, read = {true}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {Coutinho2011a}, source_type = {article}, folder_uuids = {3f6fce84-0b1d-41cd-9582-3954eada97d3,031e3fe6-33ba-42b4-a8d9-8583f8e1fd89,116db2f1-e6ac-4780-bccf-a977325250cd,99880aa7-55df-4b45-bfce-0ffc00b23ced,d3bdd308-08b1-4b78-a4c1-464ca9763e8d}, private_publication = {false}, abstract = {We sustain that the structure of affect elicited by music is largely dependent on dynamic temporal patterns in low-level music structural parameters. In support of this claim, we have previously provided evidence that spatiotemporal dynamics in psychoacoustic features resonate with two psychological dimensions of affect underlying judgments of subjective feelings: arousal and valence. In this article we extend our previous investigations in two aspects. First, we focus on the emotions experienced rather than perceived while listening to music. Second, we evaluate the extent to which peripheral feedback in music can account for the predicted emotional responses, that is, the role of physiological arousal in determining the intensity and valence of musical emotions. Akin to our previous findings, we will show that a significant part of the listeners' reported emotions can be predicted from a set of six psychoacoustic features-loudness, pitch level, pitch contour, tempo, texture, and sharpness. Furthermore, the accuracy of those predictions is improved with the inclusion of physiological cues-skin conductance and heart rate. The interdisciplinary work presented here provides a new methodology to the field of music and emotion research based on the combination of computational and experimental work, which aid the analysis of the emotional responses to music, while offering a platform for the abstract representation of those complex relationships. Future developments may aid specific areas, such as, psychology and music therapy, by providing coherent descriptions of the emotional effects of specific music stimuli. © 2011 American Psychological Association.}, bibtype = {article}, author = {Coutinho, Eduardo and Cangelosi, Angelo}, doi = {10.1037/a0024700}, journal = {Emotion}, number = {4} }
@inproceedings{ title = {Music, Speech and Emotion: psycho-physiological and computational investigations}, type = {inproceedings}, year = {2010}, keywords = {Conference,abstract}, pages = {47-48}, publisher = {University of Sheffield}, city = {Sheffield}, id = {02c4ccfa-1c7e-372d-89b8-654d934c9a6f}, created = {2020-05-29T11:51:38.645Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-05-30T17:17:25.713Z}, read = {true}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {Coutinho2010}, source_type = {inproceedings}, notes = {<b>From Duplicate 1 (<i>Music, Speech and Emotion: psycho-physiological and computational investigations</i> - Coutinho, Eduardo; Dibben, Nicola)<br/></b><br/>From Duplicate 1 (Music, Speech and Emotion: psycho-physiological and computational investigations - Coutinho, Eduardo; Dibben, Nicola) From Duplicate 3 ( Music, Speech and Emotion: psycho-physiological and computational investigations - Coutinho, Eduardo; Dibben, Nicola ) From Duplicate 2 (Music, Speech and Emotion: psycho-physiological and computational investigations - Coutinho, Eduardo; Dibben, Nicola) Proceedings of the International Conference on Interdisciplinary Musicology (CIM10): "Nature versus Culture", 23-24 July 2010, Sheffield, UK<br/><br/><b>From Duplicate 2 (<i>Music, Speech and Emotion: psycho-physiological and computational investigations</i> - Coutinho, Eduardo; Dibben, Nicola)<br/></b><br/><b>From Duplicate 1 (<i>Music, Speech and Emotion: psycho-physiological and computational investigations</i> - Coutinho, Eduardo; Dibben, Nicola)<br/></b><br/><b>From Duplicate 3 ( <i>Music, Speech and Emotion: psycho-physiological and computational investigations</i> - Coutinho, Eduardo; Dibben, Nicola )<br/></b><br/><br/><b>From Duplicate 2 (<i>Music, Speech and Emotion: psycho-physiological and computational investigations</i> - Coutinho, Eduardo; Dibben, Nicola)<br/></b><br/>Proceedings of the International Conference on Interdisciplinary Musicology (CIM10): "Nature versus Culture", 23-24 July 2010, Sheffield, UK}, folder_uuids = {a2a583e8-b0a3-48f9-900f-27e15c9a7f71,3f6fce84-0b1d-41cd-9582-3954eada97d3,031e3fe6-33ba-42b4-a8d9-8583f8e1fd89,b6ff42e6-ef84-4735-ac6e-3ae5287032d9}, private_publication = {false}, bibtype = {inproceedings}, author = {Coutinho, Eduardo and Dibben, Nicola}, editor = {Timmers, Renee and Dibben, Nicola}, booktitle = {Proceedings of the International Conference on Interdisciplinary Musicology: Nature versus Culture (CIM'10)} }
@inbook{ type = {inbook}, year = {2010}, keywords = {book,chapter}, pages = {333-370}, issue = {12}, websites = {https://digital-library.theiet.org/content/books/10.1049/pbce071e_ch12}, month = {1}, publisher = {IET}, city = {The Institution of Engineering and Technology, Michael Faraday House, Six Hills Way, Stevenage SG1 2AY, UK}, id = {94f0b320-f5cd-367e-bf2c-83ed792c106e}, created = {2020-05-29T11:51:39.178Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-05-30T17:16:43.662Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {coutinho2010aemotions}, source_type = {incollection}, folder_uuids = {5db95977-632e-457e-b1b5-8ad03c3d17c4}, private_publication = {false}, abstract = {This chapter presents a novel methodology to analyse the dynamics of emotional responses to music in terms of computational representations of perceptual processes (psychoacoustic features) and self-perception of physiological activation (peripheral feedback). The approach consists of a computational investigation of musical emotions based on spatio-temporal neural networks sensitive to structural aspects of music. We present two computational studies based on connectionist network models that predict human subjective feelings of emotion. The first study uses six basic psychoacoustic dimensions extracted from the music pieces as predictors of the emotional response. The second computational study evaluates the additional contribution of physiological arousal to the subjective feeling of emotion. Both studies are backed up by experimental data. A detailed analysis of the simulation models’ results demonstrates that a significant part of the listener’s affective response can be predicted from a set of psychoacoustic features of sound tempo, loudness, multiplicity (texture), power spectrum centroid (mean pitch), sharpness (timbre) and mean STFT flux (pitch variation) and one physiological cue, heart rate. This work provides a new methodology to the field of music and emotion research based on combinations of computational and experimental work, which aid the analysis of emotional responses to music, while offering a platform for the abstract representation of those complex relationships.}, bibtype = {inbook}, author = {Coutinho, Eduardo and Cangelosi, Angelo}, editor = {Nefti-Meziani, S and Gray, J}, doi = {10.1049/PBCE071E_ch12}, chapter = {A neural network model for the prediction of musical emotions}, title = {Advances in Cognitive Systems} }
@inproceedings{ title = {Modeling Psycho-physiological Measurements of Emotional Responses to Multiple Music Genres}, type = {inproceedings}, year = {2010}, keywords = {Conference,abstract}, pages = {53}, id = {290458b4-4778-3b12-b0e4-eac187fb4f8b}, created = {2020-05-29T11:51:39.400Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-05-30T17:16:36.235Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {coutinho2010modelinggenres}, source_type = {inproceedings}, folder_uuids = {a2a583e8-b0a3-48f9-900f-27e15c9a7f71}, private_publication = {false}, bibtype = {inproceedings}, author = {Coutinho, E}, editor = {S M Demorest, S J M and Campbell, P S}, booktitle = {Proceedings of 11th International Conference of Music Perception and Cognition (ICMPC11)} }
@article{ title = {Cognitive dissonance, knowledge instinct and musical emotions}, type = {article}, year = {2010}, keywords = {article,journal}, pages = {30-32}, volume = {7}, websites = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-77349096866&doi=10.1016%2Fj.plrev.2009.12.005&partnerID=40&md5=6ebe1ce514cf4fed7188ffff8fde7478,http://gateway.webofknowledge.com/gateway/Gateway.cgi?GWVersion=2&SrcApp=PARTNER_APP&SrcAuth=LinksAMR&KeyUT}, month = {3}, publisher = {Elsevier B.V.}, id = {2725a2b3-e3f7-340d-84f0-74544dbc06e6}, created = {2020-05-30T17:34:32.815Z}, accessed = {2012-03-15}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2021-06-17T15:16:16.758Z}, read = {true}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {Coutinho2010a}, source_type = {article}, notes = {<b>From Duplicate 1 (<i>Cognitive dissonance, knowledge instinct and musical emotions</i> - Coutinho, Eduardo)<br/></b><br/>cited By 2<br/><br/><b>From Duplicate 2 (<i>Cognitive dissonance, knowledge instinct and musical emotions</i> - Coutinho, Eduardo)<br/></b><br/><b>From Duplicate 2 (<i>Cognitive dissonance, knowledge instinct and musical emotions</i> - Coutinho, Eduardo)<br/></b><br/>cited By 2}, folder_uuids = {116db2f1-e6ac-4780-bccf-a977325250cd,99880aa7-55df-4b45-bfce-0ffc00b23ced,813ed798-f952-404b-9427-9475822f127a,db78b332-cabb-4a66-a735-a51b0746de51}, private_publication = {false}, bibtype = {article}, author = {Coutinho, Eduardo}, doi = {10.1016/j.plrev.2009.12.005}, journal = {Physics of Life Reviews}, number = {1} }
@article{ title = {The use of spatio-temporal connectionist models in psychological studies of musical emotions}, type = {article}, year = {2009}, keywords = {article,journal,thesis}, pages = {1-15}, volume = {27}, websites = {http://caliber.ucpress.net/doi/abs/10.1525/mp.2009.27.1.1,http://www.jstor.org/stable/40286139,http://mp.ucpress.edu/cgi/doi/10.1525/mp.2009.27.1.1}, month = {9}, city = {Plymouth, UK}, institution = {University of Plymouth}, department = {School of Computing and Mathematics}, id = {6d87fd6f-7923-3030-87d8-b46565c14aeb}, created = {2020-05-30T17:34:32.696Z}, accessed = {2012-03-15}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2023-05-15T08:14:21.322Z}, read = {true}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {Coutinho2009}, source_type = {phdthesis}, folder_uuids = {031e3fe6-33ba-42b4-a8d9-8583f8e1fd89,58f2988f-d929-444e-8c41-5db314c765aa,116db2f1-e6ac-4780-bccf-a977325250cd,99880aa7-55df-4b45-bfce-0ffc00b23ced}, private_publication = {false}, abstract = {This article presents a novel methodology to analyze the dynamics of emotional responses to music. It consists of a computational investigation based on spatiotemporal neural networks, which "mimic" human affective responses to music and predict the responses to novel music sequences. The results provide evidence suggesting that spatiotemporal patterns of sound resonate with affective features underlying judgments of subjective feelings (arousal and valence). A significant part of the listener's affective response is predicted from a set of six psychoacoustic features of sound-loudness, tempo, texture, mean pitch, pitch variation, and sharpness. A detailed analysis of the network parameters and dynamics also allows us to identify the role of specific psychoacoustic variables (e.g., tempo and loudness) in music emotional appraisal. This work contributes new evidence and insights to the study of musical emotions, with particular relevance to the music perception and cognition research community. © 2009 By the Regents of the University of California.}, bibtype = {article}, author = {Coutinho, Eduardo and Cangelosi, Angelo}, doi = {10.1525/mp.2009.27.1.1}, journal = {Music Perception}, number = {1} }
@inproceedings{ title = {Psycho-physiological Patterns of Musical Emotions and Their Relation with Music Structure}, type = {inproceedings}, year = {2008}, pages = {94}, id = {3d4b087b-3d1d-3f02-8667-2432bbd5a3be}, created = {2018-03-29T13:11:33.525Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2021-05-14T08:53:58.900Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {coutinho2008psychophysiologicalstructure}, source_type = {inproceedings}, notes = {date-added: 2010-03-11 09:46:03 +0000<br/>date-modified: 2010-03-11 09:54:36 +0000}, folder_uuids = {a2a583e8-b0a3-48f9-900f-27e15c9a7f71}, private_publication = {false}, bibtype = {inproceedings}, author = {Coutinho, E and Cangelosi, A}, editor = {Miyazaki, K and Hiraga, Y and Adachi, M and Nakajima, Y and Tsuzaki, M}, booktitle = {Proceedings of the 10th International Conference on Music Perception and Cognition (ICMPC10)}, keywords = {Conference,abstract} }
@inproceedings{ title = {Towards a Model for Embodied Emotions}, type = {inproceedings}, year = {2007}, keywords = {article,conference}, pages = {54-63}, websites = {http://ieeexplore.ieee.org/document/4145923/}, month = {12}, publisher = {IEEE}, id = {fcefc664-af4b-3332-95c2-9a1e95c186dc}, created = {2020-05-29T11:51:39.182Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-05-30T17:16:53.929Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {coutinho2005towardsemotions}, source_type = {inproceedings}, folder_uuids = {aac08d0d-38e7-4f4e-a381-5271c5c099ce}, private_publication = {false}, abstract = {We are interested in developing A-Life-like models to study the evolution of emotional systems in artificial worlds inhabited by autonomous agents. This paper focuses on the emotional component of an agent at its very basic physical level. We adopt an evolutionary perspective by modelling the agent based on biologically plausible principles, whereby emotions emerge from homeostatic mechanisms. We suggest that the agent should be embodied so as to allow its behaviour to be affected by low-level physical tasks. By embodiment we mean that the agent has a virtual physical body whose states can be sensed by the agent itself. The simulations show the emergence of a stable emotional system with emotional contexts resulting from dynamical categorization of objects in the world. This proved to be effective and versatile enough to allow the agent to adapt itself to unknown world configurations. The results are coherent with Antonio Damasio's theory of background emotional system (2000). We demonstrate that body/world categorizations and body maps can evolve from a simple rule: self-survival}, bibtype = {inproceedings}, author = {Coutinho, Eduardo and Miranda, Eduardo R. and Cangelosi, Angelo}, doi = {10.1109/epia.2005.341264}, booktitle = {2005 Portuguese Conference on Artificial Intelligence} }
@inproceedings{ title = {Emotion and embodiment in cognitive Agents: From instincts to music}, type = {inproceedings}, year = {2007}, pages = {133-138}, websites = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-34548721619&doi=10.1109%2FKIMAS.2007.369798&partnerID=40&md5=f8f98e2614bad5c5d0c6ede9aa095954,http://ieeexplore.ieee.org/document/4227537/}, month = {4}, publisher = {IEEE}, id = {54950cb4-26b9-3782-b3e3-509a6065443d}, created = {2020-05-30T17:34:32.700Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2023-05-15T08:14:21.365Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {Coutinho2007}, source_type = {CONF}, notes = {<b>From Duplicate 1 (<i>Emotion and embodiment in cognitive Agents: From instincts to music</i> - Coutinho, Eduardo; Cangelosi, Angelo)<br/></b><br/><b>From Duplicate 1 (<i>Emotion and embodiment in cognitive Agents: From instincts to music</i> - Coutinho, Eduardo; Cangelosi, Angelo)<br/></b><br/>cited By 5<br/><br/><b>From Duplicate 2 (<i>Emotion and embodiment in cognitive Agents: From instincts to music</i> - Coutinho, Eduardo; Cangelosi, Angelo)<br/></b><br/>International Conference on Integration of Knowledge Intensive Multi-Agent Systems, Waltham, MA, APR 30-MAY 03, 2007<br/><br/><b>From Duplicate 2 (<i>Emotion and embodiment in cognitive Agents: From instincts to music</i> - Coutinho, Eduardo; Cangelosi, Angelo)<br/></b><br/>cited By 5<br/><br/><b>From Duplicate 3 (<i>Emotion and embodiment in cognitive Agents: From instincts to music</i> - Coutinho, Eduardo; Cangelosi, Angelo)<br/></b><br/>International Conference on Integration of Knowledge Intensive Multi-Agent Systems, Waltham, MA, APR 30-MAY 03, 2007}, private_publication = {false}, abstract = {This paper suggests the use of modeling techniques to tack into the emotion'cognition paradigm. We presented two possible frameworks focusing on the embodiment basis of emotions. The first one explores the emergence of emotion mechanisms, by establishing the primary conditions of survival and exploring the basic roots of emotional systems. These simulations show the emergence of a stable motivational system with emotional contexts resulting from dynamical categorization of objects in the environment, in answer to survival pressures and homeostatic processes. The second framework uses music as a source of information about the mechanism of emotion and we propose a model based on recurrent connectionist architectures for the prediction of emotional states in response to music experience. Results demonstrate that there are strong relationships between arousal reports and music psychoacoustics, such as tempo and dynamics. Finally we discuss future directions of research on emotions based on cognitive agents and mathematical models. © 2007 IEEE.}, bibtype = {inproceedings}, author = {Coutinho, Eduardo and Cangelosi, Angelo}, doi = {10.1109/KIMAS.2007.369798}, booktitle = {2007 International Conference on Integration of Knowledge Intensive Multi-Agent Systems, KIMAS 2007} }
@inproceedings{ title = {Computational Musicology: An Artificial Life Approach}, type = {inproceedings}, year = {2007}, pages = {85-93}, websites = {http://ieeexplore.ieee.org/document/4145929/}, month = {12}, publisher = {APPIA; DIUBI; CISUC; Microsoft Res; FCT; Camara Municipal Coviha; Parkurbis; IMB-Hoteis; Caixa Geral Depositos; AUTO JARDIM Automoveis S A; TAP Air Portugal; SEMMAIS Programac Design Interact; OmniSys Tecnol Informacao Lda; Regisfund Maquinas Escritor Lda}, id = {5f4215c0-dcb3-3296-b43e-b065239b721e}, created = {2020-05-30T17:34:32.958Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2021-06-17T15:16:17.710Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {coutinho2005computationalapproach}, source_type = {CONF}, notes = {<b>From Duplicate 1 (<i>Computational Musicology: An Artificial Life Approach</i> - Coutinho, Eduardo; Gimenes, Marcelo; Martins, Joao M.; Miranda, Eduardo R.)<br/></b><br/>Portuguese Conference on Artificial Intelligence, Univ Beira Interior, Covilha, PORTUGAL, 2005<br/><br/><b>From Duplicate 2 (<i>Computational Musicology: An Artificial Life Approach</i> - Coutinho, Eduardo; Gimenes, Marcelo; Martins, Joao M.; Miranda, Eduardo R.)<br/></b><br/><b>From Duplicate 2 (<i>Computational Musicology: An Artificial Life Approach</i> - Coutinho, Eduardo; Gimenes, Marcelo; Martins, Joao M.; Miranda, Eduardo R.)<br/></b><br/>Portuguese Conference on Artificial Intelligence, Univ Beira Interior, Covilha, PORTUGAL, 2005}, folder_uuids = {aac08d0d-38e7-4f4e-a381-5271c5c099ce}, private_publication = {false}, abstract = {Artificial Life (A-Life) and Evolutionary Algorithms (EA) provide a variety of new techniques for making and studying music. EA have been used in different musical applications, ranging from new systems for composition and performance, to models for studying musical evolution in artificial societies. This paper starts with a brief introduction to three main fields of application of EA in Music, namely sound design, creativity and computational musicology. Then it presents our work in the field of computational musicology. Computational musicology is broadly defined as the study of Music with computational modelling and simulation. We are interested in developing ALifebased models to study the evolution of musical cognition in an artificial society of agents. In this paper we present the main components of a model that we are developing to study the evolution of musical ontogenies, focusing on the evolution of rhythms and emotional systems. The paper concludes by suggesting that A-Life and EA provide a powerful paradigm for computational musicology.}, bibtype = {inproceedings}, author = {Coutinho, Eduardo and Gimenes, Marcelo and Martins, Joao M. and Miranda, Eduardo R.}, editor = {Bento A and Dias, G, C and Cardoso}, doi = {10.1109/epia.2005.341270}, booktitle = {2005 Portuguese Conference on Artificial Intelligence}, keywords = {article,conference} }
@inproceedings{ title = {The dynamics of music perception and emotional experience: a connectionist model}, type = {inproceedings}, year = {2006}, keywords = {Conference,abstract}, pages = {1096-1104}, id = {f4e1a72d-0af3-38a0-8298-97ef5d2ea3a0}, created = {2018-03-29T13:11:33.082Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2021-05-14T08:53:57.309Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {coutinho2006themodel}, source_type = {inproceedings}, folder_uuids = {a2a583e8-b0a3-48f9-900f-27e15c9a7f71}, private_publication = {false}, abstract = {In this paper we present a methodological framework for the study of musical emotions, incorporating psycho- physiological experiments and modelling techniques for data analysis. Our focus is restricted to the body implica- tions as a possible source of information about the emo- tional experience, and responsible to certain levels of emo- tional engagement in music. We present and apply the use of spatiotemporal connectionist models, as a modelling technique. Simulation results using a simple recurrent net- work, demonstrate that our connectionist approach leads to a better fit of the simulated process, compared with pre- vious models. We demonstrate that a spatiotemporal con- nectionist model trained on music and emotional rating data is capable of generalizing the level of arousal in re- sponse to novel music input. The model is also capable of identifying the main variables responsible for such an emo- tional rating behaviour.}, bibtype = {inproceedings}, author = {Coutinho, Eduardo and Cangelosi, Angelo}, editor = {Baroni, M and Addessi, A R and Caterina, R and Costa, M}, booktitle = {9th International Conference on Music Perception and Cognition} }
@inbook{ type = {inbook}, year = {2005}, pages = {497}, volume = {3661 LNAI}, websites = {http://link.springer.com/10.1007/11550617_48}, id = {108d0ade-9c4d-3c62-b7b9-3215a63e04d9}, created = {2018-03-29T13:11:33.519Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2023-05-15T08:14:21.150Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {coutinho2005evolvingmusic}, source_type = {inproceedings}, private_publication = {false}, abstract = {Today computers can be programmed to compose music automatically, using techniques ranging from rule-based to evolutionary computation (e.g., genetic algorithms and cellular automata). However, we lack good techniques for programming the computer to play or interpret music with expression. Expression in music is largely associated with emotions. Therefore we are looking into the possibility of programming computer music systems with emotions. We are addressing this problem from an A-Life perspective combined with recent discoveries in the neurosciences with respect to emotion. Antonio Damasio refers to the importance of emotions to assist an individual to maintain survival, as they seem to be an important mechanism for adaptation and decision-making. Specifically, environmental events of value should be susceptible to preferential perceptual processing, regarding their pleasant or unpleasant. This approach assumes the existence of neural pathways that facilitate survival. Stable emotional systems should then emerge from self-regulatory homeostatic processes. We implemented a system consisting of an agent that inhabits an environment containing with a number of different objects. These objects cause different physiological reactions to the agent. The internal body state of the agent is defined by a set of internal drives and a set of physiological variables that vary as the agent interacts with the objects it encounters in the environment. The agent is controlled by a feed-forward neural network that integrates visual input with information about its internal states. The network learns through a reinforcement-learning algorithm, derivate from different body states, due to pleasant or unpleasant stimuli. The playback of musical recordings in MIDI format is steered by the physiological variables of the agent in different phases of the adaptation process. The behaviour of the system is coherent with Damasio's theory of background emotional system. It demonstrates that specific phenomena, such as body/world categorization and existence of a body map, can evolve from a simple rule: self-survival in the environment. Currently, we are in the process of defining a system of higher-level emotional states (or foreground system) that will operate in social contexts; i.e., with several agents in the environment reacting to objects and interacting with each other. © Springer-Verlag Berlin Heidelberg 2005.}, bibtype = {inbook}, author = {Coutinho, Eduardo and Miranda, Eduardo Reck and Da Silva, Patricio}, editor = {Panayiotopoulos, T and Gratch, J and Aylett, R and Ballin, D and Olivier, P and Rist, T}, doi = {10.1007/11550617_48}, chapter = {Evolving emotional behaviour for expressive performance of music}, title = {Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)} }
@inproceedings{ title = {Artificial Emotion - Simulating Affective Behaviour}, type = {inproceedings}, year = {2005}, keywords = {Conference,abstract}, pages = {7}, publisher = {Glasgow, Scotland}, institution = {Glasgow, Scotland}, id = {17be4876-5dd7-3c79-a145-610a02526735}, created = {2020-05-29T11:51:39.418Z}, file_attached = {true}, profile_id = {ffa9027c-806a-3827-93a1-02c42eb146a1}, last_modified = {2020-05-30T17:16:35.716Z}, read = {false}, starred = {false}, authored = {true}, confirmed = {true}, hidden = {false}, citation_key = {coutinho2005artificialbehaviour}, source_type = {inproceedings}, folder_uuids = {a2a583e8-b0a3-48f9-900f-27e15c9a7f71}, private_publication = {false}, bibtype = {inproceedings}, author = {Coutinho, E and Miranda, E R and Cangelosi, A}, booktitle = {Proceedings of the Post-cognitivist Psychology Conference} }