\n\n \n\n \n\n \n \n\n \n\n \n \n\n \n\n \n

\n generated by\n \n $\"bibbase.org\"\n$ \n \n

\n \n\n

\n\n

\n \n Group by\n \n \n
- \n Year\n
- \n Author\n
- \n Type\n
- \n Keyword\n
- \n Downloads\n
\n
\n \n \n \n \n
- \n \n Expand/Collapse All\n \n
- \n \n Download BibTeX\n \n
- \n \n RSS Feed\n \n
\n

\n\n\n

\n\n Excellent! Next you can\n create a new website with this list, or\n embed it in an existing web page by copying & pasting\n any of the following snippets.\n\n

\n JavaScript\n (easiest)\n

\n            <script src=\"https://bibbase.org/show?authorFirst=1&bib=AnneBeyer.github.io%2Fassets%2Fbib%2Fmine.bib&jsonp=1&jsonp=1\"></script>\n

\n\n PHP\n

\n            <?php\n            $contents = file_get_contents(\"https://bibbase.org/show?authorFirst=1&bib=AnneBeyer.github.io%2Fassets%2Fbib%2Fmine.bib&jsonp=1\");\n            print_r($contents);\n            ?>\n

\n\n iFrame\n (not recommended)\n

\n            <iframe src=\"https://bibbase.org/show?authorFirst=1&bib=AnneBeyer.github.io%2Fassets%2Fbib%2Fmine.bib&jsonp=1\"></iframe>\n

\n\n

\n For more details see the documention.\n

\n\n

\n\n This is a preview! To use this list on your own web site\n or create a new web site from it,\n create a free account. The file will be added\n and you will be able to edit it in the File Manager.\n We will show you instructions once you've created your account.\n

\n\n

To the site owner:

\n\n

Action required! Mendeley is changing its\n API. In order to keep using Mendeley with BibBase past April\n 14th, you need to:\n

renew the authorization for BibBase on Mendeley, and
update the BibBase URL\n in your page the same way you did when you initially set up\n this page.\n

\n\n

\n \n \n Fix it now\n

\n\n

\n\n\n

\n \n \n

\n \n 2025\n \n \n (1)\n \n \n

\n \n \n

\n \n\n \n \n Hakimov, S.; Abdullayeva, Y.; Koshti, K.; Schmidt, A.; Weiser, Y.; Beyer, A.; and Schlangen, D.\n\n\n \n \n \n \n \n Using Game Play to Investigate Multimodal and Conversational Grounding in Large Multimodal Models.\n \n \n \n \n\n\n \n\n\n\n In Rambow, O.; Wanner, L.; Apidianaki, M.; Al-Khalifa, H.; Eugenio, B. D.; and Schockaert, S., editor(s), Proceedings of the 31st International Conference on Computational Linguistics, pages 5686–5718, Abu Dhabi, UAE, January 2025. Association for Computational Linguistics\n \n\n\n\n
\n\n\n\n \n \n $\"Using$ Paper\n \n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n

@inproceedings{Hakimov-2025,\n  title = {Using Game Play to Investigate Multimodal and Conversational Grounding in Large Multimodal Models},\n  author = {Hakimov, Sherzod and Abdullayeva, Yerkezhan and Koshti, Kushal and Schmidt, Antonia and Weiser, Yan and Beyer, Anne and Schlangen, David},\n  editor = {Rambow, Owen and Wanner, Leo and Apidianaki, Marianna and Al-Khalifa, Hend and Eugenio, Barbara Di and Schockaert, Steven},\n  booktitle = {Proceedings of the 31st International Conference on Computational Linguistics},\n  month = jan,\n  year = {2025},\n  address = {Abu Dhabi, UAE},\n  publisher = {Association for Computational Linguistics},\n  url = {https://aclanthology.org/2025.coling-main.381/},\n  pages = {5686--5718}\n}\n\n

\n\n\n\n

\n\n\n\n\n\n

\n\n

\n \n 2024\n \n \n (1)\n \n \n

\n \n \n

\n \n\n \n \n Beyer, A.; Chalamalasetti, K.; Hakimov, S.; Madureira, B.; Sadler, P.; and Schlangen, D.\n\n\n \n \n \n \n clembench-2024: A Challenging, Dynamic, Complementary, Multilingual Benchmark and Underlying Flexible Framework for LLMs as Multi-Action Agents.\n \n \n \n\n\n \n\n\n\n 2024.\n \n\n\n\n
\n\n\n\n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n

@misc{Beyer-2024,\n  title = {clembench-2024: A Challenging, Dynamic, Complementary, Multilingual Benchmark and Underlying Flexible Framework for LLMs as Multi-Action Agents},\n  author = {Beyer, Anne and Chalamalasetti, Kranti and Hakimov, Sherzod and Madureira, Brielen and Sadler, Philipp and Schlangen, David},\n  year = {2024},\n  eprint = {2405.20859},\n  archiveprefix = {arXiv},\n  primaryclass = {cs.CL}\n}\n

\n\n\n\n

\n\n\n\n\n\n

\n\n

\n \n 2023\n \n \n (1)\n \n \n

\n \n \n

\n \n\n \n \n Galetzka, F.; Beyer, A.; and Schlangen, D.\n\n\n \n \n \n \n \n Neural Conversation Models and How to Rein Them in: A Survey of Failures and Fixes.\n \n \n \n \n\n\n \n\n\n\n 2023.\n \n\n\n\n
\n\n\n\n \n \n $\"Neural$ Paper\n \n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n \n \n abstract \n \n\n \n \n \n 1 download\n \n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n

@misc{galetzka2023neuralconversationmodelsrein,\n      title={Neural Conversation Models and How to Rein Them in: A Survey of Failures and Fixes}, \n      author={Fabian Galetzka and Anne Beyer and David Schlangen},\n      year={2023},\n      eprint={2308.06095},\n      archivePrefix={arXiv},\n      primaryClass={cs.CL},\n      url={https://arxiv.org/abs/2308.06095}, \n      abstract={Recent conditional language models are able to continue any kind of text source in an often seemingly fluent way. This fact encouraged research in the area of open-domain conversational systems that are based on powerful language models and aim to imitate an interlocutor by generating appropriate contributions to a written dialogue. From a linguistic perspective, however, the complexity of contributing to a conversation is high. In this survey, we interpret Grice's maxims of cooperative conversation from the perspective of this specific research area and systematize the literature under the aspect of what makes a contribution appropriate: A neural conversation model has to be fluent, informative, consistent, coherent, and follow social norms. In order to ensure these qualities, recent approaches try to tame the underlying language models at various intervention points, such as data, training regime or decoding. Sorted by these categories and intervention points, we discuss promising attempts and suggest novel ways for future research.}\n}\n\n

\n\n\n\n\n\n

\n\n

\n \n 2022\n \n \n (1)\n \n \n

\n \n \n

\n \n\n \n \n Loáiciga, S.; Beyer, A.; and Schlangen, D.\n\n\n \n \n \n \n \n New or Old? Exploring How Pre-Trained Language Models Represent Discourse Entities.\n \n \n \n \n\n\n \n\n\n\n In Proceedings of the 29th International Conference on Computational Linguistics, pages 875–886, Gyeongju, Republic of Korea, October 2022. International Committee on Computational Linguistics\n \n\n\n\n
\n\n\n\n \n \n $\"New$ Paper\n \n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n \n \n abstract \n \n\n \n \n \n 2 downloads\n \n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n

@inproceedings{loaiciga-etal-2022-new,\n    title = "New or Old? Exploring How Pre-Trained Language Models Represent Discourse Entities",\n    author = "Lo{\\'a}iciga, Sharid  and\n      Beyer, Anne  and\n      Schlangen, David",\n    booktitle = "Proceedings of the 29th International Conference on Computational Linguistics",\n    month = oct,\n    year = "2022",\n    address = "Gyeongju, Republic of Korea",\n    publisher = "International Committee on Computational Linguistics",\n    url = "https://aclanthology.org/2022.coling-1.73",\n    pages = "875--886",\n    abstract = "Recent research shows that pre-trained language models, built to generate text conditioned on some context, learn to encode syntactic knowledge to a certain degree. This has motivated researchers to move beyond the sentence-level and look into their ability to encode less studied discourse-level phenomena. In this paper, we add to the body of probing research by investigating discourse entity representations in large pre-trained language models in English. Motivated by early theories of discourse and key pieces of previous work, we focus on the information-status of entities as discourse-new or discourse-old. We present two probing models, one based on binary classification and another one on sequence labeling. The results of our experiments show that pre-trained language models do encode information on whether an entity has been introduced before or not in the discourse. However, this information alone is not sufficient to find the entities in a discourse, opening up interesting questions about the definition of entities for future work."\n}\n\n

\n\n\n\n\n\n

\n\n

\n \n 2021\n \n \n (1)\n \n \n

\n \n \n

\n \n\n \n \n Beyer, A.; Loáiciga, S.; and Schlangen, D.\n\n\n \n \n \n \n \n Is Incoherence Surprising? Targeted Evaluation of Coherence Prediction from Language Models.\n \n \n \n \n\n\n \n\n\n\n In Proceedings of the 2021 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, Online, 2021. Association for Computational Linguistics\n \n\n\n\n
\n\n\n\n \n \n $\"Is$ paper\n \n \n \n $\"Is$ video\n \n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n \n \n abstract \n \n\n \n \n \n 3 downloads\n \n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n

@inproceedings{beyer_incoherence_2021,\n    author = {Beyer, Anne and Lo\\'aiciga, Sharid and Schlangen, David},\n    year = {2021},\n    title = {Is {Incoherence} {Surprising}? {Targeted} {Evaluation} of {Coherence} {Prediction} from {Language} {Models}},\n    abstract = {Coherent discourse is distinguished from a mere collection of utterances by the satisfaction of a diverse set of constraints, for example choice of expression, logical relation between denoted events, and implicit compatibility with world-knowledge. Do neural language models encode such constraints? We design an extendable set of test suites addressing different aspects of discourse and dialogue coherence. Unlike most previous coherence evaluation studies, we address specific linguistic devices beyond sentence order perturbations, allowing for a more fine-grained analysis of what constitutes coherence and what neural models trained on a language modelling objective do encode. Extending the targeted evaluation paradigm for neural language models (Marvin and Linzen, 2018) to phenomena beyond syntax, we show that this paradigm is equally suited to evaluate linguistic qualities that contribute to the notion of coherence.},\n    booktitle = {Proceedings of the 2021 {Conference} of the {North} {A}merican {Chapter} of the {Association} for {Computational} {Linguistics}: {Human} {Language} {Technologies}},\n    publisher = {Association for {Computational} {Linguistics}},\n    url_Paper = {https://aclanthology.org/2021.naacl-main.328/},\n    url_Video = {https://screencast-o-matic.com/watch/crhXrYVfqo7},\n    address = {Online}\n}\n\n

\n\n\n\n\n\n

\n\n

\n \n 2020\n \n \n (1)\n \n \n

\n \n \n

\n \n\n \n \n Beyer, A.; Kauermann, G.; and Schütze, H.\n\n\n \n \n \n \n \n Embedding Space Correlation as a Measure of Domain Similarity.\n \n \n \n \n\n\n \n\n\n\n In Proceedings of The 12th Language Resources and Evaluation Conference, pages 2431–2439, Marseille, France, 2020. \n \n\n\n\n
\n\n\n\n \n \n $\"Embedding$ paper\n \n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n \n \n abstract \n \n\n \n \n \n 6 downloads\n \n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n

@inproceedings{beyer_embedding_2020,\n  author    = {Beyer, Anne  and  Kauermann, Göran  and  Schütze, Hinrich},\n  title     = {Embedding Space Correlation as a Measure of Domain Similarity},\n  booktitle = {Proceedings of The 12th Language Resources and Evaluation Conference},\n  year      = {2020},\n  address   = {Marseille, France},\n  pages     = {2431--2439},\n  abstract  = {Prior work has determined domain similarity using text-based features of a corpus. However, when using pre-trained word embeddings, the underlying text corpus might not be accessible anymore. Therefore, we propose the CCA measure, a new measure of domain similarity based directly on the dimension-wise correlations between corresponding embedding spaces. Our results suggest that an inherent notion of domain can be captured this way, as we are able to reproduce our findings for different domain comparisons for English, German, Spanish and Czech as well as in cross-lingual comparisons. We further find a threshold at which the CCA measure indicates that two corpora come from the same domain in a monolingual setting by applying permutation tests. By evaluating the usability of the CCA measure in a domain adaptation application, we also show that it can be used to determine which corpora are more similar to each other in a cross-domain sentiment detection task.},\n  url_Paper = {https://www.aclweb.org/anthology/2020.lrec-1.296.pdf}\n}\n\n

\n\n\n\n\n\n

\n\n

\n \n 2017\n \n \n (1)\n \n \n

\n \n \n

\n \n\n \n \n Beyer, A.; Macketanz, V.; Burchardt, A.; and Williams, P.\n\n\n \n \n \n \n \n Can Out-of-the-box NMT Beat a Domain-trained Moses on Technical Data?.\n \n \n \n \n\n\n \n\n\n\n In Proceedings for EAMT 2017 User Studies and Project/Product Descriptions, pages 41–46, Prague, Czech Republic, 2017. \n \n\n\n\n
\n\n\n\n \n \n $\"Can$ paper\n \n \n\n \n\n \n link\n \n \n\n bibtex\n \n\n \n \n \n abstract \n \n\n \n \n \n 4 downloads\n \n \n\n \n \n \n \n \n \n \n\n \n \n \n\n\n\n

@inproceedings{beyer_can_2017,\n  address = {Prague, Czech Republic},\n  title = {Can {Out}-of-the-box {NMT} {Beat} a {Domain}-trained {Moses} on {Technical} {Data}?},\n  url_Paper = {https://ufal.mff.cuni.cz/eamt2017/user-project-product-papers/papers/user/EAMT2017_paper_32.pdf},\n  abstract = {In the last year, we have seen a lot of evidence about the superiority of neural machine translation approaches (NMT) over phrase-based statistical approaches (PBMT). This trend has shown for the general domain at public competitions such as the WMT challenges as well as in the obvious quality increase in online translation services that have changed their technology. In this paper, we take the perspective of an LSP. The questions we want to answer with this study is if now is already the time to invest in the new technology. To answer this question, we have collected evidence as to whether an existing stateof-the-art NMT system for the general domain can already compete with a domaintrained and optimised Moses (PBMT) system or if it is maybe already better. As it is well known that automatic quality measures are not reliable for comparing the performance of different system types, we have performed a detailed manual evaluation based on a test suite of domain segments.},\n  language = {en},\n  booktitle = {Proceedings for {EAMT} 2017 {User} {Studies} and {Project}/{Product} {Descriptions}},\n  author = {Beyer, Anne and Macketanz, Vivien and Burchardt, Aljoscha and Williams, Philip},\n  year = {2017},\n  pages = {41--46}\n}\n\n

\n\n\n\n\n\n

\n\n\n\n\n

\n\n\n \n\n \n \n \n \n\n