BERT Rediscovers the Classical NLP Pipeline. Tenney, I., Das, D., & Pavlick, E. August, 2019. arXiv:1905.05950 [cs]Paper doi abstract bibtex Pre-trained text encoders have rapidly advanced the state of the art on many NLP tasks. We focus on one such model, BERT, and aim to quantify where linguistic information is captured within the network. We find that the model represents the steps of the traditional NLP pipeline in an interpretable and localizable way, and that the regions responsible for each step appear in the expected sequence: POS tagging, parsing, NER, semantic roles, then coreference. Qualitative analysis reveals that the model can and often does adjust this pipeline dynamically, revising lower-level decisions on the basis of disambiguating information from higher-level representations.
@misc{tenney_bert_2019,
title = {{BERT} {Rediscovers} the {Classical} {NLP} {Pipeline}},
url = {http://arxiv.org/abs/1905.05950},
doi = {10.48550/arXiv.1905.05950},
abstract = {Pre-trained text encoders have rapidly advanced the state of the art on many NLP tasks. We focus on one such model, BERT, and aim to quantify where linguistic information is captured within the network. We find that the model represents the steps of the traditional NLP pipeline in an interpretable and localizable way, and that the regions responsible for each step appear in the expected sequence: POS tagging, parsing, NER, semantic roles, then coreference. Qualitative analysis reveals that the model can and often does adjust this pipeline dynamically, revising lower-level decisions on the basis of disambiguating information from higher-level representations.},
urldate = {2024-06-14},
publisher = {arXiv},
author = {Tenney, Ian and Das, Dipanjan and Pavlick, Ellie},
month = aug,
year = {2019},
note = {arXiv:1905.05950 [cs]},
keywords = {Computer Science - Computation and Language},
}
Downloads: 0
{"_id":"CKxiRuwuydJNxopzJ","bibbaseid":"tenney-das-pavlick-bertrediscoverstheclassicalnlppipeline-2019","authorIDs":[],"author_short":["Tenney, I.","Das, D.","Pavlick, E."],"bibdata":{"bibtype":"misc","type":"misc","title":"BERT Rediscovers the Classical NLP Pipeline","url":"http://arxiv.org/abs/1905.05950","doi":"10.48550/arXiv.1905.05950","abstract":"Pre-trained text encoders have rapidly advanced the state of the art on many NLP tasks. We focus on one such model, BERT, and aim to quantify where linguistic information is captured within the network. We find that the model represents the steps of the traditional NLP pipeline in an interpretable and localizable way, and that the regions responsible for each step appear in the expected sequence: POS tagging, parsing, NER, semantic roles, then coreference. Qualitative analysis reveals that the model can and often does adjust this pipeline dynamically, revising lower-level decisions on the basis of disambiguating information from higher-level representations.","urldate":"2024-06-14","publisher":"arXiv","author":[{"propositions":[],"lastnames":["Tenney"],"firstnames":["Ian"],"suffixes":[]},{"propositions":[],"lastnames":["Das"],"firstnames":["Dipanjan"],"suffixes":[]},{"propositions":[],"lastnames":["Pavlick"],"firstnames":["Ellie"],"suffixes":[]}],"month":"August","year":"2019","note":"arXiv:1905.05950 [cs]","keywords":"Computer Science - Computation and Language","bibtex":"@misc{tenney_bert_2019,\n\ttitle = {{BERT} {Rediscovers} the {Classical} {NLP} {Pipeline}},\n\turl = {http://arxiv.org/abs/1905.05950},\n\tdoi = {10.48550/arXiv.1905.05950},\n\tabstract = {Pre-trained text encoders have rapidly advanced the state of the art on many NLP tasks. We focus on one such model, BERT, and aim to quantify where linguistic information is captured within the network. We find that the model represents the steps of the traditional NLP pipeline in an interpretable and localizable way, and that the regions responsible for each step appear in the expected sequence: POS tagging, parsing, NER, semantic roles, then coreference. Qualitative analysis reveals that the model can and often does adjust this pipeline dynamically, revising lower-level decisions on the basis of disambiguating information from higher-level representations.},\n\turldate = {2024-06-14},\n\tpublisher = {arXiv},\n\tauthor = {Tenney, Ian and Das, Dipanjan and Pavlick, Ellie},\n\tmonth = aug,\n\tyear = {2019},\n\tnote = {arXiv:1905.05950 [cs]},\n\tkeywords = {Computer Science - Computation and Language},\n}\n\n\n\n\n\n\n\n","author_short":["Tenney, I.","Das, D.","Pavlick, E."],"key":"tenney_bert_2019","id":"tenney_bert_2019","bibbaseid":"tenney-das-pavlick-bertrediscoverstheclassicalnlppipeline-2019","role":"author","urls":{"Paper":"http://arxiv.org/abs/1905.05950"},"keyword":["Computer Science - Computation and Language"],"metadata":{"authorlinks":{}},"downloads":0,"html":""},"bibtype":"misc","biburl":"https://bibbase.org/zotero/abhishek-p","creationDate":"2020-01-05T22:03:38.529Z","downloads":0,"keywords":["computer science - computation and language"],"search_terms":["bert","rediscovers","classical","nlp","pipeline","tenney","das","pavlick"],"title":"BERT Rediscovers the Classical NLP Pipeline","year":2019,"dataSources":["okYcdTpf4JJ2zkj7A","SBafiCSLPjNDAPHQn","znj7izS5PeehdLR3G","h7kKWXpJh2iaX92T5"]}