Incorporating non-local information into information extraction systems by Gibbs sampling

Incorporating non-local information into information extraction systems by Gibbs sampling. Finkel, J., R., Grenager, T., & Manning, C. Proceedings of the 43rd Annual Meeting on Association for Computational Linguistics ACL 05, 43(1995):363-370, Association for Computational Linguistics, 2005.

Paper

Incorporating non-local information into information extraction systems by Gibbs sampling [link]

Website abstract bibtex

Most current statistical natural language processing models use only local features so as to permit dynamic programming in inference, but this makes them unable to fully account for the long distance structure that is prevalent in language use. We show how to solve this dilemma with Gibbs sampling, a simple Monte Carlo method used to perform approximate inference in factored probabilistic models. By using simulated annealing in place of Viterbi decoding in sequence models such as HMMs, CMMs, and CRFs, it is possible to incorporate non-local structure while preserving tractable inference. We use this technique to augment an existing CRF-based information extraction system with long-distance dependency models, enforcing label consistency and extraction template consistency constraints. This technique results in an error reduction of up to 9% over state-of-the-art systems on two established information extraction tasks.

@article{
 title = {Incorporating non-local information into information extraction systems by Gibbs sampling},
 type = {article},
 year = {2005},
 identifiers = {[object Object]},
 pages = {363-370},
 volume = {43},
 websites = {http://portal.acm.org/citation.cfm?doid=1219840.1219885},
 publisher = {Association for Computational Linguistics},
 id = {c08dbfd3-1051-3541-b4e6-b587c9f2080d},
 created = {2010-11-13T05:17:45.000Z},
 file_attached = {true},
 profile_id = {5284e6aa-156c-3ce5-bc0e-b80cf09f3ef6},
 group_id = {066b42c8-f712-3fc3-abb2-225c158d2704},
 last_modified = {2019-09-17T09:34:57.251Z},
 read = {false},
 starred = {false},
 authored = {false},
 confirmed = {true},
 hidden = {false},
 citation_key = {Finkel2005a},
 notes = {Cited by 70 (6 self) – Show/Hide Context – Add To MetaCart<br/><br/>http://citeseerx.ist.psu.edu/viewdoc/summary;jsessionid=8C93442C94F6F7135C6F71670CB3C0F4?doi=10.1.1.131.8904},
 private_publication = {false},
 abstract = {Most current statistical natural language processing models use only local features so as to permit dynamic programming in inference, but this makes them unable to fully account for the long distance structure that is prevalent in language use. We show how to solve this dilemma with Gibbs sampling, a simple Monte Carlo method used to perform approximate inference in factored probabilistic models. By using simulated annealing in place of Viterbi decoding in sequence models such as HMMs, CMMs, and CRFs, it is possible to incorporate non-local structure while preserving tractable inference. We use this technique to augment an existing CRF-based information extraction system with long-distance dependency models, enforcing label consistency and extraction template consistency constraints. This technique results in an error reduction of up to 9% over state-of-the-art systems on two established information extraction tasks.},
 bibtype = {article},
 author = {Finkel, Jenny Rose and Grenager, Trond and Manning, Christopher},
 journal = {Proceedings of the 43rd Annual Meeting on Association for Computational Linguistics ACL 05},
 number = {1995}
}

Downloads: 0

{"_id":"kY5afXKgWXpgg4ndv","bibbaseid":"finkel-grenager-manning-incorporatingnonlocalinformationintoinformationextractionsystemsbygibbssampling-2005","authorIDs":[],"author_short":["Finkel, J., R.","Grenager, T.","Manning, C."],"bibdata":{"title":"Incorporating non-local information into information extraction systems by Gibbs sampling","type":"article","year":"2005","identifiers":"[object Object]","pages":"363-370","volume":"43","websites":"http://portal.acm.org/citation.cfm?doid=1219840.1219885","publisher":"Association for Computational Linguistics","id":"c08dbfd3-1051-3541-b4e6-b587c9f2080d","created":"2010-11-13T05:17:45.000Z","file_attached":"true","profile_id":"5284e6aa-156c-3ce5-bc0e-b80cf09f3ef6","group_id":"066b42c8-f712-3fc3-abb2-225c158d2704","last_modified":"2019-09-17T09:34:57.251Z","read":false,"starred":false,"authored":false,"confirmed":"true","hidden":false,"citation_key":"Finkel2005a","notes":"Cited by 70 (6 self) – Show/Hide Context – Add To MetaCart<br/><br/>http://citeseerx.ist.psu.edu/viewdoc/summary;jsessionid=8C93442C94F6F7135C6F71670CB3C0F4?doi=10.1.1.131.8904","private_publication":false,"abstract":"Most current statistical natural language processing models use only local features so as to permit dynamic programming in inference, but this makes them unable to fully account for the long distance structure that is prevalent in language use. We show how to solve this dilemma with Gibbs sampling, a simple Monte Carlo method used to perform approximate inference in factored probabilistic models. By using simulated annealing in place of Viterbi decoding in sequence models such as HMMs, CMMs, and CRFs, it is possible to incorporate non-local structure while preserving tractable inference. We use this technique to augment an existing CRF-based information extraction system with long-distance dependency models, enforcing label consistency and extraction template consistency constraints. This technique results in an error reduction of up to 9% over state-of-the-art systems on two established information extraction tasks.","bibtype":"article","author":"Finkel, Jenny Rose and Grenager, Trond and Manning, Christopher","journal":"Proceedings of the 43rd Annual Meeting on Association for Computational Linguistics ACL 05","number":"1995","bibtex":"@article{\n title = {Incorporating non-local information into information extraction systems by Gibbs sampling},\n type = {article},\n year = {2005},\n identifiers = {[object Object]},\n pages = {363-370},\n volume = {43},\n websites = {http://portal.acm.org/citation.cfm?doid=1219840.1219885},\n publisher = {Association for Computational Linguistics},\n id = {c08dbfd3-1051-3541-b4e6-b587c9f2080d},\n created = {2010-11-13T05:17:45.000Z},\n file_attached = {true},\n profile_id = {5284e6aa-156c-3ce5-bc0e-b80cf09f3ef6},\n group_id = {066b42c8-f712-3fc3-abb2-225c158d2704},\n last_modified = {2019-09-17T09:34:57.251Z},\n read = {false},\n starred = {false},\n authored = {false},\n confirmed = {true},\n hidden = {false},\n citation_key = {Finkel2005a},\n notes = {Cited by 70 (6 self) – Show/Hide Context – Add To MetaCart<br/><br/>http://citeseerx.ist.psu.edu/viewdoc/summary;jsessionid=8C93442C94F6F7135C6F71670CB3C0F4?doi=10.1.1.131.8904},\n private_publication = {false},\n abstract = {Most current statistical natural language processing models use only local features so as to permit dynamic programming in inference, but this makes them unable to fully account for the long distance structure that is prevalent in language use. We show how to solve this dilemma with Gibbs sampling, a simple Monte Carlo method used to perform approximate inference in factored probabilistic models. By using simulated annealing in place of Viterbi decoding in sequence models such as HMMs, CMMs, and CRFs, it is possible to incorporate non-local structure while preserving tractable inference. We use this technique to augment an existing CRF-based information extraction system with long-distance dependency models, enforcing label consistency and extraction template consistency constraints. This technique results in an error reduction of up to 9% over state-of-the-art systems on two established information extraction tasks.},\n bibtype = {article},\n author = {Finkel, Jenny Rose and Grenager, Trond and Manning, Christopher},\n journal = {Proceedings of the 43rd Annual Meeting on Association for Computational Linguistics ACL 05},\n number = {1995}\n}","author_short":["Finkel, J., R.","Grenager, T.","Manning, C."],"urls":{"Paper":"https://bibbase.org/service/mendeley/bfdabac2-d7f2-3c5b-aa7a-06431c0ae35e/file/52ab5a6d-44fd-546b-08ff-7a39e0da3b86/2005-Incorporating_non-local_information_into_information_extraction_systems_by_Gibbs_sampling.pdf.pdf","Website":"http://portal.acm.org/citation.cfm?doid=1219840.1219885"},"bibbaseid":"finkel-grenager-manning-incorporatingnonlocalinformationintoinformationextractionsystemsbygibbssampling-2005","role":"author","downloads":0,"html":""},"bibtype":"article","creationDate":"2020-02-06T23:48:11.678Z","downloads":0,"keywords":[],"search_terms":["incorporating","non","local","information","information","extraction","systems","gibbs","sampling","finkel","grenager","manning"],"title":"Incorporating non-local information into information extraction systems by Gibbs sampling","year":2005}