Bert: Pre-training of deep bidirectional transformers for language understanding. Devlin, J. arXiv preprint arXiv:1810.04805, 2018.
bibtex   
@article{devlin2018bert,
  title={Bert: Pre-training of deep bidirectional transformers for language understanding},
  author={Devlin, Jacob},
  journal={arXiv preprint arXiv:1810.04805},
  year={2018}
}

Downloads: 0