Multimodal Compact Bilinear Pooling for Visual Question Answering and Visual Grounding. Fukui, A., Park, D. H., Yang, D., Rohrbach, A., Darrell, T., & Rohrbach, M. CoRR, 2016.
Multimodal Compact Bilinear Pooling for Visual Question Answering and Visual Grounding [link]Paper  bibtex   
@Article{DBLP:journals/corr/FukuiPYRDR16,
  author    = {Akira Fukui and Dong Huk Park and Daylen Yang and Anna Rohrbach and Trevor Darrell and Marcus Rohrbach},
  title     = {Multimodal Compact Bilinear Pooling for Visual Question Answering and Visual Grounding},
  journal   = {CoRR},
  year      = {2016},
  volume    = {abs/1606.01847},
  bibsource = {dblp computer science bibliography, http://dblp.org},
  biburl    = {http://dblp.uni-trier.de/rec/bib/journals/corr/FukuiPYRDR16},
  timestamp = {Fri, 01 Jul 2016 17:39:49 +0200},
  url       = {http://arxiv.org/abs/1606.01847},
}

Downloads: 0