Explicit Sparse Transformer: Concentrated Attention Through Explicit Selection.
http://arxiv.org/abs/1912.11637
@article{DBLP:journals/corr/abs-1912-11637,
author = {Guangxiang Zhao and
Junyang Lin and
Zhiyuan Zhang and
Xuancheng Ren and
Qi Su and
Xu Sun},
title = {Explicit Sparse Transformer: Concentrated Attention Through Explicit
Selection},
journal = {CoRR},
volume = {abs/1912.11637},
year = {2019},
url = {http://arxiv.org/abs/1912.11637},
archivePrefix = {arXiv},
eprint = {1912.11637},
timestamp = {Fri, 03 Jan 2020 16:10:45 +0100},
biburl = {https://dblp.org/rec/journals/corr/abs-1912-11637.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
本页面没有标签