BibTeX records: Furu Wei

download as .bib file

@article{DBLP:journals/mlc/BaoDWYPW24,
  author       = {Hangbo Bao and
                  Li Dong and
                  Wenhui Wang and
                  Nan Yang and
                  Songhao Piao and
                  Furu Wei},
  title        = {Fine-tuning pretrained transformer encoders for sequence-to-sequence
                  learning},
  journal      = {Int. J. Mach. Learn. Cybern.},
  volume       = {15},
  number       = {5},
  pages        = {1711--1728},
  year         = {2024},
  url          = {https://doi.org/10.1007/s13042-023-01992-6},
  doi          = {10.1007/S13042-023-01992-6},
  timestamp    = {Sat, 04 May 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/mlc/BaoDWYPW24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/00010WWL24,
  author       = {Yongqi Li and
                  Nan Yang and
                  Liang Wang and
                  Furu Wei and
                  Wenjie Li},
  editor       = {Michael J. Wooldridge and
                  Jennifer G. Dy and
                  Sriraam Natarajan},
  title        = {Learning to Rank in Generative Retrieval},
  booktitle    = {Thirty-Eighth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2024, Thirty-Sixth Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2024, Fourteenth Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2014, February 20-27, 2024, Vancouver,
                  Canada},
  pages        = {8716--8723},
  publisher    = {{AAAI} Press},
  year         = {2024},
  url          = {https://doi.org/10.1609/aaai.v38i8.28717},
  doi          = {10.1609/AAAI.V38I8.28717},
  timestamp    = {Tue, 02 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/00010WWL24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/LiuYHZHWDSZ24,
  author       = {Yuxuan Liu and
                  Tianchi Yang and
                  Shaohan Huang and
                  Zihan Zhang and
                  Haizhen Huang and
                  Furu Wei and
                  Weiwei Deng and
                  Feng Sun and
                  Qi Zhang},
  editor       = {Michael J. Wooldridge and
                  Jennifer G. Dy and
                  Sriraam Natarajan},
  title        = {Text Diffusion with Reinforced Conditioning},
  booktitle    = {Thirty-Eighth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2024, Thirty-Sixth Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2024, Fourteenth Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2014, February 20-27, 2024, Vancouver,
                  Canada},
  pages        = {14069--14077},
  publisher    = {{AAAI} Press},
  year         = {2024},
  url          = {https://doi.org/10.1609/aaai.v38i12.29316},
  doi          = {10.1609/AAAI.V38I12.29316},
  timestamp    = {Tue, 02 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/LiuYHZHWDSZ24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eacl/YangDDCCLGW24,
  author       = {Zonglin Yang and
                  Li Dong and
                  Xinya Du and
                  Hao Cheng and
                  Erik Cambria and
                  Xiaodong Liu and
                  Jianfeng Gao and
                  Furu Wei},
  editor       = {Yvette Graham and
                  Matthew Purver},
  title        = {Language Models as Inductive Reasoners},
  booktitle    = {Proceedings of the 18th Conference of the European Chapter of the
                  Association for Computational Linguistics, {EACL} 2024 - Volume 1:
                  Long Papers, St. Julian's, Malta, March 17-22, 2024},
  pages        = {209--225},
  publisher    = {Association for Computational Linguistics},
  year         = {2024},
  url          = {https://aclanthology.org/2024.eacl-long.13},
  timestamp    = {Thu, 11 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/eacl/YangDDCCLGW24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eacl/LuHZWL24,
  author       = {Hongyuan Lu and
                  Haoyang Huang and
                  Dongdong Zhang and
                  Furu Wei and
                  Wai Lam},
  editor       = {Yvette Graham and
                  Matthew Purver},
  title        = {Revamping Multilingual Agreement Bidirectionally via Switched Back-translation
                  for Multilingual Neural Machine Translation},
  booktitle    = {Findings of the Association for Computational Linguistics: {EACL}
                  2024, St. Julian's, Malta, March 17-22, 2024},
  pages        = {264--275},
  publisher    = {Association for Computational Linguistics},
  year         = {2024},
  url          = {https://aclanthology.org/2024.findings-eacl.19},
  timestamp    = {Tue, 02 Apr 2024 16:32:10 +0200},
  biburl       = {https://dblp.org/rec/conf/eacl/LuHZWL24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eacl/WangYW24,
  author       = {Liang Wang and
                  Nan Yang and
                  Furu Wei},
  editor       = {Yvette Graham and
                  Matthew Purver},
  title        = {Learning to Retrieve In-Context Examples for Large Language Models},
  booktitle    = {Proceedings of the 18th Conference of the European Chapter of the
                  Association for Computational Linguistics, {EACL} 2024 - Volume 1:
                  Long Papers, St. Julian's, Malta, March 17-22, 2024},
  pages        = {1752--1767},
  publisher    = {Association for Computational Linguistics},
  year         = {2024},
  url          = {https://aclanthology.org/2024.eacl-long.105},
  timestamp    = {Mon, 25 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/eacl/WangYW24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2401-00246,
  author       = {Hongkun Hao and
                  Long Zhou and
                  Shujie Liu and
                  Jinyu Li and
                  Shujie Hu and
                  Rui Wang and
                  Furu Wei},
  title        = {Boosting Large Language Model for Speech Synthesis: An Empirical Study},
  journal      = {CoRR},
  volume       = {abs/2401.00246},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2401.00246},
  doi          = {10.48550/ARXIV.2401.00246},
  eprinttype    = {arXiv},
  eprint       = {2401.00246},
  timestamp    = {Mon, 15 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2401-00246.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2401-00368,
  author       = {Liang Wang and
                  Nan Yang and
                  Xiaolong Huang and
                  Linjun Yang and
                  Rangan Majumder and
                  Furu Wei},
  title        = {Improving Text Embeddings with Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2401.00368},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2401.00368},
  doi          = {10.48550/ARXIV.2401.00368},
  eprinttype    = {arXiv},
  eprint       = {2401.00368},
  timestamp    = {Fri, 23 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2401-00368.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2401-07284,
  author       = {Ting Jiang and
                  Shaohan Huang and
                  Shengyue Luo and
                  Zihan Zhang and
                  Haizhen Huang and
                  Furu Wei and
                  Weiwei Deng and
                  Feng Sun and
                  Qi Zhang and
                  Deqing Wang and
                  Fuzhen Zhuang},
  title        = {Improving Domain Adaptation through Extended-Text Reading Comprehension},
  journal      = {CoRR},
  volume       = {abs/2401.07284},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2401.07284},
  doi          = {10.48550/ARXIV.2401.07284},
  eprinttype    = {arXiv},
  eprint       = {2401.07284},
  timestamp    = {Thu, 01 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2401-07284.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2402-01521,
  author       = {Yadong Zhang and
                  Shaoguang Mao and
                  Tao Ge and
                  Xun Wang and
                  Yan Xia and
                  Man Lan and
                  Furu Wei},
  title        = {K-Level Reasoning with Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2402.01521},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.01521},
  doi          = {10.48550/ARXIV.2402.01521},
  eprinttype    = {arXiv},
  eprint       = {2402.01521},
  timestamp    = {Fri, 09 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-01521.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2402-05672,
  author       = {Liang Wang and
                  Nan Yang and
                  Xiaolong Huang and
                  Linjun Yang and
                  Rangan Majumder and
                  Furu Wei},
  title        = {Multilingual {E5} Text Embeddings: {A} Technical Report},
  journal      = {CoRR},
  volume       = {abs/2402.05672},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.05672},
  doi          = {10.48550/ARXIV.2402.05672},
  eprinttype    = {arXiv},
  eprint       = {2402.05672},
  timestamp    = {Fri, 23 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-05672.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2402-09906,
  author       = {Niklas Muennighoff and
                  Hongjin Su and
                  Liang Wang and
                  Nan Yang and
                  Furu Wei and
                  Tao Yu and
                  Amanpreet Singh and
                  Douwe Kiela},
  title        = {Generative Representational Instruction Tuning},
  journal      = {CoRR},
  volume       = {abs/2402.09906},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.09906},
  doi          = {10.48550/ARXIV.2402.09906},
  eprinttype    = {arXiv},
  eprint       = {2402.09906},
  timestamp    = {Fri, 23 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-09906.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2402-13064,
  author       = {Haoran Li and
                  Qingxiu Dong and
                  Zhengyang Tang and
                  Chaojun Wang and
                  Xingxing Zhang and
                  Haoyang Huang and
                  Shaohan Huang and
                  Xiaolong Huang and
                  Zeqiang Huang and
                  Dongdong Zhang and
                  Yuxian Gu and
                  Xin Cheng and
                  Xun Wang and
                  Si{-}Qing Chen and
                  Li Dong and
                  Wei Lu and
                  Zhifang Sui and
                  Benyou Wang and
                  Wai Lam and
                  Furu Wei},
  title        = {Synthetic Data (Almost) from Scratch: Generalized Instruction Tuning
                  for Language Models},
  journal      = {CoRR},
  volume       = {abs/2402.13064},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.13064},
  doi          = {10.48550/ARXIV.2402.13064},
  eprinttype    = {arXiv},
  eprint       = {2402.13064},
  timestamp    = {Tue, 07 May 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-13064.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2402-13874,
  author       = {Haoyu Liu and
                  Jianfeng Liu and
                  Shaohan Huang and
                  Yuefeng Zhan and
                  Hao Sun and
                  Weiwei Deng and
                  Furu Wei and
                  Qi Zhang},
  title        = {Se\({}^{\mbox{2}}\): Sequential Example Selection for In-Context Learning},
  journal      = {CoRR},
  volume       = {abs/2402.13874},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.13874},
  doi          = {10.48550/ARXIV.2402.13874},
  eprinttype    = {arXiv},
  eprint       = {2402.13874},
  timestamp    = {Fri, 22 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-13874.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2402-14843,
  author       = {Yuxuan Liu and
                  Tianchi Yang and
                  Shaohan Huang and
                  Zihan Zhang and
                  Haizhen Huang and
                  Furu Wei and
                  Weiwei Deng and
                  Feng Sun and
                  Qi Zhang},
  title        = {Text Diffusion with Reinforced Conditioning},
  journal      = {CoRR},
  volume       = {abs/2402.14843},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.14843},
  doi          = {10.48550/ARXIV.2402.14843},
  eprinttype    = {arXiv},
  eprint       = {2402.14843},
  timestamp    = {Fri, 22 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-14843.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2402-15754,
  author       = {Yuxuan Liu and
                  Tianchi Yang and
                  Shaohan Huang and
                  Zihan Zhang and
                  Haizhen Huang and
                  Furu Wei and
                  Weiwei Deng and
                  Feng Sun and
                  Qi Zhang},
  title        = {HD-Eval: Aligning Large Language Model Evaluators Through Hierarchical
                  Criteria Decomposition},
  journal      = {CoRR},
  volume       = {abs/2402.15754},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.15754},
  doi          = {10.48550/ARXIV.2402.15754},
  eprinttype    = {arXiv},
  eprint       = {2402.15754},
  timestamp    = {Mon, 25 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-15754.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2402-16438,
  author       = {Tianyi Tang and
                  Wenyang Luo and
                  Haoyang Huang and
                  Dongdong Zhang and
                  Xiaolei Wang and
                  Xin Zhao and
                  Furu Wei and
                  Ji{-}Rong Wen},
  title        = {Language-Specific Neurons: The Key to Multilingual Capabilities in
                  Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2402.16438},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.16438},
  doi          = {10.48550/ARXIV.2402.16438},
  eprinttype    = {arXiv},
  eprint       = {2402.16438},
  timestamp    = {Mon, 25 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-16438.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2402-17759,
  author       = {Yuxian Gu and
                  Li Dong and
                  Yaru Hao and
                  Qingxiu Dong and
                  Minlie Huang and
                  Furu Wei},
  title        = {Towards Optimal Learning of Language Models},
  journal      = {CoRR},
  volume       = {abs/2402.17759},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.17759},
  doi          = {10.48550/ARXIV.2402.17759},
  eprinttype    = {arXiv},
  eprint       = {2402.17759},
  timestamp    = {Mon, 25 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-17759.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2402-17764,
  author       = {Shuming Ma and
                  Hongyu Wang and
                  Lingxiao Ma and
                  Lei Wang and
                  Wenhui Wang and
                  Shaohan Huang and
                  Li Dong and
                  Ruiping Wang and
                  Jilong Xue and
                  Furu Wei},
  title        = {The Era of 1-bit LLMs: All Large Language Models are in 1.58 Bits},
  journal      = {CoRR},
  volume       = {abs/2402.17764},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.17764},
  doi          = {10.48550/ARXIV.2402.17764},
  eprinttype    = {arXiv},
  eprint       = {2402.17764},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-17764.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2402-18039,
  author       = {Shuhua Shi and
                  Shaohan Huang and
                  Minghui Song and
                  Zhoujun Li and
                  Zihan Zhang and
                  Haizhen Huang and
                  Furu Wei and
                  Weiwei Deng and
                  Feng Sun and
                  Qi Zhang},
  title        = {ResLoRA: Identity Residual Mapping in Low-Rank Adaption},
  journal      = {CoRR},
  volume       = {abs/2402.18039},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.18039},
  doi          = {10.48550/ARXIV.2402.18039},
  eprinttype    = {arXiv},
  eprint       = {2402.18039},
  timestamp    = {Tue, 26 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-18039.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2403-02884,
  author       = {Zhengyang Tang and
                  Xingxing Zhang and
                  Benyou Wang and
                  Furu Wei},
  title        = {MathScale: Scaling Instruction Tuning for Mathematical Reasoning},
  journal      = {CoRR},
  volume       = {abs/2403.02884},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2403.02884},
  doi          = {10.48550/ARXIV.2403.02884},
  eprinttype    = {arXiv},
  eprint       = {2403.02884},
  timestamp    = {Wed, 03 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2403-02884.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2404-00656,
  author       = {Shujie Hu and
                  Long Zhou and
                  Shujie Liu and
                  Sanyuan Chen and
                  Hongkun Hao and
                  Jing Pan and
                  Xunying Liu and
                  Jinyu Li and
                  Sunit Sivasankaran and
                  Linquan Liu and
                  Furu Wei},
  title        = {WavLLM: Towards Robust and Adaptive Speech Large Language Model},
  journal      = {CoRR},
  volume       = {abs/2404.00656},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2404.00656},
  doi          = {10.48550/ARXIV.2404.00656},
  eprinttype    = {arXiv},
  eprint       = {2404.00656},
  timestamp    = {Wed, 08 May 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2404-00656.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2404-01230,
  author       = {Yadong Zhang and
                  Shaoguang Mao and
                  Tao Ge and
                  Xun Wang and
                  Adrian de Wynter and
                  Yan Xia and
                  Wenshan Wu and
                  Ting Song and
                  Man Lan and
                  Furu Wei},
  title        = {{LLM} as a Mastermind: {A} Survey of Strategic Reasoning with Large
                  Language Models},
  journal      = {CoRR},
  volume       = {abs/2404.01230},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2404.01230},
  doi          = {10.48550/ARXIV.2404.01230},
  eprinttype    = {arXiv},
  eprint       = {2404.01230},
  timestamp    = {Wed, 08 May 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2404-01230.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ipm/LiYWWL23,
  author       = {Yongqi Li and
                  Nan Yang and
                  Liang Wang and
                  Furu Wei and
                  Wenjie Li},
  title        = {Generative retrieval for conversational question answering},
  journal      = {Inf. Process. Manag.},
  volume       = {60},
  number       = {5},
  pages        = {103475},
  year         = {2023},
  url          = {https://doi.org/10.1016/j.ipm.2023.103475},
  doi          = {10.1016/J.IPM.2023.103475},
  timestamp    = {Fri, 23 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ipm/LiYWWL23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/sigir/WangYHYMW23,
  author       = {Liang Wang and
                  Nan Yang and
                  Xiaolong Huang and
                  Linjun Yang and
                  Rangan Majumder and
                  Furu Wei},
  title        = {Large Search Model: Redefining Search Stack in the Era of LLMs},
  journal      = {{SIGIR} Forum},
  volume       = {57},
  number       = {2},
  pages        = {23:1--23:16},
  year         = {2023},
  url          = {https://doi.org/10.1145/3642979.3643006},
  doi          = {10.1145/3642979.3643006},
  timestamp    = {Fri, 23 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/sigir/WangYHYMW23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/YangYYMHZWL23,
  author       = {Jian Yang and
                  Yuwei Yin and
                  Liqun Yang and
                  Shuming Ma and
                  Haoyang Huang and
                  Dongdong Zhang and
                  Furu Wei and
                  Zhoujun Li},
  title        = {GTrans: Grouping and Fusing Transformer Layers for Neural Machine
                  Translation},
  journal      = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.},
  volume       = {31},
  pages        = {1489--1498},
  year         = {2023},
  url          = {https://doi.org/10.1109/TASLP.2022.3221040},
  doi          = {10.1109/TASLP.2022.3221040},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/taslp/YangYYMHZWL23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tmlr/PengDBWY23,
  author       = {Zhiliang Peng and
                  Li Dong and
                  Hangbo Bao and
                  Furu Wei and
                  Qixiang Ye},
  title        = {A Unified View of Masked Image Modeling},
  journal      = {Trans. Mach. Learn. Res.},
  volume       = {2023},
  year         = {2023},
  url          = {https://openreview.net/forum?id=wmGlMhaBe0},
  timestamp    = {Thu, 18 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tmlr/PengDBWY23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/LiLC0LFZ0W23,
  author       = {Minghao Li and
                  Tengchao Lv and
                  Jingye Chen and
                  Lei Cui and
                  Yijuan Lu and
                  Dinei A. F. Flor{\^{e}}ncio and
                  Cha Zhang and
                  Zhoujun Li and
                  Furu Wei},
  editor       = {Brian Williams and
                  Yiling Chen and
                  Jennifer Neville},
  title        = {TrOCR: Transformer-Based Optical Character Recognition with Pre-trained
                  Models},
  booktitle    = {Thirty-Seventh {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2023, Thirty-Fifth Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2023, Thirteenth Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2023, Washington, DC, USA, February
                  7-14, 2023},
  pages        = {13094--13102},
  publisher    = {{AAAI} Press},
  year         = {2023},
  url          = {https://doi.org/10.1609/aaai.v37i11.26538},
  doi          = {10.1609/AAAI.V37I11.26538},
  timestamp    = {Mon, 04 Sep 2023 12:29:24 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/LiLC0LFZ0W23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/XieHCW23,
  author       = {Yuan Xie and
                  Shaohan Huang and
                  Tianyu Chen and
                  Furu Wei},
  editor       = {Brian Williams and
                  Yiling Chen and
                  Jennifer Neville},
  title        = {MoEC: Mixture of Expert Clusters},
  booktitle    = {Thirty-Seventh {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2023, Thirty-Fifth Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2023, Thirteenth Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2023, Washington, DC, USA, February
                  7-14, 2023},
  pages        = {13807--13815},
  publisher    = {{AAAI} Press},
  year         = {2023},
  url          = {https://doi.org/10.1609/aaai.v37i11.26617},
  doi          = {10.1609/AAAI.V37I11.26617},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/XieHCW23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/ChenHZGLHWDZ23,
  author       = {Beiduo Chen and
                  Shaohan Huang and
                  Zihan Zhang and
                  Wu Guo and
                  Zhenhua Ling and
                  Haizhen Huang and
                  Furu Wei and
                  Weiwei Deng and
                  Qi Zhang},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {Pre-training Language Model as a Multi-perspective Course Learner},
  booktitle    = {Findings of the Association for Computational Linguistics: {ACL} 2023,
                  Toronto, Canada, July 9-14, 2023},
  pages        = {114--128},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.findings-acl.9},
  doi          = {10.18653/V1/2023.FINDINGS-ACL.9},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/acl/ChenHZGLHWDZ23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/WangYHJYJMW23,
  author       = {Liang Wang and
                  Nan Yang and
                  Xiaolong Huang and
                  Binxing Jiao and
                  Linjun Yang and
                  Daxin Jiang and
                  Rangan Majumder and
                  Furu Wei},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {SimLM: Pre-training with Representation Bottleneck for Dense Passage
                  Retrieval},
  booktitle    = {Proceedings of the 61st Annual Meeting of the Association for Computational
                  Linguistics (Volume 1: Long Papers), {ACL} 2023, Toronto, Canada,
                  July 9-14, 2023},
  pages        = {2244--2258},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.acl-long.125},
  doi          = {10.18653/V1/2023.ACL-LONG.125},
  timestamp    = {Sat, 10 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/acl/WangYHJYJMW23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/LiHZDLHJWDZ23,
  author       = {Ziheng Li and
                  Shaohan Huang and
                  Zihan Zhang and
                  Zhi{-}Hong Deng and
                  Qiang Lou and
                  Haizhen Huang and
                  Jian Jiao and
                  Furu Wei and
                  Weiwei Deng and
                  Qi Zhang},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {Dual-Alignment Pre-training for Cross-lingual Sentence Embedding},
  booktitle    = {Proceedings of the 61st Annual Meeting of the Association for Computational
                  Linguistics (Volume 1: Long Papers), {ACL} 2023, Toronto, Canada,
                  July 9-14, 2023},
  pages        = {3466--3478},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.acl-long.191},
  doi          = {10.18653/V1/2023.ACL-LONG.191},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/acl/LiHZDLHJWDZ23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/DaiS0HMSW23,
  author       = {Damai Dai and
                  Yutao Sun and
                  Li Dong and
                  Yaru Hao and
                  Shuming Ma and
                  Zhifang Sui and
                  Furu Wei},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {Why Can {GPT} Learn In-Context? Language Models Secretly Perform Gradient
                  Descent as Meta-Optimizers},
  booktitle    = {Findings of the Association for Computational Linguistics: {ACL} 2023,
                  Toronto, Canada, July 9-14, 2023},
  pages        = {4005--4019},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.findings-acl.247},
  doi          = {10.18653/V1/2023.FINDINGS-ACL.247},
  timestamp    = {Thu, 10 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/DaiS0HMSW23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/Gu0WH23,
  author       = {Yuxian Gu and
                  Li Dong and
                  Furu Wei and
                  Minlie Huang},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {Pre-Training to Learn in Context},
  booktitle    = {Proceedings of the 61st Annual Meeting of the Association for Computational
                  Linguistics (Volume 1: Long Papers), {ACL} 2023, Toronto, Canada,
                  July 9-14, 2023},
  pages        = {4849--4870},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.acl-long.267},
  doi          = {10.18653/V1/2023.ACL-LONG.267},
  timestamp    = {Thu, 10 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/Gu0WH23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/0001YWWL23,
  author       = {Yongqi Li and
                  Nan Yang and
                  Liang Wang and
                  Furu Wei and
                  Wenjie Li},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {Multiview Identifiers Enhanced Generative Retrieval},
  booktitle    = {Proceedings of the 61st Annual Meeting of the Association for Computational
                  Linguistics (Volume 1: Long Papers), {ACL} 2023, Toronto, Canada,
                  July 9-14, 2023},
  pages        = {6636--6648},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.acl-long.366},
  doi          = {10.18653/V1/2023.ACL-LONG.366},
  timestamp    = {Fri, 23 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/acl/0001YWWL23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/YangM0HHYZYWL23,
  author       = {Jian Yang and
                  Shuming Ma and
                  Li Dong and
                  Shaohan Huang and
                  Haoyang Huang and
                  Yuwei Yin and
                  Dongdong Zhang and
                  Liqun Yang and
                  Furu Wei and
                  Zhoujun Li},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {GanLM: Encoder-Decoder Pre-training with an Auxiliary Discriminator},
  booktitle    = {Proceedings of the 61st Annual Meeting of the Association for Computational
                  Linguistics (Volume 1: Long Papers), {ACL} 2023, Toronto, Canada,
                  July 9-14, 2023},
  pages        = {9394--9412},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.acl-long.522},
  doi          = {10.18653/V1/2023.ACL-LONG.522},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/acl/YangM0HHYZYWL23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/ChenMZWC23,
  author       = {Liang Chen and
                  Shuming Ma and
                  Dongdong Zhang and
                  Furu Wei and
                  Baobao Chang},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {On the Off-Target Problem of Zero-Shot Multilingual Neural Machine
                  Translation},
  booktitle    = {Findings of the Association for Computational Linguistics: {ACL} 2023,
                  Toronto, Canada, July 9-14, 2023},
  pages        = {9542--9558},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.findings-acl.608},
  doi          = {10.18653/V1/2023.FINDINGS-ACL.608},
  timestamp    = {Thu, 08 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/acl/ChenMZWC23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/SunDPMHBCSW23,
  author       = {Yutao Sun and
                  Li Dong and
                  Barun Patra and
                  Shuming Ma and
                  Shaohan Huang and
                  Alon Benhaim and
                  Vishrav Chaudhary and
                  Xia Song and
                  Furu Wei},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {A Length-Extrapolatable Transformer},
  booktitle    = {Proceedings of the 61st Annual Meeting of the Association for Computational
                  Linguistics (Volume 1: Long Papers), {ACL} 2023, Toronto, Canada,
                  July 9-14, 2023},
  pages        = {14590--14604},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.acl-long.816},
  doi          = {10.18653/V1/2023.ACL-LONG.816},
  timestamp    = {Thu, 10 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/SunDPMHBCSW23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/PatraSHC0WCS23,
  author       = {Barun Patra and
                  Saksham Singhal and
                  Shaohan Huang and
                  Zewen Chi and
                  Li Dong and
                  Furu Wei and
                  Vishrav Chaudhary and
                  Xia Song},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {Beyond English-Centric Bitexts for Better Multilingual Language Representation
                  Learning},
  booktitle    = {Proceedings of the 61st Annual Meeting of the Association for Computational
                  Linguistics (Volume 1: Long Papers), {ACL} 2023, Toronto, Canada,
                  July 9-14, 2023},
  pages        = {15354--15373},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.acl-long.856},
  doi          = {10.18653/V1/2023.ACL-LONG.856},
  timestamp    = {Thu, 10 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/PatraSHC0WCS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/Zhou0GWW23,
  author       = {Jinghao Zhou and
                  Li Dong and
                  Zhe Gan and
                  Lijuan Wang and
                  Furu Wei},
  title        = {Non-Contrastive Learning Meets Language-Image Pre-Training},
  booktitle    = {{IEEE/CVF} Conference on Computer Vision and Pattern Recognition,
                  {CVPR} 2023, Vancouver, BC, Canada, June 17-24, 2023},
  pages        = {11028--11038},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/CVPR52729.2023.01061},
  doi          = {10.1109/CVPR52729.2023.01061},
  timestamp    = {Tue, 29 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cvpr/Zhou0GWW23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/HuangP0WJY23,
  author       = {Wei Huang and
                  Zhiliang Peng and
                  Li Dong and
                  Furu Wei and
                  Jianbin Jiao and
                  Qixiang Ye},
  title        = {Generic-to-Specific Distillation of Masked Autoencoders},
  booktitle    = {{IEEE/CVF} Conference on Computer Vision and Pattern Recognition,
                  {CVPR} 2023, Vancouver, BC, Canada, June 17-24, 2023},
  pages        = {15996--16005},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/CVPR52729.2023.01535},
  doi          = {10.1109/CVPR52729.2023.01535},
  timestamp    = {Tue, 29 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cvpr/HuangP0WJY23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/WangBDBPLAMSSW23,
  author       = {Wenhui Wang and
                  Hangbo Bao and
                  Li Dong and
                  Johan Bjorck and
                  Zhiliang Peng and
                  Qiang Liu and
                  Kriti Aggarwal and
                  Owais Khan Mohammed and
                  Saksham Singhal and
                  Subhojit Som and
                  Furu Wei},
  title        = {Image as a Foreign Language: {BEIT} Pretraining for Vision and Vision-Language
                  Tasks},
  booktitle    = {{IEEE/CVF} Conference on Computer Vision and Pattern Recognition,
                  {CVPR} 2023, Vancouver, BC, Canada, June 17-24, 2023},
  pages        = {19175--19186},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/CVPR52729.2023.01838},
  doi          = {10.1109/CVPR52729.2023.01838},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cvpr/WangBDBPLAMSSW23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/dasfaa/YangYMYGHZZLW23,
  author       = {Jian Yang and
                  Yuwei Yin and
                  Shuming Ma and
                  Liqun Yang and
                  Hongcheng Guo and
                  Haoyang Huang and
                  Dongdong Zhang and
                  Yutao Zeng and
                  Zhoujun Li and
                  Furu Wei},
  editor       = {Xin Wang and
                  Maria Luisa Sapino and
                  Wook{-}Shin Han and
                  Amr El Abbadi and
                  Gill Dobbie and
                  Zhiyong Feng and
                  Yingxiao Shao and
                  Hongzhi Yin},
  title        = {HanoiT: Enhancing Context-aware Translation via Selective Context},
  booktitle    = {Database Systems for Advanced Applications - 28th International Conference,
                  {DASFAA} 2023, Tianjin, China, April 17-20, 2023, Proceedings, Part
                  {III}},
  series       = {Lecture Notes in Computer Science},
  volume       = {13945},
  pages        = {471--486},
  publisher    = {Springer},
  year         = {2023},
  url          = {https://doi.org/10.1007/978-3-031-30675-4\_34},
  doi          = {10.1007/978-3-031-30675-4\_34},
  timestamp    = {Tue, 07 May 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/dasfaa/YangYMYGHZZLW23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/WangHLWSZHWDSZ23,
  author       = {Zhaoyang Wang and
                  Shaohan Huang and
                  Yuxuan Liu and
                  Jiahai Wang and
                  Minghui Song and
                  Zihan Zhang and
                  Haizhen Huang and
                  Furu Wei and
                  Weiwei Deng and
                  Feng Sun and
                  Qi Zhang},
  editor       = {Houda Bouamor and
                  Juan Pino and
                  Kalika Bali},
  title        = {Democratizing Reasoning Ability: Tailored Learning from Large Language
                  Model},
  booktitle    = {Proceedings of the 2023 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2023, Singapore, December 6-10, 2023},
  pages        = {1948--1966},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.emnlp-main.120},
  doi          = {10.18653/V1/2023.EMNLP-MAIN.120},
  timestamp    = {Fri, 12 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/WangHLWSZHWDSZ23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/Xia0WCWS23,
  author       = {Heming Xia and
                  Tao Ge and
                  Peiyi Wang and
                  Si{-}Qing Chen and
                  Furu Wei and
                  Zhifang Sui},
  editor       = {Houda Bouamor and
                  Juan Pino and
                  Kalika Bali},
  title        = {Speculative Decoding: Exploiting Speculative Execution for Accelerating
                  Seq2seq Generation},
  booktitle    = {Findings of the Association for Computational Linguistics: {EMNLP}
                  2023, Singapore, December 6-10, 2023},
  pages        = {3909--3925},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.findings-emnlp.257},
  doi          = {10.18653/V1/2023.FINDINGS-EMNLP.257},
  timestamp    = {Fri, 12 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/Xia0WCWS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/LuHMZLGAMW23,
  author       = {Hongyuan Lu and
                  Haoyang Huang and
                  Shuming Ma and
                  Dongdong Zhang and
                  Wai Lam and
                  Zhaochuan Gao and
                  Anthony Aue and
                  Arul Menezes and
                  Furu Wei},
  editor       = {Houda Bouamor and
                  Juan Pino and
                  Kalika Bali},
  title        = {{TRIP:} Accelerating Document-level Multilingual Pre-training via
                  Triangular Document-level Pre-training on Parallel Data Triplets},
  booktitle    = {Findings of the Association for Computational Linguistics: {EMNLP}
                  2023, Singapore, December 6-10, 2023},
  pages        = {7845--7858},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.findings-emnlp.526},
  doi          = {10.18653/V1/2023.FINDINGS-EMNLP.526},
  timestamp    = {Fri, 12 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/LuHMZLGAMW23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/WangYW23,
  author       = {Liang Wang and
                  Nan Yang and
                  Furu Wei},
  editor       = {Houda Bouamor and
                  Juan Pino and
                  Kalika Bali},
  title        = {Query2doc: Query Expansion with Large Language Models},
  booktitle    = {Proceedings of the 2023 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2023, Singapore, December 6-10, 2023},
  pages        = {9414--9423},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.emnlp-main.585},
  doi          = {10.18653/V1/2023.EMNLP-MAIN.585},
  timestamp    = {Fri, 12 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/WangYW23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/ChengHBZLW0WDZ23,
  author       = {Daixuan Cheng and
                  Shaohan Huang and
                  Junyu Bi and
                  Yuefeng Zhan and
                  Jianfeng Liu and
                  Yujing Wang and
                  Hao Sun and
                  Furu Wei and
                  Weiwei Deng and
                  Qi Zhang},
  editor       = {Houda Bouamor and
                  Juan Pino and
                  Kalika Bali},
  title        = {{UPRISE:} Universal Prompt Retrieval for Improving Zero-Shot Evaluation},
  booktitle    = {Proceedings of the 2023 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2023, Singapore, December 6-10, 2023},
  pages        = {12318--12337},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.emnlp-main.758},
  doi          = {10.18653/V1/2023.EMNLP-MAIN.758},
  timestamp    = {Fri, 12 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/ChengHBZLW0WDZ23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/HuangTZZSXW23,
  author       = {Haoyang Huang and
                  Tianyi Tang and
                  Dongdong Zhang and
                  Xin Zhao and
                  Ting Song and
                  Yan Xia and
                  Furu Wei},
  editor       = {Houda Bouamor and
                  Juan Pino and
                  Kalika Bali},
  title        = {Not All Languages Are Created Equal in LLMs: Improving Multilingual
                  Capability by Cross-Lingual-Thought Prompting},
  booktitle    = {Findings of the Association for Computational Linguistics: {EMNLP}
                  2023, Singapore, December 6-10, 2023},
  pages        = {12365--12394},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.findings-emnlp.826},
  doi          = {10.18653/V1/2023.FINDINGS-EMNLP.826},
  timestamp    = {Fri, 12 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/HuangTZZSXW23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/DengPKCWLRCR23,
  author       = {Wentao Deng and
                  Jiahuan Pei and
                  Keyi Kong and
                  Zhe Chen and
                  Furu Wei and
                  Yujun Li and
                  Zhaochun Ren and
                  Zhumin Chen and
                  Pengjie Ren},
  editor       = {Houda Bouamor and
                  Juan Pino and
                  Kalika Bali},
  title        = {Syllogistic Reasoning for Legal Judgment Analysis},
  booktitle    = {Proceedings of the 2023 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2023, Singapore, December 6-10, 2023},
  pages        = {13997--14009},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.emnlp-main.864},
  doi          = {10.18653/V1/2023.EMNLP-MAIN.864},
  timestamp    = {Fri, 12 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/DengPKCWLRCR23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/LiLZLW23,
  author       = {Haoran Li and
                  Yiran Liu and
                  Xingxing Zhang and
                  Wei Lu and
                  Furu Wei},
  editor       = {Houda Bouamor and
                  Juan Pino and
                  Kalika Bali},
  title        = {Tuna: Instruction Tuning using Feedback from Large Language Models},
  booktitle    = {Findings of the Association for Computational Linguistics: {EMNLP}
                  2023, Singapore, December 6-10, 2023},
  pages        = {15146--15163},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.findings-emnlp.1011},
  doi          = {10.18653/V1/2023.FINDINGS-EMNLP.1011},
  timestamp    = {Fri, 12 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/LiLZLW23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/WeiZZCLHLW23,
  author       = {Kun Wei and
                  Long Zhou and
                  Ziqiang Zhang and
                  Liping Chen and
                  Shujie Liu and
                  Lei He and
                  Jinyu Li and
                  Furu Wei},
  title        = {Joint Pre-Training with Speech and Bilingual Text for Direct Speech
                  to Speech Translation},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing
                  {ICASSP} 2023, Rhodes Island, Greece, June 4-10, 2023},
  pages        = {1--5},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/ICASSP49357.2023.10095616},
  doi          = {10.1109/ICASSP49357.2023.10095616},
  timestamp    = {Sun, 05 Nov 2023 16:51:21 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/WeiZZCLHLW23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/Fang0BWW23,
  author       = {Yuxin Fang and
                  Li Dong and
                  Hangbo Bao and
                  Xinggang Wang and
                  Furu Wei},
  title        = {Corrupted Image Modeling for Self-Supervised Visual Pre-Training},
  booktitle    = {The Eleventh International Conference on Learning Representations,
                  {ICLR} 2023, Kigali, Rwanda, May 1-5, 2023},
  publisher    = {OpenReview.net},
  year         = {2023},
  url          = {https://openreview.net/pdf?id=09hVcSDkea},
  timestamp    = {Fri, 30 Jun 2023 14:38:38 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/Fang0BWW23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/HanH0SW23,
  author       = {Zhixiong Han and
                  Yaru Hao and
                  Li Dong and
                  Yutao Sun and
                  Furu Wei},
  title        = {Prototypical Calibration for Few-shot Learning of Language Models},
  booktitle    = {The Eleventh International Conference on Learning Representations,
                  {ICLR} 2023, Kigali, Rwanda, May 1-5, 2023},
  publisher    = {OpenReview.net},
  year         = {2023},
  url          = {https://openreview.net/pdf?id=nUsP9lFADUF},
  timestamp    = {Fri, 30 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/HanH0SW23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/Wang0000YGW23,
  author       = {Weizhi Wang and
                  Li Dong and
                  Hao Cheng and
                  Haoyu Song and
                  Xiaodong Liu and
                  Xifeng Yan and
                  Jianfeng Gao and
                  Furu Wei},
  title        = {Visually-Augmented Language Modeling},
  booktitle    = {The Eleventh International Conference on Learning Representations,
                  {ICLR} 2023, Kigali, Rwanda, May 1-5, 2023},
  publisher    = {OpenReview.net},
  year         = {2023},
  url          = {https://openreview.net/pdf?id=8IN-qLkl215},
  timestamp    = {Thu, 11 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/Wang0000YGW23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/ZhaoM0DW23,
  author       = {Haiteng Zhao and
                  Shuming Ma and
                  Dongdong Zhang and
                  Zhi{-}Hong Deng and
                  Furu Wei},
  title        = {Are More Layers Beneficial to Graph Transformers?},
  booktitle    = {The Eleventh International Conference on Learning Representations,
                  {ICLR} 2023, Kigali, Rwanda, May 1-5, 2023},
  publisher    = {OpenReview.net},
  year         = {2023},
  url          = {https://openreview.net/pdf?id=uagC-X9XMi8},
  timestamp    = {Fri, 30 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/ZhaoM0DW23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/ChenW00T0CYW23,
  author       = {Sanyuan Chen and
                  Yu Wu and
                  Chengyi Wang and
                  Shujie Liu and
                  Daniel Tompkins and
                  Zhuo Chen and
                  Wanxiang Che and
                  Xiangzhan Yu and
                  Furu Wei},
  editor       = {Andreas Krause and
                  Emma Brunskill and
                  Kyunghyun Cho and
                  Barbara Engelhardt and
                  Sivan Sabato and
                  Jonathan Scarlett},
  title        = {BEATs: Audio Pre-Training with Acoustic Tokenizers},
  booktitle    = {International Conference on Machine Learning, {ICML} 2023, 23-29 July
                  2023, Honolulu, Hawaii, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {5178--5193},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v202/chen23ag.html},
  timestamp    = {Mon, 28 Aug 2023 17:23:08 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/ChenW00T0CYW23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/WangMH0WPWBSBPL23,
  author       = {Hongyu Wang and
                  Shuming Ma and
                  Shaohan Huang and
                  Li Dong and
                  Wenhui Wang and
                  Zhiliang Peng and
                  Yu Wu and
                  Payal Bajaj and
                  Saksham Singhal and
                  Alon Benhaim and
                  Barun Patra and
                  Zhun Liu and
                  Vishrav Chaudhary and
                  Xia Song and
                  Furu Wei},
  editor       = {Andreas Krause and
                  Emma Brunskill and
                  Kyunghyun Cho and
                  Barbara Engelhardt and
                  Sivan Sabato and
                  Jonathan Scarlett},
  title        = {Magneto: {A} Foundation Transformer},
  booktitle    = {International Conference on Machine Learning, {ICML} 2023, 23-29 July
                  2023, Honolulu, Hawaii, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {36077--36092},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v202/wang23u.html},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/WangMH0WPWBSBPL23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/000100M0WCW23,
  author       = {Tao Ge and
                  Jing Hu and
                  Li Dong and
                  Shaoguang Mao and
                  Yan Xia and
                  Xun Wang and
                  Si{-}Qing Chen and
                  Furu Wei},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {Extensible Prompts for Language Models on Zero-shot Language Style
                  Customization},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/6fcbfb3721c1781728b10c6685cc2f6c-Abstract-Conference.html},
  timestamp    = {Tue, 05 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/000100M0WCW23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/ChenHL0CW23,
  author       = {Jingye Chen and
                  Yupan Huang and
                  Tengchao Lv and
                  Lei Cui and
                  Qifeng Chen and
                  Furu Wei},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {TextDiffuser: Diffusion Models as Text Painters},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/1df4afb0b4ebf492a41218ce16b6d8df-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/ChenHL0CW23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/ChenMZWC23,
  author       = {Liang Chen and
                  Shuming Ma and
                  Dongdong Zhang and
                  Furu Wei and
                  Baobao Chang},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {On the Pareto Front of Multilingual Neural Machine Translation},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/690eb240baf1180b69dac48fc905c918-Abstract-Conference.html},
  timestamp    = {Fri, 15 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/ChenMZWC23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/HaoC0W23,
  author       = {Yaru Hao and
                  Zewen Chi and
                  Li Dong and
                  Furu Wei},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {Optimizing Prompts for Text-to-Image Generation},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/d346d91999074dd8d6073d4c3b13733b-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/HaoC0W23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/Huang0WHSML0MPL23,
  author       = {Shaohan Huang and
                  Li Dong and
                  Wenhui Wang and
                  Yaru Hao and
                  Saksham Singhal and
                  Shuming Ma and
                  Tengchao Lv and
                  Lei Cui and
                  Owais Khan Mohammed and
                  Barun Patra and
                  Qiang Liu and
                  Kriti Aggarwal and
                  Zewen Chi and
                  Nils Johan Bertil Bjorck and
                  Vishrav Chaudhary and
                  Subhojit Som and
                  Xia Song and
                  Furu Wei},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {Language Is Not All You Need: Aligning Perception with Language Models},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/e425b75bac5742a008d643826428787c-Abstract-Conference.html},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/Huang0WHSML0MPL23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/Wang0CLYGW23,
  author       = {Weizhi Wang and
                  Li Dong and
                  Hao Cheng and
                  Xiaodong Liu and
                  Xifeng Yan and
                  Jianfeng Gao and
                  Furu Wei},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {Augmenting Language Models with Long-Term Memory},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/ebd82705f44793b6f9ade5a669d0f0bf-Abstract-Conference.html},
  timestamp    = {Thu, 11 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/Wang0CLYGW23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2301-02111,
  author       = {Chengyi Wang and
                  Sanyuan Chen and
                  Yu Wu and
                  Ziqiang Zhang and
                  Long Zhou and
                  Shujie Liu and
                  Zhuo Chen and
                  Yanqing Liu and
                  Huaming Wang and
                  Jinyu Li and
                  Lei He and
                  Sheng Zhao and
                  Furu Wei},
  title        = {Neural Codec Language Models are Zero-Shot Text to Speech Synthesizers},
  journal      = {CoRR},
  volume       = {abs/2301.02111},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2301.02111},
  doi          = {10.48550/ARXIV.2301.02111},
  eprinttype    = {arXiv},
  eprint       = {2301.02111},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2301-02111.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2301-06825,
  author       = {Jian Yang and
                  Yuwei Yin and
                  Shuming Ma and
                  Liqun Yang and
                  Hongcheng Guo and
                  Haoyang Huang and
                  Dongdong Zhang and
                  Yutao Zeng and
                  Zhoujun Li and
                  Furu Wei},
  title        = {HanoiT: Enhancing Context-aware Translation via Selective Context},
  journal      = {CoRR},
  volume       = {abs/2301.06825},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2301.06825},
  doi          = {10.48550/ARXIV.2301.06825},
  eprinttype    = {arXiv},
  eprint       = {2301.06825},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2301-06825.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2302-14045,
  author       = {Shaohan Huang and
                  Li Dong and
                  Wenhui Wang and
                  Yaru Hao and
                  Saksham Singhal and
                  Shuming Ma and
                  Tengchao Lv and
                  Lei Cui and
                  Owais Khan Mohammed and
                  Barun Patra and
                  Qiang Liu and
                  Kriti Aggarwal and
                  Zewen Chi and
                  Johan Bjorck and
                  Vishrav Chaudhary and
                  Subhojit Som and
                  Xia Song and
                  Furu Wei},
  title        = {Language Is Not All You Need: Aligning Perception with Language Models},
  journal      = {CoRR},
  volume       = {abs/2302.14045},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2302.14045},
  doi          = {10.48550/ARXIV.2302.14045},
  eprinttype    = {arXiv},
  eprint       = {2302.14045},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2302-14045.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2302-14771,
  author       = {Wei Huang and
                  Zhiliang Peng and
                  Li Dong and
                  Furu Wei and
                  Jianbin Jiao and
                  Qixiang Ye},
  title        = {Generic-to-Specific Distillation of Masked Autoencoders},
  journal      = {CoRR},
  volume       = {abs/2302.14771},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2302.14771},
  doi          = {10.48550/ARXIV.2302.14771},
  eprinttype    = {arXiv},
  eprint       = {2302.14771},
  timestamp    = {Thu, 02 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2302-14771.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2303-00579,
  author       = {Haiteng Zhao and
                  Shuming Ma and
                  Dongdong Zhang and
                  Zhi{-}Hong Deng and
                  Furu Wei},
  title        = {Are More Layers Beneficial to Graph Transformers?},
  journal      = {CoRR},
  volume       = {abs/2303.00579},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2303.00579},
  doi          = {10.48550/ARXIV.2303.00579},
  eprinttype    = {arXiv},
  eprint       = {2303.00579},
  timestamp    = {Tue, 07 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2303-00579.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2303-01421,
  author       = {Guangyue Peng and
                  Tao Ge and
                  Si{-}Qing Chen and
                  Furu Wei and
                  Houfeng Wang},
  title        = {Semiparametric Language Models Are Scalable Continual Learners},
  journal      = {CoRR},
  volume       = {abs/2303.01421},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2303.01421},
  doi          = {10.48550/ARXIV.2303.01421},
  eprinttype    = {arXiv},
  eprint       = {2303.01421},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2303-01421.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2303-03926,
  author       = {Ziqiang Zhang and
                  Long Zhou and
                  Chengyi Wang and
                  Sanyuan Chen and
                  Yu Wu and
                  Shujie Liu and
                  Zhuo Chen and
                  Yanqing Liu and
                  Huaming Wang and
                  Jinyu Li and
                  Lei He and
                  Sheng Zhao and
                  Furu Wei},
  title        = {Speak Foreign Languages with Your Own Voice: Cross-Lingual Neural
                  Codec Language Modeling},
  journal      = {CoRR},
  volume       = {abs/2303.03926},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2303.03926},
  doi          = {10.48550/ARXIV.2303.03926},
  eprinttype    = {arXiv},
  eprint       = {2303.03926},
  timestamp    = {Thu, 11 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2303-03926.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2303-07678,
  author       = {Liang Wang and
                  Nan Yang and
                  Furu Wei},
  title        = {Query2doc: Query Expansion with Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2303.07678},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2303.07678},
  doi          = {10.48550/ARXIV.2303.07678},
  eprinttype    = {arXiv},
  eprint       = {2303.07678},
  timestamp    = {Fri, 23 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2303-07678.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2303-08518,
  author       = {Daixuan Cheng and
                  Shaohan Huang and
                  Junyu Bi and
                  Yuefeng Zhan and
                  Jianfeng Liu and
                  Yujing Wang and
                  Hao Sun and
                  Furu Wei and
                  Denvy Deng and
                  Qi Zhang},
  title        = {{UPRISE:} Universal Prompt Retrieval for Improving Zero-Shot Evaluation},
  journal      = {CoRR},
  volume       = {abs/2303.08518},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2303.08518},
  doi          = {10.48550/ARXIV.2303.08518},
  eprinttype    = {arXiv},
  eprint       = {2303.08518},
  timestamp    = {Fri, 05 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2303-08518.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2304-03216,
  author       = {Liang Chen and
                  Shuming Ma and
                  Dongdong Zhang and
                  Furu Wei and
                  Baobao Chang},
  title        = {On the Pareto Front of Multilingual Neural Machine Translation},
  journal      = {CoRR},
  volume       = {abs/2304.03216},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2304.03216},
  doi          = {10.48550/ARXIV.2304.03216},
  eprinttype    = {arXiv},
  eprint       = {2304.03216},
  timestamp    = {Tue, 19 Dec 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2304-03216.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2304-04487,
  author       = {Nan Yang and
                  Tao Ge and
                  Liang Wang and
                  Binxing Jiao and
                  Daxin Jiang and
                  Linjun Yang and
                  Rangan Majumder and
                  Furu Wei},
  title        = {Inference with Reference: Lossless Acceleration of Large Language
                  Models},
  journal      = {CoRR},
  volume       = {abs/2304.04487},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2304.04487},
  doi          = {10.48550/ARXIV.2304.04487},
  eprinttype    = {arXiv},
  eprint       = {2304.04487},
  timestamp    = {Fri, 23 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2304-04487.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-03981,
  author       = {Beiduo Chen and
                  Shaohan Huang and
                  Zihan Zhang and
                  Wu Guo and
                  Zhenhua Ling and
                  Haizhen Huang and
                  Furu Wei and
                  Weiwei Deng and
                  Qi Zhang},
  title        = {Pre-training Language Model as a Multi-perspective Course Learner},
  journal      = {CoRR},
  volume       = {abs/2305.03981},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.03981},
  doi          = {10.48550/ARXIV.2305.03981},
  eprinttype    = {arXiv},
  eprint       = {2305.03981},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-03981.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-06575,
  author       = {Hongyuan Lu and
                  Haoyang Huang and
                  Dongdong Zhang and
                  Haoran Yang and
                  Wai Lam and
                  Furu Wei},
  title        = {Chain-of-Dictionary Prompting Elicits Translation in Large Language
                  Models},
  journal      = {CoRR},
  volume       = {abs/2305.06575},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.06575},
  doi          = {10.48550/ARXIV.2305.06575},
  eprinttype    = {arXiv},
  eprint       = {2305.06575},
  timestamp    = {Sat, 23 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-06575.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-07004,
  author       = {Haoyang Huang and
                  Tianyi Tang and
                  Dongdong Zhang and
                  Wayne Xin Zhao and
                  Ting Song and
                  Yan Xia and
                  Furu Wei},
  title        = {Not All Languages Are Created Equal in LLMs: Improving Multilingual
                  Capability by Cross-Lingual-Thought Prompting},
  journal      = {CoRR},
  volume       = {abs/2305.07004},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.07004},
  doi          = {10.48550/ARXIV.2305.07004},
  eprinttype    = {arXiv},
  eprint       = {2305.07004},
  timestamp    = {Wed, 17 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-07004.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-09137,
  author       = {Yuxian Gu and
                  Li Dong and
                  Furu Wei and
                  Minlie Huang},
  title        = {Pre-Training to Learn in Context},
  journal      = {CoRR},
  volume       = {abs/2305.09137},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.09137},
  doi          = {10.48550/ARXIV.2305.09137},
  eprinttype    = {arXiv},
  eprint       = {2305.09137},
  timestamp    = {Wed, 24 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-09137.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-09148,
  author       = {Ziheng Li and
                  Shaohan Huang and
                  Zihan Zhang and
                  Zhi{-}Hong Deng and
                  Qiang Lou and
                  Haizhen Huang and
                  Jian Jiao and
                  Furu Wei and
                  Weiwei Deng and
                  Qi Zhang},
  title        = {Dual-Alignment Pre-training for Cross-lingual Sentence Embedding},
  journal      = {CoRR},
  volume       = {abs/2305.09148},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.09148},
  doi          = {10.48550/ARXIV.2305.09148},
  eprinttype    = {arXiv},
  eprint       = {2305.09148},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-09148.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-10855,
  author       = {Jingye Chen and
                  Yupan Huang and
                  Tengchao Lv and
                  Lei Cui and
                  Qifeng Chen and
                  Furu Wei},
  title        = {TextDiffuser: Diffusion Models as Text Painters},
  journal      = {CoRR},
  volume       = {abs/2305.10855},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.10855},
  doi          = {10.48550/ARXIV.2305.10855},
  eprinttype    = {arXiv},
  eprint       = {2305.10855},
  timestamp    = {Thu, 25 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-10855.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-10930,
  author       = {Liang Chen and
                  Shuming Ma and
                  Dongdong Zhang and
                  Furu Wei and
                  Baobao Chang},
  title        = {On the Off-Target Problem of Zero-Shot Multilingual Neural Machine
                  Translation},
  journal      = {CoRR},
  volume       = {abs/2305.10930},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.10930},
  doi          = {10.48550/ARXIV.2305.10930},
  eprinttype    = {arXiv},
  eprint       = {2305.10930},
  timestamp    = {Tue, 19 Dec 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-10930.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-14066,
  author       = {Lan Jiang and
                  Haoyang Huang and
                  Dongdong Zhang and
                  Rui Jiang and
                  Furu Wei},
  title        = {One-stop Training of Multiple Capacity Models},
  journal      = {CoRR},
  volume       = {abs/2305.14066},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.14066},
  doi          = {10.48550/ARXIV.2305.14066},
  eprinttype    = {arXiv},
  eprint       = {2305.14066},
  timestamp    = {Tue, 06 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-14066.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-15067,
  author       = {Tianyi Tang and
                  Hongyuan Lu and
                  Yuchen Eleanor Jiang and
                  Haoyang Huang and
                  Dongdong Zhang and
                  Wayne Xin Zhao and
                  Furu Wei},
  title        = {Not All Metrics Are Guilty: Improving {NLG} Evaluation with {LLM}
                  Paraphrasing},
  journal      = {CoRR},
  volume       = {abs/2305.15067},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.15067},
  doi          = {10.48550/ARXIV.2305.15067},
  eprinttype    = {arXiv},
  eprint       = {2305.15067},
  timestamp    = {Thu, 13 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-15067.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-16107,
  author       = {Tianrui Wang and
                  Long Zhou and
                  Ziqiang Zhang and
                  Yu Wu and
                  Shujie Liu and
                  Yashesh Gaur and
                  Zhuo Chen and
                  Jinyu Li and
                  Furu Wei},
  title        = {VioLA: Unified Codec Language Models for Speech Recognition, Synthesis,
                  and Translation},
  journal      = {CoRR},
  volume       = {abs/2305.16107},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.16107},
  doi          = {10.48550/ARXIV.2305.16107},
  eprinttype    = {arXiv},
  eprint       = {2305.16107},
  timestamp    = {Wed, 07 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-16107.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-16675,
  author       = {Yongqi Li and
                  Nan Yang and
                  Liang Wang and
                  Furu Wei and
                  Wenjie Li},
  title        = {Multiview Identifiers Enhanced Generative Retrieval},
  journal      = {CoRR},
  volume       = {abs/2305.16675},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.16675},
  doi          = {10.48550/ARXIV.2305.16675},
  eprinttype    = {arXiv},
  eprint       = {2305.16675},
  timestamp    = {Fri, 23 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-16675.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2306-07174,
  author       = {Weizhi Wang and
                  Li Dong and
                  Hao Cheng and
                  Xiaodong Liu and
                  Xifeng Yan and
                  Jianfeng Gao and
                  Furu Wei},
  title        = {Augmenting Language Models with Long-Term Memory},
  journal      = {CoRR},
  volume       = {abs/2306.07174},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.07174},
  doi          = {10.48550/ARXIV.2306.07174},
  eprinttype    = {arXiv},
  eprint       = {2306.07174},
  timestamp    = {Thu, 11 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-07174.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2306-08543,
  author       = {Yuxian Gu and
                  Li Dong and
                  Furu Wei and
                  Minlie Huang},
  title        = {Knowledge Distillation of Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2306.08543},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.08543},
  doi          = {10.48550/ARXIV.2306.08543},
  eprinttype    = {arXiv},
  eprint       = {2306.08543},
  timestamp    = {Sun, 18 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-08543.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2306-14824,
  author       = {Zhiliang Peng and
                  Wenhui Wang and
                  Li Dong and
                  Yaru Hao and
                  Shaohan Huang and
                  Shuming Ma and
                  Furu Wei},
  title        = {Kosmos-2: Grounding Multimodal Large Language Models to the World},
  journal      = {CoRR},
  volume       = {abs/2306.14824},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.14824},
  doi          = {10.48550/ARXIV.2306.14824},
  eprinttype    = {arXiv},
  eprint       = {2306.14824},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-14824.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2306-15222,
  author       = {Yongqi Li and
                  Nan Yang and
                  Liang Wang and
                  Furu Wei and
                  Wenjie Li},
  title        = {Learning to Rank in Generative Retrieval},
  journal      = {CoRR},
  volume       = {abs/2306.15222},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.15222},
  doi          = {10.48550/ARXIV.2306.15222},
  eprinttype    = {arXiv},
  eprint       = {2306.15222},
  timestamp    = {Fri, 23 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-15222.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2307-02486,
  author       = {Jiayu Ding and
                  Shuming Ma and
                  Li Dong and
                  Xingxing Zhang and
                  Shaohan Huang and
                  Wenhui Wang and
                  Nanning Zheng and
                  Furu Wei},
  title        = {LongNet: Scaling Transformers to 1, 000, 000, 000 Tokens},
  journal      = {CoRR},
  volume       = {abs/2307.02486},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2307.02486},
  doi          = {10.48550/ARXIV.2307.02486},
  eprinttype    = {arXiv},
  eprint       = {2307.02486},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2307-02486.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2307-05300,
  author       = {Zhenhailong Wang and
                  Shaoguang Mao and
                  Wenshan Wu and
                  Tao Ge and
                  Furu Wei and
                  Heng Ji},
  title        = {Unleashing Cognitive Synergy in Large Language Models: {A} Task-Solving
                  Agent through Multi-Persona Self-Collaboration},
  journal      = {CoRR},
  volume       = {abs/2307.05300},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2307.05300},
  doi          = {10.48550/ARXIV.2307.05300},
  eprinttype    = {arXiv},
  eprint       = {2307.05300},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2307-05300.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2307-06945,
  author       = {Tao Ge and
                  Jing Hu and
                  Xun Wang and
                  Si{-}Qing Chen and
                  Furu Wei},
  title        = {In-context Autoencoder for Context Compression in a Large Language
                  Model},
  journal      = {CoRR},
  volume       = {abs/2307.06945},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2307.06945},
  doi          = {10.48550/ARXIV.2307.06945},
  eprinttype    = {arXiv},
  eprint       = {2307.06945},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2307-06945.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2307-07164,
  author       = {Liang Wang and
                  Nan Yang and
                  Furu Wei},
  title        = {Learning to Retrieve In-Context Examples for Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2307.07164},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2307.07164},
  doi          = {10.48550/ARXIV.2307.07164},
  eprinttype    = {arXiv},
  eprint       = {2307.07164},
  timestamp    = {Fri, 23 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2307-07164.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2307-08621,
  author       = {Yutao Sun and
                  Li Dong and
                  Shaohan Huang and
                  Shuming Ma and
                  Yuqing Xia and
                  Jilong Xue and
                  Jianyong Wang and
                  Furu Wei},
  title        = {Retentive Network: {A} Successor to Transformer for Large Language
                  Models},
  journal      = {CoRR},
  volume       = {abs/2307.08621},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2307.08621},
  doi          = {10.48550/ARXIV.2307.08621},
  eprinttype    = {arXiv},
  eprint       = {2307.08621},
  timestamp    = {Tue, 25 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2307-08621.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2308-12770,
  author       = {Guangyu Chen and
                  Yu Wu and
                  Shujie Liu and
                  Tao Liu and
                  Xiaoyong Du and
                  Furu Wei},
  title        = {WavMark: Watermarking for Audio Generation},
  journal      = {CoRR},
  volume       = {abs/2308.12770},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2308.12770},
  doi          = {10.48550/ARXIV.2308.12770},
  eprinttype    = {arXiv},
  eprint       = {2308.12770},
  timestamp    = {Wed, 30 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2308-12770.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2309-05689,
  author       = {Qingxiu Dong and
                  Li Dong and
                  Ke Xu and
                  Guangyan Zhou and
                  Yaru Hao and
                  Zhifang Sui and
                  Furu Wei},
  title        = {Large Language Model for Science: {A} Study on {P} vs. {NP}},
  journal      = {CoRR},
  volume       = {abs/2309.05689},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.05689},
  doi          = {10.48550/ARXIV.2309.05689},
  eprinttype    = {arXiv},
  eprint       = {2309.05689},
  timestamp    = {Fri, 15 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-05689.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2309-09530,
  author       = {Daixuan Cheng and
                  Shaohan Huang and
                  Furu Wei},
  title        = {Adapting Large Language Models via Reading Comprehension},
  journal      = {CoRR},
  volume       = {abs/2309.09530},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.09530},
  doi          = {10.48550/ARXIV.2309.09530},
  eprinttype    = {arXiv},
  eprint       = {2309.09530},
  timestamp    = {Fri, 22 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-09530.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2309-10400,
  author       = {Dawei Zhu and
                  Nan Yang and
                  Liang Wang and
                  Yifan Song and
                  Wenhao Wu and
                  Furu Wei and
                  Sujian Li},
  title        = {PoSE: Efficient Context Window Extension of LLMs via Positional Skip-wise
                  Training},
  journal      = {CoRR},
  volume       = {abs/2309.10400},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.10400},
  doi          = {10.48550/ARXIV.2309.10400},
  eprinttype    = {arXiv},
  eprint       = {2309.10400},
  timestamp    = {Fri, 23 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-10400.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2309-11419,
  author       = {Tengchao Lv and
                  Yupan Huang and
                  Jingye Chen and
                  Lei Cui and
                  Shuming Ma and
                  Yaoyao Chang and
                  Shaohan Huang and
                  Wenhui Wang and
                  Li Dong and
                  Weiyao Luo and
                  Shaoxiang Wu and
                  Guoxin Wang and
                  Cha Zhang and
                  Furu Wei},
  title        = {Kosmos-2.5: {A} Multimodal Literate Model},
  journal      = {CoRR},
  volume       = {abs/2309.11419},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.11419},
  doi          = {10.48550/ARXIV.2309.11419},
  eprinttype    = {arXiv},
  eprint       = {2309.11419},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-11419.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2309-13308,
  author       = {Yuxuan Liu and
                  Tianchi Yang and
                  Shaohan Huang and
                  Zihan Zhang and
                  Haizhen Huang and
                  Furu Wei and
                  Weiwei Deng and
                  Feng Sun and
                  Qi Zhang},
  title        = {Calibrating LLM-Based Evaluator},
  journal      = {CoRR},
  volume       = {abs/2309.13308},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.13308},
  doi          = {10.48550/ARXIV.2309.13308},
  eprinttype    = {arXiv},
  eprint       = {2309.13308},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-13308.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2309-17061,
  author       = {Xin Cheng and
                  Xun Wang and
                  Tao Ge and
                  Si{-}Qing Chen and
                  Furu Wei and
                  Dongyan Zhao and
                  Rui Yan},
  title        = {{SCALE:} Synergized Collaboration of Asymmetric Language Translation
                  Engines},
  journal      = {CoRR},
  volume       = {abs/2309.17061},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.17061},
  doi          = {10.48550/ARXIV.2309.17061},
  eprinttype    = {arXiv},
  eprint       = {2309.17061},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-17061.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-02992,
  author       = {Xichen Pan and
                  Li Dong and
                  Shaohan Huang and
                  Zhiliang Peng and
                  Wenhu Chen and
                  Furu Wei},
  title        = {Kosmos-G: Generating Images in Context with Multimodal Large Language
                  Models},
  journal      = {CoRR},
  volume       = {abs/2310.02992},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.02992},
  doi          = {10.48550/ARXIV.2310.02992},
  eprinttype    = {arXiv},
  eprint       = {2310.02992},
  timestamp    = {Thu, 19 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-02992.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-08185,
  author       = {Wang You and
                  Wenshan Wu and
                  Yaobo Liang and
                  Shaoguang Mao and
                  Chenfei Wu and
                  Maosong Cao and
                  Yuzhe Cai and
                  Yiduo Guo and
                  Yan Xia and
                  Furu Wei and
                  Nan Duan},
  title        = {EIPE-text: Evaluation-Guided Iterative Plan Extraction for Long-Form
                  Narrative Text Generation},
  journal      = {CoRR},
  volume       = {abs/2310.08185},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.08185},
  doi          = {10.48550/ARXIV.2310.08185},
  eprinttype    = {arXiv},
  eprint       = {2310.08185},
  timestamp    = {Tue, 24 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-08185.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-08319,
  author       = {Xueguang Ma and
                  Liang Wang and
                  Nan Yang and
                  Furu Wei and
                  Jimmy Lin},
  title        = {Fine-Tuning LLaMA for Multi-Stage Text Retrieval},
  journal      = {CoRR},
  volume       = {abs/2310.08319},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.08319},
  doi          = {10.48550/ARXIV.2310.08319},
  eprinttype    = {arXiv},
  eprint       = {2310.08319},
  timestamp    = {Fri, 23 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-08319.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-11453,
  author       = {Hongyu Wang and
                  Shuming Ma and
                  Li Dong and
                  Shaohan Huang and
                  Huaijie Wang and
                  Lingxiao Ma and
                  Fan Yang and
                  Ruiping Wang and
                  Yi Wu and
                  Furu Wei},
  title        = {BitNet: Scaling 1-bit Transformers for Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2310.11453},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.11453},
  doi          = {10.48550/ARXIV.2310.11453},
  eprinttype    = {arXiv},
  eprint       = {2310.11453},
  timestamp    = {Tue, 02 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-11453.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-13332,
  author       = {Zhaoyang Wang and
                  Shaohan Huang and
                  Yuxuan Liu and
                  Jiahai Wang and
                  Minghui Song and
                  Zihan Zhang and
                  Haizhen Huang and
                  Furu Wei and
                  Weiwei Deng and
                  Feng Sun and
                  Qi Zhang},
  title        = {Democratizing Reasoning Ability: Tailored Learning from Large Language
                  Model},
  journal      = {CoRR},
  volume       = {abs/2310.13332},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.13332},
  doi          = {10.48550/ARXIV.2310.13332},
  eprinttype    = {arXiv},
  eprint       = {2310.13332},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-13332.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-13385,
  author       = {Haoran Li and
                  Yiran Liu and
                  Xingxing Zhang and
                  Wei Lu and
                  Furu Wei},
  title        = {Tuna: Instruction Tuning using Feedback from Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2310.13385},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.13385},
  doi          = {10.48550/ARXIV.2310.13385},
  eprinttype    = {arXiv},
  eprint       = {2310.13385},
  timestamp    = {Fri, 27 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-13385.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-14587,
  author       = {Liang Wang and
                  Nan Yang and
                  Xiaolong Huang and
                  Linjun Yang and
                  Rangan Majumder and
                  Furu Wei},
  title        = {Large Search Model: Redefining Search Stack in the Era of LLMs},
  journal      = {CoRR},
  volume       = {abs/2310.14587},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.14587},
  doi          = {10.48550/ARXIV.2310.14587},
  eprinttype    = {arXiv},
  eprint       = {2310.14587},
  timestamp    = {Fri, 23 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-14587.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2311-03220,
  author       = {Shaoguang Mao and
                  Yuzhe Cai and
                  Yan Xia and
                  Wenshan Wu and
                  Xun Wang and
                  Fengyi Wang and
                  Tao Ge and
                  Furu Wei},
  title        = {{ALYMPICS:} Language Agents Meet Game Theory},
  journal      = {CoRR},
  volume       = {abs/2311.03220},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2311.03220},
  doi          = {10.48550/ARXIV.2311.03220},
  eprinttype    = {arXiv},
  eprint       = {2311.03220},
  timestamp    = {Wed, 08 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2311-03220.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2311-09263,
  author       = {Jinghan Yang and
                  Shuming Ma and
                  Furu Wei},
  title        = {Auto-ICL: In-Context Learning without Human Supervision},
  journal      = {CoRR},
  volume       = {abs/2311.09263},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2311.09263},
  doi          = {10.48550/ARXIV.2311.09263},
  eprinttype    = {arXiv},
  eprint       = {2311.09263},
  timestamp    = {Tue, 21 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2311-09263.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2311-16465,
  author       = {Jingye Chen and
                  Yupan Huang and
                  Tengchao Lv and
                  Lei Cui and
                  Qifeng Chen and
                  Furu Wei},
  title        = {TextDiffuser-2: Unleashing the Power of Language Models for Text Rendering},
  journal      = {CoRR},
  volume       = {abs/2311.16465},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2311.16465},
  doi          = {10.48550/ARXIV.2311.16465},
  eprinttype    = {arXiv},
  eprint       = {2311.16465},
  timestamp    = {Mon, 04 Dec 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2311-16465.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2312-03558,
  author       = {Wenhui Wang and
                  Shuming Ma and
                  Hanwen Xu and
                  Naoto Usuyama and
                  Jiayu Ding and
                  Hoifung Poon and
                  Furu Wei},
  title        = {When an Image is Worth 1, 024 x 1, 024 Words: {A} Case Study in Computational
                  Pathology},
  journal      = {CoRR},
  volume       = {abs/2312.03558},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2312.03558},
  doi          = {10.48550/ARXIV.2312.03558},
  eprinttype    = {arXiv},
  eprint       = {2312.03558},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2312-03558.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jstsp/ChenWCWLCLKYXWZ22,
  author       = {Sanyuan Chen and
                  Chengyi Wang and
                  Zhengyang Chen and
                  Yu Wu and
                  Shujie Liu and
                  Zhuo Chen and
                  Jinyu Li and
                  Naoyuki Kanda and
                  Takuya Yoshioka and
                  Xiong Xiao and
                  Jian Wu and
                  Long Zhou and
                  Shuo Ren and
                  Yanmin Qian and
                  Yao Qian and
                  Jian Wu and
                  Michael Zeng and
                  Xiangzhan Yu and
                  Furu Wei},
  title        = {WavLM: Large-Scale Self-Supervised Pre-Training for Full Stack Speech
                  Processing},
  journal      = {{IEEE} J. Sel. Top. Signal Process.},
  volume       = {16},
  number       = {6},
  pages        = {1505--1518},
  year         = {2022},
  url          = {https://doi.org/10.1109/JSTSP.2022.3188113},
  doi          = {10.1109/JSTSP.2022.3188113},
  timestamp    = {Sun, 13 Nov 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/jstsp/ChenWCWLCLKYXWZ22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/ZhuDWQL22,
  author       = {Haichao Zhu and
                  Li Dong and
                  Furu Wei and
                  Bing Qin and
                  Ting Liu},
  title        = {Transforming Wikipedia Into Augmented Data for Query-Focused Summarization},
  journal      = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.},
  volume       = {30},
  pages        = {2357--2367},
  year         = {2022},
  url          = {https://doi.org/10.1109/taslp.2022.3171963},
  doi          = {10.1109/TASLP.2022.3171963},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/taslp/ZhuDWQL22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/XuZWW22a,
  author       = {Shusheng Xu and
                  Xingxing Zhang and
                  Yi Wu and
                  Furu Wei},
  title        = {Sequence Level Contrastive Learning for Text Summarization},
  booktitle    = {Thirty-Sixth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2022, Thirty-Fourth Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2022, The Twelveth Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2022 Virtual Event, February 22
                  - March 1, 2022},
  pages        = {11556--11565},
  publisher    = {{AAAI} Press},
  year         = {2022},
  url          = {https://doi.org/10.1609/aaai.v36i10.21409},
  doi          = {10.1609/AAAI.V36I10.21409},
  timestamp    = {Tue, 02 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/XuZWW22a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/ZhangZBW22,
  author       = {Shengqiang Zhang and
                  Xingxing Zhang and
                  Hangbo Bao and
                  Furu Wei},
  editor       = {Smaranda Muresan and
                  Preslav Nakov and
                  Aline Villavicencio},
  title        = {Attention Temperature Matters in Abstractive Summarization Distillation},
  booktitle    = {Proceedings of the 60th Annual Meeting of the Association for Computational
                  Linguistics (Volume 1: Long Papers), {ACL} 2022, Dublin, Ireland,
                  May 22-27, 2022},
  pages        = {127--141},
  publisher    = {Association for Computational Linguistics},
  year         = {2022},
  url          = {https://doi.org/10.18653/v1/2022.acl-long.11},
  doi          = {10.18653/V1/2022.ACL-LONG.11},
  timestamp    = {Mon, 01 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/ZhangZBW22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/ChenMC0PWW22,
  author       = {Guanhua Chen and
                  Shuming Ma and
                  Yun Chen and
                  Dongdong Zhang and
                  Jia Pan and
                  Wenping Wang and
                  Furu Wei},
  editor       = {Smaranda Muresan and
                  Preslav Nakov and
                  Aline Villavicencio},
  title        = {Towards Making the Most of Cross-Lingual Transfer for Zero-Shot Neural
                  Machine Translation},
  booktitle    = {Proceedings of the 60th Annual Meeting of the Association for Computational
                  Linguistics (Volume 1: Long Papers), {ACL} 2022, Dublin, Ireland,
                  May 22-27, 2022},
  pages        = {142--157},
  publisher    = {Association for Computational Linguistics},
  year         = {2022},
  url          = {https://doi.org/10.18653/v1/2022.acl-long.12},
  doi          = {10.18653/V1/2022.ACL-LONG.12},
  timestamp    = {Thu, 25 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/ChenMC0PWW22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/JiaZC0WW22,
  author       = {Ruipeng Jia and
                  Xingxing Zhang and
                  Yanan Cao and
                  Zheng Lin and
                  Shi Wang and
                  Furu Wei},
  editor       = {Smaranda Muresan and
                  Preslav Nakov and
                  Aline Villavicencio},
  title        = {Neural Label Search for Zero-Shot Multi-Lingual Extractive Summarization},
  booktitle    = {Proceedings of the 60th Annual Meeting of the Association for Computational
                  Linguistics (Volume 1: Long Papers), {ACL} 2022, Dublin, Ireland,
                  May 22-27, 2022},
  pages        = {561--570},
  publisher    = {Association for Computational Linguistics},
  year         = {2022},
  url          = {https://doi.org/10.18653/v1/2022.acl-long.42},
  doi          = {10.18653/V1/2022.ACL-LONG.42},
  timestamp    = {Mon, 01 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/JiaZC0WW22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/Qian0SWC22,
  author       = {Jing Qian and
                  Li Dong and
                  Yelong Shen and
                  Furu Wei and
                  Weizhu Chen},
  editor       = {Smaranda Muresan and
                  Preslav Nakov and
                  Aline Villavicencio},
  title        = {Controllable Natural Language Generation with Contrastive Prefixes},
  booktitle    = {Findings of the Association for Computational Linguistics: {ACL} 2022,
                  Dublin, Ireland, May 22-27, 2022},
  pages        = {2912--2924},
  publisher    = {Association for Computational Linguistics},
  year         = {2022},
  url          = {https://doi.org/10.18653/v1/2022.findings-acl.229},
  doi          = {10.18653/V1/2022.FINDINGS-ACL.229},
  timestamp    = {Mon, 01 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/Qian0SWC22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/XuL0WLFZW22,
  author       = {Yiheng Xu and
                  Tengchao Lv and
                  Lei Cui and
                  Guoxin Wang and
                  Yijuan Lu and
                  Dinei A. F. Flor{\^{e}}ncio and
                  Cha Zhang and
                  Furu Wei},
  editor       = {Smaranda Muresan and
                  Preslav Nakov and
                  Aline Villavicencio},
  title        = {{XFUND:} {A} Benchmark Dataset for Multilingual Visually Rich Form
                  Understanding},
  booktitle    = {Findings of the Association for Computational Linguistics: {ACL} 2022,
                  Dublin, Ireland, May 22-27, 2022},
  pages        = {3214--3224},
  publisher    = {Association for Computational Linguistics},
  year         = {2022},
  url          = {https://doi.org/10.18653/v1/2022.findings-acl.253},
  doi          = {10.18653/V1/2022.FINDINGS-ACL.253},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/XuL0WLFZW22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/ChenBHDJJZLW22,
  author       = {Tianyu Chen and
                  Hangbo Bao and
                  Shaohan Huang and
                  Li Dong and
                  Binxing Jiao and
                  Daxin Jiang and
                  Haoyi Zhou and
                  Jianxin Li and
                  Furu Wei},
  editor       = {Smaranda Muresan and
                  Preslav Nakov and
                  Aline Villavicencio},
  title        = {{THE-X:} Privacy-Preserving Transformer Inference with Homomorphic
                  Encryption},
  booktitle    = {Findings of the Association for Computational Linguistics: {ACL} 2022,
                  Dublin, Ireland, May 22-27, 2022},
  pages        = {3510--3520},
  publisher    = {Association for Computational Linguistics},
  year         = {2022},
  url          = {https://doi.org/10.18653/v1/2022.findings-acl.277},
  doi          = {10.18653/V1/2022.FINDINGS-ACL.277},
  timestamp    = {Thu, 06 Apr 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/ChenBHDJJZLW22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/AoWZ0RW0KLZWQ0W22,
  author       = {Junyi Ao and
                  Rui Wang and
                  Long Zhou and
                  Chengyi Wang and
                  Shuo Ren and
                  Yu Wu and
                  Shujie Liu and
                  Tom Ko and
                  Qing Li and
                  Yu Zhang and
                  Zhihua Wei and
                  Yao Qian and
                  Jinyu Li and
                  Furu Wei},
  editor       = {Smaranda Muresan and
                  Preslav Nakov and
                  Aline Villavicencio},
  title        = {SpeechT5: Unified-Modal Encoder-Decoder Pre-Training for Spoken Language
                  Processing},
  booktitle    = {Proceedings of the 60th Annual Meeting of the Association for Computational
                  Linguistics (Volume 1: Long Papers), {ACL} 2022, Dublin, Ireland,
                  May 22-27, 2022},
  pages        = {5723--5738},
  publisher    = {Association for Computational Linguistics},
  year         = {2022},
  url          = {https://doi.org/10.18653/v1/2022.acl-long.393},
  doi          = {10.18653/V1/2022.ACL-LONG.393},
  timestamp    = {Mon, 01 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/AoWZ0RW0KLZWQ0W22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/LiX0W22,
  author       = {Junlong Li and
                  Yiheng Xu and
                  Lei Cui and
                  Furu Wei},
  editor       = {Smaranda Muresan and
                  Preslav Nakov and
                  Aline Villavicencio},
  title        = {MarkupLM: Pre-training of Text and Markup Language for Visually Rich
                  Document Understanding},
  booktitle    = {Proceedings of the 60th Annual Meeting of the Association for Computational
                  Linguistics (Volume 1: Long Papers), {ACL} 2022, Dublin, Ireland,
                  May 22-27, 2022},
  pages        = {6078--6087},
  publisher    = {Association for Computational Linguistics},
  year         = {2022},
  url          = {https://doi.org/10.18653/v1/2022.acl-long.420},
  doi          = {10.18653/V1/2022.ACL-LONG.420},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/LiX0W22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/0002000W22,
  author       = {Haoyu Song and
                  Li Dong and
                  Weinan Zhang and
                  Ting Liu and
                  Furu Wei},
  editor       = {Smaranda Muresan and
                  Preslav Nakov and
                  Aline Villavicencio},
  title        = {{CLIP} Models are Few-Shot Learners: Empirical Studies on {VQA} and
                  Visual Entailment},
  booktitle    = {Proceedings of the 60th Annual Meeting of the Association for Computational
                  Linguistics (Volume 1: Long Papers), {ACL} 2022, Dublin, Ireland,
                  May 22-27, 2022},
  pages        = {6088--6100},
  publisher    = {Association for Computational Linguistics},
  year         = {2022},
  url          = {https://doi.org/10.18653/v1/2022.acl-long.421},
  doi          = {10.18653/V1/2022.ACL-LONG.421},
  timestamp    = {Mon, 01 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/0002000W22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/ChiH0MZSBSMHW22,
  author       = {Zewen Chi and
                  Shaohan Huang and
                  Li Dong and
                  Shuming Ma and
                  Bo Zheng and
                  Saksham Singhal and
                  Payal Bajaj and
                  Xia Song and
                  Xian{-}Ling Mao and
                  Heyan Huang and
                  Furu Wei},
  editor       = {Smaranda Muresan and
                  Preslav Nakov and
                  Aline Villavicencio},
  title        = {{XLM-E:} Cross-lingual Language Model Pre-training via {ELECTRA}},
  booktitle    = {Proceedings of the 60th Annual Meeting of the Association for Computational
                  Linguistics (Volume 1: Long Papers), {ACL} 2022, Dublin, Ireland,
                  May 22-27, 2022},
  pages        = {6170--6182},
  publisher    = {Association for Computational Linguistics},
  year         = {2022},
  url          = {https://doi.org/10.18653/v1/2022.acl-long.427},
  doi          = {10.18653/V1/2022.ACL-LONG.427},
  timestamp    = {Mon, 01 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/ChiH0MZSBSMHW22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/Dai0MZSCW22,
  author       = {Damai Dai and
                  Li Dong and
                  Shuming Ma and
                  Bo Zheng and
                  Zhifang Sui and
                  Baobao Chang and
                  Furu Wei},
  editor       = {Smaranda Muresan and
                  Preslav Nakov and
                  Aline Villavicencio},
  title        = {StableMoE: Stable Routing Strategy for Mixture of Experts},
  booktitle    = {Proceedings of the 60th Annual Meeting of the Association for Computational
                  Linguistics (Volume 1: Long Papers), {ACL} 2022, Dublin, Ireland,
                  May 22-27, 2022},
  pages        = {7085--7095},
  publisher    = {Association for Computational Linguistics},
  year         = {2022},
  url          = {https://doi.org/10.18653/v1/2022.acl-long.489},
  doi          = {10.18653/V1/2022.ACL-LONG.489},
  timestamp    = {Mon, 01 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/Dai0MZSCW22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/DaiDHSCW22,
  author       = {Damai Dai and
                  Li Dong and
                  Yaru Hao and
                  Zhifang Sui and
                  Baobao Chang and
                  Furu Wei},
  editor       = {Smaranda Muresan and
                  Preslav Nakov and
                  Aline Villavicencio},
  title        = {Knowledge Neurons in Pretrained Transformers},
  booktitle    = {Proceedings of the 60th Annual Meeting of the Association for Computational
                  Linguistics (Volume 1: Long Papers), {ACL} 2022, Dublin, Ireland,
                  May 22-27, 2022},
  pages        = {8493--8502},
  publisher    = {Association for Computational Linguistics},
  year         = {2022},
  url          = {https://doi.org/10.18653/v1/2022.acl-long.581},
  doi          = {10.18653/V1/2022.ACL-LONG.581},
  timestamp    = {Mon, 01 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/DaiDHSCW22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/Liu0LYXWN000WG22,
  author       = {Ze Liu and
                  Han Hu and
                  Yutong Lin and
                  Zhuliang Yao and
                  Zhenda Xie and
                  Yixuan Wei and
                  Jia Ning and
                  Yue Cao and
                  Zheng Zhang and
                  Li Dong and
                  Furu Wei and
                  Baining Guo},
  title        = {Swin Transformer {V2:} Scaling Up Capacity and Resolution},
  booktitle    = {{IEEE/CVF} Conference on Computer Vision and Pattern Recognition,
                  {CVPR} 2022, New Orleans, LA, USA, June 18-24, 2022},
  pages        = {11999--12009},
  publisher    = {{IEEE}},
  year         = {2022},
  url          = {https://doi.org/10.1109/CVPR52688.2022.01170},
  doi          = {10.1109/CVPR52688.2022.01170},
  timestamp    = {Mon, 05 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cvpr/Liu0LYXWN000WG22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/YangHMY0ZGLW22,
  author       = {Jian Yang and
                  Shaohan Huang and
                  Shuming Ma and
                  Yuwei Yin and
                  Li Dong and
                  Dongdong Zhang and
                  Hongcheng Guo and
                  Zhoujun Li and
                  Furu Wei},
  editor       = {Yoav Goldberg and
                  Zornitsa Kozareva and
                  Yue Zhang},
  title        = {{CROP:} Zero-shot Cross-lingual Named Entity Recognition with Multilingual
                  Labeled Sequence Translation},
  booktitle    = {Findings of the Association for Computational Linguistics: {EMNLP}
                  2022, Abu Dhabi, United Arab Emirates, December 7-11, 2022},
  pages        = {486--496},
  publisher    = {Association for Computational Linguistics},
  year         = {2022},
  url          = {https://doi.org/10.18653/v1/2022.findings-emnlp.34},
  doi          = {10.18653/V1/2022.FINDINGS-EMNLP.34},
  timestamp    = {Tue, 07 May 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/YangHMY0ZGLW22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/ChenL0ZW22,
  author       = {Jingye Chen and
                  Tengchao Lv and
                  Lei Cui and
                  Cha Zhang and
                  Furu Wei},
  editor       = {Yoav Goldberg and
                  Zornitsa Kozareva and
                  Yue Zhang},
  title        = {XDoc: Unified Pre-training for Cross-Format Document Understanding},
  booktitle    = {Findings of the Association for Computational Linguistics: {EMNLP}
                  2022, Abu Dhabi, United Arab Emirates, December 7-11, 2022},
  pages        = {1006--1016},
  publisher    = {Association for Computational Linguistics},
  year         = {2022},
  url          = {https://doi.org/10.18653/v1/2022.findings-emnlp.71},
  doi          = {10.18653/V1/2022.FINDINGS-EMNLP.71},
  timestamp    = {Thu, 10 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/ChenL0ZW22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/ZhangZA0D0W22,
  author       = {Ziqiang Zhang and
                  Long Zhou and
                  Junyi Ao and
                  Shujie Liu and
                  Lirong Dai and
                  Jinyu Li and
                  Furu Wei},
  editor       = {Yoav Goldberg and
                  Zornitsa Kozareva and
                  Yue Zhang},
  title        = {SpeechUT: Bridging Speech and Text with Hidden-Unit for Encoder-Decoder
                  Based Speech-Text Pre-training},
  booktitle    = {Proceedings of the 2022 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2022, Abu Dhabi, United Arab Emirates,
                  December 7-11, 2022},
  pages        = {1663--1676},
  publisher    = {Association for Computational Linguistics},
  year         = {2022},
  url          = {https://doi.org/10.18653/v1/2022.emnlp-main.108},
  doi          = {10.18653/V1/2022.EMNLP-MAIN.108},
  timestamp    = {Thu, 10 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/ZhangZA0D0W22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/ChengHLZ0WDZ22,
  author       = {Daixuan Cheng and
                  Shaohan Huang and
                  Jianfeng Liu and
                  Yuefeng Zhan and
                  Hao Sun and
                  Furu Wei and
                  Denvy Deng and
                  Qi Zhang},
  editor       = {Yoav Goldberg and
                  Zornitsa Kozareva and
                  Yue Zhang},
  title        = {Snapshot-Guided Domain Adaptation for {ELECTRA}},
  booktitle    = {Findings of the Association for Computational Linguistics: {EMNLP}
                  2022, Abu Dhabi, United Arab Emirates, December 7-11, 2022},
  pages        = {2226--2232},
  publisher    = {Association for Computational Linguistics},
  year         = {2022},
  url          = {https://doi.org/10.18653/v1/2022.findings-emnlp.163},
  doi          = {10.18653/V1/2022.FINDINGS-EMNLP.163},
  timestamp    = {Thu, 10 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/ChengHLZ0WDZ22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/JiangJHZWZWHDZ22,
  author       = {Ting Jiang and
                  Jian Jiao and
                  Shaohan Huang and
                  Zihan Zhang and
                  Deqing Wang and
                  Fuzhen Zhuang and
                  Furu Wei and
                  Haizhen Huang and
                  Denvy Deng and
                  Qi Zhang},
  editor       = {Yoav Goldberg and
                  Zornitsa Kozareva and
                  Yue Zhang},
  title        = {PromptBERT: Improving {BERT} Sentence Embeddings with Prompts},
  booktitle    = {Proceedings of the 2022 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2022, Abu Dhabi, United Arab Emirates,
                  December 7-11, 2022},
  pages        = {8826--8837},
  publisher    = {Association for Computational Linguistics},
  year         = {2022},
  url          = {https://doi.org/10.18653/v1/2022.emnlp-main.603},
  doi          = {10.18653/V1/2022.EMNLP-MAIN.603},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/JiangJHZWZWHDZ22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/WangWZL0W22,
  author       = {Zekun Wang and
                  Wenhui Wang and
                  Haichao Zhu and
                  Ming Liu and
                  Bing Qin and
                  Furu Wei},
  editor       = {Yoav Goldberg and
                  Zornitsa Kozareva and
                  Yue Zhang},
  title        = {Distilled Dual-Encoder Model for Vision-Language Understanding},
  booktitle    = {Proceedings of the 2022 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2022, Abu Dhabi, United Arab Emirates,
                  December 7-11, 2022},
  pages        = {8901--8913},
  publisher    = {Association for Computational Linguistics},
  year         = {2022},
  url          = {https://doi.org/10.18653/v1/2022.emnlp-main.608},
  doi          = {10.18653/V1/2022.EMNLP-MAIN.608},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/WangWZL0W22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/GeCW22,
  author       = {Tao Ge and
                  Si{-}Qing Chen and
                  Furu Wei},
  editor       = {Yoav Goldberg and
                  Zornitsa Kozareva and
                  Yue Zhang},
  title        = {EdgeFormer: {A} Parameter-Efficient Transformer for On-Device Seq2seq
                  Generation},
  booktitle    = {Proceedings of the 2022 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2022, Abu Dhabi, United Arab Emirates,
                  December 7-11, 2022},
  pages        = {10786--10798},
  publisher    = {Association for Computational Linguistics},
  year         = {2022},
  url          = {https://doi.org/10.18653/v1/2022.emnlp-main.741},
  doi          = {10.18653/V1/2022.EMNLP-MAIN.741},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/GeCW22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/HuangM0WW22,
  author       = {Lianzhe Huang and
                  Shuming Ma and
                  Dongdong Zhang and
                  Furu Wei and
                  Houfeng Wang},
  editor       = {Yoav Goldberg and
                  Zornitsa Kozareva and
                  Yue Zhang},
  title        = {Zero-shot Cross-lingual Transfer of Prompt-based Tuning with a Unified
                  Multilingual Prompt},
  booktitle    = {Proceedings of the 2022 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2022, Abu Dhabi, United Arab Emirates,
                  December 7-11, 2022},
  pages        = {11488--11497},
  publisher    = {Association for Computational Linguistics},
  year         = {2022},
  url          = {https://doi.org/10.18653/v1/2022.emnlp-main.790},
  doi          = {10.18653/V1/2022.EMNLP-MAIN.790},
  timestamp    = {Thu, 10 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/HuangM0WW22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/ChenWWCCLWQWLY22,
  author       = {Sanyuan Chen and
                  Yu Wu and
                  Chengyi Wang and
                  Zhengyang Chen and
                  Zhuo Chen and
                  Shujie Liu and
                  Jian Wu and
                  Yao Qian and
                  Furu Wei and
                  Jinyu Li and
                  Xiangzhan Yu},
  title        = {Unispeech-Sat: Universal Speech Representation Learning With Speaker
                  Aware Pre-Training},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2022, Virtual and Singapore, 23-27 May 2022},
  pages        = {6152--6156},
  publisher    = {{IEEE}},
  year         = {2022},
  url          = {https://doi.org/10.1109/ICASSP43922.2022.9747077},
  doi          = {10.1109/ICASSP43922.2022.9747077},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/ChenWWCCLWQWLY22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/Bao0PW22,
  author       = {Hangbo Bao and
                  Li Dong and
                  Songhao Piao and
                  Furu Wei},
  title        = {BEiT: {BERT} Pre-Training of Image Transformers},
  booktitle    = {The Tenth International Conference on Learning Representations, {ICLR}
                  2022, Virtual Event, April 25-29, 2022},
  publisher    = {OpenReview.net},
  year         = {2022},
  url          = {https://openreview.net/forum?id=p-BhZSz59o4},
  timestamp    = {Sat, 20 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/Bao0PW22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/0013GM0WW22,
  author       = {Xin Sun and
                  Tao Ge and
                  Shuming Ma and
                  Jingjing Li and
                  Furu Wei and
                  Houfeng Wang},
  editor       = {Luc De Raedt},
  title        = {A Unified Strategy for Multilingual Grammatical Error Correction with
                  Pre-trained Cross-Lingual Language Model},
  booktitle    = {Proceedings of the Thirty-First International Joint Conference on
                  Artificial Intelligence, {IJCAI} 2022, Vienna, Austria, 23-29 July
                  2022},
  pages        = {4367--4374},
  publisher    = {ijcai.org},
  year         = {2022},
  url          = {https://doi.org/10.24963/ijcai.2022/606},
  doi          = {10.24963/IJCAI.2022/606},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ijcai/0013GM0WW22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/YangYM0WG0W22,
  author       = {Jian Yang and
                  Yuwei Yin and
                  Shuming Ma and
                  Dongdong Zhang and
                  Shuangzhi Wu and
                  Hongcheng Guo and
                  Zhoujun Li and
                  Furu Wei},
  editor       = {Luc De Raedt},
  title        = {{UM4:} Unified Multilingual Multiple Teacher-Student Model for Zero-Resource
                  Neural Machine Translation},
  booktitle    = {Proceedings of the Thirty-First International Joint Conference on
                  Artificial Intelligence, {IJCAI} 2022, Vienna, Austria, 23-29 July
                  2022},
  pages        = {4454--4460},
  publisher    = {ijcai.org},
  year         = {2022},
  url          = {https://doi.org/10.24963/ijcai.2022/618},
  doi          = {10.24963/IJCAI.2022/618},
  timestamp    = {Fri, 22 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ijcai/YangYM0WG0W22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/YangYM00W22,
  author       = {Jian Yang and
                  Yuwei Yin and
                  Shuming Ma and
                  Dongdong Zhang and
                  Zhoujun Li and
                  Furu Wei},
  editor       = {Luc De Raedt},
  title        = {High-resource Language-specific Training for Multilingual Neural Machine
                  Translation},
  booktitle    = {Proceedings of the Thirty-First International Joint Conference on
                  Artificial Intelligence, {IJCAI} 2022, Vienna, Austria, 23-29 July
                  2022},
  pages        = {4461--4467},
  publisher    = {ijcai.org},
  year         = {2022},
  url          = {https://doi.org/10.24963/ijcai.2022/619},
  doi          = {10.24963/IJCAI.2022/619},
  timestamp    = {Fri, 22 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ijcai/YangYM00W22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcnlp/JinGW22,
  author       = {Xuyang Jin and
                  Tao Ge and
                  Furu Wei},
  editor       = {Yulan He and
                  Heng Ji and
                  Yang Liu and
                  Sujian Li and
                  Chia{-}Hui Chang and
                  Soujanya Poria and
                  Chenghua Lin and
                  Wray L. Buntine and
                  Maria Liakata and
                  Hanqi Yan and
                  Zonghan Yan and
                  Sebastian Ruder and
                  Xiaojun Wan and
                  Miguel Arana{-}Catania and
                  Zhongyu Wei and
                  Hen{-}Hsen Huang and
                  Jheng{-}Long Wu and
                  Min{-}Yuh Day and
                  Pengfei Liu and
                  Ruifeng Xu},
  title        = {Plug and Play Knowledge Distillation for kNN-LM with External Logits},
  booktitle    = {Proceedings of the 2nd Conference of the Asia-Pacific Chapter of the
                  Association for Computational Linguistics and the 12th International
                  Joint Conference on Natural Language Processing, {AACL/IJCNLP} 2022
                  - Volume 2: Short Papers, Online only, November 20-23, 2022},
  pages        = {463--469},
  publisher    = {Association for Computational Linguistics},
  year         = {2022},
  url          = {https://aclanthology.org/2022.aacl-short.57},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ijcnlp/JinGW22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/WangWWC00W22,
  author       = {Chengyi Wang and
                  Yiming Wang and
                  Yu Wu and
                  Sanyuan Chen and
                  Jinyu Li and
                  Shujie Liu and
                  Furu Wei},
  editor       = {Hanseok Ko and
                  John H. L. Hansen},
  title        = {Supervision-Guided Codebooks for Masked Prediction in Speech Pre-training},
  booktitle    = {Interspeech 2022, 23rd Annual Conference of the International Speech
                  Communication Association, Incheon, Korea, 18-22 September 2022},
  pages        = {2643--2647},
  publisher    = {{ISCA}},
  year         = {2022},
  url          = {https://doi.org/10.21437/Interspeech.2022-936},
  doi          = {10.21437/INTERSPEECH.2022-936},
  timestamp    = {Wed, 21 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/WangWWC00W22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/Ren00ZW22,
  author       = {Shuo Ren and
                  Shujie Liu and
                  Yu Wu and
                  Long Zhou and
                  Furu Wei},
  editor       = {Hanseok Ko and
                  John H. L. Hansen},
  title        = {Speech Pre-training with Acoustic Piece},
  booktitle    = {Interspeech 2022, 23rd Annual Conference of the International Speech
                  Communication Association, Incheon, Korea, 18-22 September 2022},
  pages        = {2648--2652},
  publisher    = {{ISCA}},
  year         = {2022},
  url          = {https://doi.org/10.21437/Interspeech.2022-981},
  doi          = {10.21437/INTERSPEECH.2022-981},
  timestamp    = {Wed, 21 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/Ren00ZW22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/AoZZ00K00QW22,
  author       = {Junyi Ao and
                  Ziqiang Zhang and
                  Long Zhou and
                  Shujie Liu and
                  Haizhou Li and
                  Tom Ko and
                  Lirong Dai and
                  Jinyu Li and
                  Yao Qian and
                  Furu Wei},
  editor       = {Hanseok Ko and
                  John H. L. Hansen},
  title        = {Pre-Training Transformer Decoder for End-to-End {ASR} Model with Unpaired
                  Speech Data},
  booktitle    = {Interspeech 2022, 23rd Annual Conference of the International Speech
                  Communication Association, Incheon, Korea, 18-22 September 2022},
  pages        = {2658--2662},
  publisher    = {{ISCA}},
  year         = {2022},
  url          = {https://doi.org/10.21437/Interspeech.2022-10368},
  doi          = {10.21437/INTERSPEECH.2022-10368},
  timestamp    = {Wed, 21 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/AoZZ00K00QW22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/Chen0000WL00YW22,
  author       = {Sanyuan Chen and
                  Yu Wu and
                  Chengyi Wang and
                  Shujie Liu and
                  Zhuo Chen and
                  Peidong Wang and
                  Gang Liu and
                  Jinyu Li and
                  Jian Wu and
                  Xiangzhan Yu and
                  Furu Wei},
  editor       = {Hanseok Ko and
                  John H. L. Hansen},
  title        = {Why does Self-Supervised Learning for Speech Recognition Benefit Speaker
                  Recognition?},
  booktitle    = {Interspeech 2022, 23rd Annual Conference of the International Speech
                  Communication Association, Incheon, Korea, 18-22 September 2022},
  pages        = {3699--3703},
  publisher    = {{ISCA}},
  year         = {2022},
  url          = {https://doi.org/10.21437/Interspeech.2022-10019},
  doi          = {10.21437/INTERSPEECH.2022-10019},
  timestamp    = {Wed, 21 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/Chen0000WL00YW22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/Zhang0K00EYXMQW22,
  author       = {Wangyou Zhang and
                  Zhuo Chen and
                  Naoyuki Kanda and
                  Shujie Liu and
                  Jinyu Li and
                  Sefik Emre Eskimez and
                  Takuya Yoshioka and
                  Xiong Xiao and
                  Zhong Meng and
                  Yanmin Qian and
                  Furu Wei},
  editor       = {Hanseok Ko and
                  John H. L. Hansen},
  title        = {Separating Long-Form Speech with Group-wise Permutation Invariant
                  Training},
  booktitle    = {Interspeech 2022, 23rd Annual Conference of the International Speech
                  Communication Association, Incheon, Korea, 18-22 September 2022},
  pages        = {5383--5387},
  publisher    = {{ISCA}},
  year         = {2022},
  url          = {https://doi.org/10.21437/Interspeech.2022-10362},
  doi          = {10.21437/INTERSPEECH.2022-10362},
  timestamp    = {Wed, 21 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/Zhang0K00EYXMQW22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/mm/LiXL0ZW22,
  author       = {Junlong Li and
                  Yiheng Xu and
                  Tengchao Lv and
                  Lei Cui and
                  Cha Zhang and
                  Furu Wei},
  editor       = {Jo{\~{a}}o Magalh{\~{a}}es and
                  Alberto Del Bimbo and
                  Shin'ichi Satoh and
                  Nicu Sebe and
                  Xavier Alameda{-}Pineda and
                  Qin Jin and
                  Vincent Oria and
                  Laura Toni},
  title        = {DiT: Self-supervised Pre-training for Document Image Transformer},
  booktitle    = {{MM} '22: The 30th {ACM} International Conference on Multimedia, Lisboa,
                  Portugal, October 10 - 14, 2022},
  pages        = {3530--3539},
  publisher    = {{ACM}},
  year         = {2022},
  url          = {https://doi.org/10.1145/3503161.3547911},
  doi          = {10.1145/3503161.3547911},
  timestamp    = {Fri, 14 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/mm/LiXL0ZW22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/mm/HuangL0LW22,
  author       = {Yupan Huang and
                  Tengchao Lv and
                  Lei Cui and
                  Yutong Lu and
                  Furu Wei},
  editor       = {Jo{\~{a}}o Magalh{\~{a}}es and
                  Alberto Del Bimbo and
                  Shin'ichi Satoh and
                  Nicu Sebe and
                  Xavier Alameda{-}Pineda and
                  Qin Jin and
                  Vincent Oria and
                  Laura Toni},
  title        = {LayoutLMv3: Pre-training for Document {AI} with Unified Text and Image
                  Masking},
  booktitle    = {{MM} '22: The 30th {ACM} International Conference on Multimedia, Lisboa,
                  Portugal, October 10 - 14, 2022},
  pages        = {4083--4091},
  publisher    = {{ACM}},
  year         = {2022},
  url          = {https://doi.org/10.1145/3503161.3548112},
  doi          = {10.1145/3503161.3548112},
  timestamp    = {Fri, 14 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/mm/HuangL0LW22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BaoW0LMASPW22,
  author       = {Hangbo Bao and
                  Wenhui Wang and
                  Li Dong and
                  Qiang Liu and
                  Owais Khan Mohammed and
                  Kriti Aggarwal and
                  Subhojit Som and
                  Songhao Piao and
                  Furu Wei},
  editor       = {Sanmi Koyejo and
                  S. Mohamed and
                  A. Agarwal and
                  Danielle Belgrave and
                  K. Cho and
                  A. Oh},
  title        = {VLMo: Unified Vision-Language Pre-Training with Mixture-of-Modality-Experts},
  booktitle    = {Advances in Neural Information Processing Systems 35: Annual Conference
                  on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans,
                  LA, USA, November 28 - December 9, 2022},
  year         = {2022},
  url          = {http://papers.nips.cc/paper\_files/paper/2022/hash/d46662aa53e78a62afd980a29e0c37ed-Abstract-Conference.html},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/BaoW0LMASPW22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/Chi0HDMPSBSMHW22,
  author       = {Zewen Chi and
                  Li Dong and
                  Shaohan Huang and
                  Damai Dai and
                  Shuming Ma and
                  Barun Patra and
                  Saksham Singhal and
                  Payal Bajaj and
                  Xia Song and
                  Xian{-}Ling Mao and
                  Heyan Huang and
                  Furu Wei},
  editor       = {Sanmi Koyejo and
                  S. Mohamed and
                  A. Agarwal and
                  Danielle Belgrave and
                  K. Cho and
                  A. Oh},
  title        = {On the Representation Collapse of Sparse Mixture of Experts},
  booktitle    = {Advances in Neural Information Processing Systems 35: Annual Conference
                  on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans,
                  LA, USA, November 28 - December 9, 2022},
  year         = {2022},
  url          = {http://papers.nips.cc/paper\_files/paper/2022/hash/df4f371f1f89ec8ba5014b3310578048-Abstract-Conference.html},
  timestamp    = {Mon, 08 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/Chi0HDMPSBSMHW22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nlpcc/YaoHDWCZ22,
  author       = {Yunzhi Yao and
                  Shaohan Huang and
                  Li Dong and
                  Furu Wei and
                  Huajun Chen and
                  Ningyu Zhang},
  editor       = {Wei Lu and
                  Shujian Huang and
                  Yu Hong and
                  Xiabing Zhou},
  title        = {Kformer: Knowledge Injection in Transformer Feed-Forward Layers},
  booktitle    = {Natural Language Processing and Chinese Computing - 11th {CCF} International
                  Conference, {NLPCC} 2022, Guilin, China, September 24-25, 2022, Proceedings,
                  Part {I}},
  series       = {Lecture Notes in Computer Science},
  volume       = {13551},
  pages        = {131--143},
  publisher    = {Springer},
  year         = {2022},
  url          = {https://doi.org/10.1007/978-3-031-17120-8\_11},
  doi          = {10.1007/978-3-031-17120-8\_11},
  timestamp    = {Tue, 27 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nlpcc/YaoHDWCZ22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2201-01631,
  author       = {Xu Zhang and
                  Jian Yang and
                  Haoyang Huang and
                  Shuming Ma and
                  Dongdong Zhang and
                  Jinlong Li and
                  Furu Wei},
  title        = {{SMDT:} Selective Memory-Augmented Neural Document Translation},
  journal      = {CoRR},
  volume       = {abs/2201.01631},
  year         = {2022},
  url          = {https://arxiv.org/abs/2201.01631},
  eprinttype    = {arXiv},
  eprint       = {2201.01631},
  timestamp    = {Wed, 07 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2201-01631.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2201-02009,
  author       = {Juncheng Wan and
                  Jian Yang and
                  Shuming Ma and
                  Dongdong Zhang and
                  Weinan Zhang and
                  Yong Yu and
                  Furu Wei},
  title        = {Phrase-level Adversarial Example Generation for Neural Machine Translation},
  journal      = {CoRR},
  volume       = {abs/2201.02009},
  year         = {2022},
  url          = {https://arxiv.org/abs/2201.02009},
  eprinttype    = {arXiv},
  eprint       = {2201.02009},
  timestamp    = {Wed, 07 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2201-02009.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2201-04337,
  author       = {Ting Jiang and
                  Shaohan Huang and
                  Zihan Zhang and
                  Deqing Wang and
                  Fuzhen Zhuang and
                  Furu Wei and
                  Haizhen Huang and
                  Liangjie Zhang and
                  Qi Zhang},
  title        = {PromptBERT: Improving {BERT} Sentence Embeddings with Prompts},
  journal      = {CoRR},
  volume       = {abs/2201.04337},
  year         = {2022},
  url          = {https://arxiv.org/abs/2201.04337},
  eprinttype    = {arXiv},
  eprint       = {2201.04337},
  timestamp    = {Thu, 20 Jan 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2201-04337.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2201-05742,
  author       = {Yunzhi Yao and
                  Shaohan Huang and
                  Ningyu Zhang and
                  Li Dong and
                  Furu Wei and
                  Huajun Chen},
  title        = {Kformer: Knowledge Injection in Transformer Feed-Forward Layers},
  journal      = {CoRR},
  volume       = {abs/2201.05742},
  year         = {2022},
  url          = {https://arxiv.org/abs/2201.05742},
  eprinttype    = {arXiv},
  eprint       = {2201.05742},
  timestamp    = {Tue, 27 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2201-05742.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2201-10707,
  author       = {Xin Sun and
                  Tao Ge and
                  Shuming Ma and
                  Jingjing Li and
                  Furu Wei and
                  Houfeng Wang},
  title        = {A Unified Strategy for Multilingual Grammatical Error Correction with
                  Pre-trained Cross-Lingual Language Model},
  journal      = {CoRR},
  volume       = {abs/2201.10707},
  year         = {2022},
  url          = {https://arxiv.org/abs/2201.10707},
  eprinttype    = {arXiv},
  eprint       = {2201.10707},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2201-10707.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2202-03382,
  author       = {Yuxin Fang and
                  Li Dong and
                  Hangbo Bao and
                  Xinggang Wang and
                  Furu Wei},
  title        = {Corrupted Image Modeling for Self-Supervised Visual Pre-Training},
  journal      = {CoRR},
  volume       = {abs/2202.03382},
  year         = {2022},
  url          = {https://arxiv.org/abs/2202.03382},
  eprinttype    = {arXiv},
  eprint       = {2202.03382},
  timestamp    = {Wed, 09 Feb 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2202-03382.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2202-07959,
  author       = {Tao Ge and
                  Furu Wei},
  title        = {EdgeFormer: {A} Parameter-Efficient Transformer for On-Device Seq2seq
                  Generation},
  journal      = {CoRR},
  volume       = {abs/2202.07959},
  year         = {2022},
  url          = {https://arxiv.org/abs/2202.07959},
  eprinttype    = {arXiv},
  eprint       = {2202.07959},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2202-07959.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2202-08772,
  author       = {Da Yin and
                  Li Dong and
                  Hao Cheng and
                  Xiaodong Liu and
                  Kai{-}Wei Chang and
                  Furu Wei and
                  Jianfeng Gao},
  title        = {A Survey of Knowledge-Intensive {NLP} with Pre-Trained Language Models},
  journal      = {CoRR},
  volume       = {abs/2202.08772},
  year         = {2022},
  url          = {https://arxiv.org/abs/2202.08772},
  eprinttype    = {arXiv},
  eprint       = {2202.08772},
  timestamp    = {Thu, 11 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2202-08772.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2202-11451,
  author       = {Lianzhe Huang and
                  Shuming Ma and
                  Dongdong Zhang and
                  Furu Wei and
                  Houfeng Wang},
  title        = {Zero-shot Cross-lingual Transfer of Prompt-based Tuning with a Unified
                  Multilingual Prompt},
  journal      = {CoRR},
  volume       = {abs/2202.11451},
  year         = {2022},
  url          = {https://arxiv.org/abs/2202.11451},
  eprinttype    = {arXiv},
  eprint       = {2202.11451},
  timestamp    = {Wed, 02 Mar 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2202-11451.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2202-13257,
  author       = {Jing Qian and
                  Li Dong and
                  Yelong Shen and
                  Furu Wei and
                  Weizhu Chen},
  title        = {Controllable Natural Language Generation with Contrastive Prefixes},
  journal      = {CoRR},
  volume       = {abs/2202.13257},
  year         = {2022},
  url          = {https://arxiv.org/abs/2202.13257},
  eprinttype    = {arXiv},
  eprint       = {2202.13257},
  timestamp    = {Wed, 02 Mar 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2202-13257.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2203-00555,
  author       = {Hongyu Wang and
                  Shuming Ma and
                  Li Dong and
                  Shaohan Huang and
                  Dongdong Zhang and
                  Furu Wei},
  title        = {DeepNet: Scaling Transformers to 1, 000 Layers},
  journal      = {CoRR},
  volume       = {abs/2203.00555},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2203.00555},
  doi          = {10.48550/ARXIV.2203.00555},
  eprinttype    = {arXiv},
  eprint       = {2203.00555},
  timestamp    = {Tue, 20 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2203-00555.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2203-02378,
  author       = {Junlong Li and
                  Yiheng Xu and
                  Tengchao Lv and
                  Lei Cui and
                  Cha Zhang and
                  Furu Wei},
  title        = {DiT: Self-supervised Pre-training for Document Image Transformer},
  journal      = {CoRR},
  volume       = {abs/2203.02378},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2203.02378},
  doi          = {10.48550/ARXIV.2203.02378},
  eprinttype    = {arXiv},
  eprint       = {2203.02378},
  timestamp    = {Wed, 16 Mar 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2203-02378.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2203-07190,
  author       = {Haoyu Song and
                  Li Dong and
                  Wei{-}Nan Zhang and
                  Ting Liu and
                  Furu Wei},
  title        = {{CLIP} Models are Few-shot Learners: Empirical Studies on {VQA} and
                  Visual Entailment},
  journal      = {CoRR},
  volume       = {abs/2203.07190},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2203.07190},
  doi          = {10.48550/ARXIV.2203.07190},
  eprinttype    = {arXiv},
  eprint       = {2203.07190},
  timestamp    = {Fri, 18 Mar 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2203-07190.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2203-16487,
  author       = {Heming Xia and
                  Tao Ge and
                  Furu Wei and
                  Zhifang Sui},
  title        = {Lossless Speedup of Autoregressive Translation with Generalized Aggressive
                  Decoding},
  journal      = {CoRR},
  volume       = {abs/2203.16487},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2203.16487},
  doi          = {10.48550/ARXIV.2203.16487},
  eprinttype    = {arXiv},
  eprint       = {2203.16487},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2203-16487.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2203-17113,
  author       = {Junyi Ao and
                  Ziqiang Zhang and
                  Long Zhou and
                  Shujie Liu and
                  Haizhou Li and
                  Tom Ko and
                  Lirong Dai and
                  Jinyu Li and
                  Yao Qian and
                  Furu Wei},
  title        = {Pre-Training Transformer Decoder for End-to-End {ASR} Model with Unpaired
                  Speech Data},
  journal      = {CoRR},
  volume       = {abs/2203.17113},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2203.17113},
  doi          = {10.48550/ARXIV.2203.17113},
  eprinttype    = {arXiv},
  eprint       = {2203.17113},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2203-17113.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2204-03240,
  author       = {Shuo Ren and
                  Shujie Liu and
                  Yu Wu and
                  Long Zhou and
                  Furu Wei},
  title        = {Speech Pre-training with Acoustic Piece},
  journal      = {CoRR},
  volume       = {abs/2204.03240},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2204.03240},
  doi          = {10.48550/ARXIV.2204.03240},
  eprinttype    = {arXiv},
  eprint       = {2204.03240},
  timestamp    = {Mon, 30 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2204-03240.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2204-08387,
  author       = {Yupan Huang and
                  Tengchao Lv and
                  Lei Cui and
                  Yutong Lu and
                  Furu Wei},
  title        = {LayoutLMv3: Pre-training for Document {AI} with Unified Text and Image
                  Masking},
  journal      = {CoRR},
  volume       = {abs/2204.08387},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2204.08387},
  doi          = {10.48550/ARXIV.2204.08387},
  eprinttype    = {arXiv},
  eprint       = {2204.08387},
  timestamp    = {Tue, 19 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2204-08387.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2204-08396,
  author       = {Damai Dai and
                  Li Dong and
                  Shuming Ma and
                  Bo Zheng and
                  Zhifang Sui and
                  Baobao Chang and
                  Furu Wei},
  title        = {StableMoE: Stable Routing Strategy for Mixture of Experts},
  journal      = {CoRR},
  volume       = {abs/2204.08396},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2204.08396},
  doi          = {10.48550/ARXIV.2204.08396},
  eprinttype    = {arXiv},
  eprint       = {2204.08396},
  timestamp    = {Tue, 19 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2204-08396.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2204-09179,
  author       = {Zewen Chi and
                  Li Dong and
                  Shaohan Huang and
                  Damai Dai and
                  Shuming Ma and
                  Barun Patra and
                  Saksham Singhal and
                  Payal Bajaj and
                  Xia Song and
                  Furu Wei},
  title        = {On the Representation Collapse of Sparse Mixture of Experts},
  journal      = {CoRR},
  volume       = {abs/2204.09179},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2204.09179},
  doi          = {10.48550/ARXIV.2204.09179},
  eprinttype    = {arXiv},
  eprint       = {2204.09179},
  timestamp    = {Mon, 25 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2204-09179.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2204-12765,
  author       = {Sanyuan Chen and
                  Yu Wu and
                  Chengyi Wang and
                  Shujie Liu and
                  Zhuo Chen and
                  Peidong Wang and
                  Gang Liu and
                  Jinyu Li and
                  Jian Wu and
                  Xiangzhan Yu and
                  Furu Wei},
  title        = {Why does Self-Supervised Learning for Speech Recognition Benefit Speaker
                  Recognition?},
  journal      = {CoRR},
  volume       = {abs/2204.12765},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2204.12765},
  doi          = {10.48550/ARXIV.2204.12765},
  eprinttype    = {arXiv},
  eprint       = {2204.12765},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2204-12765.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2204-13512,
  author       = {Ruipeng Jia and
                  Xingxing Zhang and
                  Yanan Cao and
                  Shi Wang and
                  Zheng Lin and
                  Furu Wei},
  title        = {Neural Label Search for Zero-Shot Multi-Lingual Extractive Summarization},
  journal      = {CoRR},
  volume       = {abs/2204.13512},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2204.13512},
  doi          = {10.48550/ARXIV.2204.13512},
  eprinttype    = {arXiv},
  eprint       = {2204.13512},
  timestamp    = {Mon, 02 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2204-13512.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2205-10178,
  author       = {Weizhi Wang and
                  Li Dong and
                  Hao Cheng and
                  Haoyu Song and
                  Xiaodong Liu and
                  Xifeng Yan and
                  Jianfeng Gao and
                  Furu Wei},
  title        = {Visually-Augmented Language Modeling},
  journal      = {CoRR},
  volume       = {abs/2205.10178},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2205.10178},
  doi          = {10.48550/ARXIV.2205.10178},
  eprinttype    = {arXiv},
  eprint       = {2205.10178},
  timestamp    = {Thu, 11 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2205-10178.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2205-10183,
  author       = {Zhixiong Han and
                  Yaru Hao and
                  Li Dong and
                  Furu Wei},
  title        = {Prototypical Calibration for Few-shot Learning of Language Models},
  journal      = {CoRR},
  volume       = {abs/2205.10183},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2205.10183},
  doi          = {10.48550/ARXIV.2205.10183},
  eprinttype    = {arXiv},
  eprint       = {2205.10183},
  timestamp    = {Tue, 31 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2205-10183.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2205-10350,
  author       = {Tao Ge and
                  Heming Xia and
                  Xin Sun and
                  Si{-}Qing Chen and
                  Furu Wei},
  title        = {Lossless Acceleration for Seq2seq Generation with Aggressive Decoding},
  journal      = {CoRR},
  volume       = {abs/2205.10350},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2205.10350},
  doi          = {10.48550/ARXIV.2205.10350},
  eprinttype    = {arXiv},
  eprint       = {2205.10350},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2205-10350.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2206-00216,
  author       = {Tianyu Chen and
                  Hangbo Bao and
                  Shaohan Huang and
                  Li Dong and
                  Binxing Jiao and
                  Daxin Jiang and
                  Haoyi Zhou and
                  Jianxin Li and
                  Furu Wei},
  title        = {{THE-X:} Privacy-Preserving Transformer Inference with Homomorphic
                  Encryption},
  journal      = {CoRR},
  volume       = {abs/2206.00216},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.00216},
  doi          = {10.48550/ARXIV.2206.00216},
  eprinttype    = {arXiv},
  eprint       = {2206.00216},
  timestamp    = {Mon, 01 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-00216.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2206-00277,
  author       = {Tianyu Chen and
                  Shaohan Huang and
                  Yuan Xie and
                  Binxing Jiao and
                  Daxin Jiang and
                  Haoyi Zhou and
                  Jianxin Li and
                  Furu Wei},
  title        = {Task-Specific Expert Pruning for Sparse Mixture-of-Experts},
  journal      = {CoRR},
  volume       = {abs/2206.00277},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.00277},
  doi          = {10.48550/ARXIV.2206.00277},
  eprinttype    = {arXiv},
  eprint       = {2206.00277},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-00277.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2206-01127,
  author       = {Hangbo Bao and
                  Wenhui Wang and
                  Li Dong and
                  Furu Wei},
  title        = {VL-BEiT: Generative Vision-Language Pretraining},
  journal      = {CoRR},
  volume       = {abs/2206.01127},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.01127},
  doi          = {10.48550/ARXIV.2206.01127},
  eprinttype    = {arXiv},
  eprint       = {2206.01127},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-01127.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2206-05777,
  author       = {Ziqiang Zhang and
                  Junyi Ao and
                  Long Zhou and
                  Shujie Liu and
                  Furu Wei and
                  Jinyu Li},
  title        = {The YiTrans End-to-End Speech Translation System for {IWSLT} 2022
                  Offline Shared Task},
  journal      = {CoRR},
  volume       = {abs/2206.05777},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.05777},
  doi          = {10.48550/ARXIV.2206.05777},
  eprinttype    = {arXiv},
  eprint       = {2206.05777},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-05777.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2206-06336,
  author       = {Yaru Hao and
                  Haoyu Song and
                  Li Dong and
                  Shaohan Huang and
                  Zewen Chi and
                  Wenhui Wang and
                  Shuming Ma and
                  Furu Wei},
  title        = {Language Models are General-Purpose Interfaces},
  journal      = {CoRR},
  volume       = {abs/2206.06336},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.06336},
  doi          = {10.48550/ARXIV.2206.06336},
  eprinttype    = {arXiv},
  eprint       = {2206.06336},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-06336.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2206-10125,
  author       = {Chengyi Wang and
                  Yiming Wang and
                  Yu Wu and
                  Sanyuan Chen and
                  Jinyu Li and
                  Shujie Liu and
                  Furu Wei},
  title        = {Supervision-Guided Codebooks for Masked Prediction in Speech Pre-training},
  journal      = {CoRR},
  volume       = {abs/2206.10125},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.10125},
  doi          = {10.48550/ARXIV.2206.10125},
  eprinttype    = {arXiv},
  eprint       = {2206.10125},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-10125.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2207-02578,
  author       = {Liang Wang and
                  Nan Yang and
                  Xiaolong Huang and
                  Binxing Jiao and
                  Linjun Yang and
                  Daxin Jiang and
                  Rangan Majumder and
                  Furu Wei},
  title        = {SimLM: Pre-training with Representation Bottleneck for Dense Passage
                  Retrieval},
  journal      = {CoRR},
  volume       = {abs/2207.02578},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2207.02578},
  doi          = {10.48550/ARXIV.2207.02578},
  eprinttype    = {arXiv},
  eprint       = {2207.02578},
  timestamp    = {Mon, 01 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2207-02578.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2207-04900,
  author       = {Jian Yang and
                  Yuwei Yin and
                  Shuming Ma and
                  Dongdong Zhang and
                  Shuangzhi Wu and
                  Hongcheng Guo and
                  Zhoujun Li and
                  Furu Wei},
  title        = {{UM4:} Unified Multilingual Multiple Teacher-Student Model for Zero-Resource
                  Neural Machine Translation},
  journal      = {CoRR},
  volume       = {abs/2207.04900},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2207.04900},
  doi          = {10.48550/ARXIV.2207.04900},
  eprinttype    = {arXiv},
  eprint       = {2207.04900},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2207-04900.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2207-04906,
  author       = {Jian Yang and
                  Yuwei Yin and
                  Shuming Ma and
                  Dongdong Zhang and
                  Zhoujun Li and
                  Furu Wei},
  title        = {{HLT-MT:} High-resource Language-specific Training for Multilingual
                  Neural Machine Translation},
  journal      = {CoRR},
  volume       = {abs/2207.04906},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2207.04906},
  doi          = {10.48550/ARXIV.2207.04906},
  eprinttype    = {arXiv},
  eprint       = {2207.04906},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2207-04906.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2207-09094,
  author       = {Yuan Xie and
                  Shaohan Huang and
                  Tianyu Chen and
                  Furu Wei},
  title        = {MoEC: Mixture of Expert Clusters},
  journal      = {CoRR},
  volume       = {abs/2207.09094},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2207.09094},
  doi          = {10.48550/ARXIV.2207.09094},
  eprinttype    = {arXiv},
  eprint       = {2207.09094},
  timestamp    = {Mon, 25 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2207-09094.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2207-14467,
  author       = {Jian Yang and
                  Yuwei Yin and
                  Shuming Ma and
                  Haoyang Huang and
                  Dongdong Zhang and
                  Furu Wei and
                  Zhoujun Li},
  title        = {GTrans: Grouping and Fusing Transformer Layers for Neural Machine
                  Translation},
  journal      = {CoRR},
  volume       = {abs/2207.14467},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2207.14467},
  doi          = {10.48550/ARXIV.2207.14467},
  eprinttype    = {arXiv},
  eprint       = {2207.14467},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2207-14467.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2208-04232,
  author       = {Zehan Li and
                  Nan Yang and
                  Liang Wang and
                  Furu Wei},
  title        = {Learning Diverse Document Representations with Deep Query Interactions
                  for Dense Retrieval},
  journal      = {CoRR},
  volume       = {abs/2208.04232},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2208.04232},
  doi          = {10.48550/ARXIV.2208.04232},
  eprinttype    = {arXiv},
  eprint       = {2208.04232},
  timestamp    = {Wed, 10 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2208-04232.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2208-06366,
  author       = {Zhiliang Peng and
                  Li Dong and
                  Hangbo Bao and
                  Qixiang Ye and
                  Furu Wei},
  title        = {BEiT v2: Masked Image Modeling with Vector-Quantized Visual Tokenizers},
  journal      = {CoRR},
  volume       = {abs/2208.06366},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2208.06366},
  doi          = {10.48550/ARXIV.2208.06366},
  eprinttype    = {arXiv},
  eprint       = {2208.06366},
  timestamp    = {Tue, 16 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2208-06366.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2208-10442,
  author       = {Wenhui Wang and
                  Hangbo Bao and
                  Li Dong and
                  Johan Bjorck and
                  Zhiliang Peng and
                  Qiang Liu and
                  Kriti Aggarwal and
                  Owais Khan Mohammed and
                  Saksham Singhal and
                  Subhojit Som and
                  Furu Wei},
  title        = {Image as a Foreign Language: BEiT Pretraining for All Vision and Vision-Language
                  Tasks},
  journal      = {CoRR},
  volume       = {abs/2208.10442},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2208.10442},
  doi          = {10.48550/ARXIV.2208.10442},
  eprinttype    = {arXiv},
  eprint       = {2208.10442},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2208-10442.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2209-13940,
  author       = {Hongyuan Lu and
                  Haoyang Huang and
                  Shuming Ma and
                  Dongdong Zhang and
                  Furu Wei and
                  Wai Lam},
  title        = {Towards Multilingual Transitivity and Bidirectional Multilingual Agreement
                  for Multilingual Document-level Machine Translation},
  journal      = {CoRR},
  volume       = {abs/2209.13940},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2209.13940},
  doi          = {10.48550/ARXIV.2209.13940},
  eprinttype    = {arXiv},
  eprint       = {2209.13940},
  timestamp    = {Thu, 06 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2209-13940.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-02849,
  author       = {Jingye Chen and
                  Tengchao Lv and
                  Lei Cui and
                  Cha Zhang and
                  Furu Wei},
  title        = {XDoc: Unified Pre-training for Cross-Format Document Understanding},
  journal      = {CoRR},
  volume       = {abs/2210.02849},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.02849},
  doi          = {10.48550/ARXIV.2210.02849},
  eprinttype    = {arXiv},
  eprint       = {2210.02849},
  timestamp    = {Fri, 07 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-02849.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-03730,
  author       = {Ziqiang Zhang and
                  Long Zhou and
                  Junyi Ao and
                  Shujie Liu and
                  Lirong Dai and
                  Jinyu Li and
                  Furu Wei},
  title        = {SpeechUT: Bridging Speech and Text with Hidden-Unit for Encoder-Decoder
                  Based Speech-Text Pre-training},
  journal      = {CoRR},
  volume       = {abs/2210.03730},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.03730},
  doi          = {10.48550/ARXIV.2210.03730},
  eprinttype    = {arXiv},
  eprint       = {2210.03730},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-03730.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-06423,
  author       = {Hongyu Wang and
                  Shuming Ma and
                  Shaohan Huang and
                  Li Dong and
                  Wenhui Wang and
                  Zhiliang Peng and
                  Yu Wu and
                  Payal Bajaj and
                  Saksham Singhal and
                  Alon Benhaim and
                  Barun Patra and
                  Zhun Liu and
                  Vishrav Chaudhary and
                  Xia Song and
                  Furu Wei},
  title        = {Foundation Transformers},
  journal      = {CoRR},
  volume       = {abs/2210.06423},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.06423},
  doi          = {10.48550/ARXIV.2210.06423},
  eprinttype    = {arXiv},
  eprint       = {2210.06423},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-06423.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-07022,
  author       = {Jian Yang and
                  Shaohan Huang and
                  Shuming Ma and
                  Yuwei Yin and
                  Li Dong and
                  Dongdong Zhang and
                  Hongcheng Guo and
                  Zhoujun Li and
                  Furu Wei},
  title        = {{CROP:} Zero-shot Cross-lingual Named Entity Recognition with Multilingual
                  Labeled Sequence Translation},
  journal      = {CoRR},
  volume       = {abs/2210.07022},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.07022},
  doi          = {10.48550/ARXIV.2210.07022},
  eprinttype    = {arXiv},
  eprint       = {2210.07022},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-07022.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-09304,
  author       = {Jinghao Zhou and
                  Li Dong and
                  Zhe Gan and
                  Lijuan Wang and
                  Furu Wei},
  title        = {Non-Contrastive Learning Meets Language-Image Pre-Training},
  journal      = {CoRR},
  volume       = {abs/2210.09304},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.09304},
  doi          = {10.48550/ARXIV.2210.09304},
  eprinttype    = {arXiv},
  eprint       = {2210.09304},
  timestamp    = {Wed, 19 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-09304.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-10615,
  author       = {Zhiliang Peng and
                  Li Dong and
                  Hangbo Bao and
                  Qixiang Ye and
                  Furu Wei},
  title        = {A Unified View of Masked Image Modeling},
  journal      = {CoRR},
  volume       = {abs/2210.10615},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.10615},
  doi          = {10.48550/ARXIV.2210.10615},
  eprinttype    = {arXiv},
  eprint       = {2210.10615},
  timestamp    = {Tue, 25 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-10615.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-14867,
  author       = {Barun Patra and
                  Saksham Singhal and
                  Shaohan Huang and
                  Zewen Chi and
                  Li Dong and
                  Furu Wei and
                  Vishrav Chaudhary and
                  Xia Song},
  title        = {Beyond English-Centric Bitexts for Better Multilingual Language Representation
                  Learning},
  journal      = {CoRR},
  volume       = {abs/2210.14867},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.14867},
  doi          = {10.48550/ARXIV.2210.14867},
  eprinttype    = {arXiv},
  eprint       = {2210.14867},
  timestamp    = {Wed, 02 Nov 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-14867.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-15461,
  author       = {Hongcheng Guo and
                  Jiaheng Liu and
                  Haoyang Huang and
                  Jian Yang and
                  Zhoujun Li and
                  Dongdong Zhang and
                  Furu Wei},
  title        = {{LVP-M3:} Language-aware Visual Prompt for Multilingual Multimodal
                  Machine Translation},
  journal      = {CoRR},
  volume       = {abs/2210.15461},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.15461},
  doi          = {10.48550/ARXIV.2210.15461},
  eprinttype    = {arXiv},
  eprint       = {2210.15461},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-15461.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-17027,
  author       = {Kun Wei and
                  Long Zhou and
                  Ziqiang Zhang and
                  Liping Chen and
                  Shujie Liu and
                  Lei He and
                  Jinyu Li and
                  Furu Wei},
  title        = {Joint Pre-Training with Speech and Bilingual Text for Direct Speech
                  to Speech Translation},
  journal      = {CoRR},
  volume       = {abs/2210.17027},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.17027},
  doi          = {10.48550/ARXIV.2210.17027},
  eprinttype    = {arXiv},
  eprint       = {2210.17027},
  timestamp    = {Thu, 11 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-17027.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2211-01837,
  author       = {Yubo Zhang and
                  Xingxing Zhang and
                  Xun Wang and
                  Si{-}qing Chen and
                  Furu Wei},
  title        = {Latent Prompt Tuning for Text Summarization},
  journal      = {CoRR},
  volume       = {abs/2211.01837},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2211.01837},
  doi          = {10.48550/ARXIV.2211.01837},
  eprinttype    = {arXiv},
  eprint       = {2211.01837},
  timestamp    = {Fri, 04 Nov 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2211-01837.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2211-11275,
  author       = {Qiu{-}Shi Zhu and
                  Long Zhou and
                  Ziqiang Zhang and
                  Shujie Liu and
                  Binxing Jiao and
                  Jie Zhang and
                  Lirong Dai and
                  Daxin Jiang and
                  Jinyu Li and
                  Furu Wei},
  title        = {{VATLM:} Visual-Audio-Text Pre-Training with Unified Masked Prediction
                  for Speech Representation Learning},
  journal      = {CoRR},
  volume       = {abs/2211.11275},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2211.11275},
  doi          = {10.48550/ARXIV.2211.11275},
  eprinttype    = {arXiv},
  eprint       = {2211.11275},
  timestamp    = {Tue, 23 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2211-11275.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2211-13184,
  author       = {Shuming Ma and
                  Hongyu Wang and
                  Shaohan Huang and
                  Wenhui Wang and
                  Zewen Chi and
                  Li Dong and
                  Alon Benhaim and
                  Barun Patra and
                  Vishrav Chaudhary and
                  Xia Song and
                  Furu Wei},
  title        = {TorchScale: Transformers at Scale},
  journal      = {CoRR},
  volume       = {abs/2211.13184},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2211.13184},
  doi          = {10.48550/ARXIV.2211.13184},
  eprinttype    = {arXiv},
  eprint       = {2211.13184},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2211-13184.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2212-00616,
  author       = {Tao Ge and
                  Jing Hu and
                  Li Dong and
                  Shaoguang Mao and
                  Yan Xia and
                  Xun Wang and
                  Si{-}Qing Chen and
                  Furu Wei},
  title        = {Extensible Prompts for Language Models},
  journal      = {CoRR},
  volume       = {abs/2212.00616},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2212.00616},
  doi          = {10.48550/ARXIV.2212.00616},
  eprinttype    = {arXiv},
  eprint       = {2212.00616},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2212-00616.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2212-03533,
  author       = {Liang Wang and
                  Nan Yang and
                  Xiaolong Huang and
                  Binxing Jiao and
                  Linjun Yang and
                  Daxin Jiang and
                  Rangan Majumder and
                  Furu Wei},
  title        = {Text Embeddings by Weakly-Supervised Contrastive Pre-training},
  journal      = {CoRR},
  volume       = {abs/2212.03533},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2212.03533},
  doi          = {10.48550/ARXIV.2212.03533},
  eprinttype    = {arXiv},
  eprint       = {2212.03533},
  timestamp    = {Fri, 23 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2212-03533.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2212-04257,
  author       = {Xingxing Zhang and
                  Yiran Liu and
                  Xun Wang and
                  Pengcheng He and
                  Yang Yu and
                  Si{-}Qing Chen and
                  Wayne Xiong and
                  Furu Wei},
  title        = {Momentum Calibration for Text Generation},
  journal      = {CoRR},
  volume       = {abs/2212.04257},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2212.04257},
  doi          = {10.48550/ARXIV.2212.04257},
  eprinttype    = {arXiv},
  eprint       = {2212.04257},
  timestamp    = {Mon, 02 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2212-04257.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2212-06713,
  author       = {Yaru Hao and
                  Yutao Sun and
                  Li Dong and
                  Zhixiong Han and
                  Yuxian Gu and
                  Furu Wei},
  title        = {Structured Prompting: Scaling In-Context Learning to 1, 000 Examples},
  journal      = {CoRR},
  volume       = {abs/2212.06713},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2212.06713},
  doi          = {10.48550/ARXIV.2212.06713},
  eprinttype    = {arXiv},
  eprint       = {2212.06713},
  timestamp    = {Mon, 02 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2212-06713.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2212-07752,
  author       = {Hongyuan Lu and
                  Haoyang Huang and
                  Shuming Ma and
                  Dongdong Zhang and
                  Wai Lam and
                  Furu Wei},
  title        = {{TRIP:} Triangular Document-level Pre-training for Multilingual Language
                  Models},
  journal      = {CoRR},
  volume       = {abs/2212.07752},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2212.07752},
  doi          = {10.48550/ARXIV.2212.07752},
  eprinttype    = {arXiv},
  eprint       = {2212.07752},
  timestamp    = {Mon, 02 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2212-07752.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2212-09058,
  author       = {Sanyuan Chen and
                  Yu Wu and
                  Chengyi Wang and
                  Shujie Liu and
                  Daniel Tompkins and
                  Zhuo Chen and
                  Furu Wei},
  title        = {BEATs: Audio Pre-Training with Acoustic Tokenizers},
  journal      = {CoRR},
  volume       = {abs/2212.09058},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2212.09058},
  doi          = {10.48550/ARXIV.2212.09058},
  eprinttype    = {arXiv},
  eprint       = {2212.09058},
  timestamp    = {Mon, 02 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2212-09058.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2212-09611,
  author       = {Yaru Hao and
                  Zewen Chi and
                  Li Dong and
                  Furu Wei},
  title        = {Optimizing Prompts for Text-to-Image Generation},
  journal      = {CoRR},
  volume       = {abs/2212.09611},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2212.09611},
  doi          = {10.48550/ARXIV.2212.09611},
  eprinttype    = {arXiv},
  eprint       = {2212.09611},
  timestamp    = {Tue, 03 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2212-09611.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2212-10190,
  author       = {Xun Wang and
                  Tao Ge and
                  Allen Mao and
                  Yuki Li and
                  Furu Wei and
                  Si{-}Qing Chen},
  title        = {Pay Attention to Your Tone: Introducing a New Dataset for Polite Language
                  Rewrite},
  journal      = {CoRR},
  volume       = {abs/2212.10190},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2212.10190},
  doi          = {10.48550/ARXIV.2212.10190},
  eprinttype    = {arXiv},
  eprint       = {2212.10190},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2212-10190.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2212-10218,
  author       = {Jian Yang and
                  Shuming Ma and
                  Li Dong and
                  Shaohan Huang and
                  Haoyang Huang and
                  Yuwei Yin and
                  Dongdong Zhang and
                  Liqun Yang and
                  Zhoujun Li and
                  Furu Wei},
  title        = {GanLM: Encoder-Decoder Pre-training with an Auxiliary Discriminator},
  journal      = {CoRR},
  volume       = {abs/2212.10218},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2212.10218},
  doi          = {10.48550/ARXIV.2212.10218},
  eprinttype    = {arXiv},
  eprint       = {2212.10218},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2212-10218.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2212-10554,
  author       = {Yutao Sun and
                  Li Dong and
                  Barun Patra and
                  Shuming Ma and
                  Shaohan Huang and
                  Alon Benhaim and
                  Vishrav Chaudhary and
                  Xia Song and
                  Furu Wei},
  title        = {A Length-Extrapolatable Transformer},
  journal      = {CoRR},
  volume       = {abs/2212.10554},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2212.10554},
  doi          = {10.48550/ARXIV.2212.10554},
  eprinttype    = {arXiv},
  eprint       = {2212.10554},
  timestamp    = {Wed, 04 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2212-10554.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2212-10559,
  author       = {Damai Dai and
                  Yutao Sun and
                  Li Dong and
                  Yaru Hao and
                  Zhifang Sui and
                  Furu Wei},
  title        = {Why Can {GPT} Learn In-Context? Language Models Secretly Perform Gradient
                  Descent as Meta-Optimizers},
  journal      = {CoRR},
  volume       = {abs/2212.10559},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2212.10559},
  doi          = {10.48550/ARXIV.2212.10559},
  eprinttype    = {arXiv},
  eprint       = {2212.10559},
  timestamp    = {Wed, 04 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2212-10559.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2212-10923,
  author       = {Zonglin Yang and
                  Li Dong and
                  Xinya Du and
                  Hao Cheng and
                  Erik Cambria and
                  Xiaodong Liu and
                  Jianfeng Gao and
                  Furu Wei},
  title        = {Language Models as Inductive Reasoners},
  journal      = {CoRR},
  volume       = {abs/2212.10923},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2212.10923},
  doi          = {10.48550/ARXIV.2212.10923},
  eprinttype    = {arXiv},
  eprint       = {2212.10923},
  timestamp    = {Thu, 11 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2212-10923.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/Hao0W021,
  author       = {Yaru Hao and
                  Li Dong and
                  Furu Wei and
                  Ke Xu},
  title        = {Self-Attention Attribution: Interpreting Information Interactions
                  Inside Transformer},
  booktitle    = {Thirty-Fifth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2021, Thirty-Third Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2021, The Eleventh Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2021, Virtual Event, February 2-9,
                  2021},
  pages        = {12963--12971},
  publisher    = {{AAAI} Press},
  year         = {2021},
  url          = {https://doi.org/10.1609/aaai.v35i14.17533},
  doi          = {10.1609/AAAI.V35I14.17533},
  timestamp    = {Mon, 04 Sep 2023 12:29:24 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/Hao0W021.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/YangYMHZLW20,
  author       = {Jian Yang and
                  Yuwei Yin and
                  Shuming Ma and
                  Haoyang Huang and
                  Dongdong Zhang and
                  Zhoujun Li and
                  Furu Wei},
  editor       = {Chengqing Zong and
                  Fei Xia and
                  Wenjie Li and
                  Roberto Navigli},
  title        = {Multilingual Agreement for Multilingual Neural Machine Translation},
  booktitle    = {Proceedings of the 59th Annual Meeting of the Association for Computational
                  Linguistics and the 11th International Joint Conference on Natural
                  Language Processing, {ACL/IJCNLP} 2021, (Volume 2: Short Papers),
                  Virtual Event, August 1-6, 2021},
  pages        = {233--239},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.acl-short.31},
  doi          = {10.18653/V1/2021.ACL-SHORT.31},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/acl/YangYMHZLW20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/YaoHWDW21,
  author       = {Yunzhi Yao and
                  Shaohan Huang and
                  Wenhui Wang and
                  Li Dong and
                  Furu Wei},
  editor       = {Chengqing Zong and
                  Fei Xia and
                  Wenjie Li and
                  Roberto Navigli},
  title        = {Adapt-and-Distill: Developing Small, Fast and Effective Pretrained
                  Language Models for Domains},
  booktitle    = {Findings of the Association for Computational Linguistics: {ACL/IJCNLP}
                  2021, Online Event, August 1-6, 2021},
  series       = {Findings of {ACL}},
  volume       = {{ACL/IJCNLP} 2021},
  pages        = {460--470},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.findings-acl.40},
  doi          = {10.18653/V1/2021.FINDINGS-ACL.40},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/YaoHWDW21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/TangZBLWZY21,
  author       = {Yu Tang and
                  Long Zhou and
                  Ambrosio Blanco and
                  Shujie Liu and
                  Furu Wei and
                  Ming Zhou and
                  Muyun Yang},
  editor       = {Chengqing Zong and
                  Fei Xia and
                  Wenjie Li and
                  Roberto Navigli},
  title        = {Grammar-Based Patches Generation for Automated Program Repair},
  booktitle    = {Findings of the Association for Computational Linguistics: {ACL/IJCNLP}
                  2021, Online Event, August 1-6, 2021},
  series       = {Findings of {ACL}},
  volume       = {{ACL/IJCNLP} 2021},
  pages        = {1300--1305},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.findings-acl.111},
  doi          = {10.18653/V1/2021.FINDINGS-ACL.111},
  timestamp    = {Mon, 09 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/TangZBLWZY21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/WangBHDW21,
  author       = {Wenhui Wang and
                  Hangbo Bao and
                  Shaohan Huang and
                  Li Dong and
                  Furu Wei},
  editor       = {Chengqing Zong and
                  Fei Xia and
                  Wenjie Li and
                  Roberto Navigli},
  title        = {MiniLMv2: Multi-Head Self-Attention Relation Distillation for Compressing
                  Pretrained Transformers},
  booktitle    = {Findings of the Association for Computational Linguistics: {ACL/IJCNLP}
                  2021, Online Event, August 1-6, 2021},
  series       = {Findings of {ACL}},
  volume       = {{ACL/IJCNLP} 2021},
  pages        = {2140--2151},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.findings-acl.188},
  doi          = {10.18653/V1/2021.FINDINGS-ACL.188},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/WangBHDW21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/XuXL0WWLFZCZZ20,
  author       = {Yang Xu and
                  Yiheng Xu and
                  Tengchao Lv and
                  Lei Cui and
                  Furu Wei and
                  Guoxin Wang and
                  Yijuan Lu and
                  Dinei A. F. Flor{\^{e}}ncio and
                  Cha Zhang and
                  Wanxiang Che and
                  Min Zhang and
                  Lidong Zhou},
  editor       = {Chengqing Zong and
                  Fei Xia and
                  Wenjie Li and
                  Roberto Navigli},
  title        = {LayoutLMv2: Multi-modal Pre-training for Visually-rich Document Understanding},
  booktitle    = {Proceedings of the 59th Annual Meeting of the Association for Computational
                  Linguistics and the 11th International Joint Conference on Natural
                  Language Processing, {ACL/IJCNLP} 2021, (Volume 1: Long Papers), Virtual
                  Event, August 1-6, 2021},
  pages        = {2579--2591},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.acl-long.201},
  doi          = {10.18653/V1/2021.ACL-LONG.201},
  timestamp    = {Wed, 31 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/acl/XuXL0WWLFZCZZ20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/Zheng0HWCSC0SW20,
  author       = {Bo Zheng and
                  Li Dong and
                  Shaohan Huang and
                  Wenhui Wang and
                  Zewen Chi and
                  Saksham Singhal and
                  Wanxiang Che and
                  Ting Liu and
                  Xia Song and
                  Furu Wei},
  editor       = {Chengqing Zong and
                  Fei Xia and
                  Wenjie Li and
                  Roberto Navigli},
  title        = {Consistency Regularization for Cross-Lingual Fine-Tuning},
  booktitle    = {Proceedings of the 59th Annual Meeting of the Association for Computational
                  Linguistics and the 11th International Joint Conference on Natural
                  Language Processing, {ACL/IJCNLP} 2021, (Volume 1: Long Papers), Virtual
                  Event, August 1-6, 2021},
  pages        = {3403--3417},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.acl-long.264},
  doi          = {10.18653/V1/2021.ACL-LONG.264},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/Zheng0HWCSC0SW20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/Chi0ZHMHW20,
  author       = {Zewen Chi and
                  Li Dong and
                  Bo Zheng and
                  Shaohan Huang and
                  Xian{-}Ling Mao and
                  Heyan Huang and
                  Furu Wei},
  editor       = {Chengqing Zong and
                  Fei Xia and
                  Wenjie Li and
                  Roberto Navigli},
  title        = {Improving Pretrained Cross-Lingual Language Models via Self-Labeled
                  Word Alignment},
  booktitle    = {Proceedings of the 59th Annual Meeting of the Association for Computational
                  Linguistics and the 11th International Joint Conference on Natural
                  Language Processing, {ACL/IJCNLP} 2021, (Volume 1: Long Papers), Virtual
                  Event, August 1-6, 2021},
  pages        = {3418--3430},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.acl-long.265},
  doi          = {10.18653/V1/2021.ACL-LONG.265},
  timestamp    = {Mon, 09 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/Chi0ZHMHW20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/ZhaoDSZWC21,
  author       = {Yuekai Zhao and
                  Li Dong and
                  Yelong Shen and
                  Zhihua Zhang and
                  Furu Wei and
                  Weizhu Chen},
  editor       = {Chengqing Zong and
                  Fei Xia and
                  Wenjie Li and
                  Roberto Navigli},
  title        = {Memory-Efficient Differentiable Transformer Architecture Search},
  booktitle    = {Findings of the Association for Computational Linguistics: {ACL/IJCNLP}
                  2021, Online Event, August 1-6, 2021},
  series       = {Findings of {ACL}},
  volume       = {{ACL/IJCNLP} 2021},
  pages        = {4254--4264},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.findings-acl.372},
  doi          = {10.18653/V1/2021.FINDINGS-ACL.372},
  timestamp    = {Mon, 09 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/ZhaoDSZWC21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/HaoDBXW21,
  author       = {Yaru Hao and
                  Li Dong and
                  Hangbo Bao and
                  Ke Xu and
                  Furu Wei},
  editor       = {Chengqing Zong and
                  Fei Xia and
                  Wenjie Li and
                  Roberto Navigli},
  title        = {Learning to Sample Replacements for {ELECTRA} Pre-Training},
  booktitle    = {Findings of the Association for Computational Linguistics: {ACL/IJCNLP}
                  2021, Online Event, August 1-6, 2021},
  series       = {Findings of {ACL}},
  volume       = {{ACL/IJCNLP} 2021},
  pages        = {4495--4506},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.findings-acl.394},
  doi          = {10.18653/V1/2021.FINDINGS-ACL.394},
  timestamp    = {Mon, 09 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/HaoDBXW21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/RenZ0W0020,
  author       = {Shuo Ren and
                  Long Zhou and
                  Shujie Liu and
                  Furu Wei and
                  Ming Zhou and
                  Shuai Ma},
  editor       = {Chengqing Zong and
                  Fei Xia and
                  Wenjie Li and
                  Roberto Navigli},
  title        = {SemFace: Pre-training Encoder and Decoder with a Semantic Interface
                  for Neural Machine Translation},
  booktitle    = {Proceedings of the 59th Annual Meeting of the Association for Computational
                  Linguistics and the 11th International Joint Conference on Natural
                  Language Processing, {ACL/IJCNLP} 2021, (Volume 1: Long Papers), Virtual
                  Event, August 1-6, 2021},
  pages        = {4518--4527},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.acl-long.348},
  doi          = {10.18653/V1/2021.ACL-LONG.348},
  timestamp    = {Mon, 09 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/RenZ0W0020.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/SunGWW20,
  author       = {Xin Sun and
                  Tao Ge and
                  Furu Wei and
                  Houfeng Wang},
  editor       = {Chengqing Zong and
                  Fei Xia and
                  Wenjie Li and
                  Roberto Navigli},
  title        = {Instantaneous Grammatical Error Correction with Shallow Aggressive
                  Decoding},
  booktitle    = {Proceedings of the 59th Annual Meeting of the Association for Computational
                  Linguistics and the 11th International Joint Conference on Natural
                  Language Processing, {ACL/IJCNLP} 2021, (Volume 1: Long Papers), Virtual
                  Event, August 1-6, 2021},
  pages        = {5937--5947},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.acl-long.462},
  doi          = {10.18653/V1/2021.ACL-LONG.462},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/acl/SunGWW20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/YangWJJY20,
  author       = {Nan Yang and
                  Furu Wei and
                  Binxing Jiao and
                  Daxing Jiang and
                  Linjun Yang},
  editor       = {Chengqing Zong and
                  Fei Xia and
                  Wenjie Li and
                  Roberto Navigli},
  title        = {xMoCo: Cross Momentum Contrastive Learning for Open-Domain Question
                  Answering},
  booktitle    = {Proceedings of the 59th Annual Meeting of the Association for Computational
                  Linguistics and the 11th International Joint Conference on Natural
                  Language Processing, {ACL/IJCNLP} 2021, (Volume 1: Long Papers), Virtual
                  Event, August 1-6, 2021},
  pages        = {6120--6129},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.acl-long.477},
  doi          = {10.18653/V1/2021.ACL-LONG.477},
  timestamp    = {Thu, 28 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/YangWJJY20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/ChenMC00PWW21,
  author       = {Guanhua Chen and
                  Shuming Ma and
                  Yun Chen and
                  Li Dong and
                  Dongdong Zhang and
                  Jia Pan and
                  Wenping Wang and
                  Furu Wei},
  editor       = {Marie{-}Francine Moens and
                  Xuanjing Huang and
                  Lucia Specia and
                  Scott Wen{-}tau Yih},
  title        = {Zero-Shot Cross-Lingual Transfer of Neural Machine Translation with
                  Multilingual Pretrained Encoders},
  booktitle    = {Proceedings of the 2021 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2021, Virtual Event / Punta Cana, Dominican
                  Republic, 7-11 November, 2021},
  pages        = {15--26},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.emnlp-main.2},
  doi          = {10.18653/V1/2021.EMNLP-MAIN.2},
  timestamp    = {Fri, 16 Feb 2024 08:27:36 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/ChenMC00PWW21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/ZhouGX0W21,
  author       = {Wangchunshu Zhou and
                  Tao Ge and
                  Canwen Xu and
                  Ke Xu and
                  Furu Wei},
  editor       = {Marie{-}Francine Moens and
                  Xuanjing Huang and
                  Lucia Specia and
                  Scott Wen{-}tau Yih},
  title        = {Improving Sequence-to-Sequence Pre-training via Sequence Span Rewriting},
  booktitle    = {Proceedings of the 2021 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2021, Virtual Event / Punta Cana, Dominican
                  Republic, 7-11 November, 2021},
  pages        = {571--582},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.emnlp-main.45},
  doi          = {10.18653/V1/2021.EMNLP-MAIN.45},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/ZhouGX0W21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/ChiDMHSMHSW21,
  author       = {Zewen Chi and
                  Li Dong and
                  Shuming Ma and
                  Shaohan Huang and
                  Saksham Singhal and
                  Xian{-}Ling Mao and
                  Heyan Huang and
                  Xia Song and
                  Furu Wei},
  editor       = {Marie{-}Francine Moens and
                  Xuanjing Huang and
                  Lucia Specia and
                  Scott Wen{-}tau Yih},
  title        = {mT6: Multilingual Pretrained Text-to-Text Transformer with Translation
                  Pairs},
  booktitle    = {Proceedings of the 2021 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2021, Virtual Event / Punta Cana, Dominican
                  Republic, 7-11 November, 2021},
  pages        = {1671--1683},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.emnlp-main.125},
  doi          = {10.18653/V1/2021.EMNLP-MAIN.125},
  timestamp    = {Thu, 20 Jan 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/ChiDMHSMHSW21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/ZhengDHSCLSW21,
  author       = {Bo Zheng and
                  Li Dong and
                  Shaohan Huang and
                  Saksham Singhal and
                  Wanxiang Che and
                  Ting Liu and
                  Xia Song and
                  Furu Wei},
  editor       = {Marie{-}Francine Moens and
                  Xuanjing Huang and
                  Lucia Specia and
                  Scott Wen{-}tau Yih},
  title        = {Allocating Large Vocabulary Capacity for Cross-Lingual Language Model
                  Pre-Training},
  booktitle    = {Proceedings of the 2021 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2021, Virtual Event / Punta Cana, Dominican
                  Republic, 7-11 November, 2021},
  pages        = {3203--3215},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.emnlp-main.257},
  doi          = {10.18653/V1/2021.EMNLP-MAIN.257},
  timestamp    = {Wed, 16 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/ZhengDHSCLSW21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/WangX0SW21,
  author       = {Zilong Wang and
                  Yiheng Xu and
                  Lei Cui and
                  Jingbo Shang and
                  Furu Wei},
  editor       = {Marie{-}Francine Moens and
                  Xuanjing Huang and
                  Lucia Specia and
                  Scott Wen{-}tau Yih},
  title        = {LayoutReader: Pre-training of Text and Layout for Reading Order Detection},
  booktitle    = {Proceedings of the 2021 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2021, Virtual Event / Punta Cana, Dominican
                  Republic, 7-11 November, 2021},
  pages        = {4735--4744},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.emnlp-main.389},
  doi          = {10.18653/V1/2021.EMNLP-MAIN.389},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/WangX0SW21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/BaiZB0W0021,
  author       = {Jiaqi Bai and
                  Long Zhou and
                  Ambrosio Blanco and
                  Shujie Liu and
                  Furu Wei and
                  Ming Zhou and
                  Zhoujun Li},
  editor       = {Marie{-}Francine Moens and
                  Xuanjing Huang and
                  Lucia Specia and
                  Scott Wen{-}tau Yih},
  title        = {Jointly Learning to Repair Code and Generate Commit Message},
  booktitle    = {Proceedings of the 2021 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2021, Virtual Event / Punta Cana, Dominican
                  Republic, 7-11 November, 2021},
  pages        = {9784--9795},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.emnlp-main.771},
  doi          = {10.18653/V1/2021.EMNLP-MAIN.771},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/BaiZB0W0021.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/XuZG0MW21,
  author       = {Canwen Xu and
                  Wangchunshu Zhou and
                  Tao Ge and
                  Ke Xu and
                  Julian J. McAuley and
                  Furu Wei},
  editor       = {Marie{-}Francine Moens and
                  Xuanjing Huang and
                  Lucia Specia and
                  Scott Wen{-}tau Yih},
  title        = {Beyond Preserved Accuracy: Evaluating Loyalty and Robustness of {BERT}
                  Compression},
  booktitle    = {Proceedings of the 2021 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2021, Virtual Event / Punta Cana, Dominican
                  Republic, 7-11 November, 2021},
  pages        = {10653--10659},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.emnlp-main.832},
  doi          = {10.18653/V1/2021.EMNLP-MAIN.832},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/XuZG0MW21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/0002WQK0WZ021,
  author       = {Chengyi Wang and
                  Yu Wu and
                  Yao Qian and
                  Ken'ichi Kumatani and
                  Shujie Liu and
                  Furu Wei and
                  Michael Zeng and
                  Xuedong Huang},
  editor       = {Marina Meila and
                  Tong Zhang},
  title        = {UniSpeech: Unified Speech Representation Learning with Labeled and
                  Unlabeled Data},
  booktitle    = {Proceedings of the 38th International Conference on Machine Learning,
                  {ICML} 2021, 18-24 July 2021, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {139},
  pages        = {10937--10947},
  publisher    = {{PMLR}},
  year         = {2021},
  url          = {http://proceedings.mlr.press/v139/wang21y.html},
  timestamp    = {Thu, 12 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/0002WQK0WZ021.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/naacl/XuZGXMW21,
  author       = {Canwen Xu and
                  Wangchunshu Zhou and
                  Tao Ge and
                  Ke Xu and
                  Julian J. McAuley and
                  Furu Wei},
  editor       = {Kristina Toutanova and
                  Anna Rumshisky and
                  Luke Zettlemoyer and
                  Dilek Hakkani{-}T{\"{u}}r and
                  Iz Beltagy and
                  Steven Bethard and
                  Ryan Cotterell and
                  Tanmoy Chakraborty and
                  Yichao Zhou},
  title        = {Blow the Dog Whistle: {A} Chinese Dataset for Cant Understanding with
                  Common Sense and World Knowledge},
  booktitle    = {Proceedings of the 2021 Conference of the North American Chapter of
                  the Association for Computational Linguistics: Human Language Technologies,
                  {NAACL-HLT} 2021, Online, June 6-11, 2021},
  pages        = {2139--2145},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.naacl-main.172},
  doi          = {10.18653/V1/2021.NAACL-MAIN.172},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/naacl/XuZGXMW21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/naacl/ChiDWYSWSMHZ21,
  author       = {Zewen Chi and
                  Li Dong and
                  Furu Wei and
                  Nan Yang and
                  Saksham Singhal and
                  Wenhui Wang and
                  Xia Song and
                  Xian{-}Ling Mao and
                  Heyan Huang and
                  Ming Zhou},
  editor       = {Kristina Toutanova and
                  Anna Rumshisky and
                  Luke Zettlemoyer and
                  Dilek Hakkani{-}T{\"{u}}r and
                  Iz Beltagy and
                  Steven Bethard and
                  Ryan Cotterell and
                  Tanmoy Chakraborty and
                  Yichao Zhou},
  title        = {InfoXLM: An Information-Theoretic Framework for Cross-Lingual Language
                  Model Pre-Training},
  booktitle    = {Proceedings of the 2021 Conference of the North American Chapter of
                  the Association for Computational Linguistics: Human Language Technologies,
                  {NAACL-HLT} 2021, Online, June 6-11, 2021},
  pages        = {3576--3588},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.naacl-main.280},
  doi          = {10.18653/V1/2021.NAACL-MAIN.280},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/naacl/ChiDWYSWSMHZ21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nlpcc/YangWMHZYLW21,
  author       = {Jian Yang and
                  Juncheng Wan and
                  Shuming Ma and
                  Haoyang Huang and
                  Dongdong Zhang and
                  Yong Yu and
                  Zhoujun Li and
                  Furu Wei},
  editor       = {Lu Wang and
                  Yansong Feng and
                  Yu Hong and
                  Ruifang He},
  title        = {Learning to Select Relevant Knowledge for Neural Machine Translation},
  booktitle    = {Natural Language Processing and Chinese Computing - 10th {CCF} International
                  Conference, {NLPCC} 2021, Qingdao, China, October 13-17, 2021, Proceedings,
                  Part {I}},
  series       = {Lecture Notes in Computer Science},
  volume       = {13028},
  pages        = {79--91},
  publisher    = {Springer},
  year         = {2021},
  url          = {https://doi.org/10.1007/978-3-030-88480-2\_7},
  doi          = {10.1007/978-3-030-88480-2\_7},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nlpcc/YangWMHZYLW21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/wmt/YangMH00HMSHSW21,
  author       = {Jian Yang and
                  Shuming Ma and
                  Haoyang Huang and
                  Dongdong Zhang and
                  Li Dong and
                  Shaohan Huang and
                  Alexandre Muzio and
                  Saksham Singhal and
                  Hany Hassan and
                  Xia Song and
                  Furu Wei},
  editor       = {Lo{\"{\i}}c Barrault and
                  Ondrej Bojar and
                  Fethi Bougares and
                  Rajen Chatterjee and
                  Marta R. Costa{-}juss{\`{a}} and
                  Christian Federmann and
                  Mark Fishel and
                  Alexander Fraser and
                  Markus Freitag and
                  Yvette Graham and
                  Roman Grundkiewicz and
                  Paco Guzman and
                  Barry Haddow and
                  Matthias Huck and
                  Antonio Jimeno{-}Yepes and
                  Philipp Koehn and
                  Tom Kocmi and
                  Andr{\'{e}} Martins and
                  Makoto Morishita and
                  Christof Monz},
  title        = {Multilingual Machine Translation Systems from Microsoft for {WMT21}
                  Shared Task},
  booktitle    = {Proceedings of the Sixth Conference on Machine Translation, WMT@EMNLP
                  2021, Online Event, November 10-11, 2021},
  pages        = {446--455},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://aclanthology.org/2021.wmt-1.54},
  timestamp    = {Wed, 07 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/wmt/YangMH00HMSHSW21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2101-00416,
  author       = {Wangchunshu Zhou and
                  Tao Ge and
                  Ke Xu and
                  Furu Wei},
  title        = {Improving Sequence-to-Sequence Pre-training via Sequence Span Rewriting},
  journal      = {CoRR},
  volume       = {abs/2101.00416},
  year         = {2021},
  url          = {https://arxiv.org/abs/2101.00416},
  eprinttype    = {arXiv},
  eprint       = {2101.00416},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2101-00416.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2101-07597,
  author       = {Chengyi Wang and
                  Yu Wu and
                  Yao Qian and
                  Ken'ichi Kumatani and
                  Shujie Liu and
                  Furu Wei and
                  Michael Zeng and
                  Xuedong Huang},
  title        = {UniSpeech: Unified Speech Representation Learning with Labeled and
                  Unlabeled Data},
  journal      = {CoRR},
  volume       = {abs/2101.07597},
  year         = {2021},
  url          = {https://arxiv.org/abs/2101.07597},
  eprinttype    = {arXiv},
  eprint       = {2101.07597},
  timestamp    = {Thu, 12 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2101-07597.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2104-02704,
  author       = {Canwen Xu and
                  Wangchunshu Zhou and
                  Tao Ge and
                  Ke Xu and
                  Julian J. McAuley and
                  Furu Wei},
  title        = {Blow the Dog Whistle: {A} Chinese Dataset for Cant Understanding with
                  Common Sense and World Knowledge},
  journal      = {CoRR},
  volume       = {abs/2104.02704},
  year         = {2021},
  url          = {https://arxiv.org/abs/2104.02704},
  eprinttype    = {arXiv},
  eprint       = {2104.02704},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2104-02704.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2104-08692,
  author       = {Zewen Chi and
                  Li Dong and
                  Shuming Ma and
                  Shaohan Huang and
                  Xian{-}Ling Mao and
                  Heyan Huang and
                  Furu Wei},
  title        = {mT6: Multilingual Pretrained Text-to-Text Transformer with Translation
                  Pairs},
  journal      = {CoRR},
  volume       = {abs/2104.08692},
  year         = {2021},
  url          = {https://arxiv.org/abs/2104.08692},
  eprinttype    = {arXiv},
  eprint       = {2104.08692},
  timestamp    = {Mon, 26 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2104-08692.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2104-08696,
  author       = {Damai Dai and
                  Li Dong and
                  Yaru Hao and
                  Zhifang Sui and
                  Furu Wei},
  title        = {Knowledge Neurons in Pretrained Transformers},
  journal      = {CoRR},
  volume       = {abs/2104.08696},
  year         = {2021},
  url          = {https://arxiv.org/abs/2104.08696},
  eprinttype    = {arXiv},
  eprint       = {2104.08696},
  timestamp    = {Wed, 02 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2104-08696.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2104-08757,
  author       = {Guanhua Chen and
                  Shuming Ma and
                  Yun Chen and
                  Li Dong and
                  Dongdong Zhang and
                  Jia Pan and
                  Wenping Wang and
                  Furu Wei},
  title        = {Zero-shot Cross-lingual Transfer of Neural Machine Translation with
                  Multilingual Pretrained Encoders},
  journal      = {CoRR},
  volume       = {abs/2104.08757},
  year         = {2021},
  url          = {https://arxiv.org/abs/2104.08757},
  eprinttype    = {arXiv},
  eprint       = {2104.08757},
  timestamp    = {Mon, 26 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2104-08757.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2104-08836,
  author       = {Yiheng Xu and
                  Tengchao Lv and
                  Lei Cui and
                  Guoxin Wang and
                  Yijuan Lu and
                  Dinei Flor{\^{e}}ncio and
                  Cha Zhang and
                  Furu Wei},
  title        = {LayoutXLM: Multimodal Pre-training for Multilingual Visually-rich
                  Document Understanding},
  journal      = {CoRR},
  volume       = {abs/2104.08836},
  year         = {2021},
  url          = {https://arxiv.org/abs/2104.08836},
  eprinttype    = {arXiv},
  eprint       = {2104.08836},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2104-08836.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2105-14669,
  author       = {Yuekai Zhao and
                  Li Dong and
                  Yelong Shen and
                  Zhihua Zhang and
                  Furu Wei and
                  Weizhu Chen},
  title        = {Memory-Efficient Differentiable Transformer Architecture Search},
  journal      = {CoRR},
  volume       = {abs/2105.14669},
  year         = {2021},
  url          = {https://arxiv.org/abs/2105.14669},
  eprinttype    = {arXiv},
  eprint       = {2105.14669},
  timestamp    = {Wed, 02 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2105-14669.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-03441,
  author       = {Shengqiang Zhang and
                  Xingxing Zhang and
                  Hangbo Bao and
                  Furu Wei},
  title        = {Attention Temperature Matters in Abstractive Summarization Distillation},
  journal      = {CoRR},
  volume       = {abs/2106.03441},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.03441},
  eprinttype    = {arXiv},
  eprint       = {2106.03441},
  timestamp    = {Thu, 10 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-03441.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-04970,
  author       = {Xin Sun and
                  Tao Ge and
                  Furu Wei and
                  Houfeng Wang},
  title        = {Instantaneous Grammatical Error Correction with Shallow Aggressive
                  Decoding},
  journal      = {CoRR},
  volume       = {abs/2106.04970},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.04970},
  eprinttype    = {arXiv},
  eprint       = {2106.04970},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-04970.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-05606,
  author       = {Tengchao Lv and
                  Lei Cui and
                  Momcilo Vasilijevic and
                  Furu Wei},
  title        = {VT-SSum: {A} Benchmark Dataset for Video Transcript Segmentation and
                  Summarization},
  journal      = {CoRR},
  volume       = {abs/2106.05606},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.05606},
  eprinttype    = {arXiv},
  eprint       = {2106.05606},
  timestamp    = {Tue, 15 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-05606.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-06381,
  author       = {Zewen Chi and
                  Li Dong and
                  Bo Zheng and
                  Shaohan Huang and
                  Xian{-}Ling Mao and
                  Heyan Huang and
                  Furu Wei},
  title        = {Improving Pretrained Cross-Lingual Language Models via Self-Labeled
                  Word Alignment},
  journal      = {CoRR},
  volume       = {abs/2106.06381},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.06381},
  eprinttype    = {arXiv},
  eprint       = {2106.06381},
  timestamp    = {Tue, 15 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-06381.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-08226,
  author       = {Bo Zheng and
                  Li Dong and
                  Shaohan Huang and
                  Wenhui Wang and
                  Zewen Chi and
                  Saksham Singhal and
                  Wanxiang Che and
                  Ting Liu and
                  Xia Song and
                  Furu Wei},
  title        = {Consistency Regularization for Cross-Lingual Fine-Tuning},
  journal      = {CoRR},
  volume       = {abs/2106.08226},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.08226},
  eprinttype    = {arXiv},
  eprint       = {2106.08226},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-08226.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-08254,
  author       = {Hangbo Bao and
                  Li Dong and
                  Furu Wei},
  title        = {BEiT: {BERT} Pre-Training of Image Transformers},
  journal      = {CoRR},
  volume       = {abs/2106.08254},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.08254},
  eprinttype    = {arXiv},
  eprint       = {2106.08254},
  timestamp    = {Tue, 29 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-08254.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-13474,
  author       = {Yunzhi Yao and
                  Shaohan Huang and
                  Wenhui Wang and
                  Li Dong and
                  Furu Wei},
  title        = {Adapt-and-Distill: Developing Small, Fast and Effective Pretrained
                  Language Models for Domains},
  journal      = {CoRR},
  volume       = {abs/2106.13474},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.13474},
  eprinttype    = {arXiv},
  eprint       = {2106.13474},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-13474.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-13715,
  author       = {Yaru Hao and
                  Li Dong and
                  Hangbo Bao and
                  Ke Xu and
                  Furu Wei},
  title        = {Learning to Sample Replacements for {ELECTRA} Pre-Training},
  journal      = {CoRR},
  volume       = {abs/2106.13715},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.13715},
  eprinttype    = {arXiv},
  eprint       = {2106.13715},
  timestamp    = {Wed, 30 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-13715.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-13736,
  author       = {Shuming Ma and
                  Li Dong and
                  Shaohan Huang and
                  Dongdong Zhang and
                  Alexandre Muzio and
                  Saksham Singhal and
                  Hany Hassan Awadalla and
                  Xia Song and
                  Furu Wei},
  title        = {DeltaLM: Encoder-Decoder Pre-training for Language Generation and
                  Translation by Augmenting Pretrained Multilingual Encoders},
  journal      = {CoRR},
  volume       = {abs/2106.13736},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.13736},
  eprinttype    = {arXiv},
  eprint       = {2106.13736},
  timestamp    = {Wed, 30 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-13736.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-16138,
  author       = {Zewen Chi and
                  Shaohan Huang and
                  Li Dong and
                  Shuming Ma and
                  Saksham Singhal and
                  Payal Bajaj and
                  Xia Song and
                  Furu Wei},
  title        = {{XLM-E:} Cross-lingual Language Model Pre-training via {ELECTRA}},
  journal      = {CoRR},
  volume       = {abs/2106.16138},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.16138},
  eprinttype    = {arXiv},
  eprint       = {2106.16138},
  timestamp    = {Mon, 05 Jul 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-16138.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2108-11591,
  author       = {Zilong Wang and
                  Yiheng Xu and
                  Lei Cui and
                  Jingbo Shang and
                  Furu Wei},
  title        = {LayoutReader: Pre-training of Text and Layout for Reading Order Detection},
  journal      = {CoRR},
  volume       = {abs/2108.11591},
  year         = {2021},
  url          = {https://arxiv.org/abs/2108.11591},
  eprinttype    = {arXiv},
  eprint       = {2108.11591},
  timestamp    = {Thu, 16 Dec 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2108-11591.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2109-03228,
  author       = {Canwen Xu and
                  Wangchunshu Zhou and
                  Tao Ge and
                  Ke Xu and
                  Julian J. McAuley and
                  Furu Wei},
  title        = {Beyond Preserved Accuracy: Evaluating Loyalty and Robustness of {BERT}
                  Compression},
  journal      = {CoRR},
  volume       = {abs/2109.03228},
  year         = {2021},
  url          = {https://arxiv.org/abs/2109.03228},
  eprinttype    = {arXiv},
  eprint       = {2109.03228},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2109-03228.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2109-03481,
  author       = {Shusheng Xu and
                  Xingxing Zhang and
                  Yi Wu and
                  Furu Wei},
  title        = {Sequence Level Contrastive Learning for Text Summarization},
  journal      = {CoRR},
  volume       = {abs/2109.03481},
  year         = {2021},
  url          = {https://arxiv.org/abs/2109.03481},
  eprinttype    = {arXiv},
  eprint       = {2109.03481},
  timestamp    = {Tue, 02 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2109-03481.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2109-07306,
  author       = {Bo Zheng and
                  Li Dong and
                  Shaohan Huang and
                  Saksham Singhal and
                  Wanxiang Che and
                  Ting Liu and
                  Xia Song and
                  Furu Wei},
  title        = {Allocating Large Vocabulary Capacity for Cross-lingual Language Model
                  Pre-training},
  journal      = {CoRR},
  volume       = {abs/2109.07306},
  year         = {2021},
  url          = {https://arxiv.org/abs/2109.07306},
  eprinttype    = {arXiv},
  eprint       = {2109.07306},
  timestamp    = {Wed, 16 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2109-07306.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2109-10282,
  author       = {Minghao Li and
                  Tengchao Lv and
                  Lei Cui and
                  Yijuan Lu and
                  Dinei A. F. Flor{\^{e}}ncio and
                  Cha Zhang and
                  Zhoujun Li and
                  Furu Wei},
  title        = {TrOCR: Transformer-based Optical Character Recognition with Pre-trained
                  Models},
  journal      = {CoRR},
  volume       = {abs/2109.10282},
  year         = {2021},
  url          = {https://arxiv.org/abs/2109.10282},
  eprinttype    = {arXiv},
  eprint       = {2109.10282},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2109-10282.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2109-12296,
  author       = {Jiaqi Bai and
                  Long Zhou and
                  Ambrosio Blanco and
                  Shujie Liu and
                  Furu Wei and
                  Ming Zhou and
                  Zhoujun Li},
  title        = {Jointly Learning to Repair Code and Generate Commit Message},
  journal      = {CoRR},
  volume       = {abs/2109.12296},
  year         = {2021},
  url          = {https://arxiv.org/abs/2109.12296},
  eprinttype    = {arXiv},
  eprint       = {2109.12296},
  timestamp    = {Mon, 04 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2109-12296.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2110-05752,
  author       = {Sanyuan Chen and
                  Yu Wu and
                  Chengyi Wang and
                  Zhengyang Chen and
                  Zhuo Chen and
                  Shujie Liu and
                  Jian Wu and
                  Yao Qian and
                  Furu Wei and
                  Jinyu Li and
                  Xiangzhan Yu},
  title        = {UniSpeech-SAT: Universal Speech Representation Learning with Speaker
                  Aware Pre-Training},
  journal      = {CoRR},
  volume       = {abs/2110.05752},
  year         = {2021},
  url          = {https://arxiv.org/abs/2110.05752},
  eprinttype    = {arXiv},
  eprint       = {2110.05752},
  timestamp    = {Tue, 17 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2110-05752.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2110-07205,
  author       = {Junyi Ao and
                  Rui Wang and
                  Long Zhou and
                  Shujie Liu and
                  Shuo Ren and
                  Yu Wu and
                  Tom Ko and
                  Qing Li and
                  Yu Zhang and
                  Zhihua Wei and
                  Yao Qian and
                  Jinyu Li and
                  Furu Wei},
  title        = {SpeechT5: Unified-Modal Encoder-Decoder Pre-training for Spoken Language
                  Processing},
  journal      = {CoRR},
  volume       = {abs/2110.07205},
  year         = {2021},
  url          = {https://arxiv.org/abs/2110.07205},
  eprinttype    = {arXiv},
  eprint       = {2110.07205},
  timestamp    = {Mon, 01 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2110-07205.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2110-08518,
  author       = {Junlong Li and
                  Yiheng Xu and
                  Lei Cui and
                  Furu Wei},
  title        = {MarkupLM: Pre-training of Text and Markup Language for Visually-rich
                  Document Understanding},
  journal      = {CoRR},
  volume       = {abs/2110.08518},
  year         = {2021},
  url          = {https://arxiv.org/abs/2110.08518},
  eprinttype    = {arXiv},
  eprint       = {2110.08518},
  timestamp    = {Fri, 22 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2110-08518.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2110-08547,
  author       = {Guanhua Chen and
                  Shuming Ma and
                  Yun Chen and
                  Dongdong Zhang and
                  Jia Pan and
                  Wenping Wang and
                  Furu Wei},
  title        = {Towards Making the Most of Multilingual Pretraining for Zero-Shot
                  Neural Machine Translation},
  journal      = {CoRR},
  volume       = {abs/2110.08547},
  year         = {2021},
  url          = {https://arxiv.org/abs/2110.08547},
  eprinttype    = {arXiv},
  eprint       = {2110.08547},
  timestamp    = {Fri, 22 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2110-08547.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2110-11115,
  author       = {Ting Jiang and
                  Shaohan Huang and
                  Zihan Zhang and
                  Deqing Wang and
                  Fuzhen Zhuang and
                  Furu Wei and
                  Haizhen Huang and
                  Liangjie Zhang and
                  Qi Zhang},
  title        = {Improving Non-autoregressive Generation with Mixup Training},
  journal      = {CoRR},
  volume       = {abs/2110.11115},
  year         = {2021},
  url          = {https://arxiv.org/abs/2110.11115},
  eprinttype    = {arXiv},
  eprint       = {2110.11115},
  timestamp    = {Thu, 28 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2110-11115.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2110-13640,
  author       = {Hangbo Bao and
                  Li Dong and
                  Wenhui Wang and
                  Nan Yang and
                  Furu Wei},
  title        = {s2s-ft: Fine-Tuning Pretrained Transformer Encoders for Sequence-to-Sequence
                  Learning},
  journal      = {CoRR},
  volume       = {abs/2110.13640},
  year         = {2021},
  url          = {https://arxiv.org/abs/2110.13640},
  eprinttype    = {arXiv},
  eprint       = {2110.13640},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2110-13640.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2110-13900,
  author       = {Sanyuan Chen and
                  Chengyi Wang and
                  Zhengyang Chen and
                  Yu Wu and
                  Shujie Liu and
                  Zhuo Chen and
                  Jinyu Li and
                  Naoyuki Kanda and
                  Takuya Yoshioka and
                  Xiong Xiao and
                  Jian Wu and
                  Long Zhou and
                  Shuo Ren and
                  Yanmin Qian and
                  Yao Qian and
                  Jian Wu and
                  Michael Zeng and
                  Furu Wei},
  title        = {WavLM: Large-Scale Self-Supervised Pre-Training for Full Stack Speech
                  Processing},
  journal      = {CoRR},
  volume       = {abs/2110.13900},
  year         = {2021},
  url          = {https://arxiv.org/abs/2110.13900},
  eprinttype    = {arXiv},
  eprint       = {2110.13900},
  timestamp    = {Wed, 26 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2110-13900.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2110-14142,
  author       = {Wangyou Zhang and
                  Zhuo Chen and
                  Naoyuki Kanda and
                  Shujie Liu and
                  Jinyu Li and
                  Sefik Emre Eskimez and
                  Takuya Yoshioka and
                  Xiong Xiao and
                  Zhong Meng and
                  Yanmin Qian and
                  Furu Wei},
  title        = {Separating Long-Form Speech with Group-Wise Permutation Invariant
                  Training},
  journal      = {CoRR},
  volume       = {abs/2110.14142},
  year         = {2021},
  url          = {https://arxiv.org/abs/2110.14142},
  eprinttype    = {arXiv},
  eprint       = {2110.14142},
  timestamp    = {Tue, 10 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2110-14142.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2111-02086,
  author       = {Jian Yang and
                  Shuming Ma and
                  Haoyang Huang and
                  Dongdong Zhang and
                  Li Dong and
                  Shaohan Huang and
                  Alexandre Muzio and
                  Saksham Singhal and
                  Hany Hassan Awadalla and
                  Xia Song and
                  Furu Wei},
  title        = {Multilingual Machine Translation Systems from Microsoft for {WMT21}
                  Shared Task},
  journal      = {CoRR},
  volume       = {abs/2111.02086},
  year         = {2021},
  url          = {https://arxiv.org/abs/2111.02086},
  eprinttype    = {arXiv},
  eprint       = {2111.02086},
  timestamp    = {Wed, 07 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2111-02086.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2111-02358,
  author       = {Wenhui Wang and
                  Hangbo Bao and
                  Li Dong and
                  Furu Wei},
  title        = {VLMo: Unified Vision-Language Pre-Training with Mixture-of-Modality-Experts},
  journal      = {CoRR},
  volume       = {abs/2111.02358},
  year         = {2021},
  url          = {https://arxiv.org/abs/2111.02358},
  eprinttype    = {arXiv},
  eprint       = {2111.02358},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2111-02358.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2111-08609,
  author       = {Lei Cui and
                  Yiheng Xu and
                  Tengchao Lv and
                  Furu Wei},
  title        = {Document {AI:} Benchmarks, Models and Applications},
  journal      = {CoRR},
  volume       = {abs/2111.08609},
  year         = {2021},
  url          = {https://arxiv.org/abs/2111.08609},
  eprinttype    = {arXiv},
  eprint       = {2111.08609},
  timestamp    = {Mon, 22 Nov 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2111-08609.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2111-09883,
  author       = {Ze Liu and
                  Han Hu and
                  Yutong Lin and
                  Zhuliang Yao and
                  Zhenda Xie and
                  Yixuan Wei and
                  Jia Ning and
                  Yue Cao and
                  Zheng Zhang and
                  Li Dong and
                  Furu Wei and
                  Baining Guo},
  title        = {Swin Transformer {V2:} Scaling Up Capacity and Resolution},
  journal      = {CoRR},
  volume       = {abs/2111.09883},
  year         = {2021},
  url          = {https://arxiv.org/abs/2111.09883},
  eprinttype    = {arXiv},
  eprint       = {2111.09883},
  timestamp    = {Mon, 05 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2111-09883.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2112-08723,
  author       = {Zekun Wang and
                  Wenhui Wang and
                  Haichao Zhu and
                  Ming Liu and
                  Bing Qin and
                  Furu Wei},
  title        = {Distilled Dual-Encoder Model for Vision-Language Understanding},
  journal      = {CoRR},
  volume       = {abs/2112.08723},
  year         = {2021},
  url          = {https://arxiv.org/abs/2112.08723},
  eprinttype    = {arXiv},
  eprint       = {2112.08723},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2112-08723.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/ZhouYWHZZ20,
  author       = {Qingyu Zhou and
                  Nan Yang and
                  Furu Wei and
                  Shaohan Huang and
                  Ming Zhou and
                  Tiejun Zhao},
  title        = {A Joint Sentence Scoring and Selection Framework for Neural Extractive
                  Document Summarization},
  journal      = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.},
  volume       = {28},
  pages        = {671--681},
  year         = {2020},
  url          = {https://doi.org/10.1109/TASLP.2020.2964427},
  doi          = {10.1109/TASLP.2020.2964427},
  timestamp    = {Fri, 13 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/taslp/ZhouYWHZZ20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/Chi0WWMH20,
  author       = {Zewen Chi and
                  Li Dong and
                  Furu Wei and
                  Wenhui Wang and
                  Xian{-}Ling Mao and
                  Heyan Huang},
  title        = {Cross-Lingual Natural Language Generation via Pre-Training},
  booktitle    = {The Thirty-Fourth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2020, The Thirty-Second Innovative Applications of Artificial Intelligence
                  Conference, {IAAI} 2020, The Tenth {AAAI} Symposium on Educational
                  Advances in Artificial Intelligence, {EAAI} 2020, New York, NY, USA,
                  February 7-12, 2020},
  pages        = {7570--7577},
  publisher    = {{AAAI} Press},
  year         = {2020},
  url          = {https://doi.org/10.1609/aaai.v34i05.6256},
  doi          = {10.1609/AAAI.V34I05.6256},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/Chi0WWMH20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/GuoGW20,
  author       = {Yinuo Guo and
                  Tao Ge and
                  Furu Wei},
  title        = {Fact-Aware Sentence Split and Rephrase with Permutation Invariant
                  Training},
  booktitle    = {The Thirty-Fourth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2020, The Thirty-Second Innovative Applications of Artificial Intelligence
                  Conference, {IAAI} 2020, The Tenth {AAAI} Symposium on Educational
                  Advances in Artificial Intelligence, {EAAI} 2020, New York, NY, USA,
                  February 7-12, 2020},
  pages        = {7855--7862},
  publisher    = {{AAAI} Press},
  year         = {2020},
  url          = {https://doi.org/10.1609/aaai.v34i05.6291},
  doi          = {10.1609/AAAI.V34I05.6291},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/aaai/GuoGW20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/LiWDWX20,
  author       = {Zhongli Li and
                  Wenhui Wang and
                  Li Dong and
                  Furu Wei and
                  Ke Xu},
  editor       = {Dan Jurafsky and
                  Joyce Chai and
                  Natalie Schluter and
                  Joel R. Tetreault},
  title        = {Harvesting and Refining Question-Answer Pairs for Unsupervised {QA}},
  booktitle    = {Proceedings of the 58th Annual Meeting of the Association for Computational
                  Linguistics, {ACL} 2020, Online, July 5-10, 2020},
  pages        = {6719--6728},
  publisher    = {Association for Computational Linguistics},
  year         = {2020},
  url          = {https://doi.org/10.18653/v1/2020.acl-main.600},
  doi          = {10.18653/V1/2020.ACL-MAIN.600},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/LiWDWX20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/coling/LiXCHWLZ20,
  author       = {Minghao Li and
                  Yiheng Xu and
                  Lei Cui and
                  Shaohan Huang and
                  Furu Wei and
                  Zhoujun Li and
                  Ming Zhou},
  editor       = {Donia Scott and
                  N{\'{u}}ria Bel and
                  Chengqing Zong},
  title        = {DocBank: {A} Benchmark Dataset for Document Layout Analysis},
  booktitle    = {Proceedings of the 28th International Conference on Computational
                  Linguistics, {COLING} 2020, Barcelona, Spain (Online), December 8-13,
                  2020},
  pages        = {949--960},
  publisher    = {International Committee on Computational Linguistics},
  year         = {2020},
  url          = {https://doi.org/10.18653/v1/2020.coling-main.82},
  doi          = {10.18653/V1/2020.COLING-MAIN.82},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/coling/LiXCHWLZ20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/coling/HuangWCZZ20,
  author       = {Shaohan Huang and
                  Furu Wei and
                  Lei Cui and
                  Xingxing Zhang and
                  Ming Zhou},
  editor       = {Donia Scott and
                  N{\'{u}}ria Bel and
                  Chengqing Zong},
  title        = {Unsupervised Fine-tuning for Text Clustering},
  booktitle    = {Proceedings of the 28th International Conference on Computational
                  Linguistics, {COLING} 2020, Barcelona, Spain (Online), December 8-13,
                  2020},
  pages        = {5530--5534},
  publisher    = {International Committee on Computational Linguistics},
  year         = {2020},
  url          = {https://doi.org/10.18653/v1/2020.coling-main.482},
  doi          = {10.18653/V1/2020.COLING-MAIN.482},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/coling/HuangWCZZ20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/coling/ZhouWZ20,
  author       = {Qingyu Zhou and
                  Furu Wei and
                  Ming Zhou},
  editor       = {Donia Scott and
                  N{\'{u}}ria Bel and
                  Chengqing Zong},
  title        = {At Which Level Should We Extract? An Empirical Analysis on Extractive
                  Document Summarization},
  booktitle    = {Proceedings of the 28th International Conference on Computational
                  Linguistics, {COLING} 2020, Barcelona, Spain (Online), December 8-13,
                  2020},
  pages        = {5617--5628},
  publisher    = {International Committee on Computational Linguistics},
  year         = {2020},
  url          = {https://doi.org/10.18653/v1/2020.coling-main.492},
  doi          = {10.18653/V1/2020.COLING-MAIN.492},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/coling/ZhouWZ20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ecai/Duan0MWZZ20,
  author       = {Chaoqun Duan and
                  Lei Cui and
                  Shuming Ma and
                  Furu Wei and
                  Conghui Zhu and
                  Tiejun Zhao},
  editor       = {Giuseppe De Giacomo and
                  Alejandro Catal{\'{a}} and
                  Bistra Dilkina and
                  Michela Milano and
                  Sen{\'{e}}n Barro and
                  Alberto Bugar{\'{\i}}n and
                  J{\'{e}}r{\^{o}}me Lang},
  title        = {Multimodal Matching Transformer for Live Commenting},
  booktitle    = {{ECAI} 2020 - 24th European Conference on Artificial Intelligence,
                  29 August-8 September 2020, Santiago de Compostela, Spain, August
                  29 - September 8, 2020 - Including 10th Conference on Prestigious
                  Applications of Artificial Intelligence {(PAIS} 2020)},
  series       = {Frontiers in Artificial Intelligence and Applications},
  volume       = {325},
  pages        = {1998--2005},
  publisher    = {{IOS} Press},
  year         = {2020},
  url          = {https://doi.org/10.3233/FAIA200320},
  doi          = {10.3233/FAIA200320},
  timestamp    = {Fri, 09 Apr 2021 18:50:05 +0200},
  biburl       = {https://dblp.org/rec/conf/ecai/Duan0MWZZ20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eccv/Li0LZHZWH0WCG20,
  author       = {Xiujun Li and
                  Xi Yin and
                  Chunyuan Li and
                  Pengchuan Zhang and
                  Xiaowei Hu and
                  Lei Zhang and
                  Lijuan Wang and
                  Houdong Hu and
                  Li Dong and
                  Furu Wei and
                  Yejin Choi and
                  Jianfeng Gao},
  editor       = {Andrea Vedaldi and
                  Horst Bischof and
                  Thomas Brox and
                  Jan{-}Michael Frahm},
  title        = {Oscar: Object-Semantics Aligned Pre-training for Vision-Language Tasks},
  booktitle    = {Computer Vision - {ECCV} 2020 - 16th European Conference, Glasgow,
                  UK, August 23-28, 2020, Proceedings, Part {XXX}},
  series       = {Lecture Notes in Computer Science},
  volume       = {12375},
  pages        = {121--137},
  publisher    = {Springer},
  year         = {2020},
  url          = {https://doi.org/10.1007/978-3-030-58577-8\_8},
  doi          = {10.1007/978-3-030-58577-8\_8},
  timestamp    = {Thu, 11 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/eccv/Li0LZHZWH0WCG20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/ZhouGM0W020,
  author       = {Wangchunshu Zhou and
                  Tao Ge and
                  Chang Mu and
                  Ke Xu and
                  Furu Wei and
                  Ming Zhou},
  editor       = {Trevor Cohn and
                  Yulan He and
                  Yang Liu},
  title        = {Improving Grammatical Error Correction with Machine Translation Pairs},
  booktitle    = {Findings of the Association for Computational Linguistics: {EMNLP}
                  2020, Online Event, 16-20 November 2020},
  series       = {Findings of {ACL}},
  volume       = {{EMNLP} 2020},
  pages        = {318--328},
  publisher    = {Association for Computational Linguistics},
  year         = {2020},
  url          = {https://doi.org/10.18653/v1/2020.findings-emnlp.30},
  doi          = {10.18653/V1/2020.FINDINGS-EMNLP.30},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/ZhouGM0W020.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/JiKHWZH20,
  author       = {Haozhe Ji and
                  Pei Ke and
                  Shaohan Huang and
                  Furu Wei and
                  Xiaoyan Zhu and
                  Minlie Huang},
  editor       = {Bonnie Webber and
                  Trevor Cohn and
                  Yulan He and
                  Yang Liu},
  title        = {Language Generation with Multi-Hop Reasoning on Commonsense Knowledge
                  Graph},
  booktitle    = {Proceedings of the 2020 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2020, Online, November 16-20, 2020},
  pages        = {725--736},
  publisher    = {Association for Computational Linguistics},
  year         = {2020},
  url          = {https://doi.org/10.18653/v1/2020.emnlp-main.54},
  doi          = {10.18653/V1/2020.EMNLP-MAIN.54},
  timestamp    = {Wed, 23 Mar 2022 10:11:55 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/JiKHWZH20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/XuZWWZ20,
  author       = {Shusheng Xu and
                  Xingxing Zhang and
                  Yi Wu and
                  Furu Wei and
                  Ming Zhou},
  editor       = {Trevor Cohn and
                  Yulan He and
                  Yang Liu},
  title        = {Unsupervised Extractive Summarization by Pre-training Hierarchical
                  Transformers},
  booktitle    = {Findings of the Association for Computational Linguistics: {EMNLP}
                  2020, Online Event, 16-20 November 2020},
  series       = {Findings of {ACL}},
  volume       = {{EMNLP} 2020},
  pages        = {1784--1795},
  publisher    = {Association for Computational Linguistics},
  year         = {2020},
  url          = {https://doi.org/10.18653/v1/2020.findings-emnlp.161},
  doi          = {10.18653/V1/2020.FINDINGS-EMNLP.161},
  timestamp    = {Tue, 02 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/XuZWWZ20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/ZhouGW0020,
  author       = {Wangchunshu Zhou and
                  Tao Ge and
                  Furu Wei and
                  Ming Zhou and
                  Ke Xu},
  editor       = {Trevor Cohn and
                  Yulan He and
                  Yang Liu},
  title        = {Scheduled DropHead: {A} Regularization Method for Transformer Models},
  booktitle    = {Findings of the Association for Computational Linguistics: {EMNLP}
                  2020, Online Event, 16-20 November 2020},
  series       = {Findings of {ACL}},
  volume       = {{EMNLP} 2020},
  pages        = {1971--1980},
  publisher    = {Association for Computational Linguistics},
  year         = {2020},
  url          = {https://doi.org/10.18653/v1/2020.findings-emnlp.178},
  doi          = {10.18653/V1/2020.FINDINGS-EMNLP.178},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/ZhouGW0020.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/ZouZLWZ20,
  author       = {Yanyan Zou and
                  Xingxing Zhang and
                  Wei Lu and
                  Furu Wei and
                  Ming Zhou},
  editor       = {Bonnie Webber and
                  Trevor Cohn and
                  Yulan He and
                  Yang Liu},
  title        = {Pre-training for Abstractive Document Summarization by Reinstating
                  Source Text},
  booktitle    = {Proceedings of the 2020 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2020, Online, November 16-20, 2020},
  pages        = {3646--3660},
  publisher    = {Association for Computational Linguistics},
  year         = {2020},
  url          = {https://doi.org/10.18653/v1/2020.emnlp-main.297},
  doi          = {10.18653/V1/2020.EMNLP-MAIN.297},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/ZouZLWZ20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/ChenGZWZ20,
  author       = {Mengyun Chen and
                  Tao Ge and
                  Xingxing Zhang and
                  Furu Wei and
                  Ming Zhou},
  editor       = {Bonnie Webber and
                  Trevor Cohn and
                  Yulan He and
                  Yang Liu},
  title        = {Improving the Efficiency of Grammatical Error Correction with Erroneous
                  Span Detection and Correction},
  booktitle    = {Proceedings of the 2020 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2020, Online, November 16-20, 2020},
  pages        = {7162--7169},
  publisher    = {Association for Computational Linguistics},
  year         = {2020},
  url          = {https://doi.org/10.18653/v1/2020.emnlp-main.581},
  doi          = {10.18653/V1/2020.EMNLP-MAIN.581},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/ChenGZWZ20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/XuZGWZ20,
  author       = {Canwen Xu and
                  Wangchunshu Zhou and
                  Tao Ge and
                  Furu Wei and
                  Ming Zhou},
  editor       = {Bonnie Webber and
                  Trevor Cohn and
                  Yulan He and
                  Yang Liu},
  title        = {BERT-of-Theseus: Compressing {BERT} by Progressive Module Replacing},
  booktitle    = {Proceedings of the 2020 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2020, Online, November 16-20, 2020},
  pages        = {7859--7869},
  publisher    = {Association for Computational Linguistics},
  year         = {2020},
  url          = {https://doi.org/10.18653/v1/2020.emnlp-main.633},
  doi          = {10.18653/V1/2020.EMNLP-MAIN.633},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/XuZGWZ20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/SuZCLLWD20,
  author       = {Weijie Su and
                  Xizhou Zhu and
                  Yue Cao and
                  Bin Li and
                  Lewei Lu and
                  Furu Wei and
                  Jifeng Dai},
  title        = {{VL-BERT:} Pre-training of Generic Visual-Linguistic Representations},
  booktitle    = {8th International Conference on Learning Representations, {ICLR} 2020,
                  Addis Ababa, Ethiopia, April 26-30, 2020},
  publisher    = {OpenReview.net},
  year         = {2020},
  url          = {https://openreview.net/forum?id=SygXPaEYvH},
  timestamp    = {Tue, 12 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/SuZCLLWD20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/ZhouGXW020,
  author       = {Wangchunshu Zhou and
                  Tao Ge and
                  Ke Xu and
                  Furu Wei and
                  Ming Zhou},
  title        = {Self-Adversarial Learning with Comparative Discrimination for Text
                  Generation},
  booktitle    = {8th International Conference on Learning Representations, {ICLR} 2020,
                  Addis Ababa, Ethiopia, April 26-30, 2020},
  publisher    = {OpenReview.net},
  year         = {2020},
  url          = {https://openreview.net/forum?id=B1l8L6EtDS},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iclr/ZhouGXW020.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/Bao0WW0L0GP0H20,
  author       = {Hangbo Bao and
                  Li Dong and
                  Furu Wei and
                  Wenhui Wang and
                  Nan Yang and
                  Xiaodong Liu and
                  Yu Wang and
                  Jianfeng Gao and
                  Songhao Piao and
                  Ming Zhou and
                  Hsiao{-}Wuen Hon},
  title        = {UniLMv2: Pseudo-Masked Language Models for Unified Language Model
                  Pre-Training},
  booktitle    = {Proceedings of the 37th International Conference on Machine Learning,
                  {ICML} 2020, 13-18 July 2020, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {119},
  pages        = {642--652},
  publisher    = {{PMLR}},
  year         = {2020},
  url          = {http://proceedings.mlr.press/v119/bao20a.html},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/Bao0WW0L0GP0H20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcnlp/ChiDWMH20,
  author       = {Zewen Chi and
                  Li Dong and
                  Furu Wei and
                  Xianling Mao and
                  Heyan Huang},
  editor       = {Kam{-}Fai Wong and
                  Kevin Knight and
                  Hua Wu},
  title        = {Can Monolingual Pretrained Models Help Cross-Lingual Classification?},
  booktitle    = {Proceedings of the 1st Conference of the Asia-Pacific Chapter of the
                  Association for Computational Linguistics and the 10th International
                  Joint Conference on Natural Language Processing, {AACL/IJCNLP} 2020,
                  Suzhou, China, December 4-7, 2020},
  pages        = {12--17},
  publisher    = {Association for Computational Linguistics},
  year         = {2020},
  url          = {https://aclanthology.org/2020.aacl-main.2/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcnlp/ChiDWMH20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcnlp/HaoDWX20,
  author       = {Yaru Hao and
                  Li Dong and
                  Furu Wei and
                  Ke Xu},
  editor       = {Kam{-}Fai Wong and
                  Kevin Knight and
                  Hua Wu},
  title        = {Investigating Learning Dynamics of {BERT} Fine-Tuning},
  booktitle    = {Proceedings of the 1st Conference of the Asia-Pacific Chapter of the
                  Association for Computational Linguistics and the 10th International
                  Joint Conference on Natural Language Processing, {AACL/IJCNLP} 2020,
                  Suzhou, China, December 4-7, 2020},
  pages        = {87--92},
  publisher    = {Association for Computational Linguistics},
  year         = {2020},
  url          = {https://aclanthology.org/2020.aacl-main.11/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcnlp/HaoDWX20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcnlp/XuGLW20,
  author       = {Canwen Xu and
                  Tao Ge and
                  Chenliang Li and
                  Furu Wei},
  editor       = {Kam{-}Fai Wong and
                  Kevin Knight and
                  Hua Wu},
  title        = {UnihanLM: Coarse-to-Fine Chinese-Japanese Language Model Pretraining
                  with the Unihan Database},
  booktitle    = {Proceedings of the 1st Conference of the Asia-Pacific Chapter of the
                  Association for Computational Linguistics and the 10th International
                  Joint Conference on Natural Language Processing, {AACL/IJCNLP} 2020,
                  Suzhou, China, December 4-7, 2020},
  pages        = {201--211},
  publisher    = {Association for Computational Linguistics},
  year         = {2020},
  url          = {https://aclanthology.org/2020.aacl-main.24/},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ijcnlp/XuGLW20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcnlp/JiKHWH20,
  author       = {Haozhe Ji and
                  Pei Ke and
                  Shaohan Huang and
                  Furu Wei and
                  Minlie Huang},
  editor       = {Kam{-}Fai Wong and
                  Kevin Knight and
                  Hua Wu},
  title        = {Generating Commonsense Explanation by Extracting Bridge Concepts from
                  Reasoning Paths},
  booktitle    = {Proceedings of the 1st Conference of the Asia-Pacific Chapter of the
                  Association for Computational Linguistics and the 10th International
                  Joint Conference on Natural Language Processing, {AACL/IJCNLP} 2020,
                  Suzhou, China, December 4-7, 2020},
  pages        = {248--257},
  publisher    = {Association for Computational Linguistics},
  year         = {2020},
  url          = {https://aclanthology.org/2020.aacl-main.28/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcnlp/JiKHWH20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/kdd/XuL0HW020,
  author       = {Yiheng Xu and
                  Minghao Li and
                  Lei Cui and
                  Shaohan Huang and
                  Furu Wei and
                  Ming Zhou},
  editor       = {Rajesh Gupta and
                  Yan Liu and
                  Jiliang Tang and
                  B. Aditya Prakash},
  title        = {LayoutLM: Pre-training of Text and Layout for Document Image Understanding},
  booktitle    = {{KDD} '20: The 26th {ACM} {SIGKDD} Conference on Knowledge Discovery
                  and Data Mining, Virtual Event, CA, USA, August 23-27, 2020},
  pages        = {1192--1200},
  publisher    = {{ACM}},
  year         = {2020},
  url          = {https://doi.org/10.1145/3394486.3403172},
  doi          = {10.1145/3394486.3403172},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/kdd/XuL0HW020.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/lrec/LiCHWZL20,
  author       = {Minghao Li and
                  Lei Cui and
                  Shaohan Huang and
                  Furu Wei and
                  Ming Zhou and
                  Zhoujun Li},
  editor       = {Nicoletta Calzolari and
                  Fr{\'{e}}d{\'{e}}ric B{\'{e}}chet and
                  Philippe Blache and
                  Khalid Choukri and
                  Christopher Cieri and
                  Thierry Declerck and
                  Sara Goggi and
                  Hitoshi Isahara and
                  Bente Maegaard and
                  Joseph Mariani and
                  H{\'{e}}l{\`{e}}ne Mazo and
                  Asunci{\'{o}}n Moreno and
                  Jan Odijk and
                  Stelios Piperidis},
  title        = {TableBank: Table Benchmark for Image-based Table Detection and Recognition},
  booktitle    = {Proceedings of The 12th Language Resources and Evaluation Conference,
                  {LREC} 2020, Marseille, France, May 11-16, 2020},
  pages        = {1918--1925},
  publisher    = {European Language Resources Association},
  year         = {2020},
  url          = {https://aclanthology.org/2020.lrec-1.236/},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/lrec/LiCHWZL20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/WangW0B0020,
  author       = {Wenhui Wang and
                  Furu Wei and
                  Li Dong and
                  Hangbo Bao and
                  Nan Yang and
                  Ming Zhou},
  editor       = {Hugo Larochelle and
                  Marc'Aurelio Ranzato and
                  Raia Hadsell and
                  Maria{-}Florina Balcan and
                  Hsuan{-}Tien Lin},
  title        = {MiniLM: Deep Self-Attention Distillation for Task-Agnostic Compression
                  of Pre-Trained Transformers},
  booktitle    = {Advances in Neural Information Processing Systems 33: Annual Conference
                  on Neural Information Processing Systems 2020, NeurIPS 2020, December
                  6-12, 2020, virtual},
  year         = {2020},
  url          = {https://proceedings.neurips.cc/paper/2020/hash/3f5ee243547dee91fbd053c1c4a845aa-Abstract.html},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/WangW0B0020.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/ZhouXGM0W20,
  author       = {Wangchunshu Zhou and
                  Canwen Xu and
                  Tao Ge and
                  Julian J. McAuley and
                  Ke Xu and
                  Furu Wei},
  editor       = {Hugo Larochelle and
                  Marc'Aurelio Ranzato and
                  Raia Hadsell and
                  Maria{-}Florina Balcan and
                  Hsuan{-}Tien Lin},
  title        = {{BERT} Loses Patience: Fast and Robust Inference with Early Exit},
  booktitle    = {Advances in Neural Information Processing Systems 33: Annual Conference
                  on Neural Information Processing Systems 2020, NeurIPS 2020, December
                  6-12, 2020, virtual},
  year         = {2020},
  url          = {https://proceedings.neurips.cc/paper/2020/hash/d4dd111a4fd973394238aca5c05bebe3-Abstract.html},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/ZhouXGM0W20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2001-11383,
  author       = {Yinuo Guo and
                  Tao Ge and
                  Furu Wei},
  title        = {Fact-aware Sentence Split and Rephrase with Permutation Invariant
                  Training},
  journal      = {CoRR},
  volume       = {abs/2001.11383},
  year         = {2020},
  url          = {https://arxiv.org/abs/2001.11383},
  eprinttype    = {arXiv},
  eprint       = {2001.11383},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2001-11383.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2001-11691,
  author       = {Wangchunshu Zhou and
                  Tao Ge and
                  Ke Xu and
                  Furu Wei and
                  Ming Zhou},
  title        = {Self-Adversarial Learning with Comparative Discrimination for Text
                  Generation},
  journal      = {CoRR},
  volume       = {abs/2001.11691},
  year         = {2020},
  url          = {https://arxiv.org/abs/2001.11691},
  eprinttype    = {arXiv},
  eprint       = {2001.11691},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2001-11691.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2002-02649,
  author       = {Chaoqun Duan and
                  Lei Cui and
                  Shuming Ma and
                  Furu Wei and
                  Conghui Zhu and
                  Tiejun Zhao},
  title        = {Multimodal Matching Transformer for Live Commenting},
  journal      = {CoRR},
  volume       = {abs/2002.02649},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.02649},
  eprinttype    = {arXiv},
  eprint       = {2002.02649},
  timestamp    = {Mon, 01 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-02649.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2002-02925,
  author       = {Canwen Xu and
                  Wangchunshu Zhou and
                  Tao Ge and
                  Furu Wei and
                  Ming Zhou},
  title        = {BERT-of-Theseus: Compressing {BERT} by Progressive Module Replacing},
  journal      = {CoRR},
  volume       = {abs/2002.02925},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.02925},
  eprinttype    = {arXiv},
  eprint       = {2002.02925},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-02925.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2002-10957,
  author       = {Wenhui Wang and
                  Furu Wei and
                  Li Dong and
                  Hangbo Bao and
                  Nan Yang and
                  Ming Zhou},
  title        = {MiniLM: Deep Self-Attention Distillation for Task-Agnostic Compression
                  of Pre-Trained Transformers},
  journal      = {CoRR},
  volume       = {abs/2002.10957},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.10957},
  eprinttype    = {arXiv},
  eprint       = {2002.10957},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-10957.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2002-12804,
  author       = {Hangbo Bao and
                  Li Dong and
                  Furu Wei and
                  Wenhui Wang and
                  Nan Yang and
                  Xiaodong Liu and
                  Yu Wang and
                  Songhao Piao and
                  Jianfeng Gao and
                  Ming Zhou and
                  Hsiao{-}Wuen Hon},
  title        = {UniLMv2: Pseudo-Masked Language Models for Unified Language Model
                  Pre-Training},
  journal      = {CoRR},
  volume       = {abs/2002.12804},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.12804},
  eprinttype    = {arXiv},
  eprint       = {2002.12804},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-12804.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2004-01853,
  author       = {Yanyan Zou and
                  Xingxing Zhang and
                  Wei Lu and
                  Furu Wei and
                  Ming Zhou},
  title        = {{STEP:} Sequence-to-Sequence Transformer Pre-training for Document
                  Summarization},
  journal      = {CoRR},
  volume       = {abs/2004.01853},
  year         = {2020},
  url          = {https://arxiv.org/abs/2004.01853},
  eprinttype    = {arXiv},
  eprint       = {2004.01853},
  timestamp    = {Mon, 24 Aug 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2004-01853.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2004-02592,
  author       = {Qingyu Zhou and
                  Furu Wei and
                  Ming Zhou},
  title        = {Learning to Summarize Passages: Mining Passage-Summary Pairs from
                  Wikipedia Revision Histories},
  journal      = {CoRR},
  volume       = {abs/2004.02592},
  year         = {2020},
  url          = {https://arxiv.org/abs/2004.02592},
  eprinttype    = {arXiv},
  eprint       = {2004.02592},
  timestamp    = {Wed, 08 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2004-02592.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2004-02664,
  author       = {Qingyu Zhou and
                  Furu Wei and
                  Ming Zhou},
  title        = {At Which Level Should We Extract? An Empirical Study on Extractive
                  Document Summarization},
  journal      = {CoRR},
  volume       = {abs/2004.02664},
  year         = {2020},
  url          = {https://arxiv.org/abs/2004.02664},
  eprinttype    = {arXiv},
  eprint       = {2004.02664},
  timestamp    = {Wed, 08 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2004-02664.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2004-06165,
  author       = {Xiujun Li and
                  Xi Yin and
                  Chunyuan Li and
                  Pengchuan Zhang and
                  Xiaowei Hu and
                  Lei Zhang and
                  Lijuan Wang and
                  Houdong Hu and
                  Li Dong and
                  Furu Wei and
                  Yejin Choi and
                  Jianfeng Gao},
  title        = {Oscar: Object-Semantics Aligned Pre-training for Vision-Language Tasks},
  journal      = {CoRR},
  volume       = {abs/2004.06165},
  year         = {2020},
  url          = {https://arxiv.org/abs/2004.06165},
  eprinttype    = {arXiv},
  eprint       = {2004.06165},
  timestamp    = {Thu, 11 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2004-06165.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2004-11207,
  author       = {Yaru Hao and
                  Li Dong and
                  Furu Wei and
                  Ke Xu},
  title        = {Self-Attention Attribution: Interpreting Information Interactions
                  Inside Transformer},
  journal      = {CoRR},
  volume       = {abs/2004.11207},
  year         = {2020},
  url          = {https://arxiv.org/abs/2004.11207},
  eprinttype    = {arXiv},
  eprint       = {2004.11207},
  timestamp    = {Wed, 29 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2004-11207.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2004-13342,
  author       = {Wangchunshu Zhou and
                  Tao Ge and
                  Ke Xu and
                  Furu Wei and
                  Ming Zhou},
  title        = {Scheduled DropHead: {A} Regularization Method for Transformer Models},
  journal      = {CoRR},
  volume       = {abs/2004.13342},
  year         = {2020},
  url          = {https://arxiv.org/abs/2004.13342},
  eprinttype    = {arXiv},
  eprint       = {2004.13342},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2004-13342.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2005-02925,
  author       = {Zhongli Li and
                  Wenhui Wang and
                  Li Dong and
                  Furu Wei and
                  Ke Xu},
  title        = {Harvesting and Refining Question-Answer Pairs for Unsupervised {QA}},
  journal      = {CoRR},
  volume       = {abs/2005.02925},
  year         = {2020},
  url          = {https://arxiv.org/abs/2005.02925},
  eprinttype    = {arXiv},
  eprint       = {2005.02925},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2005-02925.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-01038,
  author       = {Minghao Li and
                  Yiheng Xu and
                  Lei Cui and
                  Shaohan Huang and
                  Furu Wei and
                  Zhoujun Li and
                  Ming Zhou},
  title        = {DocBank: {A} Benchmark Dataset for Document Layout Analysis},
  journal      = {CoRR},
  volume       = {abs/2006.01038},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.01038},
  eprinttype    = {arXiv},
  eprint       = {2006.01038},
  timestamp    = {Thu, 16 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-01038.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-04152,
  author       = {Wangchunshu Zhou and
                  Canwen Xu and
                  Tao Ge and
                  Julian J. McAuley and
                  Ke Xu and
                  Furu Wei},
  title        = {{BERT} Loses Patience: Fast and Robust Inference with Early Exit},
  journal      = {CoRR},
  volume       = {abs/2006.04152},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.04152},
  eprinttype    = {arXiv},
  eprint       = {2006.04152},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-04152.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2007-07834,
  author       = {Zewen Chi and
                  Li Dong and
                  Furu Wei and
                  Nan Yang and
                  Saksham Singhal and
                  Wenhui Wang and
                  Xia Song and
                  Xian{-}Ling Mao and
                  Heyan Huang and
                  Ming Zhou},
  title        = {InfoXLM: An Information-Theoretic Framework for Cross-Lingual Language
                  Model Pre-Training},
  journal      = {CoRR},
  volume       = {abs/2007.07834},
  year         = {2020},
  url          = {https://arxiv.org/abs/2007.07834},
  eprinttype    = {arXiv},
  eprint       = {2007.07834},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2007-07834.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2009-11692,
  author       = {Haozhe Ji and
                  Pei Ke and
                  Shaohan Huang and
                  Furu Wei and
                  Xiaoyan Zhu and
                  Minlie Huang},
  title        = {Language Generation with Multi-Hop Reasoning on Commonsense Knowledge
                  Graph},
  journal      = {CoRR},
  volume       = {abs/2009.11692},
  year         = {2020},
  url          = {https://arxiv.org/abs/2009.11692},
  eprinttype    = {arXiv},
  eprint       = {2009.11692},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2009-11692.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2009-11753,
  author       = {Haozhe Ji and
                  Pei Ke and
                  Shaohan Huang and
                  Furu Wei and
                  Minlie Huang},
  title        = {Generating Commonsense Explanation by Extracting Bridge Concepts from
                  Reasoning Paths},
  journal      = {CoRR},
  volume       = {abs/2009.11753},
  year         = {2020},
  url          = {https://arxiv.org/abs/2009.11753},
  eprinttype    = {arXiv},
  eprint       = {2009.11753},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2009-11753.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2010-03260,
  author       = {Mengyun Chen and
                  Tao Ge and
                  Xingxing Zhang and
                  Furu Wei and
                  Ming Zhou},
  title        = {Improving the Efficiency of Grammatical Error Correction with Erroneous
                  Span Detection and Correction},
  journal      = {CoRR},
  volume       = {abs/2010.03260},
  year         = {2020},
  url          = {https://arxiv.org/abs/2010.03260},
  eprinttype    = {arXiv},
  eprint       = {2010.03260},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2010-03260.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2010-08242,
  author       = {Shusheng Xu and
                  Xingxing Zhang and
                  Yi Wu and
                  Furu Wei and
                  Ming Zhou},
  title        = {Unsupervised Extractive Summarization by Pre-training Hierarchical
                  Transformers},
  journal      = {CoRR},
  volume       = {abs/2010.08242},
  year         = {2020},
  url          = {https://arxiv.org/abs/2010.08242},
  eprinttype    = {arXiv},
  eprint       = {2010.08242},
  timestamp    = {Tue, 02 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2010-08242.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2012-14740,
  author       = {Yang Xu and
                  Yiheng Xu and
                  Tengchao Lv and
                  Lei Cui and
                  Furu Wei and
                  Guoxin Wang and
                  Yijuan Lu and
                  Dinei A. F. Flor{\^{e}}ncio and
                  Cha Zhang and
                  Wanxiang Che and
                  Min Zhang and
                  Lidong Zhou},
  title        = {LayoutLMv2: Multi-modal Pre-training for Visually-Rich Document Understanding},
  journal      = {CoRR},
  volume       = {abs/2012.14740},
  year         = {2020},
  url          = {https://arxiv.org/abs/2012.14740},
  eprinttype    = {arXiv},
  eprint       = {2012.14740},
  timestamp    = {Wed, 31 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2012-14740.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2012-15547,
  author       = {Shuming Ma and
                  Jian Yang and
                  Haoyang Huang and
                  Zewen Chi and
                  Li Dong and
                  Dongdong Zhang and
                  Hany Hassan Awadalla and
                  Alexandre Muzio and
                  Akiko Eriguchi and
                  Saksham Singhal and
                  Xia Song and
                  Arul Menezes and
                  Furu Wei},
  title        = {{XLM-T:} Scaling up Multilingual Machine Translation with Pretrained
                  Cross-lingual Transformer Encoders},
  journal      = {CoRR},
  volume       = {abs/2012.15547},
  year         = {2020},
  url          = {https://arxiv.org/abs/2012.15547},
  eprinttype    = {arXiv},
  eprint       = {2012.15547},
  timestamp    = {Wed, 07 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2012-15547.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2012-15828,
  author       = {Wenhui Wang and
                  Hangbo Bao and
                  Shaohan Huang and
                  Li Dong and
                  Furu Wei},
  title        = {MiniLMv2: Multi-Head Self-Attention Relation Distillation for Compressing
                  Pretrained Transformers},
  journal      = {CoRR},
  volume       = {abs/2012.15828},
  year         = {2020},
  url          = {https://arxiv.org/abs/2012.15828},
  eprinttype    = {arXiv},
  eprint       = {2012.15828},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2012-15828.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/HuWPHYL19,
  author       = {Minghao Hu and
                  Furu Wei and
                  Yuxing Peng and
                  Zhen Huang and
                  Nan Yang and
                  Dongsheng Li},
  title        = {Read + Verify: Machine Reading Comprehension with Unanswerable Questions},
  booktitle    = {The Thirty-Third {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2019, The Thirty-First Innovative Applications of Artificial Intelligence
                  Conference, {IAAI} 2019, The Ninth {AAAI} Symposium on Educational
                  Advances in Artificial Intelligence, {EAAI} 2019, Honolulu, Hawaii,
                  USA, January 27 - February 1, 2019},
  pages        = {6529--6537},
  publisher    = {{AAAI} Press},
  year         = {2019},
  url          = {https://doi.org/10.1609/aaai.v33i01.33016529},
  doi          = {10.1609/AAAI.V33I01.33016529},
  timestamp    = {Mon, 04 Sep 2023 12:29:24 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/HuWPHYL19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/Huang0WL19,
  author       = {Shaohan Huang and
                  Yu Wu and
                  Furu Wei and
                  Zhongzhi Luan},
  title        = {Dictionary-Guided Editing Networks for Paraphrase Generation},
  booktitle    = {The Thirty-Third {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2019, The Thirty-First Innovative Applications of Artificial Intelligence
                  Conference, {IAAI} 2019, The Ninth {AAAI} Symposium on Educational
                  Advances in Artificial Intelligence, {EAAI} 2019, Honolulu, Hawaii,
                  USA, January 27 - February 1, 2019},
  pages        = {6546--6553},
  publisher    = {{AAAI} Press},
  year         = {2019},
  url          = {https://doi.org/10.1609/aaai.v33i01.33016546},
  doi          = {10.1609/AAAI.V33I01.33016546},
  timestamp    = {Wed, 26 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/Huang0WL19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/MaCDW019,
  author       = {Shuming Ma and
                  Lei Cui and
                  Damai Dai and
                  Furu Wei and
                  Xu Sun},
  title        = {LiveBot: Generating Live Video Comments Based on Visual and Textual
                  Contexts},
  booktitle    = {The Thirty-Third {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2019, The Thirty-First Innovative Applications of Artificial Intelligence
                  Conference, {IAAI} 2019, The Ninth {AAAI} Symposium on Educational
                  Advances in Artificial Intelligence, {EAAI} 2019, Honolulu, Hawaii,
                  USA, January 27 - February 1, 2019},
  pages        = {6810--6817},
  publisher    = {{AAAI} Press},
  year         = {2019},
  url          = {https://doi.org/10.1609/aaai.v33i01.33016810},
  doi          = {10.1609/AAAI.V33I01.33016810},
  timestamp    = {Tue, 02 Feb 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/aaai/MaCDW019.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/0006WHWL019,
  author       = {Yu Wu and
                  Furu Wei and
                  Shaohan Huang and
                  Yunli Wang and
                  Zhoujun Li and
                  Ming Zhou},
  title        = {Response Generation by Context-Aware Prototype Editing},
  booktitle    = {The Thirty-Third {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2019, The Thirty-First Innovative Applications of Artificial Intelligence
                  Conference, {IAAI} 2019, The Ninth {AAAI} Symposium on Educational
                  Advances in Artificial Intelligence, {EAAI} 2019, Honolulu, Hawaii,
                  USA, January 27 - February 1, 2019},
  pages        = {7281--7288},
  publisher    = {{AAAI} Press},
  year         = {2019},
  url          = {https://doi.org/10.1609/aaai.v33i01.33017281},
  doi          = {10.1609/AAAI.V33I01.33017281},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/aaai/0006WHWL019.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/ZhouGXWZ19,
  author       = {Wangchunshu Zhou and
                  Tao Ge and
                  Ke Xu and
                  Furu Wei and
                  Ming Zhou},
  editor       = {Anna Korhonen and
                  David R. Traum and
                  Llu{\'{\i}}s M{\`{a}}rquez},
  title        = {BERT-based Lexical Substitution},
  booktitle    = {Proceedings of the 57th Conference of the Association for Computational
                  Linguistics, {ACL} 2019, Florence, Italy, July 28- August 2, 2019,
                  Volume 1: Long Papers},
  pages        = {3368--3373},
  publisher    = {Association for Computational Linguistics},
  year         = {2019},
  url          = {https://doi.org/10.18653/v1/p19-1328},
  doi          = {10.18653/V1/P19-1328},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/acl/ZhouGXWZ19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/ZhuCZWL19,
  author       = {Qingfu Zhu and
                  Lei Cui and
                  Weinan Zhang and
                  Furu Wei and
                  Ting Liu},
  editor       = {Anna Korhonen and
                  David R. Traum and
                  Llu{\'{\i}}s M{\`{a}}rquez},
  title        = {Retrieval-Enhanced Adversarial Training for Neural Response Generation},
  booktitle    = {Proceedings of the 57th Conference of the Association for Computational
                  Linguistics, {ACL} 2019, Florence, Italy, July 28- August 2, 2019,
                  Volume 1: Long Papers},
  pages        = {3763--3773},
  publisher    = {Association for Computational Linguistics},
  year         = {2019},
  url          = {https://doi.org/10.18653/v1/p19-1366},
  doi          = {10.18653/V1/P19-1366},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/ZhuCZWL19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/ZhuDWWQL19,
  author       = {Haichao Zhu and
                  Li Dong and
                  Furu Wei and
                  Wenhui Wang and
                  Bing Qin and
                  Ting Liu},
  editor       = {Anna Korhonen and
                  David R. Traum and
                  Llu{\'{\i}}s M{\`{a}}rquez},
  title        = {Learning to Ask Unanswerable Questions for Machine Reading Comprehension},
  booktitle    = {Proceedings of the 57th Conference of the Association for Computational
                  Linguistics, {ACL} 2019, Florence, Italy, July 28- August 2, 2019,
                  Volume 1: Long Papers},
  pages        = {4238--4248},
  publisher    = {Association for Computational Linguistics},
  year         = {2019},
  url          = {https://doi.org/10.18653/v1/p19-1415},
  doi          = {10.18653/V1/P19-1415},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/ZhuDWWQL19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/ZhangWZ19,
  author       = {Xingxing Zhang and
                  Furu Wei and
                  Ming Zhou},
  editor       = {Anna Korhonen and
                  David R. Traum and
                  Llu{\'{\i}}s M{\`{a}}rquez},
  title        = {{HIBERT:} Document Level Pre-training of Hierarchical Bidirectional
                  Transformers for Document Summarization},
  booktitle    = {Proceedings of the 57th Conference of the Association for Computational
                  Linguistics, {ACL} 2019, Florence, Italy, July 28- August 2, 2019,
                  Volume 1: Long Papers},
  pages        = {5059--5069},
  publisher    = {Association for Computational Linguistics},
  year         = {2019},
  url          = {https://doi.org/10.18653/v1/p19-1499},
  doi          = {10.18653/V1/P19-1499},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/ZhangWZ19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/GeZWZ19,
  author       = {Tao Ge and
                  Xingxing Zhang and
                  Furu Wei and
                  Ming Zhou},
  editor       = {Anna Korhonen and
                  David R. Traum and
                  Llu{\'{\i}}s M{\`{a}}rquez},
  title        = {Automatic Grammatical Error Correction for Sequence-to-sequence Text
                  Generation: An Empirical Study},
  booktitle    = {Proceedings of the 57th Conference of the Association for Computational
                  Linguistics, {ACL} 2019, Florence, Italy, July 28- August 2, 2019,
                  Volume 1: Long Papers},
  pages        = {6059--6064},
  publisher    = {Association for Computational Linguistics},
  year         = {2019},
  url          = {https://doi.org/10.18653/v1/p19-1609},
  doi          = {10.18653/V1/P19-1609},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/acl/GeZWZ19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl-mrqa/BaoDWWYCPZ19,
  author       = {Hangbo Bao and
                  Li Dong and
                  Furu Wei and
                  Wenhui Wang and
                  Nan Yang and
                  Lei Cui and
                  Songhao Piao and
                  Ming Zhou},
  editor       = {Adam Fisch and
                  Alon Talmor and
                  Robin Jia and
                  Minjoon Seo and
                  Eunsol Choi and
                  Danqi Chen},
  title        = {Inspecting Unification of Encoding and Matching with Transformer:
                  {A} Case Study of Machine Reading Comprehension},
  booktitle    = {Proceedings of the 2nd Workshop on Machine Reading for Question Answering,
                  MRQA@EMNLP 2019, Hong Kong, China, November 4, 2019},
  pages        = {14--18},
  publisher    = {Association for Computational Linguistics},
  year         = {2019},
  url          = {https://doi.org/10.18653/v1/D19-5802},
  doi          = {10.18653/V1/D19-5802},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl-mrqa/BaoDWWYCPZ19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/JinZGXWZ19,
  author       = {Weike Jin and
                  Zhou Zhao and
                  Mao Gu and
                  Jun Xiao and
                  Furu Wei and
                  Yueting Zhuang},
  editor       = {Kentaro Inui and
                  Jing Jiang and
                  Vincent Ng and
                  Xiaojun Wan},
  title        = {Video Dialog via Progressive Inference and Cross-Transformer},
  booktitle    = {Proceedings of the 2019 Conference on Empirical Methods in Natural
                  Language Processing and the 9th International Joint Conference on
                  Natural Language Processing, {EMNLP-IJCNLP} 2019, Hong Kong, China,
                  November 3-7, 2019},
  pages        = {2109--2118},
  publisher    = {Association for Computational Linguistics},
  year         = {2019},
  url          = {https://doi.org/10.18653/v1/D19-1217},
  doi          = {10.18653/V1/D19-1217},
  timestamp    = {Thu, 07 Apr 2022 09:14:07 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/JinZGXWZ19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/HaoDWX19,
  author       = {Yaru Hao and
                  Li Dong and
                  Furu Wei and
                  Ke Xu},
  editor       = {Kentaro Inui and
                  Jing Jiang and
                  Vincent Ng and
                  Xiaojun Wan},
  title        = {Visualizing and Understanding the Effectiveness of {BERT}},
  booktitle    = {Proceedings of the 2019 Conference on Empirical Methods in Natural
                  Language Processing and the 9th International Joint Conference on
                  Natural Language Processing, {EMNLP-IJCNLP} 2019, Hong Kong, China,
                  November 3-7, 2019},
  pages        = {4141--4150},
  publisher    = {Association for Computational Linguistics},
  year         = {2019},
  url          = {https://doi.org/10.18653/v1/D19-1424},
  doi          = {10.18653/V1/D19-1424},
  timestamp    = {Thu, 12 Dec 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/HaoDWX19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/00040WWLWGZH19,
  author       = {Li Dong and
                  Nan Yang and
                  Wenhui Wang and
                  Furu Wei and
                  Xiaodong Liu and
                  Yu Wang and
                  Jianfeng Gao and
                  Ming Zhou and
                  Hsiao{-}Wuen Hon},
  editor       = {Hanna M. Wallach and
                  Hugo Larochelle and
                  Alina Beygelzimer and
                  Florence d'Alch{\'{e}}{-}Buc and
                  Emily B. Fox and
                  Roman Garnett},
  title        = {Unified Language Model Pre-training for Natural Language Understanding
                  and Generation},
  booktitle    = {Advances in Neural Information Processing Systems 32: Annual Conference
                  on Neural Information Processing Systems 2019, NeurIPS 2019, December
                  8-14, 2019, Vancouver, BC, Canada},
  pages        = {13042--13054},
  year         = {2019},
  url          = {https://proceedings.neurips.cc/paper/2019/hash/c20bb2d9a50d5ac1f713f8b34d9aac5a-Abstract.html},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/00040WWLWGZH19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nlpcc/LiZWW019,
  author       = {Weikang Li and
                  Xingxing Zhang and
                  Yunfang Wu and
                  Furu Wei and
                  Ming Zhou},
  editor       = {Jie Tang and
                  Min{-}Yen Kan and
                  Dongyan Zhao and
                  Sujian Li and
                  Hongying Zan},
  title        = {Document-Based Question Answering Improves Query-Focused Multi-document
                  Summarization},
  booktitle    = {Natural Language Processing and Chinese Computing - 8th {CCF} International
                  Conference, {NLPCC} 2019, Dunhuang, China, October 9-14, 2019, Proceedings,
                  Part {II}},
  series       = {Lecture Notes in Computer Science},
  volume       = {11839},
  pages        = {41--52},
  publisher    = {Springer},
  year         = {2019},
  url          = {https://doi.org/10.1007/978-3-030-32236-6\_4},
  doi          = {10.1007/978-3-030-32236-6\_4},
  timestamp    = {Tue, 01 Oct 2019 13:44:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nlpcc/LiZWW019.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nlpcc/BaoHWC0TPZ19,
  author       = {Hangbo Bao and
                  Shaohan Huang and
                  Furu Wei and
                  Lei Cui and
                  Yu Wu and
                  Chuanqi Tan and
                  Songhao Piao and
                  Ming Zhou},
  editor       = {Jie Tang and
                  Min{-}Yen Kan and
                  Dongyan Zhao and
                  Sujian Li and
                  Hongying Zan},
  title        = {Neural Melody Composition from Lyrics},
  booktitle    = {Natural Language Processing and Chinese Computing - 8th {CCF} International
                  Conference, {NLPCC} 2019, Dunhuang, China, October 9-14, 2019, Proceedings,
                  Part {I}},
  series       = {Lecture Notes in Computer Science},
  volume       = {11838},
  pages        = {499--511},
  publisher    = {Springer},
  year         = {2019},
  url          = {https://doi.org/10.1007/978-3-030-32233-5\_39},
  doi          = {10.1007/978-3-030-32233-5\_39},
  timestamp    = {Wed, 26 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nlpcc/BaoHWC0TPZ19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1903-01949,
  author       = {Minghao Li and
                  Lei Cui and
                  Shaohan Huang and
                  Furu Wei and
                  Ming Zhou and
                  Zhoujun Li},
  title        = {TableBank: Table Benchmark for Image-based Table Detection and Recognition},
  journal      = {CoRR},
  volume       = {abs/1903.01949},
  year         = {2019},
  url          = {http://arxiv.org/abs/1903.01949},
  eprinttype    = {arXiv},
  eprint       = {1903.01949},
  timestamp    = {Thu, 16 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1903-01949.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1903-06353,
  author       = {Ruochen Xu and
                  Tao Ge and
                  Furu Wei},
  title        = {Formality Style Transfer with Hybrid Textual Annotations},
  journal      = {CoRR},
  volume       = {abs/1903.06353},
  year         = {2019},
  url          = {http://arxiv.org/abs/1903.06353},
  eprinttype    = {arXiv},
  eprint       = {1903.06353},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1903-06353.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1905-03197,
  author       = {Li Dong and
                  Nan Yang and
                  Wenhui Wang and
                  Furu Wei and
                  Xiaodong Liu and
                  Yu Wang and
                  Jianfeng Gao and
                  Ming Zhou and
                  Hsiao{-}Wuen Hon},
  title        = {Unified Language Model Pre-training for Natural Language Understanding
                  and Generation},
  journal      = {CoRR},
  volume       = {abs/1905.03197},
  year         = {2019},
  url          = {http://arxiv.org/abs/1905.03197},
  eprinttype    = {arXiv},
  eprint       = {1905.03197},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1905-03197.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1905-06566,
  author       = {Xingxing Zhang and
                  Furu Wei and
                  Ming Zhou},
  title        = {{HIBERT:} Document Level Pre-training of Hierarchical Bidirectional
                  Transformers for Document Summarization},
  journal      = {CoRR},
  volume       = {abs/1905.06566},
  year         = {2019},
  url          = {http://arxiv.org/abs/1905.06566},
  eprinttype    = {arXiv},
  eprint       = {1905.06566},
  timestamp    = {Wed, 19 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1905-06566.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1906-06045,
  author       = {Haichao Zhu and
                  Li Dong and
                  Furu Wei and
                  Wenhui Wang and
                  Bing Qin and
                  Ting Liu},
  title        = {Learning to Ask Unanswerable Questions for Machine Reading Comprehension},
  journal      = {CoRR},
  volume       = {abs/1906.06045},
  year         = {2019},
  url          = {http://arxiv.org/abs/1906.06045},
  eprinttype    = {arXiv},
  eprint       = {1906.06045},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1906-06045.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1908-05620,
  author       = {Yaru Hao and
                  Li Dong and
                  Furu Wei and
                  Ke Xu},
  title        = {Visualizing and Understanding the Effectiveness of {BERT}},
  journal      = {CoRR},
  volume       = {abs/1908.05620},
  year         = {2019},
  url          = {http://arxiv.org/abs/1908.05620},
  eprinttype    = {arXiv},
  eprint       = {1908.05620},
  timestamp    = {Mon, 19 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1908-05620.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1908-08530,
  author       = {Weijie Su and
                  Xizhou Zhu and
                  Yue Cao and
                  Bin Li and
                  Lewei Lu and
                  Furu Wei and
                  Jifeng Dai},
  title        = {{VL-BERT:} Pre-training of Generic Visual-Linguistic Representations},
  journal      = {CoRR},
  volume       = {abs/1908.08530},
  year         = {2019},
  url          = {http://arxiv.org/abs/1908.08530},
  eprinttype    = {arXiv},
  eprint       = {1908.08530},
  timestamp    = {Tue, 12 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1908-08530.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1909-06002,
  author       = {Yi Zhang and
                  Tao Ge and
                  Furu Wei and
                  Ming Zhou and
                  Xu Sun},
  title        = {Sequence-to-sequence Pre-training with Data Augmentation for Sentence
                  Rewriting},
  journal      = {CoRR},
  volume       = {abs/1909.06002},
  year         = {2019},
  url          = {http://arxiv.org/abs/1909.06002},
  eprinttype    = {arXiv},
  eprint       = {1909.06002},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1909-06002.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1909-10481,
  author       = {Zewen Chi and
                  Li Dong and
                  Furu Wei and
                  Wenhui Wang and
                  Xianling Mao and
                  Heyan Huang},
  title        = {Cross-Lingual Natural Language Generation via Pre-Training},
  journal      = {CoRR},
  volume       = {abs/1909.10481},
  year         = {2019},
  url          = {http://arxiv.org/abs/1909.10481},
  eprinttype    = {arXiv},
  eprint       = {1909.10481},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1909-10481.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1911-02825,
  author       = {Wangchunshu Zhou and
                  Tao Ge and
                  Chang Mu and
                  Ke Xu and
                  Furu Wei and
                  Ming Zhou},
  title        = {Improving Grammatical Error Correction with Machine Translation Pairs},
  journal      = {CoRR},
  volume       = {abs/1911.02825},
  year         = {2019},
  url          = {http://arxiv.org/abs/1911.02825},
  eprinttype    = {arXiv},
  eprint       = {1911.02825},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1911-02825.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1911-03324,
  author       = {Haichao Zhu and
                  Li Dong and
                  Furu Wei and
                  Bing Qin and
                  Ting Liu},
  title        = {Transforming Wikipedia into Augmented Data for Query-Focused Summarization},
  journal      = {CoRR},
  volume       = {abs/1911.03324},
  year         = {2019},
  url          = {http://arxiv.org/abs/1911.03324},
  eprinttype    = {arXiv},
  eprint       = {1911.03324},
  timestamp    = {Sat, 23 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1911-03324.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1911-03913,
  author       = {Zewen Chi and
                  Li Dong and
                  Furu Wei and
                  Xianling Mao and
                  Heyan Huang},
  title        = {Can Monolingual Pretrained Models Help Cross-Lingual Classification?},
  journal      = {CoRR},
  volume       = {abs/1911.03913},
  year         = {2019},
  url          = {http://arxiv.org/abs/1911.03913},
  eprinttype    = {arXiv},
  eprint       = {1911.03913},
  timestamp    = {Sun, 01 Dec 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1911-03913.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1912-13318,
  author       = {Yiheng Xu and
                  Minghao Li and
                  Lei Cui and
                  Shaohan Huang and
                  Furu Wei and
                  Ming Zhou},
  title        = {LayoutLM: Pre-training of Text and Layout for Document Image Understanding},
  journal      = {CoRR},
  volume       = {abs/1912.13318},
  year         = {2019},
  url          = {http://arxiv.org/abs/1912.13318},
  eprinttype    = {arXiv},
  eprint       = {1912.13318},
  timestamp    = {Mon, 01 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1912-13318.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/TanWZYDLZ18,
  author       = {Chuanqi Tan and
                  Furu Wei and
                  Qingyu Zhou and
                  Nan Yang and
                  Bowen Du and
                  Weifeng Lv and
                  Ming Zhou},
  title        = {Context-Aware Answer Sentence Selection With Hierarchical Gated Recurrent
                  Neural Networks},
  journal      = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.},
  volume       = {26},
  number       = {3},
  pages        = {540--549},
  year         = {2018},
  url          = {https://doi.org/10.1109/TASLP.2017.2785283},
  doi          = {10.1109/TASLP.2017.2785283},
  timestamp    = {Tue, 15 Mar 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/taslp/TanWZYDLZ18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tois/RenCRWNMR18,
  author       = {Pengjie Ren and
                  Zhumin Chen and
                  Zhaochun Ren and
                  Furu Wei and
                  Liqiang Nie and
                  Jun Ma and
                  Maarten de Rijke},
  title        = {Sentence Relations for Extractive Summarization with Deep Neural Networks},
  journal      = {{ACM} Trans. Inf. Syst.},
  volume       = {36},
  number       = {4},
  pages        = {39:1--39:32},
  year         = {2018},
  url          = {https://doi.org/10.1145/3200864},
  doi          = {10.1145/3200864},
  timestamp    = {Thu, 23 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tois/RenCRWNMR18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/CaoWLL18,
  author       = {Ziqiang Cao and
                  Furu Wei and
                  Wenjie Li and
                  Sujian Li},
  editor       = {Sheila A. McIlraith and
                  Kilian Q. Weinberger},
  title        = {Faithful to the Original: Fact Aware Neural Abstractive Summarization},
  booktitle    = {Proceedings of the Thirty-Second {AAAI} Conference on Artificial Intelligence,
                  (AAAI-18), the 30th innovative Applications of Artificial Intelligence
                  (IAAI-18), and the 8th {AAAI} Symposium on Educational Advances in
                  Artificial Intelligence (EAAI-18), New Orleans, Louisiana, USA, February
                  2-7, 2018},
  pages        = {4784--4791},
  publisher    = {{AAAI} Press},
  year         = {2018},
  url          = {https://doi.org/10.1609/aaai.v32i1.11912},
  doi          = {10.1609/AAAI.V32I1.11912},
  timestamp    = {Mon, 04 Sep 2023 12:29:24 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/CaoWLL18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/ZhouYWZ18,
  author       = {Qingyu Zhou and
                  Nan Yang and
                  Furu Wei and
                  Ming Zhou},
  editor       = {Sheila A. McIlraith and
                  Kilian Q. Weinberger},
  title        = {Sequential Copying Networks},
  booktitle    = {Proceedings of the Thirty-Second {AAAI} Conference on Artificial Intelligence,
                  (AAAI-18), the 30th innovative Applications of Artificial Intelligence
                  (IAAI-18), and the 8th {AAAI} Symposium on Educational Advances in
                  Artificial Intelligence (EAAI-18), New Orleans, Louisiana, USA, February
                  2-7, 2018},
  pages        = {4987--4995},
  publisher    = {{AAAI} Press},
  year         = {2018},
  url          = {https://doi.org/10.1609/aaai.v32i1.11915},
  doi          = {10.1609/AAAI.V32I1.11915},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/ZhouYWZ18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/TanWYDLZ18,
  author       = {Chuanqi Tan and
                  Furu Wei and
                  Nan Yang and
                  Bowen Du and
                  Weifeng Lv and
                  Ming Zhou},
  editor       = {Sheila A. McIlraith and
                  Kilian Q. Weinberger},
  title        = {S-Net: From Answer Extraction to Answer Synthesis for Machine Reading
                  Comprehension},
  booktitle    = {Proceedings of the Thirty-Second {AAAI} Conference on Artificial Intelligence,
                  (AAAI-18), the 30th innovative Applications of Artificial Intelligence
                  (IAAI-18), and the 8th {AAAI} Symposium on Educational Advances in
                  Artificial Intelligence (EAAI-18), New Orleans, Louisiana, USA, February
                  2-7, 2018},
  pages        = {5940--5947},
  publisher    = {{AAAI} Press},
  year         = {2018},
  url          = {https://doi.org/10.1609/aaai.v32i1.12035},
  doi          = {10.1609/AAAI.V32I1.12035},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/TanWYDLZ18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/ZhuWQL18,
  author       = {Haichao Zhu and
                  Furu Wei and
                  Bing Qin and
                  Ting Liu},
  editor       = {Sheila A. McIlraith and
                  Kilian Q. Weinberger},
  title        = {Hierarchical Attention Flow for Multiple-Choice Reading Comprehension},
  booktitle    = {Proceedings of the Thirty-Second {AAAI} Conference on Artificial Intelligence,
                  (AAAI-18), the 30th innovative Applications of Artificial Intelligence
                  (IAAI-18), and the 8th {AAAI} Symposium on Educational Advances in
                  Artificial Intelligence (EAAI-18), New Orleans, Louisiana, USA, February
                  2-7, 2018},
  pages        = {6077--6085},
  publisher    = {{AAAI} Press},
  year         = {2018},
  url          = {https://doi.org/10.1609/aaai.v32i1.12040},
  doi          = {10.1609/AAAI.V32I1.12040},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/ZhuWQL18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/LiWLC18,
  author       = {Ziqiang Cao and
                  Wenjie Li and
                  Sujian Li and
                  Furu Wei},
  editor       = {Iryna Gurevych and
                  Yusuke Miyao},
  title        = {Retrieve, Rerank and Rewrite: Soft Template Based Neural Summarization},
  booktitle    = {Proceedings of the 56th Annual Meeting of the Association for Computational
                  Linguistics, {ACL} 2018, Melbourne, Australia, July 15-20, 2018, Volume
                  1: Long Papers},
  pages        = {152--161},
  publisher    = {Association for Computational Linguistics},
  year         = {2018},
  url          = {https://aclanthology.org/P18-1015/},
  doi          = {10.18653/V1/P18-1015},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/LiWLC18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/CuiWZ18,
  author       = {Lei Cui and
                  Furu Wei and
                  Ming Zhou},
  editor       = {Iryna Gurevych and
                  Yusuke Miyao},
  title        = {Neural Open Information Extraction},
  booktitle    = {Proceedings of the 56th Annual Meeting of the Association for Computational
                  Linguistics, {ACL} 2018, Melbourne, Australia, July 15-20, 2018, Volume
                  2: Short Papers},
  pages        = {407--413},
  publisher    = {Association for Computational Linguistics},
  year         = {2018},
  url          = {https://aclanthology.org/P18-2065/},
  doi          = {10.18653/V1/P18-2065},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/CuiWZ18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/ZhaoZWYHZ18,
  author       = {Qingyu Zhou and
                  Nan Yang and
                  Furu Wei and
                  Shaohan Huang and
                  Ming Zhou and
                  Tiejun Zhao},
  editor       = {Iryna Gurevych and
                  Yusuke Miyao},
  title        = {Neural Document Summarization by Jointly Learning to Score and Select
                  Sentences},
  booktitle    = {Proceedings of the 56th Annual Meeting of the Association for Computational
                  Linguistics, {ACL} 2018, Melbourne, Australia, July 15-20, 2018, Volume
                  1: Long Papers},
  pages        = {654--663},
  publisher    = {Association for Computational Linguistics},
  year         = {2018},
  url          = {https://aclanthology.org/P18-1061/},
  doi          = {10.18653/V1/P18-1061},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/ZhaoZWYHZ18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/ZhouWG18,
  author       = {Tao Ge and
                  Furu Wei and
                  Ming Zhou},
  editor       = {Iryna Gurevych and
                  Yusuke Miyao},
  title        = {Fluency Boost Learning and Inference for Neural Grammatical Error
                  Correction},
  booktitle    = {Proceedings of the 56th Annual Meeting of the Association for Computational
                  Linguistics, {ACL} 2018, Melbourne, Australia, July 15-20, 2018, Volume
                  1: Long Papers},
  pages        = {1055--1065},
  publisher    = {Association for Computational Linguistics},
  year         = {2018},
  url          = {https://aclanthology.org/P18-1097/},
  doi          = {10.18653/V1/P18-1097},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/acl/ZhouWG18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/ZhangLWZ18,
  author       = {Xingxing Zhang and
                  Mirella Lapata and
                  Furu Wei and
                  Ming Zhou},
  editor       = {Ellen Riloff and
                  David Chiang and
                  Julia Hockenmaier and
                  Jun'ichi Tsujii},
  title        = {Neural Latent Extractive Document Summarization},
  booktitle    = {Proceedings of the 2018 Conference on Empirical Methods in Natural
                  Language Processing, Brussels, Belgium, October 31 - November 4, 2018},
  pages        = {779--784},
  publisher    = {Association for Computational Linguistics},
  year         = {2018},
  url          = {https://doi.org/10.18653/v1/d18-1088},
  doi          = {10.18653/V1/D18-1088},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/ZhangLWZ18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/HuPWHLYZ18,
  author       = {Minghao Hu and
                  Yuxing Peng and
                  Furu Wei and
                  Zhen Huang and
                  Dongsheng Li and
                  Nan Yang and
                  Ming Zhou},
  editor       = {Ellen Riloff and
                  David Chiang and
                  Julia Hockenmaier and
                  Jun'ichi Tsujii},
  title        = {Attention-Guided Answer Distillation for Machine Reading Comprehension},
  booktitle    = {Proceedings of the 2018 Conference on Empirical Methods in Natural
                  Language Processing, Brussels, Belgium, October 31 - November 4, 2018},
  pages        = {2077--2086},
  publisher    = {Association for Computational Linguistics},
  year         = {2018},
  url          = {https://doi.org/10.18653/v1/d18-1232},
  doi          = {10.18653/V1/D18-1232},
  timestamp    = {Mon, 06 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/HuPWHLYZ18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/GeDJCCSWZ18,
  author       = {Tao Ge and
                  Qing Dou and
                  Heng Ji and
                  Lei Cui and
                  Baobao Chang and
                  Zhifang Sui and
                  Furu Wei and
                  Ming Zhou},
  editor       = {Ellen Riloff and
                  David Chiang and
                  Julia Hockenmaier and
                  Jun'ichi Tsujii},
  title        = {Fine-grained Coordinated Cross-lingual Text Stream Alignment for Endless
                  Language Knowledge Acquisition},
  booktitle    = {Proceedings of the 2018 Conference on Empirical Methods in Natural
                  Language Processing, Brussels, Belgium, October 31 - November 4, 2018},
  pages        = {2496--2506},
  publisher    = {Association for Computational Linguistics},
  year         = {2018},
  url          = {https://doi.org/10.18653/v1/d18-1271},
  doi          = {10.18653/V1/D18-1271},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/GeDJCCSWZ18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/DuanCCWZZ18,
  author       = {Chaoqun Duan and
                  Lei Cui and
                  Xinchi Chen and
                  Furu Wei and
                  Conghui Zhu and
                  Tiejun Zhao},
  editor       = {J{\'{e}}r{\^{o}}me Lang},
  title        = {Attention-Fused Deep Matching Network for Natural Language Inference},
  booktitle    = {Proceedings of the Twenty-Seventh International Joint Conference on
                  Artificial Intelligence, {IJCAI} 2018, July 13-19, 2018, Stockholm,
                  Sweden},
  pages        = {4033--4040},
  publisher    = {ijcai.org},
  year         = {2018},
  url          = {https://doi.org/10.24963/ijcai.2018/561},
  doi          = {10.24963/IJCAI.2018/561},
  timestamp    = {Mon, 01 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcai/DuanCCWZZ18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/HuPHQW018,
  author       = {Minghao Hu and
                  Yuxing Peng and
                  Zhen Huang and
                  Xipeng Qiu and
                  Furu Wei and
                  Ming Zhou},
  editor       = {J{\'{e}}r{\^{o}}me Lang},
  title        = {Reinforced Mnemonic Reader for Machine Reading Comprehension},
  booktitle    = {Proceedings of the Twenty-Seventh International Joint Conference on
                  Artificial Intelligence, {IJCAI} 2018, July 13-19, 2018, Stockholm,
                  Sweden},
  pages        = {4099--4106},
  publisher    = {ijcai.org},
  year         = {2018},
  url          = {https://doi.org/10.24963/ijcai.2018/570},
  doi          = {10.24963/IJCAI.2018/570},
  timestamp    = {Mon, 06 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ijcai/HuPHQW018.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/TanWWLZ18,
  author       = {Chuanqi Tan and
                  Furu Wei and
                  Wenhui Wang and
                  Weifeng Lv and
                  Ming Zhou},
  editor       = {J{\'{e}}r{\^{o}}me Lang},
  title        = {Multiway Attention Networks for Modeling Sentence Pairs},
  booktitle    = {Proceedings of the Twenty-Seventh International Joint Conference on
                  Artificial Intelligence, {IJCAI} 2018, July 13-19, 2018, Stockholm,
                  Sweden},
  pages        = {4411--4417},
  publisher    = {ijcai.org},
  year         = {2018},
  url          = {https://doi.org/10.24963/ijcai.2018/613},
  doi          = {10.24963/IJCAI.2018/613},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcai/TanWWLZ18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/kdd/ZhuLYQLZZWXC18,
  author       = {Hongyuan Zhu and
                  Qi Liu and
                  Nicholas Jing Yuan and
                  Chuan Qin and
                  Jiawei Li and
                  Kun Zhang and
                  Guang Zhou and
                  Furu Wei and
                  Yuanchun Xu and
                  Enhong Chen},
  editor       = {Yike Guo and
                  Faisal Farooq},
  title        = {XiaoIce Band: {A} Melody and Arrangement Generation Framework for
                  Pop Music},
  booktitle    = {Proceedings of the 24th {ACM} {SIGKDD} International Conference on
                  Knowledge Discovery {\&} Data Mining, {KDD} 2018, London, UK,
                  August 19-23, 2018},
  pages        = {2837--2846},
  publisher    = {{ACM}},
  year         = {2018},
  url          = {https://doi.org/10.1145/3219819.3220105},
  doi          = {10.1145/3219819.3220105},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/kdd/ZhuLYQLZZWXC18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/lrec/GeCCSW018,
  author       = {Tao Ge and
                  Lei Cui and
                  Baobao Chang and
                  Zhifang Sui and
                  Furu Wei and
                  Ming Zhou},
  editor       = {Nicoletta Calzolari and
                  Khalid Choukri and
                  Christopher Cieri and
                  Thierry Declerck and
                  Sara Goggi and
                  K{\^{o}}iti Hasida and
                  Hitoshi Isahara and
                  Bente Maegaard and
                  Joseph Mariani and
                  H{\'{e}}l{\`{e}}ne Mazo and
                  Asunci{\'{o}}n Moreno and
                  Jan Odijk and
                  Stelios Piperidis and
                  Takenobu Tokunaga},
  title        = {EventWiki: {A} Knowledge Base of Major Events},
  booktitle    = {Proceedings of the Eleventh International Conference on Language Resources
                  and Evaluation, {LREC} 2018, Miyazaki, Japan, May 7-12, 2018},
  publisher    = {European Language Resources Association {(ELRA)}},
  year         = {2018},
  url          = {http://www.lrec-conf.org/proceedings/lrec2018/summaries/213.html},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/lrec/GeCCSW018.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nlpcc/TanWZYLZ18,
  author       = {Chuanqi Tan and
                  Furu Wei and
                  Qingyu Zhou and
                  Nan Yang and
                  Weifeng Lv and
                  Ming Zhou},
  editor       = {Min Zhang and
                  Vincent Ng and
                  Dongyan Zhao and
                  Sujian Li and
                  Hongying Zan},
  title        = {I Know There Is No Answer: Modeling Answer Validation for Machine
                  Reading Comprehension},
  booktitle    = {Natural Language Processing and Chinese Computing - 7th {CCF} International
                  Conference, {NLPCC} 2018, Hohhot, China, August 26-30, 2018, Proceedings,
                  Part {I}},
  series       = {Lecture Notes in Computer Science},
  volume       = {11108},
  pages        = {85--97},
  publisher    = {Springer},
  year         = {2018},
  url          = {https://doi.org/10.1007/978-3-319-99495-6\_8},
  doi          = {10.1007/978-3-319-99495-6\_8},
  timestamp    = {Thu, 07 Apr 2022 09:14:07 +0200},
  biburl       = {https://dblp.org/rec/conf/nlpcc/TanWZYLZ18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nlpcc/GeCCSW018,
  author       = {Tao Ge and
                  Lei Cui and
                  Baobao Chang and
                  Zhifang Sui and
                  Furu Wei and
                  Ming Zhou},
  editor       = {Min Zhang and
                  Vincent Ng and
                  Dongyan Zhao and
                  Sujian Li and
                  Hongying Zan},
  title        = {SeRI: {A} Dataset for Sub-event Relation Inference from an Encyclopedia},
  booktitle    = {Natural Language Processing and Chinese Computing - 7th {CCF} International
                  Conference, {NLPCC} 2018, Hohhot, China, August 26-30, 2018, Proceedings,
                  Part {II}},
  series       = {Lecture Notes in Computer Science},
  volume       = {11109},
  pages        = {268--277},
  publisher    = {Springer},
  year         = {2018},
  url          = {https://doi.org/10.1007/978-3-319-99501-4\_23},
  doi          = {10.1007/978-3-319-99501-4\_23},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nlpcc/GeCCSW018.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1805-03900,
  author       = {Furu Wei},
  title        = {Improv Chat: Second Response Generation for Chatbot},
  journal      = {CoRR},
  volume       = {abs/1805.03900},
  year         = {2018},
  url          = {http://arxiv.org/abs/1805.03900},
  eprinttype    = {arXiv},
  eprint       = {1805.03900},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1805-03900.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1805-04270,
  author       = {Lei Cui and
                  Furu Wei and
                  Ming Zhou},
  title        = {Neural Open Information Extraction},
  journal      = {CoRR},
  volume       = {abs/1805.04270},
  year         = {2018},
  url          = {http://arxiv.org/abs/1805.04270},
  eprinttype    = {arXiv},
  eprint       = {1805.04270},
  timestamp    = {Mon, 01 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1805-04270.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1806-07042,
  author       = {Yu Wu and
                  Furu Wei and
                  Shaohan Huang and
                  Zhoujun Li and
                  Ming Zhou},
  title        = {Response Generation by Context-aware Prototype Editing},
  journal      = {CoRR},
  volume       = {abs/1806.07042},
  year         = {2018},
  url          = {http://arxiv.org/abs/1806.07042},
  eprinttype    = {arXiv},
  eprint       = {1806.07042},
  timestamp    = {Wed, 26 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1806-07042.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1806-08077,
  author       = {Shaohan Huang and
                  Yu Wu and
                  Furu Wei and
                  Ming Zhou},
  title        = {Dictionary-Guided Editing Networks for Paraphrase Generation},
  journal      = {CoRR},
  volume       = {abs/1806.08077},
  year         = {2018},
  url          = {http://arxiv.org/abs/1806.08077},
  eprinttype    = {arXiv},
  eprint       = {1806.08077},
  timestamp    = {Wed, 26 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1806-08077.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1807-01270,
  author       = {Tao Ge and
                  Furu Wei and
                  Ming Zhou},
  title        = {Reaching Human-level Performance in Automatic Grammatical Error Correction:
                  An Empirical Study},
  journal      = {CoRR},
  volume       = {abs/1807.01270},
  year         = {2018},
  url          = {http://arxiv.org/abs/1807.01270},
  eprinttype    = {arXiv},
  eprint       = {1807.01270},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1807-01270.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1807-02301,
  author       = {Qingyu Zhou and
                  Nan Yang and
                  Furu Wei and
                  Ming Zhou},
  title        = {Sequential Copying Networks},
  journal      = {CoRR},
  volume       = {abs/1807.02301},
  year         = {2018},
  url          = {http://arxiv.org/abs/1807.02301},
  eprinttype    = {arXiv},
  eprint       = {1807.02301},
  timestamp    = {Sun, 22 Sep 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1807-02301.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1807-02305,
  author       = {Qingyu Zhou and
                  Nan Yang and
                  Furu Wei and
                  Shaohan Huang and
                  Ming Zhou and
                  Tiejun Zhao},
  title        = {Neural Document Summarization by Jointly Learning to Score and Select
                  Sentences},
  journal      = {CoRR},
  volume       = {abs/1807.02305},
  year         = {2018},
  url          = {http://arxiv.org/abs/1807.02305},
  eprinttype    = {arXiv},
  eprint       = {1807.02305},
  timestamp    = {Wed, 25 Sep 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1807-02305.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1808-05759,
  author       = {Minghao Hu and
                  Furu Wei and
                  Yuxing Peng and
                  Zhen Huang and
                  Nan Yang and
                  Ming Zhou},
  title        = {Read + Verify: Machine Reading Comprehension with Unanswerable Questions},
  journal      = {CoRR},
  volume       = {abs/1808.05759},
  year         = {2018},
  url          = {http://arxiv.org/abs/1808.05759},
  eprinttype    = {arXiv},
  eprint       = {1808.05759},
  timestamp    = {Mon, 06 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1808-05759.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1808-07187,
  author       = {Xingxing Zhang and
                  Mirella Lapata and
                  Furu Wei and
                  Ming Zhou},
  title        = {Neural Latent Extractive Document Summarization},
  journal      = {CoRR},
  volume       = {abs/1808.07187},
  year         = {2018},
  url          = {http://arxiv.org/abs/1808.07187},
  eprinttype    = {arXiv},
  eprint       = {1808.07187},
  timestamp    = {Wed, 19 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1808-07187.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1808-07644,
  author       = {Minghao Hu and
                  Yuxing Peng and
                  Furu Wei and
                  Zhen Huang and
                  Dongsheng Li and
                  Nan Yang and
                  Ming Zhou},
  title        = {Attention-Guided Answer Distillation for Machine Reading Comprehension},
  journal      = {CoRR},
  volume       = {abs/1808.07644},
  year         = {2018},
  url          = {http://arxiv.org/abs/1808.07644},
  eprinttype    = {arXiv},
  eprint       = {1808.07644},
  timestamp    = {Mon, 06 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1808-07644.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1809-04276,
  author       = {Qingfu Zhu and
                  Lei Cui and
                  Weinan Zhang and
                  Furu Wei and
                  Yining Chen and
                  Ting Liu},
  title        = {Retrieval-Enhanced Adversarial Training for Neural Response Generation},
  journal      = {CoRR},
  volume       = {abs/1809.04276},
  year         = {2018},
  url          = {http://arxiv.org/abs/1809.04276},
  eprinttype    = {arXiv},
  eprint       = {1809.04276},
  timestamp    = {Mon, 01 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1809-04276.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1809-04318,
  author       = {Hangbo Bao and
                  Shaohan Huang and
                  Furu Wei and
                  Lei Cui and
                  Yu Wu and
                  Chuanqi Tan and
                  Songhao Piao and
                  Ming Zhou},
  title        = {Neural Melody Composition from Lyrics},
  journal      = {CoRR},
  volume       = {abs/1809.04318},
  year         = {2018},
  url          = {http://arxiv.org/abs/1809.04318},
  eprinttype    = {arXiv},
  eprint       = {1809.04318},
  timestamp    = {Wed, 26 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1809-04318.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1809-04938,
  author       = {Shuming Ma and
                  Lei Cui and
                  Damai Dai and
                  Furu Wei and
                  Xu Sun},
  title        = {LiveBot: Generating Live Video Comments Based on Visual and Textual
                  Contexts},
  journal      = {CoRR},
  volume       = {abs/1809.04938},
  year         = {2018},
  url          = {http://arxiv.org/abs/1809.04938},
  eprinttype    = {arXiv},
  eprint       = {1809.04938},
  timestamp    = {Mon, 01 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1809-04938.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1809-04960,
  author       = {Shuming Ma and
                  Lei Cui and
                  Furu Wei and
                  Xu Sun},
  title        = {Unsupervised Machine Commenting with Neural Variational Topic Model},
  journal      = {CoRR},
  volume       = {abs/1809.04960},
  year         = {2018},
  url          = {http://arxiv.org/abs/1809.04960},
  eprinttype    = {arXiv},
  eprint       = {1809.04960},
  timestamp    = {Mon, 01 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1809-04960.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1810-00341,
  author       = {Shaohan Huang and
                  Yu Wu and
                  Furu Wei and
                  Ming Zhou},
  title        = {Text Morphing},
  journal      = {CoRR},
  volume       = {abs/1810.00341},
  year         = {2018},
  url          = {http://arxiv.org/abs/1810.00341},
  eprinttype    = {arXiv},
  eprint       = {1810.00341},
  timestamp    = {Wed, 26 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1810-00341.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/CaoLLW17,
  author       = {Ziqiang Cao and
                  Wenjie Li and
                  Sujian Li and
                  Furu Wei},
  editor       = {Satinder Singh and
                  Shaul Markovitch},
  title        = {Improving Multi-Document Summarization via Text Classification},
  booktitle    = {Proceedings of the Thirty-First {AAAI} Conference on Artificial Intelligence,
                  February 4-9, 2017, San Francisco, California, {USA}},
  pages        = {3053--3059},
  publisher    = {{AAAI} Press},
  year         = {2017},
  url          = {https://doi.org/10.1609/aaai.v31i1.10955},
  doi          = {10.1609/AAAI.V31I1.10955},
  timestamp    = {Mon, 04 Sep 2023 14:40:32 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/CaoLLW17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/CuiHWTDZ17,
  author       = {Lei Cui and
                  Shaohan Huang and
                  Furu Wei and
                  Chuanqi Tan and
                  Chaoqun Duan and
                  Ming Zhou},
  editor       = {Mohit Bansal and
                  Heng Ji},
  title        = {SuperAgent: {A} Customer Service Chatbot for E-commerce Websites},
  booktitle    = {Proceedings of the 55th Annual Meeting of the Association for Computational
                  Linguistics, {ACL} 2017, Vancouver, Canada, July 30 - August 4, System
                  Demonstrations},
  pages        = {97--102},
  publisher    = {Association for Computational Linguistics},
  year         = {2017},
  url          = {https://doi.org/10.18653/v1/P17-4017},
  doi          = {10.18653/V1/P17-4017},
  timestamp    = {Fri, 06 Aug 2021 00:40:50 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/CuiHWTDZ17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/WangYWCZ17,
  author       = {Wenhui Wang and
                  Nan Yang and
                  Furu Wei and
                  Baobao Chang and
                  Ming Zhou},
  editor       = {Regina Barzilay and
                  Min{-}Yen Kan},
  title        = {Gated Self-Matching Networks for Reading Comprehension and Question
                  Answering},
  booktitle    = {Proceedings of the 55th Annual Meeting of the Association for Computational
                  Linguistics, {ACL} 2017, Vancouver, Canada, July 30 - August 4, Volume
                  1: Long Papers},
  pages        = {189--198},
  publisher    = {Association for Computational Linguistics},
  year         = {2017},
  url          = {https://doi.org/10.18653/v1/P17-1018},
  doi          = {10.18653/V1/P17-1018},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/WangYWCZ17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/ZhouYWZ17,
  author       = {Qingyu Zhou and
                  Nan Yang and
                  Furu Wei and
                  Ming Zhou},
  editor       = {Regina Barzilay and
                  Min{-}Yen Kan},
  title        = {Selective Encoding for Abstractive Sentence Summarization},
  booktitle    = {Proceedings of the 55th Annual Meeting of the Association for Computational
                  Linguistics, {ACL} 2017, Vancouver, Canada, July 30 - August 4, Volume
                  1: Long Papers},
  pages        = {1095--1104},
  publisher    = {Association for Computational Linguistics},
  year         = {2017},
  url          = {https://doi.org/10.18653/v1/P17-1101},
  doi          = {10.18653/V1/P17-1101},
  timestamp    = {Tue, 20 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/ZhouYWZ17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eacl/ZhouLWDHX17,
  author       = {Li Dong and
                  Shaohan Huang and
                  Furu Wei and
                  Mirella Lapata and
                  Ming Zhou and
                  Ke Xu},
  editor       = {Mirella Lapata and
                  Phil Blunsom and
                  Alexander Koller},
  title        = {Learning to Generate Product Reviews from Attributes},
  booktitle    = {Proceedings of the 15th Conference of the European Chapter of the
                  Association for Computational Linguistics, {EACL} 2017, Valencia,
                  Spain, April 3-7, 2017, Volume 1: Long Papers},
  pages        = {623--632},
  publisher    = {Association for Computational Linguistics},
  year         = {2017},
  url          = {https://doi.org/10.18653/v1/e17-1059},
  doi          = {10.18653/V1/E17-1059},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/eacl/ZhouLWDHX17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/TanWRLZ17,
  author       = {Chuanqi Tan and
                  Furu Wei and
                  Pengjie Ren and
                  Weifeng Lv and
                  Ming Zhou},
  editor       = {Martha Palmer and
                  Rebecca Hwa and
                  Sebastian Riedel},
  title        = {Entity Linking for Queries by Searching Wikipedia Sentences},
  booktitle    = {Proceedings of the 2017 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2017, Copenhagen, Denmark, September
                  9-11, 2017},
  pages        = {68--77},
  publisher    = {Association for Computational Linguistics},
  year         = {2017},
  url          = {https://doi.org/10.18653/v1/d17-1007},
  doi          = {10.18653/V1/D17-1007},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/TanWRLZ17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nlpcc/ZhouYWTBZ17,
  author       = {Qingyu Zhou and
                  Nan Yang and
                  Furu Wei and
                  Chuanqi Tan and
                  Hangbo Bao and
                  Ming Zhou},
  editor       = {Xuanjing Huang and
                  Jing Jiang and
                  Dongyan Zhao and
                  Yansong Feng and
                  Yu Hong},
  title        = {Neural Question Generation from Text: {A} Preliminary Study},
  booktitle    = {Natural Language Processing and Chinese Computing - 6th {CCF} International
                  Conference, {NLPCC} 2017, Dalian, China, November 8-12, 2017, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {10619},
  pages        = {662--671},
  publisher    = {Springer},
  year         = {2017},
  url          = {https://doi.org/10.1007/978-3-319-73618-1\_56},
  doi          = {10.1007/978-3-319-73618-1\_56},
  timestamp    = {Fri, 16 Feb 2024 08:27:36 +0100},
  biburl       = {https://dblp.org/rec/conf/nlpcc/ZhouYWTBZ17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sigir/RenCRWMR17,
  author       = {Pengjie Ren and
                  Zhumin Chen and
                  Zhaochun Ren and
                  Furu Wei and
                  Jun Ma and
                  Maarten de Rijke},
  editor       = {Noriko Kando and
                  Tetsuya Sakai and
                  Hideo Joho and
                  Hang Li and
                  Arjen P. de Vries and
                  Ryen W. White},
  title        = {Leveraging Contextual Sentence Relations for Extractive Summarization
                  Using a Neural Attention Model},
  booktitle    = {Proceedings of the 40th International {ACM} {SIGIR} Conference on
                  Research and Development in Information Retrieval, Shinjuku, Tokyo,
                  Japan, August 7-11, 2017},
  pages        = {95--104},
  publisher    = {{ACM}},
  year         = {2017},
  url          = {https://doi.org/10.1145/3077136.3080792},
  doi          = {10.1145/3077136.3080792},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/sigir/RenCRWMR17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/ZhouYWTBZ17,
  author       = {Qingyu Zhou and
                  Nan Yang and
                  Furu Wei and
                  Chuanqi Tan and
                  Hangbo Bao and
                  Ming Zhou},
  title        = {Neural Question Generation from Text: {A} Preliminary Study},
  journal      = {CoRR},
  volume       = {abs/1704.01792},
  year         = {2017},
  url          = {http://arxiv.org/abs/1704.01792},
  eprinttype    = {arXiv},
  eprint       = {1704.01792},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/ZhouYWTBZ17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/TanWRLZ17,
  author       = {Chuanqi Tan and
                  Furu Wei and
                  Pengjie Ren and
                  Weifeng Lv and
                  Ming Zhou},
  title        = {Entity Linking for Queries by Searching Wikipedia Sentences},
  journal      = {CoRR},
  volume       = {abs/1704.02788},
  year         = {2017},
  url          = {http://arxiv.org/abs/1704.02788},
  eprinttype    = {arXiv},
  eprint       = {1704.02788},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/TanWRLZ17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/ZhouYWZ17,
  author       = {Qingyu Zhou and
                  Nan Yang and
                  Furu Wei and
                  Ming Zhou},
  title        = {Selective Encoding for Abstractive Sentence Summarization},
  journal      = {CoRR},
  volume       = {abs/1704.07073},
  year         = {2017},
  url          = {http://arxiv.org/abs/1704.07073},
  eprinttype    = {arXiv},
  eprint       = {1704.07073},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/ZhouYWZ17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/TanWYLZ17,
  author       = {Chuanqi Tan and
                  Furu Wei and
                  Nan Yang and
                  Weifeng Lv and
                  Ming Zhou},
  title        = {S-Net: From Answer Extraction to Answer Generation for Machine Reading
                  Comprehension},
  journal      = {CoRR},
  volume       = {abs/1706.04815},
  year         = {2017},
  url          = {http://arxiv.org/abs/1706.04815},
  eprinttype    = {arXiv},
  eprint       = {1706.04815},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/TanWYLZ17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1711-04434,
  author       = {Ziqiang Cao and
                  Furu Wei and
                  Wenjie Li and
                  Sujian Li},
  title        = {Faithful to the Original: Fact Aware Neural Abstractive Summarization},
  journal      = {CoRR},
  volume       = {abs/1711.04434},
  year         = {2017},
  url          = {http://arxiv.org/abs/1711.04434},
  eprinttype    = {arXiv},
  eprint       = {1711.04434},
  timestamp    = {Fri, 29 Nov 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1711-04434.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/DongWXLZ16,
  author       = {Li Dong and
                  Furu Wei and
                  Ke Xu and
                  Shixia Liu and
                  Ming Zhou},
  title        = {Adaptive Multi-Compositionality for Recursive Neural Network Models},
  journal      = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.},
  volume       = {24},
  number       = {3},
  pages        = {422--431},
  year         = {2016},
  url          = {https://doi.org/10.1109/TASLP.2015.2509257},
  doi          = {10.1109/TASLP.2015.2509257},
  timestamp    = {Fri, 13 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/taslp/DongWXLZ16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/LiuLWJ16,
  author       = {Yang Liu and
                  Sujian Li and
                  Furu Wei and
                  Heng Ji},
  title        = {Relation Classification Via Modeling Augmented Dependency Paths},
  journal      = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.},
  volume       = {24},
  number       = {9},
  pages        = {1589--1598},
  year         = {2016},
  url          = {https://doi.org/10.1109/TASLP.2016.2573050},
  doi          = {10.1109/TASLP.2016.2573050},
  timestamp    = {Fri, 13 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/taslp/LiuLWJ16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tkde/TangWQYLZ16,
  author       = {Duyu Tang and
                  Furu Wei and
                  Bing Qin and
                  Nan Yang and
                  Ting Liu and
                  Ming Zhou},
  title        = {Sentiment Embeddings with Applications to Sentiment Analysis},
  journal      = {{IEEE} Trans. Knowl. Data Eng.},
  volume       = {28},
  number       = {2},
  pages        = {496--509},
  year         = {2016},
  url          = {https://doi.org/10.1109/TKDE.2015.2489653},
  doi          = {10.1109/TKDE.2015.2489653},
  timestamp    = {Wed, 14 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/tkde/TangWQYLZ16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tvcg/LiuLZLWP16,
  author       = {Mengchen Liu and
                  Shixia Liu and
                  Xizhou Zhu and
                  Qinying Liao and
                  Furu Wei and
                  Shimei Pan},
  title        = {An Uncertainty-Aware Approach for Exploratory Microblog Retrieval},
  journal      = {{IEEE} Trans. Vis. Comput. Graph.},
  volume       = {22},
  number       = {1},
  pages        = {250--259},
  year         = {2016},
  url          = {https://doi.org/10.1109/TVCG.2015.2467554},
  doi          = {10.1109/TVCG.2015.2467554},
  timestamp    = {Wed, 14 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/tvcg/LiuLZLWP16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/CaoCLLWZ16,
  author       = {Ziqiang Cao and
                  Chengyao Chen and
                  Wenjie Li and
                  Sujian Li and
                  Furu Wei and
                  Ming Zhou},
  editor       = {Dale Schuurmans and
                  Michael P. Wellman},
  title        = {TGSum: Build Tweet Guided Multi-Document Summarization Dataset},
  booktitle    = {Proceedings of the Thirtieth {AAAI} Conference on Artificial Intelligence,
                  February 12-17, 2016, Phoenix, Arizona, {USA}},
  pages        = {2906--2912},
  publisher    = {{AAAI} Press},
  year         = {2016},
  url          = {https://doi.org/10.1609/aaai.v30i1.10376},
  doi          = {10.1609/AAAI.V30I1.10376},
  timestamp    = {Mon, 04 Sep 2023 15:08:28 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/CaoCLLWZ16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/coling/RenWCMZ16,
  author       = {Pengjie Ren and
                  Furu Wei and
                  Zhumin Chen and
                  Jun Ma and
                  Ming Zhou},
  editor       = {Nicoletta Calzolari and
                  Yuji Matsumoto and
                  Rashmi Prasad},
  title        = {A Redundancy-Aware Sentence Regression Framework for Extractive Summarization},
  booktitle    = {{COLING} 2016, 26th International Conference on Computational Linguistics,
                  Proceedings of the Conference: Technical Papers, December 11-16, 2016,
                  Osaka, Japan},
  pages        = {33--43},
  publisher    = {{ACL}},
  year         = {2016},
  url          = {https://aclanthology.org/C16-1004/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/coling/RenWCMZ16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/coling/CaoLLWL16,
  author       = {Ziqiang Cao and
                  Wenjie Li and
                  Sujian Li and
                  Furu Wei and
                  Yanran Li},
  editor       = {Nicoletta Calzolari and
                  Yuji Matsumoto and
                  Rashmi Prasad},
  title        = {AttSum: Joint Learning of Focusing and Summarization with Neural Attention},
  booktitle    = {{COLING} 2016, 26th International Conference on Computational Linguistics,
                  Proceedings of the Conference: Technical Papers, December 11-16, 2016,
                  Osaka, Japan},
  pages        = {547--556},
  publisher    = {{ACL}},
  year         = {2016},
  url          = {https://aclanthology.org/C16-1053/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/coling/CaoLLWL16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/TanWDLZ16,
  author       = {Chuanqi Tan and
                  Furu Wei and
                  Li Dong and
                  Weifeng Lv and
                  Ming Zhou},
  editor       = {Jian Su and
                  Xavier Carreras and
                  Kevin Duh},
  title        = {Solving and Generating Chinese Character Riddles},
  booktitle    = {Proceedings of the 2016 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2016, Austin, Texas, USA, November 1-4,
                  2016},
  pages        = {846--855},
  publisher    = {The Association for Computational Linguistics},
  year         = {2016},
  url          = {https://doi.org/10.18653/v1/d16-1081},
  doi          = {10.18653/V1/D16-1081},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/TanWDLZ16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/YinWDXZZ16,
  author       = {Yichun Yin and
                  Furu Wei and
                  Li Dong and
                  Kaimeng Xu and
                  Ming Zhang and
                  Ming Zhou},
  editor       = {Subbarao Kambhampati},
  title        = {Unsupervised Word and Dependency Path Embeddings for Aspect Term Extraction},
  booktitle    = {Proceedings of the Twenty-Fifth International Joint Conference on
                  Artificial Intelligence, {IJCAI} 2016, New York, NY, USA, 9-15 July
                  2016},
  pages        = {2979--2985},
  publisher    = {{IJCAI/AAAI} Press},
  year         = {2016},
  url          = {http://www.ijcai.org/Abstract/16/423},
  timestamp    = {Tue, 20 Aug 2019 16:19:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcai/YinWDXZZ16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/CaoLLW16,
  author       = {Ziqiang Cao and
                  Wenjie Li and
                  Sujian Li and
                  Furu Wei},
  title        = {AttSum: Joint Learning of Focusing and Summarization with Neural Attention},
  journal      = {CoRR},
  volume       = {abs/1604.00125},
  year         = {2016},
  url          = {http://arxiv.org/abs/1604.00125},
  eprinttype    = {arXiv},
  eprint       = {1604.00125},
  timestamp    = {Fri, 29 Nov 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/CaoLLW16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/YinWDXZZ16,
  author       = {Yichun Yin and
                  Furu Wei and
                  Li Dong and
                  Kaimeng Xu and
                  Ming Zhang and
                  Ming Zhou},
  title        = {Unsupervised Word and Dependency Path Embeddings for Aspect Term Extraction},
  journal      = {CoRR},
  volume       = {abs/1605.07843},
  year         = {2016},
  url          = {http://arxiv.org/abs/1605.07843},
  eprinttype    = {arXiv},
  eprint       = {1605.07843},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/YinWDXZZ16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/CaoLLW16a,
  author       = {Ziqiang Cao and
                  Wenjie Li and
                  Sujian Li and
                  Furu Wei},
  title        = {Improving Multi-Document Summarization via Text Classification},
  journal      = {CoRR},
  volume       = {abs/1611.09238},
  year         = {2016},
  url          = {http://arxiv.org/abs/1611.09238},
  eprinttype    = {arXiv},
  eprint       = {1611.09238},
  timestamp    = {Fri, 29 Nov 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/CaoLLW16a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/coling/GaoWLLZ15,
  author       = {Dehong Gao and
                  Furu Wei and
                  Wenjie Li and
                  Xiaohua Liu and
                  Ming Zhou},
  title        = {Cross-lingual Sentiment Lexicon Learning With Bilingual Word Graph
                  Label Propagation},
  journal      = {Comput. Linguistics},
  volume       = {41},
  number       = {1},
  pages        = {21--40},
  year         = {2015},
  url          = {https://doi.org/10.1162/COLI\_a\_00207},
  doi          = {10.1162/COLI\_A\_00207},
  timestamp    = {Mon, 11 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/coling/GaoWLLZ15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/coling/DongWLZX15,
  author       = {Li Dong and
                  Furu Wei and
                  Shujie Liu and
                  Ming Zhou and
                  Ke Xu},
  title        = {A Statistical Parsing Framework for Sentiment Classification},
  journal      = {Comput. Linguistics},
  volume       = {41},
  number       = {2},
  pages        = {293--336},
  year         = {2015},
  url          = {https://doi.org/10.1162/COLI\_a\_00221},
  doi          = {10.1162/COLI\_A\_00221},
  timestamp    = {Mon, 11 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/coling/DongWLZX15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/TangQWDLZ15,
  author       = {Duyu Tang and
                  Bing Qin and
                  Furu Wei and
                  Li Dong and
                  Ting Liu and
                  Ming Zhou},
  title        = {A Joint Segmentation and Classification Framework for Sentence Level
                  Sentiment Classification},
  journal      = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.},
  volume       = {23},
  number       = {11},
  pages        = {1750--1761},
  year         = {2015},
  url          = {https://doi.org/10.1109/TASLP.2015.2449071},
  doi          = {10.1109/TASLP.2015.2449071},
  timestamp    = {Fri, 13 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/taslp/TangQWDLZ15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/CaoWDLZ15,
  author       = {Ziqiang Cao and
                  Furu Wei and
                  Li Dong and
                  Sujian Li and
                  Ming Zhou},
  editor       = {Blai Bonet and
                  Sven Koenig},
  title        = {Ranking with Recursive Neural Networks and Its Application to Multi-Document
                  Summarization},
  booktitle    = {Proceedings of the Twenty-Ninth {AAAI} Conference on Artificial Intelligence,
                  January 25-30, 2015, Austin, Texas, {USA}},
  pages        = {2153--2159},
  publisher    = {{AAAI} Press},
  year         = {2015},
  url          = {https://doi.org/10.1609/aaai.v29i1.9490},
  doi          = {10.1609/AAAI.V29I1.9490},
  timestamp    = {Mon, 18 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/CaoWDLZ15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/DongWZX15,
  author       = {Li Dong and
                  Furu Wei and
                  Ming Zhou and
                  Ke Xu},
  title        = {Question Answering over Freebase with Multi-Column Convolutional Neural
                  Networks},
  booktitle    = {Proceedings of the 53rd Annual Meeting of the Association for Computational
                  Linguistics and the 7th International Joint Conference on Natural
                  Language Processing of the Asian Federation of Natural Language Processing,
                  {ACL} 2015, July 26-31, 2015, Beijing, China, Volume 1: Long Papers},
  pages        = {260--269},
  publisher    = {The Association for Computer Linguistics},
  year         = {2015},
  url          = {https://doi.org/10.3115/v1/p15-1026},
  doi          = {10.3115/V1/P15-1026},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/DongWZX15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/LiuWLJZW15,
  author       = {Yang Liu and
                  Furu Wei and
                  Sujian Li and
                  Heng Ji and
                  Ming Zhou and
                  Houfeng Wang},
  title        = {A Dependency-Based Neural Network for Relation Classification},
  booktitle    = {Proceedings of the 53rd Annual Meeting of the Association for Computational
                  Linguistics and the 7th International Joint Conference on Natural
                  Language Processing of the Asian Federation of Natural Language Processing,
                  {ACL} 2015, July 26-31, 2015, Beijing, China, Volume 2: Short Papers},
  pages        = {285--290},
  publisher    = {The Association for Computer Linguistics},
  year         = {2015},
  url          = {https://doi.org/10.3115/v1/p15-2047},
  doi          = {10.3115/V1/P15-2047},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/LiuWLJZW15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/CaoWLLZW15,
  author       = {Ziqiang Cao and
                  Furu Wei and
                  Sujian Li and
                  Wenjie Li and
                  Ming Zhou and
                  Houfeng Wang},
  title        = {Learning Summary Prior Representation for Extractive Summarization},
  booktitle    = {Proceedings of the 53rd Annual Meeting of the Association for Computational
                  Linguistics and the 7th International Joint Conference on Natural
                  Language Processing of the Asian Federation of Natural Language Processing,
                  {ACL} 2015, July 26-31, 2015, Beijing, China, Volume 2: Short Papers},
  pages        = {829--833},
  publisher    = {The Association for Computer Linguistics},
  year         = {2015},
  url          = {https://doi.org/10.3115/v1/p15-2136},
  doi          = {10.3115/V1/P15-2136},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/CaoWLLZW15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/dasfaa/ZhaoWZN15,
  author       = {Zhou Zhao and
                  Furu Wei and
                  Ming Zhou and
                  Wilfred Ng},
  editor       = {Matthias Renz and
                  Cyrus Shahabi and
                  Xiaofang Zhou and
                  Muhammad Aamir Cheema},
  title        = {Cold-Start Expert Finding in Community Question Answering via Graph
                  Regularization},
  booktitle    = {Database Systems for Advanced Applications - 20th International Conference,
                  {DASFAA} 2015, Hanoi, Vietnam, April 20-23, 2015, Proceedings, Part
                  {I}},
  series       = {Lecture Notes in Computer Science},
  volume       = {9049},
  pages        = {21--38},
  publisher    = {Springer},
  year         = {2015},
  url          = {https://doi.org/10.1007/978-3-319-18120-2\_2},
  doi          = {10.1007/978-3-319-18120-2\_2},
  timestamp    = {Thu, 21 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/dasfaa/ZhaoWZN15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/edbt/ZhaoWZCN15,
  author       = {Zhou Zhao and
                  Furu Wei and
                  Ming Zhou and
                  Weikeng Chen and
                  Wilfred Ng},
  editor       = {Gustavo Alonso and
                  Floris Geerts and
                  Lucian Popa and
                  Pablo Barcel{\'{o}} and
                  Jens Teubner and
                  Mart{\'{\i}}n Ugarte and
                  Jan Van den Bussche and
                  Jan Paredaens},
  title        = {Crowd-Selection Query Processing in Crowdsourcing Databases: {A} Task-Driven
                  Approach},
  booktitle    = {Proceedings of the 18th International Conference on Extending Database
                  Technology, {EDBT} 2015, Brussels, Belgium, March 23-27, 2015},
  pages        = {397--408},
  publisher    = {OpenProceedings.org},
  year         = {2015},
  url          = {https://doi.org/10.5441/002/edbt.2015.35},
  doi          = {10.5441/002/EDBT.2015.35},
  timestamp    = {Fri, 22 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/edbt/ZhaoWZCN15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/DongWSZX15,
  author       = {Li Dong and
                  Furu Wei and
                  Hong Sun and
                  Ming Zhou and
                  Ke Xu},
  editor       = {Qiang Yang and
                  Michael J. Wooldridge},
  title        = {A Hybrid Neural Model for Type Classification of Entity Mentions},
  booktitle    = {Proceedings of the Twenty-Fourth International Joint Conference on
                  Artificial Intelligence, {IJCAI} 2015, Buenos Aires, Argentina, July
                  25-31, 2015},
  pages        = {1243--1249},
  publisher    = {{AAAI} Press},
  year         = {2015},
  url          = {http://ijcai.org/Abstract/15/179},
  timestamp    = {Tue, 20 Aug 2019 16:16:43 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcai/DongWSZX15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/semeval/DongWYZX15,
  author       = {Li Dong and
                  Furu Wei and
                  Yichun Yin and
                  Ming Zhou and
                  Ke Xu},
  editor       = {Daniel M. Cer and
                  David Jurgens and
                  Preslav Nakov and
                  Torsten Zesch},
  title        = {Splusplus: {A} Feature-Rich Two-stage Classifier for Sentiment Analysis
                  of Tweets},
  booktitle    = {Proceedings of the 9th International Workshop on Semantic Evaluation,
                  SemEval@NAACL-HLT 2015, Denver, Colorado, USA, June 4-5, 2015},
  pages        = {515--519},
  publisher    = {The Association for Computer Linguistics},
  year         = {2015},
  url          = {https://doi.org/10.18653/v1/s15-2086},
  doi          = {10.18653/V1/S15-2086},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/semeval/DongWYZX15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/WanCWLZ15,
  author       = {Xiaojun Wan and
                  Ziqiang Cao and
                  Furu Wei and
                  Sujian Li and
                  Ming Zhou},
  title        = {Multi-Document Summarization via Discriminative Summary Reranking},
  journal      = {CoRR},
  volume       = {abs/1507.02062},
  year         = {2015},
  url          = {http://arxiv.org/abs/1507.02062},
  eprinttype    = {arXiv},
  eprint       = {1507.02062},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/WanCWLZ15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/LiuWLJZW15,
  author       = {Yang Liu and
                  Furu Wei and
                  Sujian Li and
                  Heng Ji and
                  Ming Zhou and
                  Houfeng Wang},
  title        = {A Dependency-Based Neural Network for Relation Classification},
  journal      = {CoRR},
  volume       = {abs/1507.04646},
  year         = {2015},
  url          = {http://arxiv.org/abs/1507.04646},
  eprinttype    = {arXiv},
  eprint       = {1507.04646},
  timestamp    = {Wed, 17 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/LiuWLJZW15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/CaoCLLWZ15,
  author       = {Ziqiang Cao and
                  Chengyao Chen and
                  Wenjie Li and
                  Sujian Li and
                  Furu Wei and
                  Ming Zhou},
  title        = {TGSum: Build Tweet Guided Multi-Document Summarization Dataset},
  journal      = {CoRR},
  volume       = {abs/1511.08417},
  year         = {2015},
  url          = {http://arxiv.org/abs/1511.08417},
  eprinttype    = {arXiv},
  eprint       = {1511.08417},
  timestamp    = {Fri, 29 Nov 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/CaoCLLWZ15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/LiuLZLWP15,
  author       = {Mengchen Liu and
                  Shixia Liu and
                  Xizhou Zhu and
                  Qinying Liao and
                  Furu Wei and
                  Shimei Pan},
  title        = {An Uncertainty-Aware Approach for Exploratory Microblog Retrieval},
  journal      = {CoRR},
  volume       = {abs/1512.04038},
  year         = {2015},
  url          = {http://arxiv.org/abs/1512.04038},
  eprinttype    = {arXiv},
  eprint       = {1512.04038},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/LiuLZLWP15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/DongWZX14,
  author       = {Li Dong and
                  Furu Wei and
                  Ming Zhou and
                  Ke Xu},
  editor       = {Carla E. Brodley and
                  Peter Stone},
  title        = {Adaptive Multi-Compositionality for Recursive Neural Models with Applications
                  to Sentiment Analysis},
  booktitle    = {Proceedings of the Twenty-Eighth {AAAI} Conference on Artificial Intelligence,
                  July 27 -31, 2014, Qu{\'{e}}bec City, Qu{\'{e}}bec, Canada},
  pages        = {1537--1543},
  publisher    = {{AAAI} Press},
  year         = {2014},
  url          = {https://doi.org/10.1609/aaai.v28i1.8930},
  doi          = {10.1609/AAAI.V28I1.8930},
  timestamp    = {Mon, 04 Sep 2023 15:06:24 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/DongWZX14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/DongWTTZX14,
  author       = {Li Dong and
                  Furu Wei and
                  Chuanqi Tan and
                  Duyu Tang and
                  Ming Zhou and
                  Ke Xu},
  title        = {Adaptive Recursive Neural Network for Target-dependent Twitter Sentiment
                  Classification},
  booktitle    = {Proceedings of the 52nd Annual Meeting of the Association for Computational
                  Linguistics, {ACL} 2014, June 22-27, 2014, Baltimore, MD, USA, Volume
                  2: Short Papers},
  pages        = {49--54},
  publisher    = {The Association for Computer Linguistics},
  year         = {2014},
  url          = {https://doi.org/10.3115/v1/p14-2009},
  doi          = {10.3115/V1/P14-2009},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/DongWTTZX14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/TangWYZLQ14,
  author       = {Duyu Tang and
                  Furu Wei and
                  Nan Yang and
                  Ming Zhou and
                  Ting Liu and
                  Bing Qin},
  title        = {Learning Sentiment-Specific Word Embedding for Twitter Sentiment Classification},
  booktitle    = {Proceedings of the 52nd Annual Meeting of the Association for Computational
                  Linguistics, {ACL} 2014, June 22-27, 2014, Baltimore, MD, USA, Volume
                  1: Long Papers},
  pages        = {1555--1565},
  publisher    = {The Association for Computer Linguistics},
  year         = {2014},
  url          = {https://doi.org/10.3115/v1/p14-1146},
  doi          = {10.3115/V1/P14-1146},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/TangWYZLQ14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cikm/ZhaoCWZNW14,
  author       = {Zhou Zhao and
                  James Cheng and
                  Furu Wei and
                  Ming Zhou and
                  Wilfred Ng and
                  Yingjun Wu},
  editor       = {Jianzhong Li and
                  Xiaoyang Sean Wang and
                  Minos N. Garofalakis and
                  Ian Soboroff and
                  Torsten Suel and
                  Min Wang},
  title        = {SocialTransfer: Transferring Social Knowledge for Cold-Start Cowdsourcing},
  booktitle    = {Proceedings of the 23rd {ACM} International Conference on Conference
                  on Information and Knowledge Management, {CIKM} 2014, Shanghai, China,
                  November 3-7, 2014},
  pages        = {779--788},
  publisher    = {{ACM}},
  year         = {2014},
  url          = {https://doi.org/10.1145/2661829.2661871},
  doi          = {10.1145/2661829.2661871},
  timestamp    = {Thu, 21 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cikm/ZhaoCWZNW14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/coling/TangWQZL14,
  author       = {Duyu Tang and
                  Furu Wei and
                  Bing Qin and
                  Ming Zhou and
                  Ting Liu},
  editor       = {Jan Hajic and
                  Junichi Tsujii},
  title        = {Building Large-Scale Twitter-Specific Sentiment Lexicon : {A} Representation
                  Learning Approach},
  booktitle    = {{COLING} 2014, 25th International Conference on Computational Linguistics,
                  Proceedings of the Conference: Technical Papers, August 23-29, 2014,
                  Dublin, Ireland},
  pages        = {172--182},
  publisher    = {{ACL}},
  year         = {2014},
  url          = {https://aclanthology.org/C14-1018/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/coling/TangWQZL14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/TangWQDLZ14,
  author       = {Duyu Tang and
                  Furu Wei and
                  Bing Qin and
                  Li Dong and
                  Ting Liu and
                  Ming Zhou},
  editor       = {Alessandro Moschitti and
                  Bo Pang and
                  Walter Daelemans},
  title        = {A Joint Segmentation and Classification Framework for Sentiment Analysis},
  booktitle    = {Proceedings of the 2014 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2014, October 25-29, 2014, Doha, Qatar,
                  {A} meeting of SIGDAT, a Special Interest Group of the {ACL}},
  pages        = {477--487},
  publisher    = {{ACL}},
  year         = {2014},
  url          = {https://doi.org/10.3115/v1/d14-1054},
  doi          = {10.3115/V1/D14-1054},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/TangWQDLZ14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nlpcc/SunWZ14,
  author       = {Hong Sun and
                  Furu Wei and
                  Ming Zhou},
  editor       = {Chengqing Zong and
                  Jian{-}Yun Nie and
                  Dongyan Zhao and
                  Yansong Feng},
  title        = {Answer Extraction with Multiple Extraction Engines for Web-Based Question
                  Answering},
  booktitle    = {Natural Language Processing and Chinese Computing - Third {CCF} Conference,
                  {NLPCC} 2014, Shenzhen, China, December 5-9, 2014. Proceedings},
  series       = {Communications in Computer and Information Science},
  volume       = {496},
  pages        = {321--332},
  publisher    = {Springer},
  year         = {2014},
  url          = {https://doi.org/10.1007/978-3-662-45924-9\_29},
  doi          = {10.1007/978-3-662-45924-9\_29},
  timestamp    = {Mon, 05 Feb 2024 20:32:21 +0100},
  biburl       = {https://dblp.org/rec/conf/nlpcc/SunWZ14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/semeval/TangWQLZ14,
  author       = {Duyu Tang and
                  Furu Wei and
                  Bing Qin and
                  Ting Liu and
                  Ming Zhou},
  editor       = {Preslav Nakov and
                  Torsten Zesch},
  title        = {Coooolll: {A} Deep Learning System for Twitter Sentiment Classification},
  booktitle    = {Proceedings of the 8th International Workshop on Semantic Evaluation,
                  SemEval@COLING 2014, Dublin, Ireland, August 23-24, 2014},
  pages        = {208--212},
  publisher    = {The Association for Computer Linguistics},
  year         = {2014},
  url          = {https://doi.org/10.3115/v1/s14-2033},
  doi          = {10.3115/V1/S14-2033},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/semeval/TangWQLZ14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/DongWLZX14,
  author       = {Li Dong and
                  Furu Wei and
                  Shujie Liu and
                  Ming Zhou and
                  Ke Xu},
  title        = {A Statistical Parsing Framework for Sentiment Classification},
  journal      = {CoRR},
  volume       = {abs/1401.6330},
  year         = {2014},
  url          = {http://arxiv.org/abs/1401.6330},
  eprinttype    = {arXiv},
  eprint       = {1401.6330},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/DongWLZX14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/isci/WangLLLW13,
  author       = {Wei Wang and
                  Sujian Li and
                  Jiwei Li and
                  Wenjie Li and
                  Furu Wei},
  title        = {Exploring hypergraph-based semi-supervised ranking for query-oriented
                  summarization},
  journal      = {Inf. Sci.},
  volume       = {237},
  pages        = {271--286},
  year         = {2013},
  url          = {https://doi.org/10.1016/j.ins.2013.03.012},
  doi          = {10.1016/J.INS.2013.03.012},
  timestamp    = {Thu, 28 Nov 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/isci/WangLLLW13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tist/LiuWZZ13,
  author       = {Xiaohua Liu and
                  Furu Wei and
                  Shaodian Zhang and
                  Ming Zhou},
  title        = {Named entity recognition for tweets},
  journal      = {{ACM} Trans. Intell. Syst. Technol.},
  volume       = {4},
  number       = {1},
  pages        = {3:1--3:15},
  year         = {2013},
  url          = {https://doi.org/10.1145/2414425.2414428},
  doi          = {10.1145/2414425.2414428},
  timestamp    = {Mon, 11 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tist/LiuWZZ13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tkde/SongPLWZQ13,
  author       = {Yangqiu Song and
                  Shimei Pan and
                  Shixia Liu and
                  Furu Wei and
                  Michelle X. Zhou and
                  Weihong Qian},
  title        = {Constrained Text Coclustering with Supervised and Unsupervised Constraints},
  journal      = {{IEEE} Trans. Knowl. Data Eng.},
  volume       = {25},
  number       = {6},
  pages        = {1227--1239},
  year         = {2013},
  url          = {https://doi.org/10.1109/TKDE.2012.45},
  doi          = {10.1109/TKDE.2012.45},
  timestamp    = {Sat, 20 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tkde/SongPLWZQ13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/DongWDLZX13,
  author       = {Li Dong and
                  Furu Wei and
                  Yajuan Duan and
                  Xiaohua Liu and
                  Ming Zhou and
                  Ke Xu},
  editor       = {Marie desJardins and
                  Michael L. Littman},
  title        = {The Automated Acquisition of Suggestions from Tweets},
  booktitle    = {Proceedings of the Twenty-Seventh {AAAI} Conference on Artificial
                  Intelligence, July 14-18, 2013, Bellevue, Washington, {USA}},
  pages        = {239--245},
  publisher    = {{AAAI} Press},
  year         = {2013},
  url          = {https://doi.org/10.1609/aaai.v27i1.8630},
  doi          = {10.1609/AAAI.V27I1.8630},
  timestamp    = {Mon, 04 Sep 2023 15:56:33 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/DongWDLZX13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/GaoWLLZ13,
  author       = {Dehong Gao and
                  Furu Wei and
                  Wenjie Li and
                  Xiaohua Liu and
                  Ming Zhou},
  title        = {Co-Training Based Bilingual Sentiment Lexicon Learning},
  booktitle    = {Late-Breaking Developments in the Field of Artificial Intelligence,
                  Bellevue, Washington, USA, July 14-18, 2013},
  series       = {{AAAI} Technical Report},
  volume       = {{WS-13-17}},
  publisher    = {{AAAI}},
  year         = {2013},
  url          = {http://www.aaai.org/ocs/index.php/WS/AAAIW13/paper/view/7069},
  timestamp    = {Tue, 05 Sep 2023 08:59:27 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/GaoWLLZ13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/LiuLWZWL13,
  author       = {Xiaohua Liu and
                  Yitong Li and
                  Haocheng Wu and
                  Ming Zhou and
                  Furu Wei and
                  Yi Lu},
  title        = {Entity Linking for Tweets},
  booktitle    = {Proceedings of the 51st Annual Meeting of the Association for Computational
                  Linguistics, {ACL} 2013, 4-9 August 2013, Sofia, Bulgaria, Volume
                  1: Long Papers},
  pages        = {1304--1311},
  publisher    = {The Association for Computer Linguistics},
  year         = {2013},
  url          = {https://aclanthology.org/P13-1128/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/LiuLWZWL13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/LiuFWZ12,
  author       = {Xiaohua Liu and
                  Zhongyang Fu and
                  Furu Wei and
                  Ming Zhou},
  editor       = {J{\"{o}}rg Hoffmann and
                  Bart Selman},
  title        = {Collective Nominal Semantic Role Labeling for Tweets},
  booktitle    = {Proceedings of the Twenty-Sixth {AAAI} Conference on Artificial Intelligence,
                  July 22-26, 2012, Toronto, Ontario, Canada},
  pages        = {1685--1691},
  publisher    = {{AAAI} Press},
  year         = {2012},
  url          = {https://doi.org/10.1609/aaai.v26i1.8349},
  doi          = {10.1609/AAAI.V26I1.8349},
  timestamp    = {Mon, 04 Sep 2023 15:56:47 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/LiuFWZ12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/LiuZFWZ12,
  author       = {Xiaohua Liu and
                  Xiangyang Zhou and
                  Zhongyang Fu and
                  Furu Wei and
                  Ming Zhou},
  editor       = {J{\"{o}}rg Hoffmann and
                  Bart Selman},
  title        = {Exacting Social Events for Tweets Using a Factor Graph},
  booktitle    = {Proceedings of the Twenty-Sixth {AAAI} Conference on Artificial Intelligence,
                  July 22-26, 2012, Toronto, Ontario, Canada},
  pages        = {1692--1698},
  publisher    = {{AAAI} Press},
  year         = {2012},
  url          = {https://doi.org/10.1609/aaai.v26i1.8350},
  doi          = {10.1609/AAAI.V26I1.8350},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/LiuZFWZ12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/LiuWZ12,
  author       = {Xiaohua Liu and
                  Furu Wei and
                  Ming Zhou},
  title        = {QuickView: NLP-based Tweet Search},
  booktitle    = {The 50th Annual Meeting of the Association for Computational Linguistics,
                  Proceedings of the System Demonstrations, July 10, 2012, Jeju Island,
                  Korea},
  pages        = {13--18},
  publisher    = {The Association for Computer Linguistics},
  year         = {2012},
  url          = {https://aclanthology.org/P12-3003/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/LiuWZ12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/LiuZZFW12,
  author       = {Xiaohua Liu and
                  Ming Zhou and
                  Xiangyang Zhou and
                  Zhongyang Fu and
                  Furu Wei},
  title        = {Joint Inference of Named Entity Recognition and Normalization for
                  Tweets},
  booktitle    = {The 50th Annual Meeting of the Association for Computational Linguistics,
                  Proceedings of the Conference, July 8-14, 2012, Jeju Island, Korea
                  - Volume 1: Long Papers},
  pages        = {526--535},
  publisher    = {The Association for Computer Linguistics},
  year         = {2012},
  url          = {https://aclanthology.org/P12-1055/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/LiuZZFW12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/MengWLZXW12,
  author       = {Xinfan Meng and
                  Furu Wei and
                  Xiaohua Liu and
                  Ming Zhou and
                  Ge Xu and
                  Houfeng Wang},
  title        = {Cross-Lingual Mixture Model for Sentiment Classification},
  booktitle    = {The 50th Annual Meeting of the Association for Computational Linguistics,
                  Proceedings of the Conference, July 8-14, 2012, Jeju Island, Korea
                  - Volume 1: Long Papers},
  pages        = {572--581},
  publisher    = {The Association for Computer Linguistics},
  year         = {2012},
  url          = {https://aclanthology.org/P12-1060/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/MengWLZXW12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/chi/HuLWWSM12,
  author       = {Mengdie Hu and
                  Shixia Liu and
                  Furu Wei and
                  Yingcai Wu and
                  John T. Stasko and
                  Kwan{-}Liu Ma},
  editor       = {Joseph A. Konstan and
                  Ed H. Chi and
                  Kristina H{\"{o}}{\"{o}}k},
  title        = {Breaking news on twitter},
  booktitle    = {{CHI} Conference on Human Factors in Computing Systems, {CHI} '12,
                  Austin, TX, {USA} - May 05 - 10, 2012},
  pages        = {2751--2754},
  publisher    = {{ACM}},
  year         = {2012},
  url          = {https://doi.org/10.1145/2207676.2208672},
  doi          = {10.1145/2207676.2208672},
  timestamp    = {Tue, 01 Jun 2021 15:21:43 +0200},
  biburl       = {https://dblp.org/rec/conf/chi/HuLWWSM12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cikm/DuanWZS12,
  author       = {Yajuan Duan and
                  Furu Wei and
                  Ming Zhou and
                  Heung{-}Yeung Shum},
  editor       = {Xue{-}wen Chen and
                  Guy Lebanon and
                  Haixun Wang and
                  Mohammed J. Zaki},
  title        = {Graph-based collective classification for tweets},
  booktitle    = {21st {ACM} International Conference on Information and Knowledge Management,
                  CIKM'12, Maui, HI, USA, October 29 - November 02, 2012},
  pages        = {2323--2326},
  publisher    = {{ACM}},
  year         = {2012},
  url          = {https://doi.org/10.1145/2396761.2398631},
  doi          = {10.1145/2396761.2398631},
  timestamp    = {Tue, 06 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cikm/DuanWZS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/coling/DuanCWZS12,
  author       = {Yajuan Duan and
                  Zhimin Chen and
                  Furu Wei and
                  Ming Zhou and
                  Heung{-}Yeung Shum},
  editor       = {Martin Kay and
                  Christian Boitet},
  title        = {Twitter Topic Summarization by Ranking Tweets using Social Influence
                  and Content Quality},
  booktitle    = {{COLING} 2012, 24th International Conference on Computational Linguistics,
                  Proceedings of the Conference: Technical Papers, 8-15 December 2012,
                  Mumbai, India},
  pages        = {763--780},
  publisher    = {Indian Institute of Technology Bombay},
  year         = {2012},
  url          = {https://aclanthology.org/C12-1047/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/coling/DuanCWZS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/coling/MengWXZLZW12,
  author       = {Xinfan Meng and
                  Furu Wei and
                  Ge Xu and
                  Longkai Zhang and
                  Xiaohua Liu and
                  Ming Zhou and
                  Houfeng Wang},
  editor       = {Martin Kay and
                  Christian Boitet},
  title        = {Lost in Translations? Building Sentiment Lexicons using Context Based
                  Machine Translation},
  booktitle    = {{COLING} 2012, 24th International Conference on Computational Linguistics,
                  Proceedings of the Conference: Posters, 8-15 December 2012, Mumbai,
                  India},
  pages        = {829--838},
  publisher    = {Indian Institute of Technology Bombay},
  year         = {2012},
  url          = {https://aclanthology.org/C12-2081/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/coling/MengWXZLZW12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/coling/LiuLWZ12,
  author       = {Xiaohua Liu and
                  Yitong Li and
                  Furu Wei and
                  Ming Zhou},
  editor       = {Martin Kay and
                  Christian Boitet},
  title        = {Graph-Based Multi-Tweet Summarization using Social Signals},
  booktitle    = {{COLING} 2012, 24th International Conference on Computational Linguistics,
                  Proceedings of the Conference: Technical Papers, 8-15 December 2012,
                  Mumbai, India},
  pages        = {1699--1714},
  publisher    = {Indian Institute of Technology Bombay},
  year         = {2012},
  url          = {https://aclanthology.org/C12-1104/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/coling/LiuLWZ12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/kdd/MengWLZLW12,
  author       = {Xinfan Meng and
                  Furu Wei and
                  Xiaohua Liu and
                  Ming Zhou and
                  Sujian Li and
                  Houfeng Wang},
  editor       = {Qiang Yang and
                  Deepak Agarwal and
                  Jian Pei},
  title        = {Entity-centric topic-oriented opinion summarization in twitter},
  booktitle    = {The 18th {ACM} {SIGKDD} International Conference on Knowledge Discovery
                  and Data Mining, {KDD} '12, Beijing, China, August 12-16, 2012},
  pages        = {379--387},
  publisher    = {{ACM}},
  year         = {2012},
  url          = {https://doi.org/10.1145/2339530.2339592},
  doi          = {10.1145/2339530.2339592},
  timestamp    = {Tue, 06 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/kdd/MengWLZLW12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/cgf/WuPWLM11,
  author       = {Yingcai Wu and
                  Thomas Provan and
                  Furu Wei and
                  Shixia Liu and
                  Kwan{-}Liu Ma},
  title        = {Semantic-Preserving Word Clouds by Seam Carving},
  journal      = {Comput. Graph. Forum},
  volume       = {30},
  number       = {3},
  pages        = {741--750},
  year         = {2011},
  url          = {https://doi.org/10.1111/j.1467-8659.2011.01923.x},
  doi          = {10.1111/J.1467-8659.2011.01923.X},
  timestamp    = {Fri, 26 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/cgf/WuPWLM11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/LiuZWZ11,
  author       = {Xiaohua Liu and
                  Shaodian Zhang and
                  Furu Wei and
                  Ming Zhou},
  editor       = {Dekang Lin and
                  Yuji Matsumoto and
                  Rada Mihalcea},
  title        = {Recognizing Named Entities in Tweets},
  booktitle    = {The 49th Annual Meeting of the Association for Computational Linguistics:
                  Human Language Technologies, Proceedings of the Conference, 19-24
                  June, 2011, Portland, Oregon, {USA}},
  pages        = {359--367},
  publisher    = {The Association for Computer Linguistics},
  year         = {2011},
  url          = {https://aclanthology.org/P11-1037/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/LiuZWZ11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cikm/WangWLZZ11,
  author       = {Xiaolong Wang and
                  Furu Wei and
                  Xiaohua Liu and
                  Ming Zhou and
                  Ming Zhang},
  editor       = {Craig Macdonald and
                  Iadh Ounis and
                  Ian Ruthven},
  title        = {Topic sentiment analysis in twitter: a graph-based hashtag sentiment
                  classification approach},
  booktitle    = {Proceedings of the 20th {ACM} Conference on Information and Knowledge
                  Management, {CIKM} 2011, Glasgow, United Kingdom, October 24-28, 2011},
  pages        = {1031--1040},
  publisher    = {{ACM}},
  year         = {2011},
  url          = {https://doi.org/10.1145/2063576.2063726},
  doi          = {10.1145/2063576.2063726},
  timestamp    = {Tue, 28 Mar 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cikm/WangWLZZ11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sigir/LiuJWZ11,
  author       = {Xiaohua Liu and
                  Long Jiang and
                  Furu Wei and
                  Ming Zhou},
  editor       = {Wei{-}Ying Ma and
                  Jian{-}Yun Nie and
                  Ricardo Baeza{-}Yates and
                  Tat{-}Seng Chua and
                  W. Bruce Croft},
  title        = {QuickView: advanced search of tweets},
  booktitle    = {Proceeding of the 34th International {ACM} {SIGIR} Conference on Research
                  and Development in Information Retrieval, {SIGIR} 2011, Beijing, China,
                  July 25-29, 2011},
  pages        = {1275--1276},
  publisher    = {{ACM}},
  year         = {2011},
  url          = {https://doi.org/10.1145/2009916.2010157},
  doi          = {10.1145/2009916.2010157},
  timestamp    = {Sun, 22 Sep 2019 18:15:38 +0200},
  biburl       = {https://dblp.org/rec/conf/sigir/LiuJWZ11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@incollection{DBLP:series/sci/WeiLH11,
  author       = {Furu Wei and
                  Wenjie Li and
                  Yanxiang He},
  editor       = {Weisi Lin and
                  Dacheng Tao and
                  Janusz Kacprzyk and
                  Zhu Li and
                  Ebroul Izquierdo and
                  Haohong Wang},
  title        = {Document-Aware Graph Models for Query-Oriented Multi-document Summarization},
  booktitle    = {Multimedia Analysis, Processing and Communications},
  volume       = {346},
  pages        = {655--678},
  year         = {2011},
  url          = {https://doi.org/10.1007/978-3-642-19551-8\_24},
  doi          = {10.1007/978-3-642-19551-8\_24},
  timestamp    = {Thu, 28 Nov 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/series/sci/WeiLH11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/cga/CuiWLWZQ10,
  author       = {Weiwei Cui and
                  Yingcai Wu and
                  Shixia Liu and
                  Furu Wei and
                  Michelle X. Zhou and
                  Huamin Qu},
  title        = {Context-Preserving, Dynamic Word Cloud Visualization},
  journal      = {{IEEE} Computer Graphics and Applications},
  volume       = {30},
  number       = {6},
  pages        = {42--53},
  year         = {2010},
  url          = {https://doi.org/10.1109/MCG.2010.102},
  doi          = {10.1109/MCG.2010.102},
  timestamp    = {Sat, 30 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/cga/CuiWLWZQ10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jasis/WeiLL10,
  author       = {Furu Wei and
                  Wenjie Li and
                  Shixia Liu},
  title        = {iRANK: {A} rank-learn-combine framework for unsupervised ensemble
                  ranking},
  journal      = {J. Assoc. Inf. Sci. Technol.},
  volume       = {61},
  number       = {6},
  pages        = {1232--1243},
  year         = {2010},
  url          = {https://doi.org/10.1002/asi.21296},
  doi          = {10.1002/ASI.21296},
  timestamp    = {Mon, 02 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/jasis/WeiLL10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/kais/WeiLLH10,
  author       = {Furu Wei and
                  Wenjie Li and
                  Qin Lu and
                  Yanxiang He},
  title        = {A document-sensitive graph model for multi-document summarization},
  journal      = {Knowl. Inf. Syst.},
  volume       = {22},
  number       = {2},
  pages        = {245--259},
  year         = {2010},
  url          = {https://doi.org/10.1007/s10115-009-0194-2},
  doi          = {10.1007/S10115-009-0194-2},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/kais/WeiLLH10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tvcg/WuWLACZQ10,
  author       = {Yingcai Wu and
                  Furu Wei and
                  Shixia Liu and
                  Norman Au and
                  Weiwei Cui and
                  Hong Zhou and
                  Huamin Qu},
  title        = {OpinionSeer: Interactive Visualization of Hotel Customer Feedback},
  journal      = {{IEEE} Trans. Vis. Comput. Graph.},
  volume       = {16},
  number       = {6},
  pages        = {1109--1118},
  year         = {2010},
  url          = {https://doi.org/10.1109/TVCG.2010.183},
  doi          = {10.1109/TVCG.2010.183},
  timestamp    = {Fri, 20 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tvcg/WuWLACZQ10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/SongPLWZQ10,
  author       = {Yangqiu Song and
                  Shimei Pan and
                  Shixia Liu and
                  Furu Wei and
                  Michelle X. Zhou and
                  Weihong Qian},
  editor       = {Maria Fox and
                  David Poole},
  title        = {Constrained Coclustering for Textual Documents},
  booktitle    = {Proceedings of the Twenty-Fourth {AAAI} Conference on Artificial Intelligence,
                  {AAAI} 2010, Atlanta, Georgia, USA, July 11-15, 2010},
  pages        = {581--586},
  publisher    = {{AAAI} Press},
  year         = {2010},
  url          = {https://doi.org/10.1609/aaai.v24i1.7680},
  doi          = {10.1609/AAAI.V24I1.7680},
  timestamp    = {Mon, 04 Sep 2023 16:23:45 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/SongPLWZQ10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/apvis/CuiWLWZQ10,
  author       = {Weiwei Cui and
                  Yingcai Wu and
                  Shixia Liu and
                  Furu Wei and
                  Michelle X. Zhou and
                  Huamin Qu},
  title        = {Context preserving dynamic word cloud visualization},
  booktitle    = {{IEEE} Pacific Visualization Symposium PacificVis 2010, Taipei, Taiwan,
                  March 2-5, 2010},
  pages        = {121--128},
  publisher    = {{IEEE} Computer Society},
  year         = {2010},
  url          = {https://doi.org/10.1109/PACIFICVIS.2010.5429600},
  doi          = {10.1109/PACIFICVIS.2010.5429600},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/apvis/CuiWLWZQ10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icebe/ZhangZSW10,
  author       = {Xiaoxun Zhang and
                  Ethan Zhang and
                  Bin Song and
                  Furu Wei},
  title        = {Towards Building an Integrated Information Platform for Eco-city},
  booktitle    = {{IEEE} 7th International Conference on e-Business Engineering, {ICEBE}
                  2010, Shanghai, China, November 10-12, 2010},
  pages        = {393--398},
  publisher    = {{IEEE} Computer Society},
  year         = {2010},
  url          = {https://doi.org/10.1109/ICEBE.2010.65},
  doi          = {10.1109/ICEBE.2010.65},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icebe/ZhangZSW10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ieeevast/ShiWLTLZ10,
  author       = {Lei Shi and
                  Furu Wei and
                  Shixia Liu and
                  Li Tan and
                  Xiaoxiao Lian and
                  Michelle X. Zhou},
  title        = {Understanding text corpora with multiple facets},
  booktitle    = {5th {IEEE} Conference on Visual Analytics Science and Technology,
                  {IEEE} {VAST} 2010, Salt Lake City, UT, USA, October 24-29, 2010,
                  part of VisWeek 2010},
  pages        = {99--106},
  publisher    = {{IEEE} Computer Society},
  year         = {2010},
  url          = {https://doi.org/10.1109/VAST.2010.5652931},
  doi          = {10.1109/VAST.2010.5652931},
  timestamp    = {Thu, 25 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ieeevast/ShiWLTLZ10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ieeevast/ShiQWT10,
  author       = {Lei Shi and
                  Weihong Qian and
                  Furu Wei and
                  Li Tan},
  title        = {VisWorks text and network visual analytics: {VAST} 2010 Mini Challenge
                  1 award: "Effective interactive visualization of document contents"},
  booktitle    = {5th {IEEE} Conference on Visual Analytics Science and Technology,
                  {IEEE} {VAST} 2010, Salt Lake City, UT, USA, October 24-29, 2010,
                  part of VisWeek 2010},
  pages        = {269--270},
  publisher    = {{IEEE} Computer Society},
  year         = {2010},
  url          = {https://doi.org/10.1109/VAST.2010.5651204},
  doi          = {10.1109/VAST.2010.5651204},
  timestamp    = {Mon, 07 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ieeevast/ShiQWT10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iitsi/HuangHWL10,
  author       = {Lei Huang and
                  Yanxiang He and
                  Furu Wei and
                  Wenjie Li},
  title        = {Modeling Document Summarization as Multi-objective Optimization},
  booktitle    = {Third International Symposium on Intelligent Information Technology
                  and Security Informatics, {IITSI} 2010, Jinggangshan, China, April
                  2-4, 2010},
  pages        = {382--386},
  publisher    = {{IEEE} Computer Society},
  year         = {2010},
  url          = {https://doi.org/10.1109/IITSI.2010.80},
  doi          = {10.1109/IITSI.2010.80},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iitsi/HuangHWL10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/kdd/WeiLSPZQSTZ10,
  author       = {Furu Wei and
                  Shixia Liu and
                  Yangqiu Song and
                  Shimei Pan and
                  Michelle X. Zhou and
                  Weihong Qian and
                  Lei Shi and
                  Li Tan and
                  Qiang Zhang},
  editor       = {Bharat Rao and
                  Balaji Krishnapuram and
                  Andrew Tomkins and
                  Qiang Yang},
  title        = {{TIARA:} a visual exploratory text analytic system},
  booktitle    = {Proceedings of the 16th {ACM} {SIGKDD} International Conference on
                  Knowledge Discovery and Data Mining, Washington, DC, USA, July 25-28,
                  2010},
  pages        = {153--162},
  publisher    = {{ACM}},
  year         = {2010},
  url          = {https://doi.org/10.1145/1835804.1835827},
  doi          = {10.1145/1835804.1835827},
  timestamp    = {Thu, 25 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/kdd/WeiLSPZQSTZ10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jasis/WeiLLH09,
  author       = {Furu Wei and
                  Wenjie Li and
                  Qin Lu and
                  Yanxiang He},
  title        = {Applying two-level reinforcement ranking in query-oriented multidocument
                  summarization},
  journal      = {J. Assoc. Inf. Sci. Technol.},
  volume       = {60},
  number       = {10},
  pages        = {2119--2131},
  year         = {2009},
  url          = {https://doi.org/10.1002/asi.21127},
  doi          = {10.1002/ASI.21127},
  timestamp    = {Mon, 02 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/jasis/WeiLLH09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/WeiLH09,
  author       = {Furu Wei and
                  Wenjie Li and
                  Yanxiang He},
  title        = {Co-Feedback Ranking for Query-Focused Summarization},
  booktitle    = {{ACL} 2009, Proceedings of the 47th Annual Meeting of the Association
                  for Computational Linguistics and the 4th International Joint Conference
                  on Natural Language Processing of the AFNLP, 2-7 August 2009, Singapore,
                  Short Papers},
  pages        = {117--120},
  publisher    = {The Association for Computer Linguistics},
  year         = {2009},
  url          = {https://aclanthology.org/P09-2030/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/WeiLH09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cikm/WeiLWH09,
  author       = {Furu Wei and
                  Wenjie Li and
                  Wei Wang and
                  Yanxiang He},
  editor       = {David Wai{-}Lok Cheung and
                  Il{-}Yeol Song and
                  Wesley W. Chu and
                  Xiaohua Hu and
                  Jimmy Lin},
  title        = {iRANK: an interactive ranking framework and its application in query-focused
                  summarization},
  booktitle    = {Proceedings of the 18th {ACM} Conference on Information and Knowledge
                  Management, {CIKM} 2009, Hong Kong, China, November 2-6, 2009},
  pages        = {1557--1560},
  publisher    = {{ACM}},
  year         = {2009},
  url          = {https://doi.org/10.1145/1645953.1646171},
  doi          = {10.1145/1645953.1646171},
  timestamp    = {Fri, 27 Aug 2021 11:13:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cikm/WeiLWH09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cikm/WangWLL09,
  author       = {Wei Wang and
                  Furu Wei and
                  Wenjie Li and
                  Sujian Li},
  editor       = {David Wai{-}Lok Cheung and
                  Il{-}Yeol Song and
                  Wesley W. Chu and
                  Xiaohua Hu and
                  Jimmy Lin},
  title        = {HyperSum: hypergraph based semi-supervised sentence ranking for query-oriented
                  summarization},
  booktitle    = {Proceedings of the 18th {ACM} Conference on Information and Knowledge
                  Management, {CIKM} 2009, Hong Kong, China, November 2-6, 2009},
  pages        = {1855--1858},
  publisher    = {{ACM}},
  year         = {2009},
  url          = {https://doi.org/10.1145/1645953.1646248},
  doi          = {10.1145/1645953.1646248},
  timestamp    = {Thu, 28 Nov 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cikm/WangWLL09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iccpol/WeiHLH09,
  author       = {Furu Wei and
                  Yanxiang He and
                  Wenjie Li and
                  Lei Huang},
  editor       = {Wenjie Li and
                  Diego Moll{\'{a}} Aliod},
  title        = {Query-Oriented Summarization Based on Neighborhood Graph Model},
  booktitle    = {Computer Processing of Oriental Languages. Language Technology for
                  the Knowledge-based Economy, 22nd International Conference, {ICCPOL}
                  2009, Hong Kong, March 26-27, 2009. Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {5459},
  pages        = {156--167},
  publisher    = {Springer},
  year         = {2009},
  url          = {https://doi.org/10.1007/978-3-642-00831-3\_15},
  doi          = {10.1007/978-3-642-00831-3\_15},
  timestamp    = {Thu, 28 Nov 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iccpol/WeiHLH09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iccpol/OuyangLWL09,
  author       = {Ouyang You and
                  Wenjie Li and
                  Furu Wei and
                  Qin Lu},
  editor       = {Wenjie Li and
                  Diego Moll{\'{a}} Aliod},
  title        = {Learning Similarity Functions in Graph-Based Document Summarization},
  booktitle    = {Computer Processing of Oriental Languages. Language Technology for
                  the Knowledge-based Economy, 22nd International Conference, {ICCPOL}
                  2009, Hong Kong, March 26-27, 2009. Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {5459},
  pages        = {189--200},
  publisher    = {Springer},
  year         = {2009},
  url          = {https://doi.org/10.1007/978-3-642-00831-3\_18},
  doi          = {10.1007/978-3-642-00831-3\_18},
  timestamp    = {Thu, 28 Nov 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iccpol/OuyangLWL09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/LiZWHL08,
  author       = {Wenjie Li and
                  Peng Zhang and
                  Furu Wei and
                  Yuexian Hou and
                  Qin Lu},
  title        = {A Novel Feature-based Approach to Chinese Entity Relation Extraction},
  booktitle    = {{ACL} 2008, Proceedings of the 46th Annual Meeting of the Association
                  for Computational Linguistics, June 15-20, 2008, Columbus, Ohio, USA,
                  Short Papers},
  pages        = {89--92},
  publisher    = {The Association for Computer Linguistics},
  year         = {2008},
  url          = {https://aclanthology.org/P08-2023/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/LiZWHL08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/coling/LiWLH08,
  author       = {Wenjie Li and
                  Furu Wei and
                  Qin Lu and
                  Yanxiang He},
  editor       = {Donia Scott and
                  Hans Uszkoreit},
  title        = {{PNR2:} Ranking Sentences with Positive and Negative Reinforcement
                  for Query-Oriented Update Summarization},
  booktitle    = {{COLING} 2008, 22nd International Conference on Computational Linguistics,
                  Proceedings of the Conference, 18-22 August 2008, Manchester, {UK}},
  pages        = {489--496},
  year         = {2008},
  url          = {https://aclanthology.org/C08-1062/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/coling/LiWLH08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ecir/WeiLLH08,
  author       = {Furu Wei and
                  Wenjie Li and
                  Qin Lu and
                  Yanxiang He},
  editor       = {Craig Macdonald and
                  Iadh Ounis and
                  Vassilis Plachouras and
                  Ian Ruthven and
                  Ryen W. White},
  title        = {A Cluster-Sensitive Graph Model for Query-Oriented Multi-document
                  Summarization},
  booktitle    = {Advances in Information Retrieval , 30th European Conference on {IR}
                  Research, {ECIR} 2008, Glasgow, UK, March 30-April 3, 2008. Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {4956},
  pages        = {446--453},
  publisher    = {Springer},
  year         = {2008},
  url          = {https://doi.org/10.1007/978-3-540-78646-7\_42},
  doi          = {10.1007/978-3-540-78646-7\_42},
  timestamp    = {Thu, 28 Nov 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ecir/WeiLLH08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/isip/WeiHLL08,
  author       = {Furu Wei and
                  Yanxiang He and
                  Wenjie Li and
                  Qin Lu},
  editor       = {Fei Yu and
                  Qi Luo},
  title        = {A Query-Sensitive Graph-Based Sentence Ranking Algorithm for Query-Oriented
                  Multi-document Summarization},
  booktitle    = {International Symposium on Information Processing, {ISIP} 2008 / International
                  Pacific Workshop on Web Mining, and Web-Based Application, {WMWA}
                  2008, Moscow, Russia, 23-25 May 2008},
  pages        = {9--13},
  publisher    = {{IEEE} Computer Society},
  year         = {2008},
  url          = {https://doi.org/10.1109/ISIP.2008.21},
  doi          = {10.1109/ISIP.2008.21},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/isip/WeiHLL08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/lrec/ZhangLWLH08,
  author       = {Peng Zhang and
                  Wenjie Li and
                  Furu Wei and
                  Qin Lu and
                  Yuexian Hou},
  title        = {Exploiting the Role of Position Feature in Chinese Relation Extraction},
  booktitle    = {Proceedings of the International Conference on Language Resources
                  and Evaluation, {LREC} 2008, 26 May - 1 June 2008, Marrakech, Morocco},
  publisher    = {European Language Resources Association},
  year         = {2008},
  url          = {http://www.lrec-conf.org/proceedings/lrec2008/summaries/540.html},
  timestamp    = {Thu, 28 Nov 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/lrec/ZhangLWLH08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/pricai/LiWYLH08,
  author       = {Wenjie Li and
                  Furu Wei and
                  Ouyang You and
                  Qin Lu and
                  Yanxiang He},
  editor       = {Tu Bao Ho and
                  Zhi{-}Hua Zhou},
  title        = {Exploiting the Role of Named Entities in Query-Oriented Document Summarization},
  booktitle    = {{PRICAI} 2008: Trends in Artificial Intelligence, 10th Pacific Rim
                  International Conference on Artificial Intelligence, Hanoi, Vietnam,
                  December 15-19, 2008. Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {5351},
  pages        = {740--749},
  publisher    = {Springer},
  year         = {2008},
  url          = {https://doi.org/10.1007/978-3-540-89197-0\_68},
  doi          = {10.1007/978-3-540-89197-0\_68},
  timestamp    = {Thu, 28 Nov 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/pricai/LiWYLH08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sigir/WeiLLH08,
  author       = {Furu Wei and
                  Wenjie Li and
                  Qin Lu and
                  Yanxiang He},
  editor       = {Sung{-}Hyon Myaeng and
                  Douglas W. Oard and
                  Fabrizio Sebastiani and
                  Tat{-}Seng Chua and
                  Mun{-}Kew Leong},
  title        = {Query-sensitive mutual reinforcement chain and its application in
                  query-oriented multi-document summarization},
  booktitle    = {Proceedings of the 31st Annual International {ACM} {SIGIR} Conference
                  on Research and Development in Information Retrieval, {SIGIR} 2008,
                  Singapore, July 20-24, 2008},
  pages        = {283--290},
  publisher    = {{ACM}},
  year         = {2008},
  url          = {https://doi.org/10.1145/1390334.1390384},
  doi          = {10.1145/1390334.1390384},
  timestamp    = {Thu, 28 Nov 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/sigir/WeiLLH08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/tac/LiYHW08,
  author       = {Wenjie Li and
                  Ouyang You and
                  Yi Hu and
                  Furu Wei},
  title        = {PolyU at {TAC} 2008},
  booktitle    = {Proceedings of the First Text Analysis Conference, {TAC} 2008, Gaithersburg,
                  Maryland, USA, November 17-19, 2008},
  publisher    = {{NIST}},
  year         = {2008},
  url          = {https://tac.nist.gov/publications/2008/participant.papers/PolyU.proceedings.pdf},
  timestamp    = {Fri, 29 Nov 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/tac/LiYHW08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icwn/WeiPZH05,
  author       = {Furu Wei and
                  Min Peng and
                  Wei Zhang and
                  Yanxiang He},
  editor       = {Laurence Tianruo Yang and
                  Hamid R. Arabnia and
                  Li{-}Chun Wang},
  title        = {An Application of {FIPA-ACL} Based Agent Communication in Mobile-GPS
                  System},
  booktitle    = {Proceedings of the 2005 International Conference on Wireless Networks,
                  {ICWN} 2005, Las Vegas, Nevada, USA, June 27-30, 2005},
  pages        = {357--360},
  publisher    = {{CSREA} Press},
  year         = {2005},
  timestamp    = {Mon, 08 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icwn/WeiPZH05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
a service of  Schloss Dagstuhl - Leibniz Center for Informatics