BibTeX records: Shaohan Huang

download as .bib file

@article{DBLP:journals/pami/WangMDHZW24,
  author       = {Hongyu Wang and
                  Shuming Ma and
                  Li Dong and
                  Shaohan Huang and
                  Dongdong Zhang and
                  Furu Wei},
  title        = {DeepNet: Scaling Transformers to 1,000 Layers},
  journal      = {{IEEE} Trans. Pattern Anal. Mach. Intell.},
  volume       = {46},
  number       = {10},
  pages        = {6761--6774},
  year         = {2024},
  url          = {https://doi.org/10.1109/TPAMI.2024.3386927},
  doi          = {10.1109/TPAMI.2024.3386927},
  timestamp    = {Tue, 24 Sep 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/pami/WangMDHZW24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tc/QiLHFY24,
  author       = {Jiaxing Qi and
                  Zhongzhi Luan and
                  Shaohan Huang and
                  Carol J. Fung and
                  Hailong Yang},
  title        = {LogSay: An Efficient Comprehension System for Log Numerical Reasoning},
  journal      = {{IEEE} Trans. Computers},
  volume       = {73},
  number       = {7},
  pages        = {1809--1821},
  year         = {2024},
  url          = {https://doi.org/10.1109/TC.2024.3386068},
  doi          = {10.1109/TC.2024.3386068},
  timestamp    = {Thu, 04 Jul 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tc/QiLHFY24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/LiuYHZHWDSZ24,
  author       = {Yuxuan Liu and
                  Tianchi Yang and
                  Shaohan Huang and
                  Zihan Zhang and
                  Haizhen Huang and
                  Furu Wei and
                  Weiwei Deng and
                  Feng Sun and
                  Qi Zhang},
  editor       = {Michael J. Wooldridge and
                  Jennifer G. Dy and
                  Sriraam Natarajan},
  title        = {Text Diffusion with Reinforced Conditioning},
  booktitle    = {Thirty-Eighth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2024, Thirty-Sixth Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2024, Fourteenth Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2014, February 20-27, 2024, Vancouver,
                  Canada},
  pages        = {14069--14077},
  publisher    = {{AAAI} Press},
  year         = {2024},
  url          = {https://doi.org/10.1609/aaai.v38i12.29316},
  doi          = {10.1609/AAAI.V38I12.29316},
  timestamp    = {Mon, 17 Jun 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/LiuYHZHWDSZ24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/LiuLHZSDW024,
  author       = {Haoyu Liu and
                  Jianfeng Liu and
                  Shaohan Huang and
                  Yuefeng Zhan and
                  Hao Sun and
                  Weiwei Deng and
                  Furu Wei and
                  Qi Zhang},
  editor       = {Lun{-}Wei Ku and
                  Andre Martins and
                  Vivek Srikumar},
  title        = {Se{\({^2}\)}: Sequential Example Selection for In-Context Learning},
  booktitle    = {Findings of the Association for Computational Linguistics, {ACL} 2024,
                  Bangkok, Thailand and virtual meeting, August 11-16, 2024},
  pages        = {5262--5284},
  publisher    = {Association for Computational Linguistics},
  year         = {2024},
  url          = {https://doi.org/10.18653/v1/2024.findings-acl.312},
  doi          = {10.18653/V1/2024.FINDINGS-ACL.312},
  timestamp    = {Tue, 24 Sep 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/LiuLHZSDW024.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/LiuYHZHWD0024,
  author       = {Yuxuan Liu and
                  Tianchi Yang and
                  Shaohan Huang and
                  Zihan Zhang and
                  Haizhen Huang and
                  Furu Wei and
                  Weiwei Deng and
                  Feng Sun and
                  Qi Zhang},
  editor       = {Lun{-}Wei Ku and
                  Andre Martins and
                  Vivek Srikumar},
  title        = {HD-Eval: Aligning Large Language Model Evaluators Through Hierarchical
                  Criteria Decomposition},
  booktitle    = {Proceedings of the 62nd Annual Meeting of the Association for Computational
                  Linguistics (Volume 1: Long Papers), {ACL} 2024, Bangkok, Thailand,
                  August 11-16, 2024},
  pages        = {7641--7660},
  publisher    = {Association for Computational Linguistics},
  year         = {2024},
  url          = {https://doi.org/10.18653/v1/2024.acl-long.413},
  doi          = {10.18653/V1/2024.ACL-LONG.413},
  timestamp    = {Tue, 24 Sep 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/LiuYHZHWD0024.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/ShiHSLZHWD0Z24,
  author       = {Shuhua Shi and
                  Shaohan Huang and
                  Minghui Song and
                  Zhoujun Li and
                  Zihan Zhang and
                  Haizhen Huang and
                  Furu Wei and
                  Weiwei Deng and
                  Feng Sun and
                  Qi Zhang},
  editor       = {Lun{-}Wei Ku and
                  Andre Martins and
                  Vivek Srikumar},
  title        = {ResLoRA: Identity Residual Mapping in Low-Rank Adaption},
  booktitle    = {Findings of the Association for Computational Linguistics, {ACL} 2024,
                  Bangkok, Thailand and virtual meeting, August 11-16, 2024},
  pages        = {8870--8884},
  publisher    = {Association for Computational Linguistics},
  year         = {2024},
  url          = {https://doi.org/10.18653/v1/2024.findings-acl.525},
  doi          = {10.18653/V1/2024.FINDINGS-ACL.525},
  timestamp    = {Tue, 24 Sep 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/ShiHSLZHWD0Z24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/coling/LiuYHZHWDSZ24,
  author       = {Yuxuan Liu and
                  Tianchi Yang and
                  Shaohan Huang and
                  Zihan Zhang and
                  Haizhen Huang and
                  Furu Wei and
                  Weiwei Deng and
                  Feng Sun and
                  Qi Zhang},
  editor       = {Nicoletta Calzolari and
                  Min{-}Yen Kan and
                  V{\'{e}}ronique Hoste and
                  Alessandro Lenci and
                  Sakriani Sakti and
                  Nianwen Xue},
  title        = {Calibrating LLM-Based Evaluator},
  booktitle    = {Proceedings of the 2024 Joint International Conference on Computational
                  Linguistics, Language Resources and Evaluation, {LREC/COLING} 2024,
                  20-25 May, 2024, Torino, Italy},
  pages        = {2638--2656},
  publisher    = {{ELRA} and {ICCL}},
  year         = {2024},
  url          = {https://aclanthology.org/2024.lrec-main.237},
  timestamp    = {Mon, 17 Jun 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/coling/LiuYHZHWDSZ24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/hpdc/HuangL24,
  author       = {Shaohan Huang and
                  Zhongzhi Luan},
  editor       = {Patrizio Dazzi and
                  Gabriele Mencagli and
                  David K. Lowenthal and
                  Rosa M. Badia},
  title        = {Semantic-Aware Log Understanding and Analysis},
  booktitle    = {Proceedings of the 33rd International Symposium on High-Performance
                  Parallel and Distributed Computing, {HPDC} 2024, Pisa, Italy, June
                  3-7, 2024},
  pages        = {413--416},
  publisher    = {{ACM}},
  year         = {2024},
  url          = {https://doi.org/10.1145/3625549.3658830},
  doi          = {10.1145/3625549.3658830},
  timestamp    = {Sun, 08 Sep 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/hpdc/HuangL24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/ChengHW24,
  author       = {Daixuan Cheng and
                  Shaohan Huang and
                  Furu Wei},
  title        = {Adapting Large Language Models via Reading Comprehension},
  booktitle    = {The Twelfth International Conference on Learning Representations,
                  {ICLR} 2024, Vienna, Austria, May 7-11, 2024},
  publisher    = {OpenReview.net},
  year         = {2024},
  url          = {https://openreview.net/forum?id=y886UXPEZ0},
  timestamp    = {Wed, 07 Aug 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/ChengHW24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/Pan0HPCW24,
  author       = {Xichen Pan and
                  Li Dong and
                  Shaohan Huang and
                  Zhiliang Peng and
                  Wenhu Chen and
                  Furu Wei},
  title        = {Kosmos-G: Generating Images in Context with Multimodal Large Language
                  Models},
  booktitle    = {The Twelfth International Conference on Learning Representations,
                  {ICLR} 2024, Vienna, Austria, May 7-11, 2024},
  publisher    = {OpenReview.net},
  year         = {2024},
  url          = {https://openreview.net/forum?id=he6mX9LTyE},
  timestamp    = {Wed, 07 Aug 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/Pan0HPCW24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/Peng00HHMYW24,
  author       = {Zhiliang Peng and
                  Wenhui Wang and
                  Li Dong and
                  Yaru Hao and
                  Shaohan Huang and
                  Shuming Ma and
                  Qixiang Ye and
                  Furu Wei},
  title        = {Grounding Multimodal Large Language Models to the World},
  booktitle    = {The Twelfth International Conference on Learning Representations,
                  {ICLR} 2024, Vienna, Austria, May 7-11, 2024},
  publisher    = {OpenReview.net},
  year         = {2024},
  url          = {https://openreview.net/forum?id=lLmqxkfSIw},
  timestamp    = {Wed, 07 Aug 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/Peng00HHMYW24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/WuHW24,
  author       = {Xun Wu and
                  Shaohan Huang and
                  Furu Wei},
  title        = {Mixture of LoRA Experts},
  booktitle    = {The Twelfth International Conference on Learning Representations,
                  {ICLR} 2024, Vienna, Austria, May 7-11, 2024},
  publisher    = {OpenReview.net},
  year         = {2024},
  url          = {https://openreview.net/forum?id=uWvKBCYh4S},
  timestamp    = {Wed, 07 Aug 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/WuHW24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/wcre/Huang0QSXFWYLQ24,
  author       = {Shaohan Huang and
                  Yi Liu and
                  Jiaxing Qi and
                  Jing Shang and
                  Zhiwen Xiao and
                  Carol J. Fung and
                  Zhihui Wu and
                  Hailong Yang and
                  Zhongzhi Luan and
                  Depei Qian},
  title        = {Gloss: Guiding Large Language Models to Answer Questions from System
                  Logs},
  booktitle    = {{IEEE} International Conference on Software Analysis, Evolution and
                  Reengineering, {SANER} 2024, Rovaniemi, Finland, March 12-15, 2024},
  pages        = {91--101},
  publisher    = {{IEEE}},
  year         = {2024},
  url          = {https://doi.org/10.1109/SANER60148.2024.00017},
  doi          = {10.1109/SANER60148.2024.00017},
  timestamp    = {Tue, 30 Jul 2024 11:08:59 +0200},
  biburl       = {https://dblp.org/rec/conf/wcre/Huang0QSXFWYLQ24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2401-07284,
  author       = {Ting Jiang and
                  Shaohan Huang and
                  Shengyue Luo and
                  Zihan Zhang and
                  Haizhen Huang and
                  Furu Wei and
                  Weiwei Deng and
                  Feng Sun and
                  Qi Zhang and
                  Deqing Wang and
                  Fuzhen Zhuang},
  title        = {Improving Domain Adaptation through Extended-Text Reading Comprehension},
  journal      = {CoRR},
  volume       = {abs/2401.07284},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2401.07284},
  doi          = {10.48550/ARXIV.2401.07284},
  eprinttype    = {arXiv},
  eprint       = {2401.07284},
  timestamp    = {Mon, 17 Jun 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2401-07284.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2402-13064,
  author       = {Haoran Li and
                  Qingxiu Dong and
                  Zhengyang Tang and
                  Chaojun Wang and
                  Xingxing Zhang and
                  Haoyang Huang and
                  Shaohan Huang and
                  Xiaolong Huang and
                  Zeqiang Huang and
                  Dongdong Zhang and
                  Yuxian Gu and
                  Xin Cheng and
                  Xun Wang and
                  Si{-}Qing Chen and
                  Li Dong and
                  Wei Lu and
                  Zhifang Sui and
                  Benyou Wang and
                  Wai Lam and
                  Furu Wei},
  title        = {Synthetic Data (Almost) from Scratch: Generalized Instruction Tuning
                  for Language Models},
  journal      = {CoRR},
  volume       = {abs/2402.13064},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.13064},
  doi          = {10.48550/ARXIV.2402.13064},
  eprinttype    = {arXiv},
  eprint       = {2402.13064},
  timestamp    = {Wed, 24 Jul 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-13064.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2402-13874,
  author       = {Haoyu Liu and
                  Jianfeng Liu and
                  Shaohan Huang and
                  Yuefeng Zhan and
                  Hao Sun and
                  Weiwei Deng and
                  Furu Wei and
                  Qi Zhang},
  title        = {Se\({}^{\mbox{2}}\): Sequential Example Selection for In-Context Learning},
  journal      = {CoRR},
  volume       = {abs/2402.13874},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.13874},
  doi          = {10.48550/ARXIV.2402.13874},
  eprinttype    = {arXiv},
  eprint       = {2402.13874},
  timestamp    = {Tue, 23 Jul 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-13874.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2402-14843,
  author       = {Yuxuan Liu and
                  Tianchi Yang and
                  Shaohan Huang and
                  Zihan Zhang and
                  Haizhen Huang and
                  Furu Wei and
                  Weiwei Deng and
                  Feng Sun and
                  Qi Zhang},
  title        = {Text Diffusion with Reinforced Conditioning},
  journal      = {CoRR},
  volume       = {abs/2402.14843},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.14843},
  doi          = {10.48550/ARXIV.2402.14843},
  eprinttype    = {arXiv},
  eprint       = {2402.14843},
  timestamp    = {Mon, 17 Jun 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-14843.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2402-15754,
  author       = {Yuxuan Liu and
                  Tianchi Yang and
                  Shaohan Huang and
                  Zihan Zhang and
                  Haizhen Huang and
                  Furu Wei and
                  Weiwei Deng and
                  Feng Sun and
                  Qi Zhang},
  title        = {HD-Eval: Aligning Large Language Model Evaluators Through Hierarchical
                  Criteria Decomposition},
  journal      = {CoRR},
  volume       = {abs/2402.15754},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.15754},
  doi          = {10.48550/ARXIV.2402.15754},
  eprinttype    = {arXiv},
  eprint       = {2402.15754},
  timestamp    = {Mon, 17 Jun 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-15754.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2402-17764,
  author       = {Shuming Ma and
                  Hongyu Wang and
                  Lingxiao Ma and
                  Lei Wang and
                  Wenhui Wang and
                  Shaohan Huang and
                  Li Dong and
                  Ruiping Wang and
                  Jilong Xue and
                  Furu Wei},
  title        = {The Era of 1-bit LLMs: All Large Language Models are in 1.58 Bits},
  journal      = {CoRR},
  volume       = {abs/2402.17764},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.17764},
  doi          = {10.48550/ARXIV.2402.17764},
  eprinttype    = {arXiv},
  eprint       = {2402.17764},
  timestamp    = {Fri, 19 Jul 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-17764.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2402-18039,
  author       = {Shuhua Shi and
                  Shaohan Huang and
                  Minghui Song and
                  Zhoujun Li and
                  Zihan Zhang and
                  Haizhen Huang and
                  Furu Wei and
                  Weiwei Deng and
                  Feng Sun and
                  Qi Zhang},
  title        = {ResLoRA: Identity Residual Mapping in Low-Rank Adaption},
  journal      = {CoRR},
  volume       = {abs/2402.18039},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.18039},
  doi          = {10.48550/ARXIV.2402.18039},
  eprinttype    = {arXiv},
  eprint       = {2402.18039},
  timestamp    = {Mon, 17 Jun 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-18039.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2403-09164,
  author       = {Yizhen Li and
                  Shaohan Huang and
                  Jiaxing Qi and
                  Lei Quan and
                  Dongran Han and
                  Zhongzhi Luan},
  title        = {Exploring the Comprehension of ChatGPT in Traditional Chinese Medicine
                  Knowledge},
  journal      = {CoRR},
  volume       = {abs/2403.09164},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2403.09164},
  doi          = {10.48550/ARXIV.2403.09164},
  eprinttype    = {arXiv},
  eprint       = {2403.09164},
  timestamp    = {Fri, 05 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2403-09164.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2404-13628,
  author       = {Xun Wu and
                  Shaohan Huang and
                  Furu Wei},
  title        = {Mixture of LoRA Experts},
  journal      = {CoRR},
  volume       = {abs/2404.13628},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2404.13628},
  doi          = {10.48550/ARXIV.2404.13628},
  eprinttype    = {arXiv},
  eprint       = {2404.13628},
  timestamp    = {Sat, 25 May 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2404-13628.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2404-15045,
  author       = {Xun Wu and
                  Shaohan Huang and
                  Wenhui Wang and
                  Furu Wei},
  title        = {Multi-Head Mixture-of-Experts},
  journal      = {CoRR},
  volume       = {abs/2404.15045},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2404.15045},
  doi          = {10.48550/ARXIV.2404.15045},
  eprinttype    = {arXiv},
  eprint       = {2404.15045},
  timestamp    = {Sat, 25 May 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2404-15045.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2404-15100,
  author       = {Xun Wu and
                  Shaohan Huang and
                  Furu Wei},
  title        = {Multimodal Large Language Model is a Human-Aligned Annotator for Text-to-Image
                  Generation},
  journal      = {CoRR},
  volume       = {abs/2404.15100},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2404.15100},
  doi          = {10.48550/ARXIV.2404.15100},
  eprinttype    = {arXiv},
  eprint       = {2404.15100},
  timestamp    = {Sat, 25 May 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2404-15100.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2405-05254,
  author       = {Yutao Sun and
                  Li Dong and
                  Yi Zhu and
                  Shaohan Huang and
                  Wenhui Wang and
                  Shuming Ma and
                  Quanlu Zhang and
                  Jianyong Wang and
                  Furu Wei},
  title        = {You Only Cache Once: Decoder-Decoder Architectures for Language Models},
  journal      = {CoRR},
  volume       = {abs/2405.05254},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2405.05254},
  doi          = {10.48550/ARXIV.2405.05254},
  eprinttype    = {arXiv},
  eprint       = {2405.05254},
  timestamp    = {Thu, 01 Aug 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2405-05254.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2405-12130,
  author       = {Ting Jiang and
                  Shaohan Huang and
                  Shengyue Luo and
                  Zihan Zhang and
                  Haizhen Huang and
                  Furu Wei and
                  Weiwei Deng and
                  Feng Sun and
                  Qi Zhang and
                  Deqing Wang and
                  Fuzhen Zhuang},
  title        = {MoRA: High-Rank Updating for Parameter-Efficient Fine-Tuning},
  journal      = {CoRR},
  volume       = {abs/2405.12130},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2405.12130},
  doi          = {10.48550/ARXIV.2405.12130},
  eprinttype    = {arXiv},
  eprint       = {2405.12130},
  timestamp    = {Tue, 23 Jul 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2405-12130.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2406-07925,
  author       = {Jiaxing Qi and
                  Zhongzhi Luan and
                  Shaohan Huang and
                  Carol J. Fung and
                  Hailong Yang and
                  Depei Qian},
  title        = {FDLoRA: Personalized Federated Learning of Large Language Model via
                  Dual LoRA Tuning},
  journal      = {CoRR},
  volume       = {abs/2406.07925},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2406.07925},
  doi          = {10.48550/ARXIV.2406.07925},
  eprinttype    = {arXiv},
  eprint       = {2406.07925},
  timestamp    = {Mon, 08 Jul 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2406-07925.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2406-14491,
  author       = {Daixuan Cheng and
                  Yuxian Gu and
                  Shaohan Huang and
                  Junyu Bi and
                  Minlie Huang and
                  Furu Wei},
  title        = {Instruction Pre-Training: Language Models are Supervised Multitask
                  Learners},
  journal      = {CoRR},
  volume       = {abs/2406.14491},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2406.14491},
  doi          = {10.48550/ARXIV.2406.14491},
  eprinttype    = {arXiv},
  eprint       = {2406.14491},
  timestamp    = {Tue, 16 Jul 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2406-14491.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tc/HuangLFWYL23,
  author       = {Shaohan Huang and
                  Yi Liu and
                  Carol J. Fung and
                  He Wang and
                  Hailong Yang and
                  Zhongzhi Luan},
  title        = {Improving Log-Based Anomaly Detection by Pre-Training Hierarchical
                  Transformers},
  journal      = {{IEEE} Trans. Computers},
  volume       = {72},
  number       = {9},
  pages        = {2656--2667},
  year         = {2023},
  url          = {https://doi.org/10.1109/TC.2023.3257518},
  doi          = {10.1109/TC.2023.3257518},
  timestamp    = {Fri, 18 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tc/HuangLFWYL23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tnsm/QiLHFYLZQ23,
  author       = {Jiaxing Qi and
                  Zhongzhi Luan and
                  Shaohan Huang and
                  Carol J. Fung and
                  Hailong Yang and
                  Hanlu Li and
                  Danfeng Zhu and
                  Depei Qian},
  title        = {LogEncoder: Log-Based Contrastive Representation Learning for Anomaly
                  Detection},
  journal      = {{IEEE} Trans. Netw. Serv. Manag.},
  volume       = {20},
  number       = {2},
  pages        = {1378--1391},
  year         = {2023},
  url          = {https://doi.org/10.1109/TNSM.2023.3239522},
  doi          = {10.1109/TNSM.2023.3239522},
  timestamp    = {Fri, 07 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tnsm/QiLHFYLZQ23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/XieHCW23,
  author       = {Yuan Xie and
                  Shaohan Huang and
                  Tianyu Chen and
                  Furu Wei},
  editor       = {Brian Williams and
                  Yiling Chen and
                  Jennifer Neville},
  title        = {MoEC: Mixture of Expert Clusters},
  booktitle    = {Thirty-Seventh {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2023, Thirty-Fifth Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2023, Thirteenth Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2023, Washington, DC, USA, February
                  7-14, 2023},
  pages        = {13807--13815},
  publisher    = {{AAAI} Press},
  year         = {2023},
  url          = {https://doi.org/10.1609/aaai.v37i11.26617},
  doi          = {10.1609/AAAI.V37I11.26617},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/XieHCW23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/ChenHZGLHWDZ23,
  author       = {Beiduo Chen and
                  Shaohan Huang and
                  Zihan Zhang and
                  Wu Guo and
                  Zhenhua Ling and
                  Haizhen Huang and
                  Furu Wei and
                  Weiwei Deng and
                  Qi Zhang},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {Pre-training Language Model as a Multi-perspective Course Learner},
  booktitle    = {Findings of the Association for Computational Linguistics: {ACL} 2023,
                  Toronto, Canada, July 9-14, 2023},
  pages        = {114--128},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.findings-acl.9},
  doi          = {10.18653/V1/2023.FINDINGS-ACL.9},
  timestamp    = {Mon, 17 Jun 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/ChenHZGLHWDZ23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/LiHZDLHJWDZ23,
  author       = {Ziheng Li and
                  Shaohan Huang and
                  Zihan Zhang and
                  Zhi{-}Hong Deng and
                  Qiang Lou and
                  Haizhen Huang and
                  Jian Jiao and
                  Furu Wei and
                  Weiwei Deng and
                  Qi Zhang},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {Dual-Alignment Pre-training for Cross-lingual Sentence Embedding},
  booktitle    = {Proceedings of the 61st Annual Meeting of the Association for Computational
                  Linguistics (Volume 1: Long Papers), {ACL} 2023, Toronto, Canada,
                  July 9-14, 2023},
  pages        = {3466--3478},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.acl-long.191},
  doi          = {10.18653/V1/2023.ACL-LONG.191},
  timestamp    = {Mon, 17 Jun 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/LiHZDLHJWDZ23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/YangM0HHYZYWL23,
  author       = {Jian Yang and
                  Shuming Ma and
                  Li Dong and
                  Shaohan Huang and
                  Haoyang Huang and
                  Yuwei Yin and
                  Dongdong Zhang and
                  Liqun Yang and
                  Furu Wei and
                  Zhoujun Li},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {GanLM: Encoder-Decoder Pre-training with an Auxiliary Discriminator},
  booktitle    = {Proceedings of the 61st Annual Meeting of the Association for Computational
                  Linguistics (Volume 1: Long Papers), {ACL} 2023, Toronto, Canada,
                  July 9-14, 2023},
  pages        = {9394--9412},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.acl-long.522},
  doi          = {10.18653/V1/2023.ACL-LONG.522},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/acl/YangM0HHYZYWL23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/SunDPMHBCSW23,
  author       = {Yutao Sun and
                  Li Dong and
                  Barun Patra and
                  Shuming Ma and
                  Shaohan Huang and
                  Alon Benhaim and
                  Vishrav Chaudhary and
                  Xia Song and
                  Furu Wei},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {A Length-Extrapolatable Transformer},
  booktitle    = {Proceedings of the 61st Annual Meeting of the Association for Computational
                  Linguistics (Volume 1: Long Papers), {ACL} 2023, Toronto, Canada,
                  July 9-14, 2023},
  pages        = {14590--14604},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.acl-long.816},
  doi          = {10.18653/V1/2023.ACL-LONG.816},
  timestamp    = {Thu, 10 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/SunDPMHBCSW23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/PatraSHC0WCS23,
  author       = {Barun Patra and
                  Saksham Singhal and
                  Shaohan Huang and
                  Zewen Chi and
                  Li Dong and
                  Furu Wei and
                  Vishrav Chaudhary and
                  Xia Song},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {Beyond English-Centric Bitexts for Better Multilingual Language Representation
                  Learning},
  booktitle    = {Proceedings of the 61st Annual Meeting of the Association for Computational
                  Linguistics (Volume 1: Long Papers), {ACL} 2023, Toronto, Canada,
                  July 9-14, 2023},
  pages        = {15354--15373},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.acl-long.856},
  doi          = {10.18653/V1/2023.ACL-LONG.856},
  timestamp    = {Thu, 10 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/PatraSHC0WCS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/WangHLWSZHWDSZ23,
  author       = {Zhaoyang Wang and
                  Shaohan Huang and
                  Yuxuan Liu and
                  Jiahai Wang and
                  Minghui Song and
                  Zihan Zhang and
                  Haizhen Huang and
                  Furu Wei and
                  Weiwei Deng and
                  Feng Sun and
                  Qi Zhang},
  editor       = {Houda Bouamor and
                  Juan Pino and
                  Kalika Bali},
  title        = {Democratizing Reasoning Ability: Tailored Learning from Large Language
                  Model},
  booktitle    = {Proceedings of the 2023 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2023, Singapore, December 6-10, 2023},
  pages        = {1948--1966},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.emnlp-main.120},
  doi          = {10.18653/V1/2023.EMNLP-MAIN.120},
  timestamp    = {Mon, 17 Jun 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/WangHLWSZHWDSZ23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/ChengHBZLW0WDZ23,
  author       = {Daixuan Cheng and
                  Shaohan Huang and
                  Junyu Bi and
                  Yuefeng Zhan and
                  Jianfeng Liu and
                  Yujing Wang and
                  Hao Sun and
                  Furu Wei and
                  Weiwei Deng and
                  Qi Zhang},
  editor       = {Houda Bouamor and
                  Juan Pino and
                  Kalika Bali},
  title        = {{UPRISE:} Universal Prompt Retrieval for Improving Zero-Shot Evaluation},
  booktitle    = {Proceedings of the 2023 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2023, Singapore, December 6-10, 2023},
  pages        = {12318--12337},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.emnlp-main.758},
  doi          = {10.18653/V1/2023.EMNLP-MAIN.758},
  timestamp    = {Mon, 17 Jun 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/ChengHBZLW0WDZ23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/hpcc/QiHLYFYQSXW23,
  author       = {Jiaxing Qi and
                  Shaohan Huang and
                  Zhongzhi Luan and
                  Shu Yang and
                  Carol J. Fung and
                  Hailong Yang and
                  Depei Qian and
                  Jing Shang and
                  Zhiwen Xiao and
                  Zhihui Wu},
  title        = {LogGPT: Exploring ChatGPT for Log-Based Anomaly Detection},
  booktitle    = {{IEEE} International Conference on High Performance Computing {\&}
                  Communications, Data Science {\&} Systems, Smart City {\&}
                  Dependability in Sensor, Cloud {\&} Big Data Systems {\&}
                  Application, HPCC/DSS/SmartCity/DependSys 2023, Melbourne, Australia,
                  December 17-21, 2023},
  pages        = {273--280},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/HPCC-DSS-SmartCity-DependSys60770.2023.00045},
  doi          = {10.1109/HPCC-DSS-SMARTCITY-DEPENDSYS60770.2023.00045},
  timestamp    = {Wed, 10 Apr 2024 17:07:58 +0200},
  biburl       = {https://dblp.org/rec/conf/hpcc/QiHLYFYQSXW23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/WangMH0WPWBSBPL23,
  author       = {Hongyu Wang and
                  Shuming Ma and
                  Shaohan Huang and
                  Li Dong and
                  Wenhui Wang and
                  Zhiliang Peng and
                  Yu Wu and
                  Payal Bajaj and
                  Saksham Singhal and
                  Alon Benhaim and
                  Barun Patra and
                  Zhun Liu and
                  Vishrav Chaudhary and
                  Xia Song and
                  Furu Wei},
  editor       = {Andreas Krause and
                  Emma Brunskill and
                  Kyunghyun Cho and
                  Barbara Engelhardt and
                  Sivan Sabato and
                  Jonathan Scarlett},
  title        = {Magneto: {A} Foundation Transformer},
  booktitle    = {International Conference on Machine Learning, {ICML} 2023, 23-29 July
                  2023, Honolulu, Hawaii, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {36077--36092},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v202/wang23u.html},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/WangMH0WPWBSBPL23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/Huang0WHSML0MPL23,
  author       = {Shaohan Huang and
                  Li Dong and
                  Wenhui Wang and
                  Yaru Hao and
                  Saksham Singhal and
                  Shuming Ma and
                  Tengchao Lv and
                  Lei Cui and
                  Owais Khan Mohammed and
                  Barun Patra and
                  Qiang Liu and
                  Kriti Aggarwal and
                  Zewen Chi and
                  Nils Johan Bertil Bjorck and
                  Vishrav Chaudhary and
                  Subhojit Som and
                  Xia Song and
                  Furu Wei},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {Language Is Not All You Need: Aligning Perception with Language Models},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/e425b75bac5742a008d643826428787c-Abstract-Conference.html},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/Huang0WHSML0MPL23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2302-14045,
  author       = {Shaohan Huang and
                  Li Dong and
                  Wenhui Wang and
                  Yaru Hao and
                  Saksham Singhal and
                  Shuming Ma and
                  Tengchao Lv and
                  Lei Cui and
                  Owais Khan Mohammed and
                  Barun Patra and
                  Qiang Liu and
                  Kriti Aggarwal and
                  Zewen Chi and
                  Johan Bjorck and
                  Vishrav Chaudhary and
                  Subhojit Som and
                  Xia Song and
                  Furu Wei},
  title        = {Language Is Not All You Need: Aligning Perception with Language Models},
  journal      = {CoRR},
  volume       = {abs/2302.14045},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2302.14045},
  doi          = {10.48550/ARXIV.2302.14045},
  eprinttype    = {arXiv},
  eprint       = {2302.14045},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2302-14045.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2303-08518,
  author       = {Daixuan Cheng and
                  Shaohan Huang and
                  Junyu Bi and
                  Yuefeng Zhan and
                  Jianfeng Liu and
                  Yujing Wang and
                  Hao Sun and
                  Furu Wei and
                  Denvy Deng and
                  Qi Zhang},
  title        = {{UPRISE:} Universal Prompt Retrieval for Improving Zero-Shot Evaluation},
  journal      = {CoRR},
  volume       = {abs/2303.08518},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2303.08518},
  doi          = {10.48550/ARXIV.2303.08518},
  eprinttype    = {arXiv},
  eprint       = {2303.08518},
  timestamp    = {Fri, 23 Aug 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2303-08518.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2303-11715,
  author       = {Shaohan Huang and
                  Yi Liu and
                  Carol J. Fung and
                  Jiaxing Qi and
                  Hailong Yang and
                  Zhongzhi Luan},
  title        = {LogQA: Question Answering in Unstructured Logs},
  journal      = {CoRR},
  volume       = {abs/2303.11715},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2303.11715},
  doi          = {10.48550/ARXIV.2303.11715},
  eprinttype    = {arXiv},
  eprint       = {2303.11715},
  timestamp    = {Sun, 16 Apr 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2303-11715.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-03981,
  author       = {Beiduo Chen and
                  Shaohan Huang and
                  Zihan Zhang and
                  Wu Guo and
                  Zhenhua Ling and
                  Haizhen Huang and
                  Furu Wei and
                  Weiwei Deng and
                  Qi Zhang},
  title        = {Pre-training Language Model as a Multi-perspective Course Learner},
  journal      = {CoRR},
  volume       = {abs/2305.03981},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.03981},
  doi          = {10.48550/ARXIV.2305.03981},
  eprinttype    = {arXiv},
  eprint       = {2305.03981},
  timestamp    = {Mon, 17 Jun 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-03981.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-09148,
  author       = {Ziheng Li and
                  Shaohan Huang and
                  Zihan Zhang and
                  Zhi{-}Hong Deng and
                  Qiang Lou and
                  Haizhen Huang and
                  Jian Jiao and
                  Furu Wei and
                  Weiwei Deng and
                  Qi Zhang},
  title        = {Dual-Alignment Pre-training for Cross-lingual Sentence Embedding},
  journal      = {CoRR},
  volume       = {abs/2305.09148},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.09148},
  doi          = {10.48550/ARXIV.2305.09148},
  eprinttype    = {arXiv},
  eprint       = {2305.09148},
  timestamp    = {Mon, 17 Jun 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-09148.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-19602,
  author       = {Tianyu Chen and
                  Yuan Xie and
                  Shuai Zhang and
                  Shaohan Huang and
                  Haoyi Zhou and
                  Jianxin Li},
  title        = {Learning Music Sequence Representation from Text Supervision},
  journal      = {CoRR},
  volume       = {abs/2305.19602},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.19602},
  doi          = {10.48550/ARXIV.2305.19602},
  eprinttype    = {arXiv},
  eprint       = {2305.19602},
  timestamp    = {Fri, 19 Jul 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-19602.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2306-14824,
  author       = {Zhiliang Peng and
                  Wenhui Wang and
                  Li Dong and
                  Yaru Hao and
                  Shaohan Huang and
                  Shuming Ma and
                  Furu Wei},
  title        = {Kosmos-2: Grounding Multimodal Large Language Models to the World},
  journal      = {CoRR},
  volume       = {abs/2306.14824},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.14824},
  doi          = {10.48550/ARXIV.2306.14824},
  eprinttype    = {arXiv},
  eprint       = {2306.14824},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-14824.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2307-02486,
  author       = {Jiayu Ding and
                  Shuming Ma and
                  Li Dong and
                  Xingxing Zhang and
                  Shaohan Huang and
                  Wenhui Wang and
                  Nanning Zheng and
                  Furu Wei},
  title        = {LongNet: Scaling Transformers to 1, 000, 000, 000 Tokens},
  journal      = {CoRR},
  volume       = {abs/2307.02486},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2307.02486},
  doi          = {10.48550/ARXIV.2307.02486},
  eprinttype    = {arXiv},
  eprint       = {2307.02486},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2307-02486.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2307-08621,
  author       = {Yutao Sun and
                  Li Dong and
                  Shaohan Huang and
                  Shuming Ma and
                  Yuqing Xia and
                  Jilong Xue and
                  Jianyong Wang and
                  Furu Wei},
  title        = {Retentive Network: {A} Successor to Transformer for Large Language
                  Models},
  journal      = {CoRR},
  volume       = {abs/2307.08621},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2307.08621},
  doi          = {10.48550/ARXIV.2307.08621},
  eprinttype    = {arXiv},
  eprint       = {2307.08621},
  timestamp    = {Tue, 25 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2307-08621.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2307-16645,
  author       = {Ting Jiang and
                  Shaohan Huang and
                  Zhongzhi Luan and
                  Deqing Wang and
                  Fuzhen Zhuang},
  title        = {Scaling Sentence Embeddings with Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2307.16645},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2307.16645},
  doi          = {10.48550/ARXIV.2307.16645},
  eprinttype    = {arXiv},
  eprint       = {2307.16645},
  timestamp    = {Wed, 02 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2307-16645.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2309-01189,
  author       = {Jiaxing Qi and
                  Shaohan Huang and
                  Zhongzhi Luan and
                  Carol J. Fung and
                  Hailong Yang and
                  Depei Qian},
  title        = {LogGPT: Exploring ChatGPT for Log-Based Anomaly Detection},
  journal      = {CoRR},
  volume       = {abs/2309.01189},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.01189},
  doi          = {10.48550/ARXIV.2309.01189},
  eprinttype    = {arXiv},
  eprint       = {2309.01189},
  timestamp    = {Mon, 11 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-01189.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2309-09530,
  author       = {Daixuan Cheng and
                  Shaohan Huang and
                  Furu Wei},
  title        = {Adapting Large Language Models via Reading Comprehension},
  journal      = {CoRR},
  volume       = {abs/2309.09530},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.09530},
  doi          = {10.48550/ARXIV.2309.09530},
  eprinttype    = {arXiv},
  eprint       = {2309.09530},
  timestamp    = {Fri, 22 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-09530.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2309-11419,
  author       = {Tengchao Lv and
                  Yupan Huang and
                  Jingye Chen and
                  Lei Cui and
                  Shuming Ma and
                  Yaoyao Chang and
                  Shaohan Huang and
                  Wenhui Wang and
                  Li Dong and
                  Weiyao Luo and
                  Shaoxiang Wu and
                  Guoxin Wang and
                  Cha Zhang and
                  Furu Wei},
  title        = {Kosmos-2.5: {A} Multimodal Literate Model},
  journal      = {CoRR},
  volume       = {abs/2309.11419},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.11419},
  doi          = {10.48550/ARXIV.2309.11419},
  eprinttype    = {arXiv},
  eprint       = {2309.11419},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-11419.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2309-13308,
  author       = {Yuxuan Liu and
                  Tianchi Yang and
                  Shaohan Huang and
                  Zihan Zhang and
                  Haizhen Huang and
                  Furu Wei and
                  Weiwei Deng and
                  Feng Sun and
                  Qi Zhang},
  title        = {Calibrating LLM-Based Evaluator},
  journal      = {CoRR},
  volume       = {abs/2309.13308},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.13308},
  doi          = {10.48550/ARXIV.2309.13308},
  eprinttype    = {arXiv},
  eprint       = {2309.13308},
  timestamp    = {Mon, 17 Jun 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-13308.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-02992,
  author       = {Xichen Pan and
                  Li Dong and
                  Shaohan Huang and
                  Zhiliang Peng and
                  Wenhu Chen and
                  Furu Wei},
  title        = {Kosmos-G: Generating Images in Context with Multimodal Large Language
                  Models},
  journal      = {CoRR},
  volume       = {abs/2310.02992},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.02992},
  doi          = {10.48550/ARXIV.2310.02992},
  eprinttype    = {arXiv},
  eprint       = {2310.02992},
  timestamp    = {Thu, 19 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-02992.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-11453,
  author       = {Hongyu Wang and
                  Shuming Ma and
                  Li Dong and
                  Shaohan Huang and
                  Huaijie Wang and
                  Lingxiao Ma and
                  Fan Yang and
                  Ruiping Wang and
                  Yi Wu and
                  Furu Wei},
  title        = {BitNet: Scaling 1-bit Transformers for Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2310.11453},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.11453},
  doi          = {10.48550/ARXIV.2310.11453},
  eprinttype    = {arXiv},
  eprint       = {2310.11453},
  timestamp    = {Tue, 16 Jul 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-11453.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-13332,
  author       = {Zhaoyang Wang and
                  Shaohan Huang and
                  Yuxuan Liu and
                  Jiahai Wang and
                  Minghui Song and
                  Zihan Zhang and
                  Haizhen Huang and
                  Furu Wei and
                  Weiwei Deng and
                  Feng Sun and
                  Qi Zhang},
  title        = {Democratizing Reasoning Ability: Tailored Learning from Large Language
                  Model},
  journal      = {CoRR},
  volume       = {abs/2310.13332},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.13332},
  doi          = {10.48550/ARXIV.2310.13332},
  eprinttype    = {arXiv},
  eprint       = {2310.13332},
  timestamp    = {Mon, 17 Jun 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-13332.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/complexity/SuiSHHL22,
  author       = {Xin Sui and
                  Guifen Shi and
                  Guanchong Hou and
                  Shaohan Huang and
                  Yanshuang Li},
  title        = {Impacts of {COVID-19} on the Return and Volatility Nexus among Cryptocurrency
                  Market},
  journal      = {Complex.},
  volume       = {2022},
  pages        = {5346080:1--5346080:15},
  year         = {2022},
  url          = {https://doi.org/10.1155/2022/5346080},
  doi          = {10.1155/2022/5346080},
  timestamp    = {Mon, 26 Sep 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/complexity/SuiSHHL22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tnsm/DaiLHFWYQ22,
  author       = {Shaozhi Dai and
                  Zhongzhi Luan and
                  Shaohan Huang and
                  Carol J. Fung and
                  He Wang and
                  Hailong Yang and
                  Depei Qian},
  title        = {{REVAL:} Recommend Which Variables to Log With Pretrained Model and
                  Graph Neural Network},
  journal      = {{IEEE} Trans. Netw. Serv. Manag.},
  volume       = {19},
  number       = {4},
  pages        = {4045--4057},
  year         = {2022},
  url          = {https://doi.org/10.1109/TNSM.2022.3209317},
  doi          = {10.1109/TNSM.2022.3209317},
  timestamp    = {Fri, 10 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/tnsm/DaiLHFWYQ22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/ChenBHDJJZLW22,
  author       = {Tianyu Chen and
                  Hangbo Bao and
                  Shaohan Huang and
                  Li Dong and
                  Binxing Jiao and
                  Daxin Jiang and
                  Haoyi Zhou and
                  Jianxin Li and
                  Furu Wei},
  editor       = {Smaranda Muresan and
                  Preslav Nakov and
                  Aline Villavicencio},
  title        = {{THE-X:} Privacy-Preserving Transformer Inference with Homomorphic
                  Encryption},
  booktitle    = {Findings of the Association for Computational Linguistics: {ACL} 2022,
                  Dublin, Ireland, May 22-27, 2022},
  pages        = {3510--3520},
  publisher    = {Association for Computational Linguistics},
  year         = {2022},
  url          = {https://doi.org/10.18653/v1/2022.findings-acl.277},
  doi          = {10.18653/V1/2022.FINDINGS-ACL.277},
  timestamp    = {Thu, 06 Apr 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/ChenBHDJJZLW22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/ChiH0MZSBSMHW22,
  author       = {Zewen Chi and
                  Shaohan Huang and
                  Li Dong and
                  Shuming Ma and
                  Bo Zheng and
                  Saksham Singhal and
                  Payal Bajaj and
                  Xia Song and
                  Xian{-}Ling Mao and
                  Heyan Huang and
                  Furu Wei},
  editor       = {Smaranda Muresan and
                  Preslav Nakov and
                  Aline Villavicencio},
  title        = {{XLM-E:} Cross-lingual Language Model Pre-training via {ELECTRA}},
  booktitle    = {Proceedings of the 60th Annual Meeting of the Association for Computational
                  Linguistics (Volume 1: Long Papers), {ACL} 2022, Dublin, Ireland,
                  May 22-27, 2022},
  pages        = {6170--6182},
  publisher    = {Association for Computational Linguistics},
  year         = {2022},
  url          = {https://doi.org/10.18653/v1/2022.acl-long.427},
  doi          = {10.18653/V1/2022.ACL-LONG.427},
  timestamp    = {Wed, 07 Aug 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/ChiH0MZSBSMHW22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cnsm/HuangLFYL22,
  author       = {Shaohan Huang and
                  Yi Liu and
                  Carol J. Fung and
                  Hailong Yang and
                  Zhongzhi Luan},
  editor       = {Marinos Charalambides and
                  Panagiotis Papadimitriou and
                  Walter Cerroni and
                  Salil S. Kanhere and
                  Lefteris Mamatas},
  title        = {Black-box Attacks to Log-based Anomaly Detection},
  booktitle    = {18th International Conference on Network and Service Management, {CNSM}
                  2022, Thessaloniki, Greece, October 31 - Nov. 4, 2022},
  pages        = {310--316},
  publisher    = {{IEEE}},
  year         = {2022},
  url          = {https://doi.org/10.23919/CNSM55787.2022.9964935},
  doi          = {10.23919/CNSM55787.2022.9964935},
  timestamp    = {Thu, 08 Dec 2022 15:05:27 +0100},
  biburl       = {https://dblp.org/rec/conf/cnsm/HuangLFYL22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/YangHMY0ZGLW22,
  author       = {Jian Yang and
                  Shaohan Huang and
                  Shuming Ma and
                  Yuwei Yin and
                  Li Dong and
                  Dongdong Zhang and
                  Hongcheng Guo and
                  Zhoujun Li and
                  Furu Wei},
  editor       = {Yoav Goldberg and
                  Zornitsa Kozareva and
                  Yue Zhang},
  title        = {{CROP:} Zero-shot Cross-lingual Named Entity Recognition with Multilingual
                  Labeled Sequence Translation},
  booktitle    = {Findings of the Association for Computational Linguistics: {EMNLP}
                  2022, Abu Dhabi, United Arab Emirates, December 7-11, 2022},
  pages        = {486--496},
  publisher    = {Association for Computational Linguistics},
  year         = {2022},
  url          = {https://doi.org/10.18653/v1/2022.findings-emnlp.34},
  doi          = {10.18653/V1/2022.FINDINGS-EMNLP.34},
  timestamp    = {Tue, 07 May 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/YangHMY0ZGLW22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/ChengHLZ0WDZ22,
  author       = {Daixuan Cheng and
                  Shaohan Huang and
                  Jianfeng Liu and
                  Yuefeng Zhan and
                  Hao Sun and
                  Furu Wei and
                  Denvy Deng and
                  Qi Zhang},
  editor       = {Yoav Goldberg and
                  Zornitsa Kozareva and
                  Yue Zhang},
  title        = {Snapshot-Guided Domain Adaptation for {ELECTRA}},
  booktitle    = {Findings of the Association for Computational Linguistics: {EMNLP}
                  2022, Abu Dhabi, United Arab Emirates, December 7-11, 2022},
  pages        = {2226--2232},
  publisher    = {Association for Computational Linguistics},
  year         = {2022},
  url          = {https://doi.org/10.18653/v1/2022.findings-emnlp.163},
  doi          = {10.18653/V1/2022.FINDINGS-EMNLP.163},
  timestamp    = {Fri, 23 Aug 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/ChengHLZ0WDZ22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/JiangJHZWZWHDZ22,
  author       = {Ting Jiang and
                  Jian Jiao and
                  Shaohan Huang and
                  Zihan Zhang and
                  Deqing Wang and
                  Fuzhen Zhuang and
                  Furu Wei and
                  Haizhen Huang and
                  Denvy Deng and
                  Qi Zhang},
  editor       = {Yoav Goldberg and
                  Zornitsa Kozareva and
                  Yue Zhang},
  title        = {PromptBERT: Improving {BERT} Sentence Embeddings with Prompts},
  booktitle    = {Proceedings of the 2022 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2022, Abu Dhabi, United Arab Emirates,
                  December 7-11, 2022},
  pages        = {8826--8837},
  publisher    = {Association for Computational Linguistics},
  year         = {2022},
  url          = {https://doi.org/10.18653/v1/2022.emnlp-main.603},
  doi          = {10.18653/V1/2022.EMNLP-MAIN.603},
  timestamp    = {Tue, 16 Jul 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/JiangJHZWZWHDZ22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/ChenXZHZL22,
  author       = {Tianyu Chen and
                  Yuan Xie and
                  Shuai Zhang and
                  Shaohan Huang and
                  Haoyi Zhou and
                  Jianxin Li},
  title        = {Learning Music Sequence Representation From Text Supervision},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2022, Virtual and Singapore, 23-27 May 2022},
  pages        = {4583--4587},
  publisher    = {{IEEE}},
  year         = {2022},
  url          = {https://doi.org/10.1109/ICASSP43922.2022.9746131},
  doi          = {10.1109/ICASSP43922.2022.9746131},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/ChenXZHZL22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/Chi0HDMPSBSMHW22,
  author       = {Zewen Chi and
                  Li Dong and
                  Shaohan Huang and
                  Damai Dai and
                  Shuming Ma and
                  Barun Patra and
                  Saksham Singhal and
                  Payal Bajaj and
                  Xia Song and
                  Xian{-}Ling Mao and
                  Heyan Huang and
                  Furu Wei},
  editor       = {Sanmi Koyejo and
                  S. Mohamed and
                  A. Agarwal and
                  Danielle Belgrave and
                  K. Cho and
                  A. Oh},
  title        = {On the Representation Collapse of Sparse Mixture of Experts},
  booktitle    = {Advances in Neural Information Processing Systems 35: Annual Conference
                  on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans,
                  LA, USA, November 28 - December 9, 2022},
  year         = {2022},
  url          = {http://papers.nips.cc/paper\_files/paper/2022/hash/df4f371f1f89ec8ba5014b3310578048-Abstract-Conference.html},
  timestamp    = {Mon, 08 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/Chi0HDMPSBSMHW22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nlpcc/YaoHDWCZ22,
  author       = {Yunzhi Yao and
                  Shaohan Huang and
                  Li Dong and
                  Furu Wei and
                  Huajun Chen and
                  Ningyu Zhang},
  editor       = {Wei Lu and
                  Shujian Huang and
                  Yu Hong and
                  Xiabing Zhou},
  title        = {Kformer: Knowledge Injection in Transformer Feed-Forward Layers},
  booktitle    = {Natural Language Processing and Chinese Computing - 11th {CCF} International
                  Conference, {NLPCC} 2022, Guilin, China, September 24-25, 2022, Proceedings,
                  Part {I}},
  series       = {Lecture Notes in Computer Science},
  volume       = {13551},
  pages        = {131--143},
  publisher    = {Springer},
  year         = {2022},
  url          = {https://doi.org/10.1007/978-3-031-17120-8\_11},
  doi          = {10.1007/978-3-031-17120-8\_11},
  timestamp    = {Tue, 27 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nlpcc/YaoHDWCZ22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/noms/QiLHWFYQ22,
  author       = {Jiaxing Qi and
                  Zhongzhi Luan and
                  Shaohan Huang and
                  Yukun Wang and
                  Carol J. Fung and
                  Hailong Yang and
                  Depei Qian},
  title        = {Adanomaly: Adaptive Anomaly Detection for System Logs with Adversarial
                  Learning},
  booktitle    = {2022 {IEEE/IFIP} Network Operations and Management Symposium, {NOMS}
                  2022, Budapest, Hungary, April 25-29, 2022},
  pages        = {1--5},
  publisher    = {{IEEE}},
  year         = {2022},
  url          = {https://doi.org/10.1109/NOMS54207.2022.9789917},
  doi          = {10.1109/NOMS54207.2022.9789917},
  timestamp    = {Wed, 15 Jun 2022 16:45:18 +0200},
  biburl       = {https://dblp.org/rec/conf/noms/QiLHWFYQ22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2201-04337,
  author       = {Ting Jiang and
                  Shaohan Huang and
                  Zihan Zhang and
                  Deqing Wang and
                  Fuzhen Zhuang and
                  Furu Wei and
                  Haizhen Huang and
                  Liangjie Zhang and
                  Qi Zhang},
  title        = {PromptBERT: Improving {BERT} Sentence Embeddings with Prompts},
  journal      = {CoRR},
  volume       = {abs/2201.04337},
  year         = {2022},
  url          = {https://arxiv.org/abs/2201.04337},
  eprinttype    = {arXiv},
  eprint       = {2201.04337},
  timestamp    = {Mon, 17 Jun 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2201-04337.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2201-05742,
  author       = {Yunzhi Yao and
                  Shaohan Huang and
                  Ningyu Zhang and
                  Li Dong and
                  Furu Wei and
                  Huajun Chen},
  title        = {Kformer: Knowledge Injection in Transformer Feed-Forward Layers},
  journal      = {CoRR},
  volume       = {abs/2201.05742},
  year         = {2022},
  url          = {https://arxiv.org/abs/2201.05742},
  eprinttype    = {arXiv},
  eprint       = {2201.05742},
  timestamp    = {Tue, 27 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2201-05742.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2203-00555,
  author       = {Hongyu Wang and
                  Shuming Ma and
                  Li Dong and
                  Shaohan Huang and
                  Dongdong Zhang and
                  Furu Wei},
  title        = {DeepNet: Scaling Transformers to 1, 000 Layers},
  journal      = {CoRR},
  volume       = {abs/2203.00555},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2203.00555},
  doi          = {10.48550/ARXIV.2203.00555},
  eprinttype    = {arXiv},
  eprint       = {2203.00555},
  timestamp    = {Tue, 20 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2203-00555.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2204-09179,
  author       = {Zewen Chi and
                  Li Dong and
                  Shaohan Huang and
                  Damai Dai and
                  Shuming Ma and
                  Barun Patra and
                  Saksham Singhal and
                  Payal Bajaj and
                  Xia Song and
                  Furu Wei},
  title        = {On the Representation Collapse of Sparse Mixture of Experts},
  journal      = {CoRR},
  volume       = {abs/2204.09179},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2204.09179},
  doi          = {10.48550/ARXIV.2204.09179},
  eprinttype    = {arXiv},
  eprint       = {2204.09179},
  timestamp    = {Mon, 25 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2204-09179.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2206-00216,
  author       = {Tianyu Chen and
                  Hangbo Bao and
                  Shaohan Huang and
                  Li Dong and
                  Binxing Jiao and
                  Daxin Jiang and
                  Haoyi Zhou and
                  Jianxin Li and
                  Furu Wei},
  title        = {{THE-X:} Privacy-Preserving Transformer Inference with Homomorphic
                  Encryption},
  journal      = {CoRR},
  volume       = {abs/2206.00216},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.00216},
  doi          = {10.48550/ARXIV.2206.00216},
  eprinttype    = {arXiv},
  eprint       = {2206.00216},
  timestamp    = {Mon, 01 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-00216.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2206-00277,
  author       = {Tianyu Chen and
                  Shaohan Huang and
                  Yuan Xie and
                  Binxing Jiao and
                  Daxin Jiang and
                  Haoyi Zhou and
                  Jianxin Li and
                  Furu Wei},
  title        = {Task-Specific Expert Pruning for Sparse Mixture-of-Experts},
  journal      = {CoRR},
  volume       = {abs/2206.00277},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.00277},
  doi          = {10.48550/ARXIV.2206.00277},
  eprinttype    = {arXiv},
  eprint       = {2206.00277},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-00277.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2206-06336,
  author       = {Yaru Hao and
                  Haoyu Song and
                  Li Dong and
                  Shaohan Huang and
                  Zewen Chi and
                  Wenhui Wang and
                  Shuming Ma and
                  Furu Wei},
  title        = {Language Models are General-Purpose Interfaces},
  journal      = {CoRR},
  volume       = {abs/2206.06336},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.06336},
  doi          = {10.48550/ARXIV.2206.06336},
  eprinttype    = {arXiv},
  eprint       = {2206.06336},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-06336.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2207-09094,
  author       = {Yuan Xie and
                  Shaohan Huang and
                  Tianyu Chen and
                  Furu Wei},
  title        = {MoEC: Mixture of Expert Clusters},
  journal      = {CoRR},
  volume       = {abs/2207.09094},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2207.09094},
  doi          = {10.48550/ARXIV.2207.09094},
  eprinttype    = {arXiv},
  eprint       = {2207.09094},
  timestamp    = {Mon, 25 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2207-09094.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-06423,
  author       = {Hongyu Wang and
                  Shuming Ma and
                  Shaohan Huang and
                  Li Dong and
                  Wenhui Wang and
                  Zhiliang Peng and
                  Yu Wu and
                  Payal Bajaj and
                  Saksham Singhal and
                  Alon Benhaim and
                  Barun Patra and
                  Zhun Liu and
                  Vishrav Chaudhary and
                  Xia Song and
                  Furu Wei},
  title        = {Foundation Transformers},
  journal      = {CoRR},
  volume       = {abs/2210.06423},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.06423},
  doi          = {10.48550/ARXIV.2210.06423},
  eprinttype    = {arXiv},
  eprint       = {2210.06423},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-06423.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-07022,
  author       = {Jian Yang and
                  Shaohan Huang and
                  Shuming Ma and
                  Yuwei Yin and
                  Li Dong and
                  Dongdong Zhang and
                  Hongcheng Guo and
                  Zhoujun Li and
                  Furu Wei},
  title        = {{CROP:} Zero-shot Cross-lingual Named Entity Recognition with Multilingual
                  Labeled Sequence Translation},
  journal      = {CoRR},
  volume       = {abs/2210.07022},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.07022},
  doi          = {10.48550/ARXIV.2210.07022},
  eprinttype    = {arXiv},
  eprint       = {2210.07022},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-07022.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-14867,
  author       = {Barun Patra and
                  Saksham Singhal and
                  Shaohan Huang and
                  Zewen Chi and
                  Li Dong and
                  Furu Wei and
                  Vishrav Chaudhary and
                  Xia Song},
  title        = {Beyond English-Centric Bitexts for Better Multilingual Language Representation
                  Learning},
  journal      = {CoRR},
  volume       = {abs/2210.14867},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.14867},
  doi          = {10.48550/ARXIV.2210.14867},
  eprinttype    = {arXiv},
  eprint       = {2210.14867},
  timestamp    = {Wed, 02 Nov 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-14867.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2211-13184,
  author       = {Shuming Ma and
                  Hongyu Wang and
                  Shaohan Huang and
                  Wenhui Wang and
                  Zewen Chi and
                  Li Dong and
                  Alon Benhaim and
                  Barun Patra and
                  Vishrav Chaudhary and
                  Xia Song and
                  Furu Wei},
  title        = {TorchScale: Transformers at Scale},
  journal      = {CoRR},
  volume       = {abs/2211.13184},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2211.13184},
  doi          = {10.48550/ARXIV.2211.13184},
  eprinttype    = {arXiv},
  eprint       = {2211.13184},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2211-13184.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2212-10218,
  author       = {Jian Yang and
                  Shuming Ma and
                  Li Dong and
                  Shaohan Huang and
                  Haoyang Huang and
                  Yuwei Yin and
                  Dongdong Zhang and
                  Liqun Yang and
                  Zhoujun Li and
                  Furu Wei},
  title        = {GanLM: Encoder-Decoder Pre-training with an Auxiliary Discriminator},
  journal      = {CoRR},
  volume       = {abs/2212.10218},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2212.10218},
  doi          = {10.48550/ARXIV.2212.10218},
  eprinttype    = {arXiv},
  eprint       = {2212.10218},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2212-10218.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2212-10554,
  author       = {Yutao Sun and
                  Li Dong and
                  Barun Patra and
                  Shuming Ma and
                  Shaohan Huang and
                  Alon Benhaim and
                  Vishrav Chaudhary and
                  Xia Song and
                  Furu Wei},
  title        = {A Length-Extrapolatable Transformer},
  journal      = {CoRR},
  volume       = {abs/2212.10554},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2212.10554},
  doi          = {10.48550/ARXIV.2212.10554},
  eprinttype    = {arXiv},
  eprint       = {2212.10554},
  timestamp    = {Wed, 04 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2212-10554.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/YaoHWDW21,
  author       = {Yunzhi Yao and
                  Shaohan Huang and
                  Wenhui Wang and
                  Li Dong and
                  Furu Wei},
  editor       = {Chengqing Zong and
                  Fei Xia and
                  Wenjie Li and
                  Roberto Navigli},
  title        = {Adapt-and-Distill: Developing Small, Fast and Effective Pretrained
                  Language Models for Domains},
  booktitle    = {Findings of the Association for Computational Linguistics: {ACL/IJCNLP}
                  2021, Online Event, August 1-6, 2021},
  series       = {Findings of {ACL}},
  volume       = {{ACL/IJCNLP} 2021},
  pages        = {460--470},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.findings-acl.40},
  doi          = {10.18653/V1/2021.FINDINGS-ACL.40},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/YaoHWDW21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/WangBHDW21,
  author       = {Wenhui Wang and
                  Hangbo Bao and
                  Shaohan Huang and
                  Li Dong and
                  Furu Wei},
  editor       = {Chengqing Zong and
                  Fei Xia and
                  Wenjie Li and
                  Roberto Navigli},
  title        = {MiniLMv2: Multi-Head Self-Attention Relation Distillation for Compressing
                  Pretrained Transformers},
  booktitle    = {Findings of the Association for Computational Linguistics: {ACL/IJCNLP}
                  2021, Online Event, August 1-6, 2021},
  series       = {Findings of {ACL}},
  volume       = {{ACL/IJCNLP} 2021},
  pages        = {2140--2151},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.findings-acl.188},
  doi          = {10.18653/V1/2021.FINDINGS-ACL.188},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/WangBHDW21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/Zheng0HWCSC0SW20,
  author       = {Bo Zheng and
                  Li Dong and
                  Shaohan Huang and
                  Wenhui Wang and
                  Zewen Chi and
                  Saksham Singhal and
                  Wanxiang Che and
                  Ting Liu and
                  Xia Song and
                  Furu Wei},
  editor       = {Chengqing Zong and
                  Fei Xia and
                  Wenjie Li and
                  Roberto Navigli},
  title        = {Consistency Regularization for Cross-Lingual Fine-Tuning},
  booktitle    = {Proceedings of the 59th Annual Meeting of the Association for Computational
                  Linguistics and the 11th International Joint Conference on Natural
                  Language Processing, {ACL/IJCNLP} 2021, (Volume 1: Long Papers), Virtual
                  Event, August 1-6, 2021},
  pages        = {3403--3417},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.acl-long.264},
  doi          = {10.18653/V1/2021.ACL-LONG.264},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/Zheng0HWCSC0SW20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/Chi0ZHMHW20,
  author       = {Zewen Chi and
                  Li Dong and
                  Bo Zheng and
                  Shaohan Huang and
                  Xian{-}Ling Mao and
                  Heyan Huang and
                  Furu Wei},
  editor       = {Chengqing Zong and
                  Fei Xia and
                  Wenjie Li and
                  Roberto Navigli},
  title        = {Improving Pretrained Cross-Lingual Language Models via Self-Labeled
                  Word Alignment},
  booktitle    = {Proceedings of the 59th Annual Meeting of the Association for Computational
                  Linguistics and the 11th International Joint Conference on Natural
                  Language Processing, {ACL/IJCNLP} 2021, (Volume 1: Long Papers), Virtual
                  Event, August 1-6, 2021},
  pages        = {3418--3430},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.acl-long.265},
  doi          = {10.18653/V1/2021.ACL-LONG.265},
  timestamp    = {Thu, 08 Aug 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/Chi0ZHMHW20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ccgrid/GaoYHDLLLQ21,
  author       = {Ruiyuan Gao and
                  Hailong Yang and
                  Shaohan Huang and
                  Ming Dun and
                  Mingzhen Li and
                  Zerong Luan and
                  Zhongzhi Luan and
                  Depei Qian},
  editor       = {Laurent Lef{\`{e}}vre and
                  Stacy Patterson and
                  Young Choon Lee and
                  Haiying Shen and
                  Shashikant Ilager and
                  Mohammad Goudarzi and
                  Adel Nadjaran Toosi and
                  Rajkumar Buyya},
  title        = {PriPro: Towards Effective Privacy Protection on Edge-Cloud System
                  running {DNN} Inference},
  booktitle    = {21st {IEEE/ACM} International Symposium on Cluster, Cloud and Internet
                  Computing, CCGrid 2021, Melbourne, Australia, May 10-13, 2021},
  pages        = {334--343},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/CCGrid51090.2021.00043},
  doi          = {10.1109/CCGRID51090.2021.00043},
  timestamp    = {Thu, 02 Sep 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ccgrid/GaoYHDLLLQ21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/ChiDMHSMHSW21,
  author       = {Zewen Chi and
                  Li Dong and
                  Shuming Ma and
                  Shaohan Huang and
                  Saksham Singhal and
                  Xian{-}Ling Mao and
                  Heyan Huang and
                  Xia Song and
                  Furu Wei},
  editor       = {Marie{-}Francine Moens and
                  Xuanjing Huang and
                  Lucia Specia and
                  Scott Wen{-}tau Yih},
  title        = {mT6: Multilingual Pretrained Text-to-Text Transformer with Translation
                  Pairs},
  booktitle    = {Proceedings of the 2021 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2021, Virtual Event / Punta Cana, Dominican
                  Republic, 7-11 November, 2021},
  pages        = {1671--1683},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.emnlp-main.125},
  doi          = {10.18653/V1/2021.EMNLP-MAIN.125},
  timestamp    = {Fri, 16 Feb 2024 08:27:36 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/ChiDMHSMHSW21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/ZhengDHSCLSW21,
  author       = {Bo Zheng and
                  Li Dong and
                  Shaohan Huang and
                  Saksham Singhal and
                  Wanxiang Che and
                  Ting Liu and
                  Xia Song and
                  Furu Wei},
  editor       = {Marie{-}Francine Moens and
                  Xuanjing Huang and
                  Lucia Specia and
                  Scott Wen{-}tau Yih},
  title        = {Allocating Large Vocabulary Capacity for Cross-Lingual Language Model
                  Pre-Training},
  booktitle    = {Proceedings of the 2021 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2021, Virtual Event / Punta Cana, Dominican
                  Republic, 7-11 November, 2021},
  pages        = {3203--3215},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.emnlp-main.257},
  doi          = {10.18653/V1/2021.EMNLP-MAIN.257},
  timestamp    = {Wed, 16 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/ZhengDHSCLSW21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/wmt/YangMH00HMSHSW21,
  author       = {Jian Yang and
                  Shuming Ma and
                  Haoyang Huang and
                  Dongdong Zhang and
                  Li Dong and
                  Shaohan Huang and
                  Alexandre Muzio and
                  Saksham Singhal and
                  Hany Hassan and
                  Xia Song and
                  Furu Wei},
  editor       = {Lo{\"{\i}}c Barrault and
                  Ondrej Bojar and
                  Fethi Bougares and
                  Rajen Chatterjee and
                  Marta R. Costa{-}juss{\`{a}} and
                  Christian Federmann and
                  Mark Fishel and
                  Alexander Fraser and
                  Markus Freitag and
                  Yvette Graham and
                  Roman Grundkiewicz and
                  Paco Guzman and
                  Barry Haddow and
                  Matthias Huck and
                  Antonio Jimeno{-}Yepes and
                  Philipp Koehn and
                  Tom Kocmi and
                  Andr{\'{e}} Martins and
                  Makoto Morishita and
                  Christof Monz},
  title        = {Multilingual Machine Translation Systems from Microsoft for {WMT21}
                  Shared Task},
  booktitle    = {Proceedings of the Sixth Conference on Machine Translation, WMT@EMNLP
                  2021, Online Event, November 10-11, 2021},
  pages        = {446--455},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://aclanthology.org/2021.wmt-1.54},
  timestamp    = {Wed, 07 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/wmt/YangMH00HMSHSW21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2104-08692,
  author       = {Zewen Chi and
                  Li Dong and
                  Shuming Ma and
                  Shaohan Huang and
                  Xian{-}Ling Mao and
                  Heyan Huang and
                  Furu Wei},
  title        = {mT6: Multilingual Pretrained Text-to-Text Transformer with Translation
                  Pairs},
  journal      = {CoRR},
  volume       = {abs/2104.08692},
  year         = {2021},
  url          = {https://arxiv.org/abs/2104.08692},
  eprinttype    = {arXiv},
  eprint       = {2104.08692},
  timestamp    = {Mon, 26 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2104-08692.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-06381,
  author       = {Zewen Chi and
                  Li Dong and
                  Bo Zheng and
                  Shaohan Huang and
                  Xian{-}Ling Mao and
                  Heyan Huang and
                  Furu Wei},
  title        = {Improving Pretrained Cross-Lingual Language Models via Self-Labeled
                  Word Alignment},
  journal      = {CoRR},
  volume       = {abs/2106.06381},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.06381},
  eprinttype    = {arXiv},
  eprint       = {2106.06381},
  timestamp    = {Wed, 07 Aug 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-06381.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-08226,
  author       = {Bo Zheng and
                  Li Dong and
                  Shaohan Huang and
                  Wenhui Wang and
                  Zewen Chi and
                  Saksham Singhal and
                  Wanxiang Che and
                  Ting Liu and
                  Xia Song and
                  Furu Wei},
  title        = {Consistency Regularization for Cross-Lingual Fine-Tuning},
  journal      = {CoRR},
  volume       = {abs/2106.08226},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.08226},
  eprinttype    = {arXiv},
  eprint       = {2106.08226},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-08226.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-13474,
  author       = {Yunzhi Yao and
                  Shaohan Huang and
                  Wenhui Wang and
                  Li Dong and
                  Furu Wei},
  title        = {Adapt-and-Distill: Developing Small, Fast and Effective Pretrained
                  Language Models for Domains},
  journal      = {CoRR},
  volume       = {abs/2106.13474},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.13474},
  eprinttype    = {arXiv},
  eprint       = {2106.13474},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-13474.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-13736,
  author       = {Shuming Ma and
                  Li Dong and
                  Shaohan Huang and
                  Dongdong Zhang and
                  Alexandre Muzio and
                  Saksham Singhal and
                  Hany Hassan Awadalla and
                  Xia Song and
                  Furu Wei},
  title        = {DeltaLM: Encoder-Decoder Pre-training for Language Generation and
                  Translation by Augmenting Pretrained Multilingual Encoders},
  journal      = {CoRR},
  volume       = {abs/2106.13736},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.13736},
  eprinttype    = {arXiv},
  eprint       = {2106.13736},
  timestamp    = {Wed, 30 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-13736.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-16138,
  author       = {Zewen Chi and
                  Shaohan Huang and
                  Li Dong and
                  Shuming Ma and
                  Saksham Singhal and
                  Payal Bajaj and
                  Xia Song and
                  Furu Wei},
  title        = {{XLM-E:} Cross-lingual Language Model Pre-training via {ELECTRA}},
  journal      = {CoRR},
  volume       = {abs/2106.16138},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.16138},
  eprinttype    = {arXiv},
  eprint       = {2106.16138},
  timestamp    = {Mon, 05 Jul 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-16138.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2109-07306,
  author       = {Bo Zheng and
                  Li Dong and
                  Shaohan Huang and
                  Saksham Singhal and
                  Wanxiang Che and
                  Ting Liu and
                  Xia Song and
                  Furu Wei},
  title        = {Allocating Large Vocabulary Capacity for Cross-lingual Language Model
                  Pre-training},
  journal      = {CoRR},
  volume       = {abs/2109.07306},
  year         = {2021},
  url          = {https://arxiv.org/abs/2109.07306},
  eprinttype    = {arXiv},
  eprint       = {2109.07306},
  timestamp    = {Wed, 16 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2109-07306.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2110-11115,
  author       = {Ting Jiang and
                  Shaohan Huang and
                  Zihan Zhang and
                  Deqing Wang and
                  Fuzhen Zhuang and
                  Furu Wei and
                  Haizhen Huang and
                  Liangjie Zhang and
                  Qi Zhang},
  title        = {Improving Non-autoregressive Generation with Mixup Training},
  journal      = {CoRR},
  volume       = {abs/2110.11115},
  year         = {2021},
  url          = {https://arxiv.org/abs/2110.11115},
  eprinttype    = {arXiv},
  eprint       = {2110.11115},
  timestamp    = {Mon, 17 Jun 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2110-11115.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2111-02086,
  author       = {Jian Yang and
                  Shuming Ma and
                  Haoyang Huang and
                  Dongdong Zhang and
                  Li Dong and
                  Shaohan Huang and
                  Alexandre Muzio and
                  Saksham Singhal and
                  Hany Hassan Awadalla and
                  Xia Song and
                  Furu Wei},
  title        = {Multilingual Machine Translation Systems from Microsoft for {WMT21}
                  Shared Task},
  journal      = {CoRR},
  volume       = {abs/2111.02086},
  year         = {2021},
  url          = {https://arxiv.org/abs/2111.02086},
  eprinttype    = {arXiv},
  eprint       = {2111.02086},
  timestamp    = {Wed, 07 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2111-02086.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/ZhouYWHZZ20,
  author       = {Qingyu Zhou and
                  Nan Yang and
                  Furu Wei and
                  Shaohan Huang and
                  Ming Zhou and
                  Tiejun Zhao},
  title        = {A Joint Sentence Scoring and Selection Framework for Neural Extractive
                  Document Summarization},
  journal      = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.},
  volume       = {28},
  pages        = {671--681},
  year         = {2020},
  url          = {https://doi.org/10.1109/TASLP.2020.2964427},
  doi          = {10.1109/TASLP.2020.2964427},
  timestamp    = {Fri, 13 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/taslp/ZhouYWHZZ20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tnsm/HuangLFHZYL20,
  author       = {Shaohan Huang and
                  Yi Liu and
                  Carol J. Fung and
                  Rong He and
                  Yining Zhao and
                  Hailong Yang and
                  Zhongzhi Luan},
  title        = {HitAnomaly: Hierarchical Transformers for Anomaly Detection in System
                  Log},
  journal      = {{IEEE} Trans. Netw. Serv. Manag.},
  volume       = {17},
  number       = {4},
  pages        = {2064--2076},
  year         = {2020},
  url          = {https://doi.org/10.1109/TNSM.2020.3034647},
  doi          = {10.1109/TNSM.2020.3034647},
  timestamp    = {Wed, 15 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tnsm/HuangLFHZYL20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cnsm/HuangLFHZYL20,
  author       = {Shaohan Huang and
                  Yi Liu and
                  Carol J. Fung and
                  Rong He and
                  Yining Zhao and
                  Hailong Yang and
                  Zhongzhi Luan},
  editor       = {Nur Zincir{-}Heywood and
                  Mehmet Ulema and
                  M{\"{u}}ge Sayit and
                  Stuart Clayman and
                  Myung{-}Sup Kim and
                  Cihat Cetinkaya},
  title        = {Transfer Log-based Anomaly Detection with Pseudo Labels},
  booktitle    = {16th International Conference on Network and Service Management, {CNSM}
                  2020, Izmir, Turkey, November 2-6, 2020},
  pages        = {1--5},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.23919/CNSM50824.2020.9269069},
  doi          = {10.23919/CNSM50824.2020.9269069},
  timestamp    = {Fri, 08 Dec 2023 07:53:07 +0100},
  biburl       = {https://dblp.org/rec/conf/cnsm/HuangLFHZYL20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/coling/LiXCHWLZ20,
  author       = {Minghao Li and
                  Yiheng Xu and
                  Lei Cui and
                  Shaohan Huang and
                  Furu Wei and
                  Zhoujun Li and
                  Ming Zhou},
  editor       = {Donia Scott and
                  N{\'{u}}ria Bel and
                  Chengqing Zong},
  title        = {DocBank: {A} Benchmark Dataset for Document Layout Analysis},
  booktitle    = {Proceedings of the 28th International Conference on Computational
                  Linguistics, {COLING} 2020, Barcelona, Spain (Online), December 8-13,
                  2020},
  pages        = {949--960},
  publisher    = {International Committee on Computational Linguistics},
  year         = {2020},
  url          = {https://doi.org/10.18653/v1/2020.coling-main.82},
  doi          = {10.18653/V1/2020.COLING-MAIN.82},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/coling/LiXCHWLZ20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/coling/HuangWCZZ20,
  author       = {Shaohan Huang and
                  Furu Wei and
                  Lei Cui and
                  Xingxing Zhang and
                  Ming Zhou},
  editor       = {Donia Scott and
                  N{\'{u}}ria Bel and
                  Chengqing Zong},
  title        = {Unsupervised Fine-tuning for Text Clustering},
  booktitle    = {Proceedings of the 28th International Conference on Computational
                  Linguistics, {COLING} 2020, Barcelona, Spain (Online), December 8-13,
                  2020},
  pages        = {5530--5534},
  publisher    = {International Committee on Computational Linguistics},
  year         = {2020},
  url          = {https://doi.org/10.18653/v1/2020.coling-main.482},
  doi          = {10.18653/V1/2020.COLING-MAIN.482},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/coling/HuangWCZZ20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/JiKHWZH20,
  author       = {Haozhe Ji and
                  Pei Ke and
                  Shaohan Huang and
                  Furu Wei and
                  Xiaoyan Zhu and
                  Minlie Huang},
  editor       = {Bonnie Webber and
                  Trevor Cohn and
                  Yulan He and
                  Yang Liu},
  title        = {Language Generation with Multi-Hop Reasoning on Commonsense Knowledge
                  Graph},
  booktitle    = {Proceedings of the 2020 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2020, Online, November 16-20, 2020},
  pages        = {725--736},
  publisher    = {Association for Computational Linguistics},
  year         = {2020},
  url          = {https://doi.org/10.18653/v1/2020.emnlp-main.54},
  doi          = {10.18653/V1/2020.EMNLP-MAIN.54},
  timestamp    = {Tue, 20 Aug 2024 07:54:43 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/JiKHWZH20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icoin/HuangLFAHZYL20,
  author       = {Shaohan Huang and
                  Yi Liu and
                  Carol J. Fung and
                  Wanhe An and
                  Rong He and
                  Yining Zhao and
                  Hailong Yang and
                  Zhongzhi Luan},
  title        = {A Gated Few-shot Learning Model For Anomaly Detection},
  booktitle    = {2020 International Conference on Information Networking, {ICOIN} 2020,
                  Barcelona, Spain, January 7-10, 2020},
  pages        = {505--509},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.1109/ICOIN48656.2020.9016599},
  doi          = {10.1109/ICOIN48656.2020.9016599},
  timestamp    = {Thu, 13 Jan 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icoin/HuangLFAHZYL20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcnlp/JiKHWH20,
  author       = {Haozhe Ji and
                  Pei Ke and
                  Shaohan Huang and
                  Furu Wei and
                  Minlie Huang},
  editor       = {Kam{-}Fai Wong and
                  Kevin Knight and
                  Hua Wu},
  title        = {Generating Commonsense Explanation by Extracting Bridge Concepts from
                  Reasoning Paths},
  booktitle    = {Proceedings of the 1st Conference of the Asia-Pacific Chapter of the
                  Association for Computational Linguistics and the 10th International
                  Joint Conference on Natural Language Processing, {AACL/IJCNLP} 2020,
                  Suzhou, China, December 4-7, 2020},
  pages        = {248--257},
  publisher    = {Association for Computational Linguistics},
  year         = {2020},
  url          = {https://aclanthology.org/2020.aacl-main.28/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcnlp/JiKHWH20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/kdd/XuL0HW020,
  author       = {Yiheng Xu and
                  Minghao Li and
                  Lei Cui and
                  Shaohan Huang and
                  Furu Wei and
                  Ming Zhou},
  editor       = {Rajesh Gupta and
                  Yan Liu and
                  Jiliang Tang and
                  B. Aditya Prakash},
  title        = {LayoutLM: Pre-training of Text and Layout for Document Image Understanding},
  booktitle    = {{KDD} '20: The 26th {ACM} {SIGKDD} Conference on Knowledge Discovery
                  and Data Mining, Virtual Event, CA, USA, August 23-27, 2020},
  pages        = {1192--1200},
  publisher    = {{ACM}},
  year         = {2020},
  url          = {https://doi.org/10.1145/3394486.3403172},
  doi          = {10.1145/3394486.3403172},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/kdd/XuL0HW020.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/lrec/LiCHWZL20,
  author       = {Minghao Li and
                  Lei Cui and
                  Shaohan Huang and
                  Furu Wei and
                  Ming Zhou and
                  Zhoujun Li},
  editor       = {Nicoletta Calzolari and
                  Fr{\'{e}}d{\'{e}}ric B{\'{e}}chet and
                  Philippe Blache and
                  Khalid Choukri and
                  Christopher Cieri and
                  Thierry Declerck and
                  Sara Goggi and
                  Hitoshi Isahara and
                  Bente Maegaard and
                  Joseph Mariani and
                  H{\'{e}}l{\`{e}}ne Mazo and
                  Asunci{\'{o}}n Moreno and
                  Jan Odijk and
                  Stelios Piperidis},
  title        = {TableBank: Table Benchmark for Image-based Table Detection and Recognition},
  booktitle    = {Proceedings of The 12th Language Resources and Evaluation Conference,
                  {LREC} 2020, Marseille, France, May 11-16, 2020},
  pages        = {1918--1925},
  publisher    = {European Language Resources Association},
  year         = {2020},
  url          = {https://aclanthology.org/2020.lrec-1.236/},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/lrec/LiCHWZL20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/noms/HuangLFHZYL20,
  author       = {Shaohan Huang and
                  Yi Liu and
                  Carol J. Fung and
                  Rong He and
                  Yining Zhao and
                  Hailong Yang and
                  Zhongzhi Luan},
  title        = {Paddy: An Event Log Parsing Approach using Dynamic Dictionary},
  booktitle    = {{NOMS} 2020 - {IEEE/IFIP} Network Operations and Management Symposium,
                  Budapest, Hungary, April 20-24, 2020},
  pages        = {1--8},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.1109/NOMS47738.2020.9110435},
  doi          = {10.1109/NOMS47738.2020.9110435},
  timestamp    = {Wed, 15 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/noms/HuangLFHZYL20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-01038,
  author       = {Minghao Li and
                  Yiheng Xu and
                  Lei Cui and
                  Shaohan Huang and
                  Furu Wei and
                  Zhoujun Li and
                  Ming Zhou},
  title        = {DocBank: {A} Benchmark Dataset for Document Layout Analysis},
  journal      = {CoRR},
  volume       = {abs/2006.01038},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.01038},
  eprinttype    = {arXiv},
  eprint       = {2006.01038},
  timestamp    = {Thu, 16 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-01038.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2009-11692,
  author       = {Haozhe Ji and
                  Pei Ke and
                  Shaohan Huang and
                  Furu Wei and
                  Xiaoyan Zhu and
                  Minlie Huang},
  title        = {Language Generation with Multi-Hop Reasoning on Commonsense Knowledge
                  Graph},
  journal      = {CoRR},
  volume       = {abs/2009.11692},
  year         = {2020},
  url          = {https://arxiv.org/abs/2009.11692},
  eprinttype    = {arXiv},
  eprint       = {2009.11692},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2009-11692.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2009-11753,
  author       = {Haozhe Ji and
                  Pei Ke and
                  Shaohan Huang and
                  Furu Wei and
                  Minlie Huang},
  title        = {Generating Commonsense Explanation by Extracting Bridge Concepts from
                  Reasoning Paths},
  journal      = {CoRR},
  volume       = {abs/2009.11753},
  year         = {2020},
  url          = {https://arxiv.org/abs/2009.11753},
  eprinttype    = {arXiv},
  eprint       = {2009.11753},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2009-11753.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2012-15828,
  author       = {Wenhui Wang and
                  Hangbo Bao and
                  Shaohan Huang and
                  Li Dong and
                  Furu Wei},
  title        = {MiniLMv2: Multi-Head Self-Attention Relation Distillation for Compressing
                  Pretrained Transformers},
  journal      = {CoRR},
  volume       = {abs/2012.15828},
  year         = {2020},
  url          = {https://arxiv.org/abs/2012.15828},
  eprinttype    = {arXiv},
  eprint       = {2012.15828},
  timestamp    = {Fri, 19 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2012-15828.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/Huang0WL19,
  author       = {Shaohan Huang and
                  Yu Wu and
                  Furu Wei and
                  Zhongzhi Luan},
  title        = {Dictionary-Guided Editing Networks for Paraphrase Generation},
  booktitle    = {The Thirty-Third {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2019, The Thirty-First Innovative Applications of Artificial Intelligence
                  Conference, {IAAI} 2019, The Ninth {AAAI} Symposium on Educational
                  Advances in Artificial Intelligence, {EAAI} 2019, Honolulu, Hawaii,
                  USA, January 27 - February 1, 2019},
  pages        = {6546--6553},
  publisher    = {{AAAI} Press},
  year         = {2019},
  url          = {https://doi.org/10.1609/aaai.v33i01.33016546},
  doi          = {10.1609/AAAI.V33I01.33016546},
  timestamp    = {Mon, 04 Sep 2023 12:29:24 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/Huang0WL19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/0006WHWL019,
  author       = {Yu Wu and
                  Furu Wei and
                  Shaohan Huang and
                  Yunli Wang and
                  Zhoujun Li and
                  Ming Zhou},
  title        = {Response Generation by Context-Aware Prototype Editing},
  booktitle    = {The Thirty-Third {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2019, The Thirty-First Innovative Applications of Artificial Intelligence
                  Conference, {IAAI} 2019, The Ninth {AAAI} Symposium on Educational
                  Advances in Artificial Intelligence, {EAAI} 2019, Honolulu, Hawaii,
                  USA, January 27 - February 1, 2019},
  pages        = {7281--7288},
  publisher    = {{AAAI} Press},
  year         = {2019},
  url          = {https://doi.org/10.1609/aaai.v33i01.33017281},
  doi          = {10.1609/AAAI.V33I01.33017281},
  timestamp    = {Sun, 04 Aug 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/0006WHWL019.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nlpcc/BaoHWC0TPZ19,
  author       = {Hangbo Bao and
                  Shaohan Huang and
                  Furu Wei and
                  Lei Cui and
                  Yu Wu and
                  Chuanqi Tan and
                  Songhao Piao and
                  Ming Zhou},
  editor       = {Jie Tang and
                  Min{-}Yen Kan and
                  Dongyan Zhao and
                  Sujian Li and
                  Hongying Zan},
  title        = {Neural Melody Composition from Lyrics},
  booktitle    = {Natural Language Processing and Chinese Computing - 8th {CCF} International
                  Conference, {NLPCC} 2019, Dunhuang, China, October 9-14, 2019, Proceedings,
                  Part {I}},
  series       = {Lecture Notes in Computer Science},
  volume       = {11838},
  pages        = {499--511},
  publisher    = {Springer},
  year         = {2019},
  url          = {https://doi.org/10.1007/978-3-030-32233-5\_39},
  doi          = {10.1007/978-3-030-32233-5\_39},
  timestamp    = {Wed, 26 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nlpcc/BaoHWC0TPZ19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1903-01949,
  author       = {Minghao Li and
                  Lei Cui and
                  Shaohan Huang and
                  Furu Wei and
                  Ming Zhou and
                  Zhoujun Li},
  title        = {TableBank: Table Benchmark for Image-based Table Detection and Recognition},
  journal      = {CoRR},
  volume       = {abs/1903.01949},
  year         = {2019},
  url          = {http://arxiv.org/abs/1903.01949},
  eprinttype    = {arXiv},
  eprint       = {1903.01949},
  timestamp    = {Thu, 16 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1903-01949.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1912-13318,
  author       = {Yiheng Xu and
                  Minghao Li and
                  Lei Cui and
                  Shaohan Huang and
                  Furu Wei and
                  Ming Zhou},
  title        = {LayoutLM: Pre-training of Text and Layout for Document Image Understanding},
  journal      = {CoRR},
  volume       = {abs/1912.13318},
  year         = {2019},
  url          = {http://arxiv.org/abs/1912.13318},
  eprinttype    = {arXiv},
  eprint       = {1912.13318},
  timestamp    = {Mon, 01 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1912-13318.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/ZhaoZWYHZ18,
  author       = {Qingyu Zhou and
                  Nan Yang and
                  Furu Wei and
                  Shaohan Huang and
                  Ming Zhou and
                  Tiejun Zhao},
  editor       = {Iryna Gurevych and
                  Yusuke Miyao},
  title        = {Neural Document Summarization by Jointly Learning to Score and Select
                  Sentences},
  booktitle    = {Proceedings of the 56th Annual Meeting of the Association for Computational
                  Linguistics, {ACL} 2018, Melbourne, Australia, July 15-20, 2018, Volume
                  1: Long Papers},
  pages        = {654--663},
  publisher    = {Association for Computational Linguistics},
  year         = {2018},
  url          = {https://aclanthology.org/P18-1061/},
  doi          = {10.18653/V1/P18-1061},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/ZhaoZWYHZ18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1806-07042,
  author       = {Yu Wu and
                  Furu Wei and
                  Shaohan Huang and
                  Zhoujun Li and
                  Ming Zhou},
  title        = {Response Generation by Context-aware Prototype Editing},
  journal      = {CoRR},
  volume       = {abs/1806.07042},
  year         = {2018},
  url          = {http://arxiv.org/abs/1806.07042},
  eprinttype    = {arXiv},
  eprint       = {1806.07042},
  timestamp    = {Wed, 26 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1806-07042.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1806-08077,
  author       = {Shaohan Huang and
                  Yu Wu and
                  Furu Wei and
                  Ming Zhou},
  title        = {Dictionary-Guided Editing Networks for Paraphrase Generation},
  journal      = {CoRR},
  volume       = {abs/1806.08077},
  year         = {2018},
  url          = {http://arxiv.org/abs/1806.08077},
  eprinttype    = {arXiv},
  eprint       = {1806.08077},
  timestamp    = {Wed, 26 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1806-08077.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1807-02305,
  author       = {Qingyu Zhou and
                  Nan Yang and
                  Furu Wei and
                  Shaohan Huang and
                  Ming Zhou and
                  Tiejun Zhao},
  title        = {Neural Document Summarization by Jointly Learning to Score and Select
                  Sentences},
  journal      = {CoRR},
  volume       = {abs/1807.02305},
  year         = {2018},
  url          = {http://arxiv.org/abs/1807.02305},
  eprinttype    = {arXiv},
  eprint       = {1807.02305},
  timestamp    = {Wed, 25 Sep 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1807-02305.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1809-04318,
  author       = {Hangbo Bao and
                  Shaohan Huang and
                  Furu Wei and
                  Lei Cui and
                  Yu Wu and
                  Chuanqi Tan and
                  Songhao Piao and
                  Ming Zhou},
  title        = {Neural Melody Composition from Lyrics},
  journal      = {CoRR},
  volume       = {abs/1809.04318},
  year         = {2018},
  url          = {http://arxiv.org/abs/1809.04318},
  eprinttype    = {arXiv},
  eprint       = {1809.04318},
  timestamp    = {Wed, 26 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1809-04318.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1810-00341,
  author       = {Shaohan Huang and
                  Yu Wu and
                  Furu Wei and
                  Ming Zhou},
  title        = {Text Morphing},
  journal      = {CoRR},
  volume       = {abs/1810.00341},
  year         = {2018},
  url          = {http://arxiv.org/abs/1810.00341},
  eprinttype    = {arXiv},
  eprint       = {1810.00341},
  timestamp    = {Wed, 26 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1810-00341.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/CuiHWTDZ17,
  author       = {Lei Cui and
                  Shaohan Huang and
                  Furu Wei and
                  Chuanqi Tan and
                  Chaoqun Duan and
                  Ming Zhou},
  editor       = {Mohit Bansal and
                  Heng Ji},
  title        = {SuperAgent: {A} Customer Service Chatbot for E-commerce Websites},
  booktitle    = {Proceedings of the 55th Annual Meeting of the Association for Computational
                  Linguistics, {ACL} 2017, Vancouver, Canada, July 30 - August 4, System
                  Demonstrations},
  pages        = {97--102},
  publisher    = {Association for Computational Linguistics},
  year         = {2017},
  url          = {https://doi.org/10.18653/v1/P17-4017},
  doi          = {10.18653/V1/P17-4017},
  timestamp    = {Fri, 06 Aug 2021 00:40:50 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/CuiHWTDZ17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cnsm/HuangFLZWLQ17,
  author       = {Shaohan Huang and
                  Carol J. Fung and
                  Chang Liu and
                  Shupeng Zhang and
                  Guang Wei and
                  Zhongzhi Luan and
                  Depei Qian},
  title        = {Arena: Adaptive real-time update anomaly prediction in cloud systems},
  booktitle    = {13th International Conference on Network and Service Management, {CNSM}
                  2017, Tokyo, Japan, November 26-30, 2017},
  pages        = {1--9},
  publisher    = {{IEEE} Computer Society},
  year         = {2017},
  url          = {https://doi.org/10.23919/CNSM.2017.8256031},
  doi          = {10.23919/CNSM.2017.8256031},
  timestamp    = {Wed, 16 Oct 2019 14:14:54 +0200},
  biburl       = {https://dblp.org/rec/conf/cnsm/HuangFLZWLQ17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eacl/ZhouLWDHX17,
  author       = {Li Dong and
                  Shaohan Huang and
                  Furu Wei and
                  Mirella Lapata and
                  Ming Zhou and
                  Ke Xu},
  editor       = {Mirella Lapata and
                  Phil Blunsom and
                  Alexander Koller},
  title        = {Learning to Generate Product Reviews from Attributes},
  booktitle    = {Proceedings of the 15th Conference of the European Chapter of the
                  Association for Computational Linguistics, {EACL} 2017, Valencia,
                  Spain, April 3-7, 2017, Volume 1: Long Papers},
  pages        = {623--632},
  publisher    = {Association for Computational Linguistics},
  year         = {2017},
  url          = {https://doi.org/10.18653/v1/e17-1059},
  doi          = {10.18653/V1/E17-1059},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/eacl/ZhouLWDHX17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iwqos/ZhangFHLQ17,
  author       = {Shupeng Zhang and
                  Carol J. Fung and
                  Shaohan Huang and
                  Zhongzhi Luan and
                  Depei Qian},
  title        = {{PSOM:} Periodic Self-Organizing Maps for unsupervised anomaly detection
                  in periodic time series},
  booktitle    = {25th {IEEE/ACM} International Symposium on Quality of Service, IWQoS
                  2017, Vilanova i la Geltr{\'{u}}, Spain, June 14-16, 2017},
  pages        = {1--6},
  publisher    = {{IEEE}},
  year         = {2017},
  url          = {https://doi.org/10.1109/IWQoS.2017.7969174},
  doi          = {10.1109/IWQOS.2017.7969174},
  timestamp    = {Wed, 16 Oct 2019 14:14:53 +0200},
  biburl       = {https://dblp.org/rec/conf/iwqos/ZhangFHLQ17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iwqos/HuangFWPLQ16,
  author       = {Shaohan Huang and
                  Carol J. Fung and
                  Kui Wang and
                  Polo Pei and
                  Zhongzhi Luan and
                  Depei Qian},
  title        = {Using recurrent neural networks toward black-box system anomaly prediction},
  booktitle    = {24th {IEEE/ACM} International Symposium on Quality of Service, IWQoS
                  2016, Beijing, China, June 20-21, 2016},
  pages        = {1--10},
  publisher    = {{IEEE}},
  year         = {2016},
  url          = {https://doi.org/10.1109/IWQoS.2016.7590435},
  doi          = {10.1109/IWQOS.2016.7590435},
  timestamp    = {Wed, 16 Oct 2019 14:14:53 +0200},
  biburl       = {https://dblp.org/rec/conf/iwqos/HuangFWPLQ16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cloudnet/HuangoFWYLQ15,
  author       = {Shaohan Huang and
                  Carol J. Fung and
                  Kui Wang and
                  Yaqi Yang and
                  Zhongzhi Luan and
                  Depei Qian},
  title        = {Revisit network anomaly ranking in datacenter network using re-ranking},
  booktitle    = {4th {IEEE} International Conference on Cloud Networking, CloudNet
                  2015, Niagara Falls, ON, Canada, October 5-7, 2015},
  pages        = {178--183},
  publisher    = {{IEEE}},
  year         = {2015},
  url          = {https://doi.org/10.1109/CloudNet.2015.7335302},
  doi          = {10.1109/CLOUDNET.2015.7335302},
  timestamp    = {Mon, 03 Jan 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cloudnet/HuangoFWYLQ15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iwqos/WangFDPHLQ15,
  author       = {Kui Wang and
                  Carol J. Fung and
                  Chao Ding and
                  Polo Pei and
                  Shaohan Huang and
                  Zhongzhi Luan and
                  Depei Qian},
  title        = {A methodology for root-cause analysis in component based systems},
  booktitle    = {23rd {IEEE} International Symposium on Quality of Service, IWQoS 2015,
                  Portland, OR, USA, June 15-16, 2015},
  pages        = {243--248},
  publisher    = {{IEEE}},
  year         = {2015},
  url          = {https://doi.org/10.1109/IWQoS.2015.7404741},
  doi          = {10.1109/IWQOS.2015.7404741},
  timestamp    = {Wed, 16 Oct 2019 14:14:53 +0200},
  biburl       = {https://dblp.org/rec/conf/iwqos/WangFDPHLQ15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}