default search action
BibTeX records: Shaohan Huang
@article{DBLP:journals/pami/WangMDHZW24, author = {Hongyu Wang and Shuming Ma and Li Dong and Shaohan Huang and Dongdong Zhang and Furu Wei}, title = {DeepNet: Scaling Transformers to 1,000 Layers}, journal = {{IEEE} Trans. Pattern Anal. Mach. Intell.}, volume = {46}, number = {10}, pages = {6761--6774}, year = {2024}, url = {https://doi.org/10.1109/TPAMI.2024.3386927}, doi = {10.1109/TPAMI.2024.3386927}, timestamp = {Tue, 24 Sep 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/pami/WangMDHZW24.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/tc/QiLHFY24, author = {Jiaxing Qi and Zhongzhi Luan and Shaohan Huang and Carol J. Fung and Hailong Yang}, title = {LogSay: An Efficient Comprehension System for Log Numerical Reasoning}, journal = {{IEEE} Trans. Computers}, volume = {73}, number = {7}, pages = {1809--1821}, year = {2024}, url = {https://doi.org/10.1109/TC.2024.3386068}, doi = {10.1109/TC.2024.3386068}, timestamp = {Thu, 04 Jul 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/tc/QiLHFY24.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/LiuYHZHWDSZ24, author = {Yuxuan Liu and Tianchi Yang and Shaohan Huang and Zihan Zhang and Haizhen Huang and Furu Wei and Weiwei Deng and Feng Sun and Qi Zhang}, editor = {Michael J. Wooldridge and Jennifer G. Dy and Sriraam Natarajan}, title = {Text Diffusion with Reinforced Conditioning}, booktitle = {Thirty-Eighth {AAAI} Conference on Artificial Intelligence, {AAAI} 2024, Thirty-Sixth Conference on Innovative Applications of Artificial Intelligence, {IAAI} 2024, Fourteenth Symposium on Educational Advances in Artificial Intelligence, {EAAI} 2014, February 20-27, 2024, Vancouver, Canada}, pages = {14069--14077}, publisher = {{AAAI} Press}, year = {2024}, url = {https://doi.org/10.1609/aaai.v38i12.29316}, doi = {10.1609/AAAI.V38I12.29316}, timestamp = {Mon, 17 Jun 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/LiuYHZHWDSZ24.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/acl/LiuLHZSDW024, author = {Haoyu Liu and Jianfeng Liu and Shaohan Huang and Yuefeng Zhan and Hao Sun and Weiwei Deng and Furu Wei and Qi Zhang}, editor = {Lun{-}Wei Ku and Andre Martins and Vivek Srikumar}, title = {Se{\({^2}\)}: Sequential Example Selection for In-Context Learning}, booktitle = {Findings of the Association for Computational Linguistics, {ACL} 2024, Bangkok, Thailand and virtual meeting, August 11-16, 2024}, pages = {5262--5284}, publisher = {Association for Computational Linguistics}, year = {2024}, url = {https://doi.org/10.18653/v1/2024.findings-acl.312}, doi = {10.18653/V1/2024.FINDINGS-ACL.312}, timestamp = {Tue, 24 Sep 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/acl/LiuLHZSDW024.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/acl/LiuYHZHWD0024, author = {Yuxuan Liu and Tianchi Yang and Shaohan Huang and Zihan Zhang and Haizhen Huang and Furu Wei and Weiwei Deng and Feng Sun and Qi Zhang}, editor = {Lun{-}Wei Ku and Andre Martins and Vivek Srikumar}, title = {HD-Eval: Aligning Large Language Model Evaluators Through Hierarchical Criteria Decomposition}, booktitle = {Proceedings of the 62nd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), {ACL} 2024, Bangkok, Thailand, August 11-16, 2024}, pages = {7641--7660}, publisher = {Association for Computational Linguistics}, year = {2024}, url = {https://doi.org/10.18653/v1/2024.acl-long.413}, doi = {10.18653/V1/2024.ACL-LONG.413}, timestamp = {Tue, 24 Sep 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/acl/LiuYHZHWD0024.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/acl/ShiHSLZHWD0Z24, author = {Shuhua Shi and Shaohan Huang and Minghui Song and Zhoujun Li and Zihan Zhang and Haizhen Huang and Furu Wei and Weiwei Deng and Feng Sun and Qi Zhang}, editor = {Lun{-}Wei Ku and Andre Martins and Vivek Srikumar}, title = {ResLoRA: Identity Residual Mapping in Low-Rank Adaption}, booktitle = {Findings of the Association for Computational Linguistics, {ACL} 2024, Bangkok, Thailand and virtual meeting, August 11-16, 2024}, pages = {8870--8884}, publisher = {Association for Computational Linguistics}, year = {2024}, url = {https://doi.org/10.18653/v1/2024.findings-acl.525}, doi = {10.18653/V1/2024.FINDINGS-ACL.525}, timestamp = {Tue, 24 Sep 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/acl/ShiHSLZHWD0Z24.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/coling/LiuYHZHWDSZ24, author = {Yuxuan Liu and Tianchi Yang and Shaohan Huang and Zihan Zhang and Haizhen Huang and Furu Wei and Weiwei Deng and Feng Sun and Qi Zhang}, editor = {Nicoletta Calzolari and Min{-}Yen Kan and V{\'{e}}ronique Hoste and Alessandro Lenci and Sakriani Sakti and Nianwen Xue}, title = {Calibrating LLM-Based Evaluator}, booktitle = {Proceedings of the 2024 Joint International Conference on Computational Linguistics, Language Resources and Evaluation, {LREC/COLING} 2024, 20-25 May, 2024, Torino, Italy}, pages = {2638--2656}, publisher = {{ELRA} and {ICCL}}, year = {2024}, url = {https://aclanthology.org/2024.lrec-main.237}, timestamp = {Mon, 17 Jun 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/coling/LiuYHZHWDSZ24.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/hpdc/HuangL24, author = {Shaohan Huang and Zhongzhi Luan}, editor = {Patrizio Dazzi and Gabriele Mencagli and David K. Lowenthal and Rosa M. Badia}, title = {Semantic-Aware Log Understanding and Analysis}, booktitle = {Proceedings of the 33rd International Symposium on High-Performance Parallel and Distributed Computing, {HPDC} 2024, Pisa, Italy, June 3-7, 2024}, pages = {413--416}, publisher = {{ACM}}, year = {2024}, url = {https://doi.org/10.1145/3625549.3658830}, doi = {10.1145/3625549.3658830}, timestamp = {Sun, 08 Sep 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/hpdc/HuangL24.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/ChengHW24, author = {Daixuan Cheng and Shaohan Huang and Furu Wei}, title = {Adapting Large Language Models via Reading Comprehension}, booktitle = {The Twelfth International Conference on Learning Representations, {ICLR} 2024, Vienna, Austria, May 7-11, 2024}, publisher = {OpenReview.net}, year = {2024}, url = {https://openreview.net/forum?id=y886UXPEZ0}, timestamp = {Wed, 07 Aug 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/ChengHW24.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/Pan0HPCW24, author = {Xichen Pan and Li Dong and Shaohan Huang and Zhiliang Peng and Wenhu Chen and Furu Wei}, title = {Kosmos-G: Generating Images in Context with Multimodal Large Language Models}, booktitle = {The Twelfth International Conference on Learning Representations, {ICLR} 2024, Vienna, Austria, May 7-11, 2024}, publisher = {OpenReview.net}, year = {2024}, url = {https://openreview.net/forum?id=he6mX9LTyE}, timestamp = {Wed, 07 Aug 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/Pan0HPCW24.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/Peng00HHMYW24, author = {Zhiliang Peng and Wenhui Wang and Li Dong and Yaru Hao and Shaohan Huang and Shuming Ma and Qixiang Ye and Furu Wei}, title = {Grounding Multimodal Large Language Models to the World}, booktitle = {The Twelfth International Conference on Learning Representations, {ICLR} 2024, Vienna, Austria, May 7-11, 2024}, publisher = {OpenReview.net}, year = {2024}, url = {https://openreview.net/forum?id=lLmqxkfSIw}, timestamp = {Wed, 07 Aug 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/Peng00HHMYW24.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/WuHW24, author = {Xun Wu and Shaohan Huang and Furu Wei}, title = {Mixture of LoRA Experts}, booktitle = {The Twelfth International Conference on Learning Representations, {ICLR} 2024, Vienna, Austria, May 7-11, 2024}, publisher = {OpenReview.net}, year = {2024}, url = {https://openreview.net/forum?id=uWvKBCYh4S}, timestamp = {Wed, 07 Aug 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/WuHW24.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/wcre/Huang0QSXFWYLQ24, author = {Shaohan Huang and Yi Liu and Jiaxing Qi and Jing Shang and Zhiwen Xiao and Carol J. Fung and Zhihui Wu and Hailong Yang and Zhongzhi Luan and Depei Qian}, title = {Gloss: Guiding Large Language Models to Answer Questions from System Logs}, booktitle = {{IEEE} International Conference on Software Analysis, Evolution and Reengineering, {SANER} 2024, Rovaniemi, Finland, March 12-15, 2024}, pages = {91--101}, publisher = {{IEEE}}, year = {2024}, url = {https://doi.org/10.1109/SANER60148.2024.00017}, doi = {10.1109/SANER60148.2024.00017}, timestamp = {Tue, 30 Jul 2024 11:08:59 +0200}, biburl = {https://dblp.org/rec/conf/wcre/Huang0QSXFWYLQ24.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2401-07284, author = {Ting Jiang and Shaohan Huang and Shengyue Luo and Zihan Zhang and Haizhen Huang and Furu Wei and Weiwei Deng and Feng Sun and Qi Zhang and Deqing Wang and Fuzhen Zhuang}, title = {Improving Domain Adaptation through Extended-Text Reading Comprehension}, journal = {CoRR}, volume = {abs/2401.07284}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2401.07284}, doi = {10.48550/ARXIV.2401.07284}, eprinttype = {arXiv}, eprint = {2401.07284}, timestamp = {Mon, 17 Jun 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2401-07284.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2402-13064, author = {Haoran Li and Qingxiu Dong and Zhengyang Tang and Chaojun Wang and Xingxing Zhang and Haoyang Huang and Shaohan Huang and Xiaolong Huang and Zeqiang Huang and Dongdong Zhang and Yuxian Gu and Xin Cheng and Xun Wang and Si{-}Qing Chen and Li Dong and Wei Lu and Zhifang Sui and Benyou Wang and Wai Lam and Furu Wei}, title = {Synthetic Data (Almost) from Scratch: Generalized Instruction Tuning for Language Models}, journal = {CoRR}, volume = {abs/2402.13064}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2402.13064}, doi = {10.48550/ARXIV.2402.13064}, eprinttype = {arXiv}, eprint = {2402.13064}, timestamp = {Wed, 24 Jul 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2402-13064.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2402-13874, author = {Haoyu Liu and Jianfeng Liu and Shaohan Huang and Yuefeng Zhan and Hao Sun and Weiwei Deng and Furu Wei and Qi Zhang}, title = {Se\({}^{\mbox{2}}\): Sequential Example Selection for In-Context Learning}, journal = {CoRR}, volume = {abs/2402.13874}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2402.13874}, doi = {10.48550/ARXIV.2402.13874}, eprinttype = {arXiv}, eprint = {2402.13874}, timestamp = {Tue, 23 Jul 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2402-13874.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2402-14843, author = {Yuxuan Liu and Tianchi Yang and Shaohan Huang and Zihan Zhang and Haizhen Huang and Furu Wei and Weiwei Deng and Feng Sun and Qi Zhang}, title = {Text Diffusion with Reinforced Conditioning}, journal = {CoRR}, volume = {abs/2402.14843}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2402.14843}, doi = {10.48550/ARXIV.2402.14843}, eprinttype = {arXiv}, eprint = {2402.14843}, timestamp = {Mon, 17 Jun 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2402-14843.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2402-15754, author = {Yuxuan Liu and Tianchi Yang and Shaohan Huang and Zihan Zhang and Haizhen Huang and Furu Wei and Weiwei Deng and Feng Sun and Qi Zhang}, title = {HD-Eval: Aligning Large Language Model Evaluators Through Hierarchical Criteria Decomposition}, journal = {CoRR}, volume = {abs/2402.15754}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2402.15754}, doi = {10.48550/ARXIV.2402.15754}, eprinttype = {arXiv}, eprint = {2402.15754}, timestamp = {Mon, 17 Jun 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2402-15754.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2402-17764, author = {Shuming Ma and Hongyu Wang and Lingxiao Ma and Lei Wang and Wenhui Wang and Shaohan Huang and Li Dong and Ruiping Wang and Jilong Xue and Furu Wei}, title = {The Era of 1-bit LLMs: All Large Language Models are in 1.58 Bits}, journal = {CoRR}, volume = {abs/2402.17764}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2402.17764}, doi = {10.48550/ARXIV.2402.17764}, eprinttype = {arXiv}, eprint = {2402.17764}, timestamp = {Fri, 19 Jul 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2402-17764.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2402-18039, author = {Shuhua Shi and Shaohan Huang and Minghui Song and Zhoujun Li and Zihan Zhang and Haizhen Huang and Furu Wei and Weiwei Deng and Feng Sun and Qi Zhang}, title = {ResLoRA: Identity Residual Mapping in Low-Rank Adaption}, journal = {CoRR}, volume = {abs/2402.18039}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2402.18039}, doi = {10.48550/ARXIV.2402.18039}, eprinttype = {arXiv}, eprint = {2402.18039}, timestamp = {Mon, 17 Jun 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2402-18039.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2403-09164, author = {Yizhen Li and Shaohan Huang and Jiaxing Qi and Lei Quan and Dongran Han and Zhongzhi Luan}, title = {Exploring the Comprehension of ChatGPT in Traditional Chinese Medicine Knowledge}, journal = {CoRR}, volume = {abs/2403.09164}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2403.09164}, doi = {10.48550/ARXIV.2403.09164}, eprinttype = {arXiv}, eprint = {2403.09164}, timestamp = {Fri, 05 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2403-09164.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2404-13628, author = {Xun Wu and Shaohan Huang and Furu Wei}, title = {Mixture of LoRA Experts}, journal = {CoRR}, volume = {abs/2404.13628}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2404.13628}, doi = {10.48550/ARXIV.2404.13628}, eprinttype = {arXiv}, eprint = {2404.13628}, timestamp = {Sat, 25 May 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2404-13628.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2404-15045, author = {Xun Wu and Shaohan Huang and Wenhui Wang and Furu Wei}, title = {Multi-Head Mixture-of-Experts}, journal = {CoRR}, volume = {abs/2404.15045}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2404.15045}, doi = {10.48550/ARXIV.2404.15045}, eprinttype = {arXiv}, eprint = {2404.15045}, timestamp = {Sat, 25 May 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2404-15045.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2404-15100, author = {Xun Wu and Shaohan Huang and Furu Wei}, title = {Multimodal Large Language Model is a Human-Aligned Annotator for Text-to-Image Generation}, journal = {CoRR}, volume = {abs/2404.15100}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2404.15100}, doi = {10.48550/ARXIV.2404.15100}, eprinttype = {arXiv}, eprint = {2404.15100}, timestamp = {Sat, 25 May 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2404-15100.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2405-05254, author = {Yutao Sun and Li Dong and Yi Zhu and Shaohan Huang and Wenhui Wang and Shuming Ma and Quanlu Zhang and Jianyong Wang and Furu Wei}, title = {You Only Cache Once: Decoder-Decoder Architectures for Language Models}, journal = {CoRR}, volume = {abs/2405.05254}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2405.05254}, doi = {10.48550/ARXIV.2405.05254}, eprinttype = {arXiv}, eprint = {2405.05254}, timestamp = {Thu, 01 Aug 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2405-05254.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2405-12130, author = {Ting Jiang and Shaohan Huang and Shengyue Luo and Zihan Zhang and Haizhen Huang and Furu Wei and Weiwei Deng and Feng Sun and Qi Zhang and Deqing Wang and Fuzhen Zhuang}, title = {MoRA: High-Rank Updating for Parameter-Efficient Fine-Tuning}, journal = {CoRR}, volume = {abs/2405.12130}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2405.12130}, doi = {10.48550/ARXIV.2405.12130}, eprinttype = {arXiv}, eprint = {2405.12130}, timestamp = {Tue, 23 Jul 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2405-12130.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2406-07925, author = {Jiaxing Qi and Zhongzhi Luan and Shaohan Huang and Carol J. Fung and Hailong Yang and Depei Qian}, title = {FDLoRA: Personalized Federated Learning of Large Language Model via Dual LoRA Tuning}, journal = {CoRR}, volume = {abs/2406.07925}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2406.07925}, doi = {10.48550/ARXIV.2406.07925}, eprinttype = {arXiv}, eprint = {2406.07925}, timestamp = {Mon, 08 Jul 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2406-07925.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2406-14491, author = {Daixuan Cheng and Yuxian Gu and Shaohan Huang and Junyu Bi and Minlie Huang and Furu Wei}, title = {Instruction Pre-Training: Language Models are Supervised Multitask Learners}, journal = {CoRR}, volume = {abs/2406.14491}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2406.14491}, doi = {10.48550/ARXIV.2406.14491}, eprinttype = {arXiv}, eprint = {2406.14491}, timestamp = {Tue, 16 Jul 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2406-14491.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/tc/HuangLFWYL23, author = {Shaohan Huang and Yi Liu and Carol J. Fung and He Wang and Hailong Yang and Zhongzhi Luan}, title = {Improving Log-Based Anomaly Detection by Pre-Training Hierarchical Transformers}, journal = {{IEEE} Trans. Computers}, volume = {72}, number = {9}, pages = {2656--2667}, year = {2023}, url = {https://doi.org/10.1109/TC.2023.3257518}, doi = {10.1109/TC.2023.3257518}, timestamp = {Fri, 18 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/tc/HuangLFWYL23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/tnsm/QiLHFYLZQ23, author = {Jiaxing Qi and Zhongzhi Luan and Shaohan Huang and Carol J. Fung and Hailong Yang and Hanlu Li and Danfeng Zhu and Depei Qian}, title = {LogEncoder: Log-Based Contrastive Representation Learning for Anomaly Detection}, journal = {{IEEE} Trans. Netw. Serv. Manag.}, volume = {20}, number = {2}, pages = {1378--1391}, year = {2023}, url = {https://doi.org/10.1109/TNSM.2023.3239522}, doi = {10.1109/TNSM.2023.3239522}, timestamp = {Fri, 07 Jul 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/tnsm/QiLHFYLZQ23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/XieHCW23, author = {Yuan Xie and Shaohan Huang and Tianyu Chen and Furu Wei}, editor = {Brian Williams and Yiling Chen and Jennifer Neville}, title = {MoEC: Mixture of Expert Clusters}, booktitle = {Thirty-Seventh {AAAI} Conference on Artificial Intelligence, {AAAI} 2023, Thirty-Fifth Conference on Innovative Applications of Artificial Intelligence, {IAAI} 2023, Thirteenth Symposium on Educational Advances in Artificial Intelligence, {EAAI} 2023, Washington, DC, USA, February 7-14, 2023}, pages = {13807--13815}, publisher = {{AAAI} Press}, year = {2023}, url = {https://doi.org/10.1609/aaai.v37i11.26617}, doi = {10.1609/AAAI.V37I11.26617}, timestamp = {Sat, 30 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/XieHCW23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/acl/ChenHZGLHWDZ23, author = {Beiduo Chen and Shaohan Huang and Zihan Zhang and Wu Guo and Zhenhua Ling and Haizhen Huang and Furu Wei and Weiwei Deng and Qi Zhang}, editor = {Anna Rogers and Jordan L. Boyd{-}Graber and Naoaki Okazaki}, title = {Pre-training Language Model as a Multi-perspective Course Learner}, booktitle = {Findings of the Association for Computational Linguistics: {ACL} 2023, Toronto, Canada, July 9-14, 2023}, pages = {114--128}, publisher = {Association for Computational Linguistics}, year = {2023}, url = {https://doi.org/10.18653/v1/2023.findings-acl.9}, doi = {10.18653/V1/2023.FINDINGS-ACL.9}, timestamp = {Mon, 17 Jun 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/acl/ChenHZGLHWDZ23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/acl/LiHZDLHJWDZ23, author = {Ziheng Li and Shaohan Huang and Zihan Zhang and Zhi{-}Hong Deng and Qiang Lou and Haizhen Huang and Jian Jiao and Furu Wei and Weiwei Deng and Qi Zhang}, editor = {Anna Rogers and Jordan L. Boyd{-}Graber and Naoaki Okazaki}, title = {Dual-Alignment Pre-training for Cross-lingual Sentence Embedding}, booktitle = {Proceedings of the 61st Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), {ACL} 2023, Toronto, Canada, July 9-14, 2023}, pages = {3466--3478}, publisher = {Association for Computational Linguistics}, year = {2023}, url = {https://doi.org/10.18653/v1/2023.acl-long.191}, doi = {10.18653/V1/2023.ACL-LONG.191}, timestamp = {Mon, 17 Jun 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/acl/LiHZDLHJWDZ23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/acl/YangM0HHYZYWL23, author = {Jian Yang and Shuming Ma and Li Dong and Shaohan Huang and Haoyang Huang and Yuwei Yin and Dongdong Zhang and Liqun Yang and Furu Wei and Zhoujun Li}, editor = {Anna Rogers and Jordan L. Boyd{-}Graber and Naoaki Okazaki}, title = {GanLM: Encoder-Decoder Pre-training with an Auxiliary Discriminator}, booktitle = {Proceedings of the 61st Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), {ACL} 2023, Toronto, Canada, July 9-14, 2023}, pages = {9394--9412}, publisher = {Association for Computational Linguistics}, year = {2023}, url = {https://doi.org/10.18653/v1/2023.acl-long.522}, doi = {10.18653/V1/2023.ACL-LONG.522}, timestamp = {Mon, 05 Feb 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/acl/YangM0HHYZYWL23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/acl/SunDPMHBCSW23, author = {Yutao Sun and Li Dong and Barun Patra and Shuming Ma and Shaohan Huang and Alon Benhaim and Vishrav Chaudhary and Xia Song and Furu Wei}, editor = {Anna Rogers and Jordan L. Boyd{-}Graber and Naoaki Okazaki}, title = {A Length-Extrapolatable Transformer}, booktitle = {Proceedings of the 61st Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), {ACL} 2023, Toronto, Canada, July 9-14, 2023}, pages = {14590--14604}, publisher = {Association for Computational Linguistics}, year = {2023}, url = {https://doi.org/10.18653/v1/2023.acl-long.816}, doi = {10.18653/V1/2023.ACL-LONG.816}, timestamp = {Thu, 10 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/acl/SunDPMHBCSW23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/acl/PatraSHC0WCS23, author = {Barun Patra and Saksham Singhal and Shaohan Huang and Zewen Chi and Li Dong and Furu Wei and Vishrav Chaudhary and Xia Song}, editor = {Anna Rogers and Jordan L. Boyd{-}Graber and Naoaki Okazaki}, title = {Beyond English-Centric Bitexts for Better Multilingual Language Representation Learning}, booktitle = {Proceedings of the 61st Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), {ACL} 2023, Toronto, Canada, July 9-14, 2023}, pages = {15354--15373}, publisher = {Association for Computational Linguistics}, year = {2023}, url = {https://doi.org/10.18653/v1/2023.acl-long.856}, doi = {10.18653/V1/2023.ACL-LONG.856}, timestamp = {Thu, 10 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/acl/PatraSHC0WCS23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/emnlp/WangHLWSZHWDSZ23, author = {Zhaoyang Wang and Shaohan Huang and Yuxuan Liu and Jiahai Wang and Minghui Song and Zihan Zhang and Haizhen Huang and Furu Wei and Weiwei Deng and Feng Sun and Qi Zhang}, editor = {Houda Bouamor and Juan Pino and Kalika Bali}, title = {Democratizing Reasoning Ability: Tailored Learning from Large Language Model}, booktitle = {Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing, {EMNLP} 2023, Singapore, December 6-10, 2023}, pages = {1948--1966}, publisher = {Association for Computational Linguistics}, year = {2023}, url = {https://doi.org/10.18653/v1/2023.emnlp-main.120}, doi = {10.18653/V1/2023.EMNLP-MAIN.120}, timestamp = {Mon, 17 Jun 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/emnlp/WangHLWSZHWDSZ23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/emnlp/ChengHBZLW0WDZ23, author = {Daixuan Cheng and Shaohan Huang and Junyu Bi and Yuefeng Zhan and Jianfeng Liu and Yujing Wang and Hao Sun and Furu Wei and Weiwei Deng and Qi Zhang}, editor = {Houda Bouamor and Juan Pino and Kalika Bali}, title = {{UPRISE:} Universal Prompt Retrieval for Improving Zero-Shot Evaluation}, booktitle = {Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing, {EMNLP} 2023, Singapore, December 6-10, 2023}, pages = {12318--12337}, publisher = {Association for Computational Linguistics}, year = {2023}, url = {https://doi.org/10.18653/v1/2023.emnlp-main.758}, doi = {10.18653/V1/2023.EMNLP-MAIN.758}, timestamp = {Mon, 17 Jun 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/emnlp/ChengHBZLW0WDZ23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/hpcc/QiHLYFYQSXW23, author = {Jiaxing Qi and Shaohan Huang and Zhongzhi Luan and Shu Yang and Carol J. Fung and Hailong Yang and Depei Qian and Jing Shang and Zhiwen Xiao and Zhihui Wu}, title = {LogGPT: Exploring ChatGPT for Log-Based Anomaly Detection}, booktitle = {{IEEE} International Conference on High Performance Computing {\&} Communications, Data Science {\&} Systems, Smart City {\&} Dependability in Sensor, Cloud {\&} Big Data Systems {\&} Application, HPCC/DSS/SmartCity/DependSys 2023, Melbourne, Australia, December 17-21, 2023}, pages = {273--280}, publisher = {{IEEE}}, year = {2023}, url = {https://doi.org/10.1109/HPCC-DSS-SmartCity-DependSys60770.2023.00045}, doi = {10.1109/HPCC-DSS-SMARTCITY-DEPENDSYS60770.2023.00045}, timestamp = {Wed, 10 Apr 2024 17:07:58 +0200}, biburl = {https://dblp.org/rec/conf/hpcc/QiHLYFYQSXW23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/WangMH0WPWBSBPL23, author = {Hongyu Wang and Shuming Ma and Shaohan Huang and Li Dong and Wenhui Wang and Zhiliang Peng and Yu Wu and Payal Bajaj and Saksham Singhal and Alon Benhaim and Barun Patra and Zhun Liu and Vishrav Chaudhary and Xia Song and Furu Wei}, editor = {Andreas Krause and Emma Brunskill and Kyunghyun Cho and Barbara Engelhardt and Sivan Sabato and Jonathan Scarlett}, title = {Magneto: {A} Foundation Transformer}, booktitle = {International Conference on Machine Learning, {ICML} 2023, 23-29 July 2023, Honolulu, Hawaii, {USA}}, series = {Proceedings of Machine Learning Research}, volume = {202}, pages = {36077--36092}, publisher = {{PMLR}}, year = {2023}, url = {https://proceedings.mlr.press/v202/wang23u.html}, timestamp = {Fri, 19 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/WangMH0WPWBSBPL23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/Huang0WHSML0MPL23, author = {Shaohan Huang and Li Dong and Wenhui Wang and Yaru Hao and Saksham Singhal and Shuming Ma and Tengchao Lv and Lei Cui and Owais Khan Mohammed and Barun Patra and Qiang Liu and Kriti Aggarwal and Zewen Chi and Nils Johan Bertil Bjorck and Vishrav Chaudhary and Subhojit Som and Xia Song and Furu Wei}, editor = {Alice Oh and Tristan Naumann and Amir Globerson and Kate Saenko and Moritz Hardt and Sergey Levine}, title = {Language Is Not All You Need: Aligning Perception with Language Models}, booktitle = {Advances in Neural Information Processing Systems 36: Annual Conference on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans, LA, USA, December 10 - 16, 2023}, year = {2023}, url = {http://papers.nips.cc/paper\_files/paper/2023/hash/e425b75bac5742a008d643826428787c-Abstract-Conference.html}, timestamp = {Fri, 19 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/nips/Huang0WHSML0MPL23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2302-14045, author = {Shaohan Huang and Li Dong and Wenhui Wang and Yaru Hao and Saksham Singhal and Shuming Ma and Tengchao Lv and Lei Cui and Owais Khan Mohammed and Barun Patra and Qiang Liu and Kriti Aggarwal and Zewen Chi and Johan Bjorck and Vishrav Chaudhary and Subhojit Som and Xia Song and Furu Wei}, title = {Language Is Not All You Need: Aligning Perception with Language Models}, journal = {CoRR}, volume = {abs/2302.14045}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2302.14045}, doi = {10.48550/ARXIV.2302.14045}, eprinttype = {arXiv}, eprint = {2302.14045}, timestamp = {Fri, 19 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2302-14045.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2303-08518, author = {Daixuan Cheng and Shaohan Huang and Junyu Bi and Yuefeng Zhan and Jianfeng Liu and Yujing Wang and Hao Sun and Furu Wei and Denvy Deng and Qi Zhang}, title = {{UPRISE:} Universal Prompt Retrieval for Improving Zero-Shot Evaluation}, journal = {CoRR}, volume = {abs/2303.08518}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2303.08518}, doi = {10.48550/ARXIV.2303.08518}, eprinttype = {arXiv}, eprint = {2303.08518}, timestamp = {Fri, 23 Aug 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2303-08518.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2303-11715, author = {Shaohan Huang and Yi Liu and Carol J. Fung and Jiaxing Qi and Hailong Yang and Zhongzhi Luan}, title = {LogQA: Question Answering in Unstructured Logs}, journal = {CoRR}, volume = {abs/2303.11715}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2303.11715}, doi = {10.48550/ARXIV.2303.11715}, eprinttype = {arXiv}, eprint = {2303.11715}, timestamp = {Sun, 16 Apr 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2303-11715.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2305-03981, author = {Beiduo Chen and Shaohan Huang and Zihan Zhang and Wu Guo and Zhenhua Ling and Haizhen Huang and Furu Wei and Weiwei Deng and Qi Zhang}, title = {Pre-training Language Model as a Multi-perspective Course Learner}, journal = {CoRR}, volume = {abs/2305.03981}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2305.03981}, doi = {10.48550/ARXIV.2305.03981}, eprinttype = {arXiv}, eprint = {2305.03981}, timestamp = {Mon, 17 Jun 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2305-03981.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2305-09148, author = {Ziheng Li and Shaohan Huang and Zihan Zhang and Zhi{-}Hong Deng and Qiang Lou and Haizhen Huang and Jian Jiao and Furu Wei and Weiwei Deng and Qi Zhang}, title = {Dual-Alignment Pre-training for Cross-lingual Sentence Embedding}, journal = {CoRR}, volume = {abs/2305.09148}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2305.09148}, doi = {10.48550/ARXIV.2305.09148}, eprinttype = {arXiv}, eprint = {2305.09148}, timestamp = {Mon, 17 Jun 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2305-09148.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2305-19602, author = {Tianyu Chen and Yuan Xie and Shuai Zhang and Shaohan Huang and Haoyi Zhou and Jianxin Li}, title = {Learning Music Sequence Representation from Text Supervision}, journal = {CoRR}, volume = {abs/2305.19602}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2305.19602}, doi = {10.48550/ARXIV.2305.19602}, eprinttype = {arXiv}, eprint = {2305.19602}, timestamp = {Fri, 19 Jul 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2305-19602.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2306-14824, author = {Zhiliang Peng and Wenhui Wang and Li Dong and Yaru Hao and Shaohan Huang and Shuming Ma and Furu Wei}, title = {Kosmos-2: Grounding Multimodal Large Language Models to the World}, journal = {CoRR}, volume = {abs/2306.14824}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2306.14824}, doi = {10.48550/ARXIV.2306.14824}, eprinttype = {arXiv}, eprint = {2306.14824}, timestamp = {Fri, 19 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2306-14824.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2307-02486, author = {Jiayu Ding and Shuming Ma and Li Dong and Xingxing Zhang and Shaohan Huang and Wenhui Wang and Nanning Zheng and Furu Wei}, title = {LongNet: Scaling Transformers to 1, 000, 000, 000 Tokens}, journal = {CoRR}, volume = {abs/2307.02486}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2307.02486}, doi = {10.48550/ARXIV.2307.02486}, eprinttype = {arXiv}, eprint = {2307.02486}, timestamp = {Fri, 19 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2307-02486.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2307-08621, author = {Yutao Sun and Li Dong and Shaohan Huang and Shuming Ma and Yuqing Xia and Jilong Xue and Jianyong Wang and Furu Wei}, title = {Retentive Network: {A} Successor to Transformer for Large Language Models}, journal = {CoRR}, volume = {abs/2307.08621}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2307.08621}, doi = {10.48550/ARXIV.2307.08621}, eprinttype = {arXiv}, eprint = {2307.08621}, timestamp = {Tue, 25 Jul 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2307-08621.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2307-16645, author = {Ting Jiang and Shaohan Huang and Zhongzhi Luan and Deqing Wang and Fuzhen Zhuang}, title = {Scaling Sentence Embeddings with Large Language Models}, journal = {CoRR}, volume = {abs/2307.16645}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2307.16645}, doi = {10.48550/ARXIV.2307.16645}, eprinttype = {arXiv}, eprint = {2307.16645}, timestamp = {Wed, 02 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2307-16645.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2309-01189, author = {Jiaxing Qi and Shaohan Huang and Zhongzhi Luan and Carol J. Fung and Hailong Yang and Depei Qian}, title = {LogGPT: Exploring ChatGPT for Log-Based Anomaly Detection}, journal = {CoRR}, volume = {abs/2309.01189}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2309.01189}, doi = {10.48550/ARXIV.2309.01189}, eprinttype = {arXiv}, eprint = {2309.01189}, timestamp = {Mon, 11 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2309-01189.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2309-09530, author = {Daixuan Cheng and Shaohan Huang and Furu Wei}, title = {Adapting Large Language Models via Reading Comprehension}, journal = {CoRR}, volume = {abs/2309.09530}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2309.09530}, doi = {10.48550/ARXIV.2309.09530}, eprinttype = {arXiv}, eprint = {2309.09530}, timestamp = {Fri, 22 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2309-09530.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2309-11419, author = {Tengchao Lv and Yupan Huang and Jingye Chen and Lei Cui and Shuming Ma and Yaoyao Chang and Shaohan Huang and Wenhui Wang and Li Dong and Weiyao Luo and Shaoxiang Wu and Guoxin Wang and Cha Zhang and Furu Wei}, title = {Kosmos-2.5: {A} Multimodal Literate Model}, journal = {CoRR}, volume = {abs/2309.11419}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2309.11419}, doi = {10.48550/ARXIV.2309.11419}, eprinttype = {arXiv}, eprint = {2309.11419}, timestamp = {Fri, 19 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2309-11419.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2309-13308, author = {Yuxuan Liu and Tianchi Yang and Shaohan Huang and Zihan Zhang and Haizhen Huang and Furu Wei and Weiwei Deng and Feng Sun and Qi Zhang}, title = {Calibrating LLM-Based Evaluator}, journal = {CoRR}, volume = {abs/2309.13308}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2309.13308}, doi = {10.48550/ARXIV.2309.13308}, eprinttype = {arXiv}, eprint = {2309.13308}, timestamp = {Mon, 17 Jun 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2309-13308.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2310-02992, author = {Xichen Pan and Li Dong and Shaohan Huang and Zhiliang Peng and Wenhu Chen and Furu Wei}, title = {Kosmos-G: Generating Images in Context with Multimodal Large Language Models}, journal = {CoRR}, volume = {abs/2310.02992}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2310.02992}, doi = {10.48550/ARXIV.2310.02992}, eprinttype = {arXiv}, eprint = {2310.02992}, timestamp = {Thu, 19 Oct 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2310-02992.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2310-11453, author = {Hongyu Wang and Shuming Ma and Li Dong and Shaohan Huang and Huaijie Wang and Lingxiao Ma and Fan Yang and Ruiping Wang and Yi Wu and Furu Wei}, title = {BitNet: Scaling 1-bit Transformers for Large Language Models}, journal = {CoRR}, volume = {abs/2310.11453}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2310.11453}, doi = {10.48550/ARXIV.2310.11453}, eprinttype = {arXiv}, eprint = {2310.11453}, timestamp = {Tue, 16 Jul 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2310-11453.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2310-13332, author = {Zhaoyang Wang and Shaohan Huang and Yuxuan Liu and Jiahai Wang and Minghui Song and Zihan Zhang and Haizhen Huang and Furu Wei and Weiwei Deng and Feng Sun and Qi Zhang}, title = {Democratizing Reasoning Ability: Tailored Learning from Large Language Model}, journal = {CoRR}, volume = {abs/2310.13332}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2310.13332}, doi = {10.48550/ARXIV.2310.13332}, eprinttype = {arXiv}, eprint = {2310.13332}, timestamp = {Mon, 17 Jun 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2310-13332.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/complexity/SuiSHHL22, author = {Xin Sui and Guifen Shi and Guanchong Hou and Shaohan Huang and Yanshuang Li}, title = {Impacts of {COVID-19} on the Return and Volatility Nexus among Cryptocurrency Market}, journal = {Complex.}, volume = {2022}, pages = {5346080:1--5346080:15}, year = {2022}, url = {https://doi.org/10.1155/2022/5346080}, doi = {10.1155/2022/5346080}, timestamp = {Mon, 26 Sep 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/complexity/SuiSHHL22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/tnsm/DaiLHFWYQ22, author = {Shaozhi Dai and Zhongzhi Luan and Shaohan Huang and Carol J. Fung and He Wang and Hailong Yang and Depei Qian}, title = {{REVAL:} Recommend Which Variables to Log With Pretrained Model and Graph Neural Network}, journal = {{IEEE} Trans. Netw. Serv. Manag.}, volume = {19}, number = {4}, pages = {4045--4057}, year = {2022}, url = {https://doi.org/10.1109/TNSM.2022.3209317}, doi = {10.1109/TNSM.2022.3209317}, timestamp = {Fri, 10 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/tnsm/DaiLHFWYQ22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/acl/ChenBHDJJZLW22, author = {Tianyu Chen and Hangbo Bao and Shaohan Huang and Li Dong and Binxing Jiao and Daxin Jiang and Haoyi Zhou and Jianxin Li and Furu Wei}, editor = {Smaranda Muresan and Preslav Nakov and Aline Villavicencio}, title = {{THE-X:} Privacy-Preserving Transformer Inference with Homomorphic Encryption}, booktitle = {Findings of the Association for Computational Linguistics: {ACL} 2022, Dublin, Ireland, May 22-27, 2022}, pages = {3510--3520}, publisher = {Association for Computational Linguistics}, year = {2022}, url = {https://doi.org/10.18653/v1/2022.findings-acl.277}, doi = {10.18653/V1/2022.FINDINGS-ACL.277}, timestamp = {Thu, 06 Apr 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/acl/ChenBHDJJZLW22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/acl/ChiH0MZSBSMHW22, author = {Zewen Chi and Shaohan Huang and Li Dong and Shuming Ma and Bo Zheng and Saksham Singhal and Payal Bajaj and Xia Song and Xian{-}Ling Mao and Heyan Huang and Furu Wei}, editor = {Smaranda Muresan and Preslav Nakov and Aline Villavicencio}, title = {{XLM-E:} Cross-lingual Language Model Pre-training via {ELECTRA}}, booktitle = {Proceedings of the 60th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), {ACL} 2022, Dublin, Ireland, May 22-27, 2022}, pages = {6170--6182}, publisher = {Association for Computational Linguistics}, year = {2022}, url = {https://doi.org/10.18653/v1/2022.acl-long.427}, doi = {10.18653/V1/2022.ACL-LONG.427}, timestamp = {Wed, 07 Aug 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/acl/ChiH0MZSBSMHW22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/cnsm/HuangLFYL22, author = {Shaohan Huang and Yi Liu and Carol J. Fung and Hailong Yang and Zhongzhi Luan}, editor = {Marinos Charalambides and Panagiotis Papadimitriou and Walter Cerroni and Salil S. Kanhere and Lefteris Mamatas}, title = {Black-box Attacks to Log-based Anomaly Detection}, booktitle = {18th International Conference on Network and Service Management, {CNSM} 2022, Thessaloniki, Greece, October 31 - Nov. 4, 2022}, pages = {310--316}, publisher = {{IEEE}}, year = {2022}, url = {https://doi.org/10.23919/CNSM55787.2022.9964935}, doi = {10.23919/CNSM55787.2022.9964935}, timestamp = {Thu, 08 Dec 2022 15:05:27 +0100}, biburl = {https://dblp.org/rec/conf/cnsm/HuangLFYL22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/emnlp/YangHMY0ZGLW22, author = {Jian Yang and Shaohan Huang and Shuming Ma and Yuwei Yin and Li Dong and Dongdong Zhang and Hongcheng Guo and Zhoujun Li and Furu Wei}, editor = {Yoav Goldberg and Zornitsa Kozareva and Yue Zhang}, title = {{CROP:} Zero-shot Cross-lingual Named Entity Recognition with Multilingual Labeled Sequence Translation}, booktitle = {Findings of the Association for Computational Linguistics: {EMNLP} 2022, Abu Dhabi, United Arab Emirates, December 7-11, 2022}, pages = {486--496}, publisher = {Association for Computational Linguistics}, year = {2022}, url = {https://doi.org/10.18653/v1/2022.findings-emnlp.34}, doi = {10.18653/V1/2022.FINDINGS-EMNLP.34}, timestamp = {Tue, 07 May 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/emnlp/YangHMY0ZGLW22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/emnlp/ChengHLZ0WDZ22, author = {Daixuan Cheng and Shaohan Huang and Jianfeng Liu and Yuefeng Zhan and Hao Sun and Furu Wei and Denvy Deng and Qi Zhang}, editor = {Yoav Goldberg and Zornitsa Kozareva and Yue Zhang}, title = {Snapshot-Guided Domain Adaptation for {ELECTRA}}, booktitle = {Findings of the Association for Computational Linguistics: {EMNLP} 2022, Abu Dhabi, United Arab Emirates, December 7-11, 2022}, pages = {2226--2232}, publisher = {Association for Computational Linguistics}, year = {2022}, url = {https://doi.org/10.18653/v1/2022.findings-emnlp.163}, doi = {10.18653/V1/2022.FINDINGS-EMNLP.163}, timestamp = {Fri, 23 Aug 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/emnlp/ChengHLZ0WDZ22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/emnlp/JiangJHZWZWHDZ22, author = {Ting Jiang and Jian Jiao and Shaohan Huang and Zihan Zhang and Deqing Wang and Fuzhen Zhuang and Furu Wei and Haizhen Huang and Denvy Deng and Qi Zhang}, editor = {Yoav Goldberg and Zornitsa Kozareva and Yue Zhang}, title = {PromptBERT: Improving {BERT} Sentence Embeddings with Prompts}, booktitle = {Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing, {EMNLP} 2022, Abu Dhabi, United Arab Emirates, December 7-11, 2022}, pages = {8826--8837}, publisher = {Association for Computational Linguistics}, year = {2022}, url = {https://doi.org/10.18653/v1/2022.emnlp-main.603}, doi = {10.18653/V1/2022.EMNLP-MAIN.603}, timestamp = {Tue, 16 Jul 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/emnlp/JiangJHZWZWHDZ22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/ChenXZHZL22, author = {Tianyu Chen and Yuan Xie and Shuai Zhang and Shaohan Huang and Haoyi Zhou and Jianxin Li}, title = {Learning Music Sequence Representation From Text Supervision}, booktitle = {{IEEE} International Conference on Acoustics, Speech and Signal Processing, {ICASSP} 2022, Virtual and Singapore, 23-27 May 2022}, pages = {4583--4587}, publisher = {{IEEE}}, year = {2022}, url = {https://doi.org/10.1109/ICASSP43922.2022.9746131}, doi = {10.1109/ICASSP43922.2022.9746131}, timestamp = {Sat, 30 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icassp/ChenXZHZL22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/Chi0HDMPSBSMHW22, author = {Zewen Chi and Li Dong and Shaohan Huang and Damai Dai and Shuming Ma and Barun Patra and Saksham Singhal and Payal Bajaj and Xia Song and Xian{-}Ling Mao and Heyan Huang and Furu Wei}, editor = {Sanmi Koyejo and S. Mohamed and A. Agarwal and Danielle Belgrave and K. Cho and A. Oh}, title = {On the Representation Collapse of Sparse Mixture of Experts}, booktitle = {Advances in Neural Information Processing Systems 35: Annual Conference on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans, LA, USA, November 28 - December 9, 2022}, year = {2022}, url = {http://papers.nips.cc/paper\_files/paper/2022/hash/df4f371f1f89ec8ba5014b3310578048-Abstract-Conference.html}, timestamp = {Mon, 08 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/Chi0HDMPSBSMHW22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nlpcc/YaoHDWCZ22, author = {Yunzhi Yao and Shaohan Huang and Li Dong and Furu Wei and Huajun Chen and Ningyu Zhang}, editor = {Wei Lu and Shujian Huang and Yu Hong and Xiabing Zhou}, title = {Kformer: Knowledge Injection in Transformer Feed-Forward Layers}, booktitle = {Natural Language Processing and Chinese Computing - 11th {CCF} International Conference, {NLPCC} 2022, Guilin, China, September 24-25, 2022, Proceedings, Part {I}}, series = {Lecture Notes in Computer Science}, volume = {13551}, pages = {131--143}, publisher = {Springer}, year = {2022}, url = {https://doi.org/10.1007/978-3-031-17120-8\_11}, doi = {10.1007/978-3-031-17120-8\_11}, timestamp = {Tue, 27 Dec 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nlpcc/YaoHDWCZ22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/noms/QiLHWFYQ22, author = {Jiaxing Qi and Zhongzhi Luan and Shaohan Huang and Yukun Wang and Carol J. Fung and Hailong Yang and Depei Qian}, title = {Adanomaly: Adaptive Anomaly Detection for System Logs with Adversarial Learning}, booktitle = {2022 {IEEE/IFIP} Network Operations and Management Symposium, {NOMS} 2022, Budapest, Hungary, April 25-29, 2022}, pages = {1--5}, publisher = {{IEEE}}, year = {2022}, url = {https://doi.org/10.1109/NOMS54207.2022.9789917}, doi = {10.1109/NOMS54207.2022.9789917}, timestamp = {Wed, 15 Jun 2022 16:45:18 +0200}, biburl = {https://dblp.org/rec/conf/noms/QiLHWFYQ22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2201-04337, author = {Ting Jiang and Shaohan Huang and Zihan Zhang and Deqing Wang and Fuzhen Zhuang and Furu Wei and Haizhen Huang and Liangjie Zhang and Qi Zhang}, title = {PromptBERT: Improving {BERT} Sentence Embeddings with Prompts}, journal = {CoRR}, volume = {abs/2201.04337}, year = {2022}, url = {https://arxiv.org/abs/2201.04337}, eprinttype = {arXiv}, eprint = {2201.04337}, timestamp = {Mon, 17 Jun 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2201-04337.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2201-05742, author = {Yunzhi Yao and Shaohan Huang and Ningyu Zhang and Li Dong and Furu Wei and Huajun Chen}, title = {Kformer: Knowledge Injection in Transformer Feed-Forward Layers}, journal = {CoRR}, volume = {abs/2201.05742}, year = {2022}, url = {https://arxiv.org/abs/2201.05742}, eprinttype = {arXiv}, eprint = {2201.05742}, timestamp = {Tue, 27 Dec 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2201-05742.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2203-00555, author = {Hongyu Wang and Shuming Ma and Li Dong and Shaohan Huang and Dongdong Zhang and Furu Wei}, title = {DeepNet: Scaling Transformers to 1, 000 Layers}, journal = {CoRR}, volume = {abs/2203.00555}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2203.00555}, doi = {10.48550/ARXIV.2203.00555}, eprinttype = {arXiv}, eprint = {2203.00555}, timestamp = {Tue, 20 Dec 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2203-00555.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2204-09179, author = {Zewen Chi and Li Dong and Shaohan Huang and Damai Dai and Shuming Ma and Barun Patra and Saksham Singhal and Payal Bajaj and Xia Song and Furu Wei}, title = {On the Representation Collapse of Sparse Mixture of Experts}, journal = {CoRR}, volume = {abs/2204.09179}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2204.09179}, doi = {10.48550/ARXIV.2204.09179}, eprinttype = {arXiv}, eprint = {2204.09179}, timestamp = {Mon, 25 Apr 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2204-09179.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2206-00216, author = {Tianyu Chen and Hangbo Bao and Shaohan Huang and Li Dong and Binxing Jiao and Daxin Jiang and Haoyi Zhou and Jianxin Li and Furu Wei}, title = {{THE-X:} Privacy-Preserving Transformer Inference with Homomorphic Encryption}, journal = {CoRR}, volume = {abs/2206.00216}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2206.00216}, doi = {10.48550/ARXIV.2206.00216}, eprinttype = {arXiv}, eprint = {2206.00216}, timestamp = {Mon, 01 May 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2206-00216.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2206-00277, author = {Tianyu Chen and Shaohan Huang and Yuan Xie and Binxing Jiao and Daxin Jiang and Haoyi Zhou and Jianxin Li and Furu Wei}, title = {Task-Specific Expert Pruning for Sparse Mixture-of-Experts}, journal = {CoRR}, volume = {abs/2206.00277}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2206.00277}, doi = {10.48550/ARXIV.2206.00277}, eprinttype = {arXiv}, eprint = {2206.00277}, timestamp = {Sat, 30 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2206-00277.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2206-06336, author = {Yaru Hao and Haoyu Song and Li Dong and Shaohan Huang and Zewen Chi and Wenhui Wang and Shuming Ma and Furu Wei}, title = {Language Models are General-Purpose Interfaces}, journal = {CoRR}, volume = {abs/2206.06336}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2206.06336}, doi = {10.48550/ARXIV.2206.06336}, eprinttype = {arXiv}, eprint = {2206.06336}, timestamp = {Fri, 19 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2206-06336.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2207-09094, author = {Yuan Xie and Shaohan Huang and Tianyu Chen and Furu Wei}, title = {MoEC: Mixture of Expert Clusters}, journal = {CoRR}, volume = {abs/2207.09094}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2207.09094}, doi = {10.48550/ARXIV.2207.09094}, eprinttype = {arXiv}, eprint = {2207.09094}, timestamp = {Mon, 25 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2207-09094.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2210-06423, author = {Hongyu Wang and Shuming Ma and Shaohan Huang and Li Dong and Wenhui Wang and Zhiliang Peng and Yu Wu and Payal Bajaj and Saksham Singhal and Alon Benhaim and Barun Patra and Zhun Liu and Vishrav Chaudhary and Xia Song and Furu Wei}, title = {Foundation Transformers}, journal = {CoRR}, volume = {abs/2210.06423}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2210.06423}, doi = {10.48550/ARXIV.2210.06423}, eprinttype = {arXiv}, eprint = {2210.06423}, timestamp = {Fri, 19 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2210-06423.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2210-07022, author = {Jian Yang and Shaohan Huang and Shuming Ma and Yuwei Yin and Li Dong and Dongdong Zhang and Hongcheng Guo and Zhoujun Li and Furu Wei}, title = {{CROP:} Zero-shot Cross-lingual Named Entity Recognition with Multilingual Labeled Sequence Translation}, journal = {CoRR}, volume = {abs/2210.07022}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2210.07022}, doi = {10.48550/ARXIV.2210.07022}, eprinttype = {arXiv}, eprint = {2210.07022}, timestamp = {Mon, 05 Feb 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2210-07022.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2210-14867, author = {Barun Patra and Saksham Singhal and Shaohan Huang and Zewen Chi and Li Dong and Furu Wei and Vishrav Chaudhary and Xia Song}, title = {Beyond English-Centric Bitexts for Better Multilingual Language Representation Learning}, journal = {CoRR}, volume = {abs/2210.14867}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2210.14867}, doi = {10.48550/ARXIV.2210.14867}, eprinttype = {arXiv}, eprint = {2210.14867}, timestamp = {Wed, 02 Nov 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2210-14867.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2211-13184, author = {Shuming Ma and Hongyu Wang and Shaohan Huang and Wenhui Wang and Zewen Chi and Li Dong and Alon Benhaim and Barun Patra and Vishrav Chaudhary and Xia Song and Furu Wei}, title = {TorchScale: Transformers at Scale}, journal = {CoRR}, volume = {abs/2211.13184}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2211.13184}, doi = {10.48550/ARXIV.2211.13184}, eprinttype = {arXiv}, eprint = {2211.13184}, timestamp = {Fri, 19 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2211-13184.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2212-10218, author = {Jian Yang and Shuming Ma and Li Dong and Shaohan Huang and Haoyang Huang and Yuwei Yin and Dongdong Zhang and Liqun Yang and Zhoujun Li and Furu Wei}, title = {GanLM: Encoder-Decoder Pre-training with an Auxiliary Discriminator}, journal = {CoRR}, volume = {abs/2212.10218}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2212.10218}, doi = {10.48550/ARXIV.2212.10218}, eprinttype = {arXiv}, eprint = {2212.10218}, timestamp = {Mon, 05 Feb 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2212-10218.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2212-10554, author = {Yutao Sun and Li Dong and Barun Patra and Shuming Ma and Shaohan Huang and Alon Benhaim and Vishrav Chaudhary and Xia Song and Furu Wei}, title = {A Length-Extrapolatable Transformer}, journal = {CoRR}, volume = {abs/2212.10554}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2212.10554}, doi = {10.48550/ARXIV.2212.10554}, eprinttype = {arXiv}, eprint = {2212.10554}, timestamp = {Wed, 04 Jan 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2212-10554.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/acl/YaoHWDW21, author = {Yunzhi Yao and Shaohan Huang and Wenhui Wang and Li Dong and Furu Wei}, editor = {Chengqing Zong and Fei Xia and Wenjie Li and Roberto Navigli}, title = {Adapt-and-Distill: Developing Small, Fast and Effective Pretrained Language Models for Domains}, booktitle = {Findings of the Association for Computational Linguistics: {ACL/IJCNLP} 2021, Online Event, August 1-6, 2021}, series = {Findings of {ACL}}, volume = {{ACL/IJCNLP} 2021}, pages = {460--470}, publisher = {Association for Computational Linguistics}, year = {2021}, url = {https://doi.org/10.18653/v1/2021.findings-acl.40}, doi = {10.18653/V1/2021.FINDINGS-ACL.40}, timestamp = {Fri, 19 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/acl/YaoHWDW21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/acl/WangBHDW21, author = {Wenhui Wang and Hangbo Bao and Shaohan Huang and Li Dong and Furu Wei}, editor = {Chengqing Zong and Fei Xia and Wenjie Li and Roberto Navigli}, title = {MiniLMv2: Multi-Head Self-Attention Relation Distillation for Compressing Pretrained Transformers}, booktitle = {Findings of the Association for Computational Linguistics: {ACL/IJCNLP} 2021, Online Event, August 1-6, 2021}, series = {Findings of {ACL}}, volume = {{ACL/IJCNLP} 2021}, pages = {2140--2151}, publisher = {Association for Computational Linguistics}, year = {2021}, url = {https://doi.org/10.18653/v1/2021.findings-acl.188}, doi = {10.18653/V1/2021.FINDINGS-ACL.188}, timestamp = {Fri, 19 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/acl/WangBHDW21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/acl/Zheng0HWCSC0SW20, author = {Bo Zheng and Li Dong and Shaohan Huang and Wenhui Wang and Zewen Chi and Saksham Singhal and Wanxiang Che and Ting Liu and Xia Song and Furu Wei}, editor = {Chengqing Zong and Fei Xia and Wenjie Li and Roberto Navigli}, title = {Consistency Regularization for Cross-Lingual Fine-Tuning}, booktitle = {Proceedings of the 59th Annual Meeting of the Association for Computational Linguistics and the 11th International Joint Conference on Natural Language Processing, {ACL/IJCNLP} 2021, (Volume 1: Long Papers), Virtual Event, August 1-6, 2021}, pages = {3403--3417}, publisher = {Association for Computational Linguistics}, year = {2021}, url = {https://doi.org/10.18653/v1/2021.acl-long.264}, doi = {10.18653/V1/2021.ACL-LONG.264}, timestamp = {Fri, 19 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/acl/Zheng0HWCSC0SW20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/acl/Chi0ZHMHW20, author = {Zewen Chi and Li Dong and Bo Zheng and Shaohan Huang and Xian{-}Ling Mao and Heyan Huang and Furu Wei}, editor = {Chengqing Zong and Fei Xia and Wenjie Li and Roberto Navigli}, title = {Improving Pretrained Cross-Lingual Language Models via Self-Labeled Word Alignment}, booktitle = {Proceedings of the 59th Annual Meeting of the Association for Computational Linguistics and the 11th International Joint Conference on Natural Language Processing, {ACL/IJCNLP} 2021, (Volume 1: Long Papers), Virtual Event, August 1-6, 2021}, pages = {3418--3430}, publisher = {Association for Computational Linguistics}, year = {2021}, url = {https://doi.org/10.18653/v1/2021.acl-long.265}, doi = {10.18653/V1/2021.ACL-LONG.265}, timestamp = {Thu, 08 Aug 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/acl/Chi0ZHMHW20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ccgrid/GaoYHDLLLQ21, author = {Ruiyuan Gao and Hailong Yang and Shaohan Huang and Ming Dun and Mingzhen Li and Zerong Luan and Zhongzhi Luan and Depei Qian}, editor = {Laurent Lef{\`{e}}vre and Stacy Patterson and Young Choon Lee and Haiying Shen and Shashikant Ilager and Mohammad Goudarzi and Adel Nadjaran Toosi and Rajkumar Buyya}, title = {PriPro: Towards Effective Privacy Protection on Edge-Cloud System running {DNN} Inference}, booktitle = {21st {IEEE/ACM} International Symposium on Cluster, Cloud and Internet Computing, CCGrid 2021, Melbourne, Australia, May 10-13, 2021}, pages = {334--343}, publisher = {{IEEE}}, year = {2021}, url = {https://doi.org/10.1109/CCGrid51090.2021.00043}, doi = {10.1109/CCGRID51090.2021.00043}, timestamp = {Thu, 02 Sep 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ccgrid/GaoYHDLLLQ21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/emnlp/ChiDMHSMHSW21, author = {Zewen Chi and Li Dong and Shuming Ma and Shaohan Huang and Saksham Singhal and Xian{-}Ling Mao and Heyan Huang and Xia Song and Furu Wei}, editor = {Marie{-}Francine Moens and Xuanjing Huang and Lucia Specia and Scott Wen{-}tau Yih}, title = {mT6: Multilingual Pretrained Text-to-Text Transformer with Translation Pairs}, booktitle = {Proceedings of the 2021 Conference on Empirical Methods in Natural Language Processing, {EMNLP} 2021, Virtual Event / Punta Cana, Dominican Republic, 7-11 November, 2021}, pages = {1671--1683}, publisher = {Association for Computational Linguistics}, year = {2021}, url = {https://doi.org/10.18653/v1/2021.emnlp-main.125}, doi = {10.18653/V1/2021.EMNLP-MAIN.125}, timestamp = {Fri, 16 Feb 2024 08:27:36 +0100}, biburl = {https://dblp.org/rec/conf/emnlp/ChiDMHSMHSW21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/emnlp/ZhengDHSCLSW21, author = {Bo Zheng and Li Dong and Shaohan Huang and Saksham Singhal and Wanxiang Che and Ting Liu and Xia Song and Furu Wei}, editor = {Marie{-}Francine Moens and Xuanjing Huang and Lucia Specia and Scott Wen{-}tau Yih}, title = {Allocating Large Vocabulary Capacity for Cross-Lingual Language Model Pre-Training}, booktitle = {Proceedings of the 2021 Conference on Empirical Methods in Natural Language Processing, {EMNLP} 2021, Virtual Event / Punta Cana, Dominican Republic, 7-11 November, 2021}, pages = {3203--3215}, publisher = {Association for Computational Linguistics}, year = {2021}, url = {https://doi.org/10.18653/v1/2021.emnlp-main.257}, doi = {10.18653/V1/2021.EMNLP-MAIN.257}, timestamp = {Wed, 16 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/emnlp/ZhengDHSCLSW21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/wmt/YangMH00HMSHSW21, author = {Jian Yang and Shuming Ma and Haoyang Huang and Dongdong Zhang and Li Dong and Shaohan Huang and Alexandre Muzio and Saksham Singhal and Hany Hassan and Xia Song and Furu Wei}, editor = {Lo{\"{\i}}c Barrault and Ondrej Bojar and Fethi Bougares and Rajen Chatterjee and Marta R. Costa{-}juss{\`{a}} and Christian Federmann and Mark Fishel and Alexander Fraser and Markus Freitag and Yvette Graham and Roman Grundkiewicz and Paco Guzman and Barry Haddow and Matthias Huck and Antonio Jimeno{-}Yepes and Philipp Koehn and Tom Kocmi and Andr{\'{e}} Martins and Makoto Morishita and Christof Monz}, title = {Multilingual Machine Translation Systems from Microsoft for {WMT21} Shared Task}, booktitle = {Proceedings of the Sixth Conference on Machine Translation, WMT@EMNLP 2021, Online Event, November 10-11, 2021}, pages = {446--455}, publisher = {Association for Computational Linguistics}, year = {2021}, url = {https://aclanthology.org/2021.wmt-1.54}, timestamp = {Wed, 07 Feb 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/wmt/YangMH00HMSHSW21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2104-08692, author = {Zewen Chi and Li Dong and Shuming Ma and Shaohan Huang and Xian{-}Ling Mao and Heyan Huang and Furu Wei}, title = {mT6: Multilingual Pretrained Text-to-Text Transformer with Translation Pairs}, journal = {CoRR}, volume = {abs/2104.08692}, year = {2021}, url = {https://arxiv.org/abs/2104.08692}, eprinttype = {arXiv}, eprint = {2104.08692}, timestamp = {Mon, 26 Apr 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2104-08692.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2106-06381, author = {Zewen Chi and Li Dong and Bo Zheng and Shaohan Huang and Xian{-}Ling Mao and Heyan Huang and Furu Wei}, title = {Improving Pretrained Cross-Lingual Language Models via Self-Labeled Word Alignment}, journal = {CoRR}, volume = {abs/2106.06381}, year = {2021}, url = {https://arxiv.org/abs/2106.06381}, eprinttype = {arXiv}, eprint = {2106.06381}, timestamp = {Wed, 07 Aug 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2106-06381.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2106-08226, author = {Bo Zheng and Li Dong and Shaohan Huang and Wenhui Wang and Zewen Chi and Saksham Singhal and Wanxiang Che and Ting Liu and Xia Song and Furu Wei}, title = {Consistency Regularization for Cross-Lingual Fine-Tuning}, journal = {CoRR}, volume = {abs/2106.08226}, year = {2021}, url = {https://arxiv.org/abs/2106.08226}, eprinttype = {arXiv}, eprint = {2106.08226}, timestamp = {Fri, 19 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2106-08226.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2106-13474, author = {Yunzhi Yao and Shaohan Huang and Wenhui Wang and Li Dong and Furu Wei}, title = {Adapt-and-Distill: Developing Small, Fast and Effective Pretrained Language Models for Domains}, journal = {CoRR}, volume = {abs/2106.13474}, year = {2021}, url = {https://arxiv.org/abs/2106.13474}, eprinttype = {arXiv}, eprint = {2106.13474}, timestamp = {Fri, 19 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2106-13474.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2106-13736, author = {Shuming Ma and Li Dong and Shaohan Huang and Dongdong Zhang and Alexandre Muzio and Saksham Singhal and Hany Hassan Awadalla and Xia Song and Furu Wei}, title = {DeltaLM: Encoder-Decoder Pre-training for Language Generation and Translation by Augmenting Pretrained Multilingual Encoders}, journal = {CoRR}, volume = {abs/2106.13736}, year = {2021}, url = {https://arxiv.org/abs/2106.13736}, eprinttype = {arXiv}, eprint = {2106.13736}, timestamp = {Wed, 30 Jun 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2106-13736.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2106-16138, author = {Zewen Chi and Shaohan Huang and Li Dong and Shuming Ma and Saksham Singhal and Payal Bajaj and Xia Song and Furu Wei}, title = {{XLM-E:} Cross-lingual Language Model Pre-training via {ELECTRA}}, journal = {CoRR}, volume = {abs/2106.16138}, year = {2021}, url = {https://arxiv.org/abs/2106.16138}, eprinttype = {arXiv}, eprint = {2106.16138}, timestamp = {Mon, 05 Jul 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2106-16138.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2109-07306, author = {Bo Zheng and Li Dong and Shaohan Huang and Saksham Singhal and Wanxiang Che and Ting Liu and Xia Song and Furu Wei}, title = {Allocating Large Vocabulary Capacity for Cross-lingual Language Model Pre-training}, journal = {CoRR}, volume = {abs/2109.07306}, year = {2021}, url = {https://arxiv.org/abs/2109.07306}, eprinttype = {arXiv}, eprint = {2109.07306}, timestamp = {Wed, 16 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2109-07306.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2110-11115, author = {Ting Jiang and Shaohan Huang and Zihan Zhang and Deqing Wang and Fuzhen Zhuang and Furu Wei and Haizhen Huang and Liangjie Zhang and Qi Zhang}, title = {Improving Non-autoregressive Generation with Mixup Training}, journal = {CoRR}, volume = {abs/2110.11115}, year = {2021}, url = {https://arxiv.org/abs/2110.11115}, eprinttype = {arXiv}, eprint = {2110.11115}, timestamp = {Mon, 17 Jun 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2110-11115.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2111-02086, author = {Jian Yang and Shuming Ma and Haoyang Huang and Dongdong Zhang and Li Dong and Shaohan Huang and Alexandre Muzio and Saksham Singhal and Hany Hassan Awadalla and Xia Song and Furu Wei}, title = {Multilingual Machine Translation Systems from Microsoft for {WMT21} Shared Task}, journal = {CoRR}, volume = {abs/2111.02086}, year = {2021}, url = {https://arxiv.org/abs/2111.02086}, eprinttype = {arXiv}, eprint = {2111.02086}, timestamp = {Wed, 07 Feb 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2111-02086.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/taslp/ZhouYWHZZ20, author = {Qingyu Zhou and Nan Yang and Furu Wei and Shaohan Huang and Ming Zhou and Tiejun Zhao}, title = {A Joint Sentence Scoring and Selection Framework for Neural Extractive Document Summarization}, journal = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.}, volume = {28}, pages = {671--681}, year = {2020}, url = {https://doi.org/10.1109/TASLP.2020.2964427}, doi = {10.1109/TASLP.2020.2964427}, timestamp = {Fri, 13 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/taslp/ZhouYWHZZ20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/tnsm/HuangLFHZYL20, author = {Shaohan Huang and Yi Liu and Carol J. Fung and Rong He and Yining Zhao and Hailong Yang and Zhongzhi Luan}, title = {HitAnomaly: Hierarchical Transformers for Anomaly Detection in System Log}, journal = {{IEEE} Trans. Netw. Serv. Manag.}, volume = {17}, number = {4}, pages = {2064--2076}, year = {2020}, url = {https://doi.org/10.1109/TNSM.2020.3034647}, doi = {10.1109/TNSM.2020.3034647}, timestamp = {Wed, 15 Jun 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/tnsm/HuangLFHZYL20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/cnsm/HuangLFHZYL20, author = {Shaohan Huang and Yi Liu and Carol J. Fung and Rong He and Yining Zhao and Hailong Yang and Zhongzhi Luan}, editor = {Nur Zincir{-}Heywood and Mehmet Ulema and M{\"{u}}ge Sayit and Stuart Clayman and Myung{-}Sup Kim and Cihat Cetinkaya}, title = {Transfer Log-based Anomaly Detection with Pseudo Labels}, booktitle = {16th International Conference on Network and Service Management, {CNSM} 2020, Izmir, Turkey, November 2-6, 2020}, pages = {1--5}, publisher = {{IEEE}}, year = {2020}, url = {https://doi.org/10.23919/CNSM50824.2020.9269069}, doi = {10.23919/CNSM50824.2020.9269069}, timestamp = {Fri, 08 Dec 2023 07:53:07 +0100}, biburl = {https://dblp.org/rec/conf/cnsm/HuangLFHZYL20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/coling/LiXCHWLZ20, author = {Minghao Li and Yiheng Xu and Lei Cui and Shaohan Huang and Furu Wei and Zhoujun Li and Ming Zhou}, editor = {Donia Scott and N{\'{u}}ria Bel and Chengqing Zong}, title = {DocBank: {A} Benchmark Dataset for Document Layout Analysis}, booktitle = {Proceedings of the 28th International Conference on Computational Linguistics, {COLING} 2020, Barcelona, Spain (Online), December 8-13, 2020}, pages = {949--960}, publisher = {International Committee on Computational Linguistics}, year = {2020}, url = {https://doi.org/10.18653/v1/2020.coling-main.82}, doi = {10.18653/V1/2020.COLING-MAIN.82}, timestamp = {Tue, 21 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/coling/LiXCHWLZ20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/coling/HuangWCZZ20, author = {Shaohan Huang and Furu Wei and Lei Cui and Xingxing Zhang and Ming Zhou}, editor = {Donia Scott and N{\'{u}}ria Bel and Chengqing Zong}, title = {Unsupervised Fine-tuning for Text Clustering}, booktitle = {Proceedings of the 28th International Conference on Computational Linguistics, {COLING} 2020, Barcelona, Spain (Online), December 8-13, 2020}, pages = {5530--5534}, publisher = {International Committee on Computational Linguistics}, year = {2020}, url = {https://doi.org/10.18653/v1/2020.coling-main.482}, doi = {10.18653/V1/2020.COLING-MAIN.482}, timestamp = {Fri, 06 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/coling/HuangWCZZ20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/emnlp/JiKHWZH20, author = {Haozhe Ji and Pei Ke and Shaohan Huang and Furu Wei and Xiaoyan Zhu and Minlie Huang}, editor = {Bonnie Webber and Trevor Cohn and Yulan He and Yang Liu}, title = {Language Generation with Multi-Hop Reasoning on Commonsense Knowledge Graph}, booktitle = {Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing, {EMNLP} 2020, Online, November 16-20, 2020}, pages = {725--736}, publisher = {Association for Computational Linguistics}, year = {2020}, url = {https://doi.org/10.18653/v1/2020.emnlp-main.54}, doi = {10.18653/V1/2020.EMNLP-MAIN.54}, timestamp = {Tue, 20 Aug 2024 07:54:43 +0200}, biburl = {https://dblp.org/rec/conf/emnlp/JiKHWZH20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icoin/HuangLFAHZYL20, author = {Shaohan Huang and Yi Liu and Carol J. Fung and Wanhe An and Rong He and Yining Zhao and Hailong Yang and Zhongzhi Luan}, title = {A Gated Few-shot Learning Model For Anomaly Detection}, booktitle = {2020 International Conference on Information Networking, {ICOIN} 2020, Barcelona, Spain, January 7-10, 2020}, pages = {505--509}, publisher = {{IEEE}}, year = {2020}, url = {https://doi.org/10.1109/ICOIN48656.2020.9016599}, doi = {10.1109/ICOIN48656.2020.9016599}, timestamp = {Thu, 13 Jan 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icoin/HuangLFAHZYL20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ijcnlp/JiKHWH20, author = {Haozhe Ji and Pei Ke and Shaohan Huang and Furu Wei and Minlie Huang}, editor = {Kam{-}Fai Wong and Kevin Knight and Hua Wu}, title = {Generating Commonsense Explanation by Extracting Bridge Concepts from Reasoning Paths}, booktitle = {Proceedings of the 1st Conference of the Asia-Pacific Chapter of the Association for Computational Linguistics and the 10th International Joint Conference on Natural Language Processing, {AACL/IJCNLP} 2020, Suzhou, China, December 4-7, 2020}, pages = {248--257}, publisher = {Association for Computational Linguistics}, year = {2020}, url = {https://aclanthology.org/2020.aacl-main.28/}, timestamp = {Fri, 06 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ijcnlp/JiKHWH20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/kdd/XuL0HW020, author = {Yiheng Xu and Minghao Li and Lei Cui and Shaohan Huang and Furu Wei and Ming Zhou}, editor = {Rajesh Gupta and Yan Liu and Jiliang Tang and B. Aditya Prakash}, title = {LayoutLM: Pre-training of Text and Layout for Document Image Understanding}, booktitle = {{KDD} '20: The 26th {ACM} {SIGKDD} Conference on Knowledge Discovery and Data Mining, Virtual Event, CA, USA, August 23-27, 2020}, pages = {1192--1200}, publisher = {{ACM}}, year = {2020}, url = {https://doi.org/10.1145/3394486.3403172}, doi = {10.1145/3394486.3403172}, timestamp = {Sun, 02 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/kdd/XuL0HW020.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/lrec/LiCHWZL20, author = {Minghao Li and Lei Cui and Shaohan Huang and Furu Wei and Ming Zhou and Zhoujun Li}, editor = {Nicoletta Calzolari and Fr{\'{e}}d{\'{e}}ric B{\'{e}}chet and Philippe Blache and Khalid Choukri and Christopher Cieri and Thierry Declerck and Sara Goggi and Hitoshi Isahara and Bente Maegaard and Joseph Mariani and H{\'{e}}l{\`{e}}ne Mazo and Asunci{\'{o}}n Moreno and Jan Odijk and Stelios Piperidis}, title = {TableBank: Table Benchmark for Image-based Table Detection and Recognition}, booktitle = {Proceedings of The 12th Language Resources and Evaluation Conference, {LREC} 2020, Marseille, France, May 11-16, 2020}, pages = {1918--1925}, publisher = {European Language Resources Association}, year = {2020}, url = {https://aclanthology.org/2020.lrec-1.236/}, timestamp = {Tue, 21 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/lrec/LiCHWZL20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/noms/HuangLFHZYL20, author = {Shaohan Huang and Yi Liu and Carol J. Fung and Rong He and Yining Zhao and Hailong Yang and Zhongzhi Luan}, title = {Paddy: An Event Log Parsing Approach using Dynamic Dictionary}, booktitle = {{NOMS} 2020 - {IEEE/IFIP} Network Operations and Management Symposium, Budapest, Hungary, April 20-24, 2020}, pages = {1--8}, publisher = {{IEEE}}, year = {2020}, url = {https://doi.org/10.1109/NOMS47738.2020.9110435}, doi = {10.1109/NOMS47738.2020.9110435}, timestamp = {Wed, 15 Jun 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/noms/HuangLFHZYL20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2006-01038, author = {Minghao Li and Yiheng Xu and Lei Cui and Shaohan Huang and Furu Wei and Zhoujun Li and Ming Zhou}, title = {DocBank: {A} Benchmark Dataset for Document Layout Analysis}, journal = {CoRR}, volume = {abs/2006.01038}, year = {2020}, url = {https://arxiv.org/abs/2006.01038}, eprinttype = {arXiv}, eprint = {2006.01038}, timestamp = {Thu, 16 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2006-01038.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2009-11692, author = {Haozhe Ji and Pei Ke and Shaohan Huang and Furu Wei and Xiaoyan Zhu and Minlie Huang}, title = {Language Generation with Multi-Hop Reasoning on Commonsense Knowledge Graph}, journal = {CoRR}, volume = {abs/2009.11692}, year = {2020}, url = {https://arxiv.org/abs/2009.11692}, eprinttype = {arXiv}, eprint = {2009.11692}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2009-11692.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2009-11753, author = {Haozhe Ji and Pei Ke and Shaohan Huang and Furu Wei and Minlie Huang}, title = {Generating Commonsense Explanation by Extracting Bridge Concepts from Reasoning Paths}, journal = {CoRR}, volume = {abs/2009.11753}, year = {2020}, url = {https://arxiv.org/abs/2009.11753}, eprinttype = {arXiv}, eprint = {2009.11753}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2009-11753.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2012-15828, author = {Wenhui Wang and Hangbo Bao and Shaohan Huang and Li Dong and Furu Wei}, title = {MiniLMv2: Multi-Head Self-Attention Relation Distillation for Compressing Pretrained Transformers}, journal = {CoRR}, volume = {abs/2012.15828}, year = {2020}, url = {https://arxiv.org/abs/2012.15828}, eprinttype = {arXiv}, eprint = {2012.15828}, timestamp = {Fri, 19 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2012-15828.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/Huang0WL19, author = {Shaohan Huang and Yu Wu and Furu Wei and Zhongzhi Luan}, title = {Dictionary-Guided Editing Networks for Paraphrase Generation}, booktitle = {The Thirty-Third {AAAI} Conference on Artificial Intelligence, {AAAI} 2019, The Thirty-First Innovative Applications of Artificial Intelligence Conference, {IAAI} 2019, The Ninth {AAAI} Symposium on Educational Advances in Artificial Intelligence, {EAAI} 2019, Honolulu, Hawaii, USA, January 27 - February 1, 2019}, pages = {6546--6553}, publisher = {{AAAI} Press}, year = {2019}, url = {https://doi.org/10.1609/aaai.v33i01.33016546}, doi = {10.1609/AAAI.V33I01.33016546}, timestamp = {Mon, 04 Sep 2023 12:29:24 +0200}, biburl = {https://dblp.org/rec/conf/aaai/Huang0WL19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/0006WHWL019, author = {Yu Wu and Furu Wei and Shaohan Huang and Yunli Wang and Zhoujun Li and Ming Zhou}, title = {Response Generation by Context-Aware Prototype Editing}, booktitle = {The Thirty-Third {AAAI} Conference on Artificial Intelligence, {AAAI} 2019, The Thirty-First Innovative Applications of Artificial Intelligence Conference, {IAAI} 2019, The Ninth {AAAI} Symposium on Educational Advances in Artificial Intelligence, {EAAI} 2019, Honolulu, Hawaii, USA, January 27 - February 1, 2019}, pages = {7281--7288}, publisher = {{AAAI} Press}, year = {2019}, url = {https://doi.org/10.1609/aaai.v33i01.33017281}, doi = {10.1609/AAAI.V33I01.33017281}, timestamp = {Sun, 04 Aug 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/0006WHWL019.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nlpcc/BaoHWC0TPZ19, author = {Hangbo Bao and Shaohan Huang and Furu Wei and Lei Cui and Yu Wu and Chuanqi Tan and Songhao Piao and Ming Zhou}, editor = {Jie Tang and Min{-}Yen Kan and Dongyan Zhao and Sujian Li and Hongying Zan}, title = {Neural Melody Composition from Lyrics}, booktitle = {Natural Language Processing and Chinese Computing - 8th {CCF} International Conference, {NLPCC} 2019, Dunhuang, China, October 9-14, 2019, Proceedings, Part {I}}, series = {Lecture Notes in Computer Science}, volume = {11838}, pages = {499--511}, publisher = {Springer}, year = {2019}, url = {https://doi.org/10.1007/978-3-030-32233-5\_39}, doi = {10.1007/978-3-030-32233-5\_39}, timestamp = {Wed, 26 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/nlpcc/BaoHWC0TPZ19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1903-01949, author = {Minghao Li and Lei Cui and Shaohan Huang and Furu Wei and Ming Zhou and Zhoujun Li}, title = {TableBank: Table Benchmark for Image-based Table Detection and Recognition}, journal = {CoRR}, volume = {abs/1903.01949}, year = {2019}, url = {http://arxiv.org/abs/1903.01949}, eprinttype = {arXiv}, eprint = {1903.01949}, timestamp = {Thu, 16 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1903-01949.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1912-13318, author = {Yiheng Xu and Minghao Li and Lei Cui and Shaohan Huang and Furu Wei and Ming Zhou}, title = {LayoutLM: Pre-training of Text and Layout for Document Image Understanding}, journal = {CoRR}, volume = {abs/1912.13318}, year = {2019}, url = {http://arxiv.org/abs/1912.13318}, eprinttype = {arXiv}, eprint = {1912.13318}, timestamp = {Mon, 01 Jun 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1912-13318.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/acl/ZhaoZWYHZ18, author = {Qingyu Zhou and Nan Yang and Furu Wei and Shaohan Huang and Ming Zhou and Tiejun Zhao}, editor = {Iryna Gurevych and Yusuke Miyao}, title = {Neural Document Summarization by Jointly Learning to Score and Select Sentences}, booktitle = {Proceedings of the 56th Annual Meeting of the Association for Computational Linguistics, {ACL} 2018, Melbourne, Australia, July 15-20, 2018, Volume 1: Long Papers}, pages = {654--663}, publisher = {Association for Computational Linguistics}, year = {2018}, url = {https://aclanthology.org/P18-1061/}, doi = {10.18653/V1/P18-1061}, timestamp = {Fri, 06 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/acl/ZhaoZWYHZ18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1806-07042, author = {Yu Wu and Furu Wei and Shaohan Huang and Zhoujun Li and Ming Zhou}, title = {Response Generation by Context-aware Prototype Editing}, journal = {CoRR}, volume = {abs/1806.07042}, year = {2018}, url = {http://arxiv.org/abs/1806.07042}, eprinttype = {arXiv}, eprint = {1806.07042}, timestamp = {Wed, 26 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1806-07042.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1806-08077, author = {Shaohan Huang and Yu Wu and Furu Wei and Ming Zhou}, title = {Dictionary-Guided Editing Networks for Paraphrase Generation}, journal = {CoRR}, volume = {abs/1806.08077}, year = {2018}, url = {http://arxiv.org/abs/1806.08077}, eprinttype = {arXiv}, eprint = {1806.08077}, timestamp = {Wed, 26 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1806-08077.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1807-02305, author = {Qingyu Zhou and Nan Yang and Furu Wei and Shaohan Huang and Ming Zhou and Tiejun Zhao}, title = {Neural Document Summarization by Jointly Learning to Score and Select Sentences}, journal = {CoRR}, volume = {abs/1807.02305}, year = {2018}, url = {http://arxiv.org/abs/1807.02305}, eprinttype = {arXiv}, eprint = {1807.02305}, timestamp = {Wed, 25 Sep 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1807-02305.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1809-04318, author = {Hangbo Bao and Shaohan Huang and Furu Wei and Lei Cui and Yu Wu and Chuanqi Tan and Songhao Piao and Ming Zhou}, title = {Neural Melody Composition from Lyrics}, journal = {CoRR}, volume = {abs/1809.04318}, year = {2018}, url = {http://arxiv.org/abs/1809.04318}, eprinttype = {arXiv}, eprint = {1809.04318}, timestamp = {Wed, 26 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1809-04318.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1810-00341, author = {Shaohan Huang and Yu Wu and Furu Wei and Ming Zhou}, title = {Text Morphing}, journal = {CoRR}, volume = {abs/1810.00341}, year = {2018}, url = {http://arxiv.org/abs/1810.00341}, eprinttype = {arXiv}, eprint = {1810.00341}, timestamp = {Wed, 26 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1810-00341.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/acl/CuiHWTDZ17, author = {Lei Cui and Shaohan Huang and Furu Wei and Chuanqi Tan and Chaoqun Duan and Ming Zhou}, editor = {Mohit Bansal and Heng Ji}, title = {SuperAgent: {A} Customer Service Chatbot for E-commerce Websites}, booktitle = {Proceedings of the 55th Annual Meeting of the Association for Computational Linguistics, {ACL} 2017, Vancouver, Canada, July 30 - August 4, System Demonstrations}, pages = {97--102}, publisher = {Association for Computational Linguistics}, year = {2017}, url = {https://doi.org/10.18653/v1/P17-4017}, doi = {10.18653/V1/P17-4017}, timestamp = {Fri, 06 Aug 2021 00:40:50 +0200}, biburl = {https://dblp.org/rec/conf/acl/CuiHWTDZ17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/cnsm/HuangFLZWLQ17, author = {Shaohan Huang and Carol J. Fung and Chang Liu and Shupeng Zhang and Guang Wei and Zhongzhi Luan and Depei Qian}, title = {Arena: Adaptive real-time update anomaly prediction in cloud systems}, booktitle = {13th International Conference on Network and Service Management, {CNSM} 2017, Tokyo, Japan, November 26-30, 2017}, pages = {1--9}, publisher = {{IEEE} Computer Society}, year = {2017}, url = {https://doi.org/10.23919/CNSM.2017.8256031}, doi = {10.23919/CNSM.2017.8256031}, timestamp = {Wed, 16 Oct 2019 14:14:54 +0200}, biburl = {https://dblp.org/rec/conf/cnsm/HuangFLZWLQ17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/eacl/ZhouLWDHX17, author = {Li Dong and Shaohan Huang and Furu Wei and Mirella Lapata and Ming Zhou and Ke Xu}, editor = {Mirella Lapata and Phil Blunsom and Alexander Koller}, title = {Learning to Generate Product Reviews from Attributes}, booktitle = {Proceedings of the 15th Conference of the European Chapter of the Association for Computational Linguistics, {EACL} 2017, Valencia, Spain, April 3-7, 2017, Volume 1: Long Papers}, pages = {623--632}, publisher = {Association for Computational Linguistics}, year = {2017}, url = {https://doi.org/10.18653/v1/e17-1059}, doi = {10.18653/V1/E17-1059}, timestamp = {Fri, 06 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/eacl/ZhouLWDHX17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iwqos/ZhangFHLQ17, author = {Shupeng Zhang and Carol J. Fung and Shaohan Huang and Zhongzhi Luan and Depei Qian}, title = {{PSOM:} Periodic Self-Organizing Maps for unsupervised anomaly detection in periodic time series}, booktitle = {25th {IEEE/ACM} International Symposium on Quality of Service, IWQoS 2017, Vilanova i la Geltr{\'{u}}, Spain, June 14-16, 2017}, pages = {1--6}, publisher = {{IEEE}}, year = {2017}, url = {https://doi.org/10.1109/IWQoS.2017.7969174}, doi = {10.1109/IWQOS.2017.7969174}, timestamp = {Wed, 16 Oct 2019 14:14:53 +0200}, biburl = {https://dblp.org/rec/conf/iwqos/ZhangFHLQ17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iwqos/HuangFWPLQ16, author = {Shaohan Huang and Carol J. Fung and Kui Wang and Polo Pei and Zhongzhi Luan and Depei Qian}, title = {Using recurrent neural networks toward black-box system anomaly prediction}, booktitle = {24th {IEEE/ACM} International Symposium on Quality of Service, IWQoS 2016, Beijing, China, June 20-21, 2016}, pages = {1--10}, publisher = {{IEEE}}, year = {2016}, url = {https://doi.org/10.1109/IWQoS.2016.7590435}, doi = {10.1109/IWQOS.2016.7590435}, timestamp = {Wed, 16 Oct 2019 14:14:53 +0200}, biburl = {https://dblp.org/rec/conf/iwqos/HuangFWPLQ16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/cloudnet/HuangoFWYLQ15, author = {Shaohan Huang and Carol J. Fung and Kui Wang and Yaqi Yang and Zhongzhi Luan and Depei Qian}, title = {Revisit network anomaly ranking in datacenter network using re-ranking}, booktitle = {4th {IEEE} International Conference on Cloud Networking, CloudNet 2015, Niagara Falls, ON, Canada, October 5-7, 2015}, pages = {178--183}, publisher = {{IEEE}}, year = {2015}, url = {https://doi.org/10.1109/CloudNet.2015.7335302}, doi = {10.1109/CLOUDNET.2015.7335302}, timestamp = {Mon, 03 Jan 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/cloudnet/HuangoFWYLQ15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iwqos/WangFDPHLQ15, author = {Kui Wang and Carol J. Fung and Chao Ding and Polo Pei and Shaohan Huang and Zhongzhi Luan and Depei Qian}, title = {A methodology for root-cause analysis in component based systems}, booktitle = {23rd {IEEE} International Symposium on Quality of Service, IWQoS 2015, Portland, OR, USA, June 15-16, 2015}, pages = {243--248}, publisher = {{IEEE}}, year = {2015}, url = {https://doi.org/10.1109/IWQoS.2015.7404741}, doi = {10.1109/IWQOS.2015.7404741}, timestamp = {Wed, 16 Oct 2019 14:14:53 +0200}, biburl = {https://dblp.org/rec/conf/iwqos/WangFDPHLQ15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
manage site settings
To protect your privacy, all features that rely on external API calls from your browser are turned off by default. You need to opt-in for them to become active. All settings here will be stored as cookies with your web browser. For more information see our F.A.Q.