BibTeX records: Tim Dettmers

download as .bib file

@inproceedings{DBLP:conf/acl/BorzunovBDRBCSR23,
  author       = {Alexander Borzunov and
                  Dmitry Baranchuk and
                  Tim Dettmers and
                  Maksim Riabinin and
                  Younes Belkada and
                  Artem Chumachenko and
                  Pavel Samygin and
                  Colin Raffel},
  editor       = {Danushka Bollegala and
                  Ruihong Huang and
                  Alan Ritter},
  title        = {Petals: Collaborative Inference and Fine-tuning of Large Models},
  booktitle    = {Proceedings of the 61st Annual Meeting of the Association for Computational
                  Linguistics: System Demonstrations, {ACL} 2023, Toronto, Canada, July
                  10-12, 2023},
  pages        = {558--568},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.acl-demo.54},
  doi          = {10.18653/V1/2023.ACL-DEMO.54},
  timestamp    = {Thu, 10 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/BorzunovBDRBCSR23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/LiuDLSL23,
  author       = {Zeyu Liu and
                  Tim Dettmers and
                  Xi Lin and
                  Veselin Stoyanov and
                  Xian Li},
  editor       = {Houda Bouamor and
                  Juan Pino and
                  Kalika Bali},
  title        = {Towards {A} Unified View of Sparse Feed-Forward Network in Pretraining
                  Large Language Model},
  booktitle    = {Proceedings of the 2023 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2023, Singapore, December 6-10, 2023},
  pages        = {15038--15061},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.emnlp-main.930},
  doi          = {10.18653/V1/2023.EMNLP-MAIN.930},
  timestamp    = {Fri, 12 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/LiuDLSL23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/DettmersZ23,
  author       = {Tim Dettmers and
                  Luke Zettlemoyer},
  editor       = {Andreas Krause and
                  Emma Brunskill and
                  Kyunghyun Cho and
                  Barbara Engelhardt and
                  Sivan Sabato and
                  Jonathan Scarlett},
  title        = {The case for 4-bit precision: k-bit Inference Scaling Laws},
  booktitle    = {International Conference on Machine Learning, {ICML} 2023, 23-29 July
                  2023, Honolulu, Hawaii, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {7750--7774},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v202/dettmers23a.html},
  timestamp    = {Mon, 28 Aug 2023 17:23:08 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/DettmersZ23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/RyabininDDB23,
  author       = {Max Ryabinin and
                  Tim Dettmers and
                  Michael Diskin and
                  Alexander Borzunov},
  editor       = {Andreas Krause and
                  Emma Brunskill and
                  Kyunghyun Cho and
                  Barbara Engelhardt and
                  Sivan Sabato and
                  Jonathan Scarlett},
  title        = {{SWARM} Parallelism: Training Large Models Can Be Surprisingly Communication-Efficient},
  booktitle    = {International Conference on Machine Learning, {ICML} 2023, 23-29 July
                  2023, Honolulu, Hawaii, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {29416--29440},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v202/ryabinin23a.html},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/RyabininDDB23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BorzunovRCBDBSR23,
  author       = {Alexander Borzunov and
                  Max Ryabinin and
                  Artem Chumachenko and
                  Dmitry Baranchuk and
                  Tim Dettmers and
                  Younes Belkada and
                  Pavel Samygin and
                  Colin A. Raffel},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {Distributed Inference and Fine-tuning of Large Language Models Over
                  The Internet},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/28bf1419b9a1f908c15f6195f58cb865-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/BorzunovRCBDBSR23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/DettmersPHZ23,
  author       = {Tim Dettmers and
                  Artidoro Pagnoni and
                  Ari Holtzman and
                  Luke Zettlemoyer},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {QLoRA: Efficient Finetuning of Quantized LLMs},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/1feb87871436031bdc0f2beaa62a049b-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/DettmersPHZ23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/WortsmanDZMFS23,
  author       = {Mitchell Wortsman and
                  Tim Dettmers and
                  Luke Zettlemoyer and
                  Ari Morcos and
                  Ali Farhadi and
                  Ludwig Schmidt},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {Stable and low-precision training for large-scale vision-language
                  models},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/20bd42d82998bc61732c00452228e814-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/WortsmanDZMFS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2301-11913,
  author       = {Max Ryabinin and
                  Tim Dettmers and
                  Michael Diskin and
                  Alexander Borzunov},
  title        = {{SWARM} Parallelism: Training Large Models Can Be Surprisingly Communication-Efficient},
  journal      = {CoRR},
  volume       = {abs/2301.11913},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2301.11913},
  doi          = {10.48550/ARXIV.2301.11913},
  eprinttype    = {arXiv},
  eprint       = {2301.11913},
  timestamp    = {Tue, 31 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2301-11913.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2304-13013,
  author       = {Mitchell Wortsman and
                  Tim Dettmers and
                  Luke Zettlemoyer and
                  Ari Morcos and
                  Ali Farhadi and
                  Ludwig Schmidt},
  title        = {Stable and low-precision training for large-scale vision-language
                  models},
  journal      = {CoRR},
  volume       = {abs/2304.13013},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2304.13013},
  doi          = {10.48550/ARXIV.2304.13013},
  eprinttype    = {arXiv},
  eprint       = {2304.13013},
  timestamp    = {Wed, 03 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2304-13013.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-13999,
  author       = {Leo Z. Liu and
                  Tim Dettmers and
                  Xi Victoria Lin and
                  Veselin Stoyanov and
                  Xian Li},
  title        = {Towards {A} Unified View of Sparse Feed-Forward Network in Pretraining
                  Large Language Model},
  journal      = {CoRR},
  volume       = {abs/2305.13999},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.13999},
  doi          = {10.48550/ARXIV.2305.13999},
  eprinttype    = {arXiv},
  eprint       = {2305.13999},
  timestamp    = {Mon, 05 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-13999.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-14314,
  author       = {Tim Dettmers and
                  Artidoro Pagnoni and
                  Ari Holtzman and
                  Luke Zettlemoyer},
  title        = {QLoRA: Efficient Finetuning of Quantized LLMs},
  journal      = {CoRR},
  volume       = {abs/2305.14314},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.14314},
  doi          = {10.48550/ARXIV.2305.14314},
  eprinttype    = {arXiv},
  eprint       = {2305.14314},
  timestamp    = {Mon, 05 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-14314.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2306-03078,
  author       = {Tim Dettmers and
                  Ruslan Svirschevski and
                  Vage Egiazarian and
                  Denis Kuznedelev and
                  Elias Frantar and
                  Saleh Ashkboos and
                  Alexander Borzunov and
                  Torsten Hoefler and
                  Dan Alistarh},
  title        = {SpQR: {A} Sparse-Quantized Representation for Near-Lossless {LLM}
                  Weight Compression},
  journal      = {CoRR},
  volume       = {abs/2306.03078},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.03078},
  doi          = {10.48550/ARXIV.2306.03078},
  eprinttype    = {arXiv},
  eprint       = {2306.03078},
  timestamp    = {Tue, 13 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-03078.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-07707,
  author       = {Devvrit and
                  Sneha Kudugunta and
                  Aditya Kusupati and
                  Tim Dettmers and
                  Kaifeng Chen and
                  Inderjit S. Dhillon and
                  Yulia Tsvetkov and
                  Hannaneh Hajishirzi and
                  Sham M. Kakade and
                  Ali Farhadi and
                  Prateek Jain},
  title        = {MatFormer: Nested Transformer for Elastic Inference},
  journal      = {CoRR},
  volume       = {abs/2310.07707},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.07707},
  doi          = {10.48550/ARXIV.2310.07707},
  eprinttype    = {arXiv},
  eprint       = {2310.07707},
  timestamp    = {Tue, 24 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-07707.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2312-08361,
  author       = {Alexander Borzunov and
                  Max Ryabinin and
                  Artem Chumachenko and
                  Dmitry Baranchuk and
                  Tim Dettmers and
                  Younes Belkada and
                  Pavel Samygin and
                  Colin Raffel},
  title        = {Distributed Inference and Fine-tuning of Large Language Models Over
                  The Internet},
  journal      = {CoRR},
  volume       = {abs/2312.08361},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2312.08361},
  doi          = {10.48550/ARXIV.2312.08361},
  eprinttype    = {arXiv},
  eprint       = {2312.08361},
  timestamp    = {Mon, 08 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2312-08361.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/DettmersLSZ22,
  author       = {Tim Dettmers and
                  Mike Lewis and
                  Sam Shleifer and
                  Luke Zettlemoyer},
  title        = {8-bit Optimizers via Block-wise Quantization},
  booktitle    = {The Tenth International Conference on Learning Representations, {ICLR}
                  2022, Virtual Event, April 25-29, 2022},
  publisher    = {OpenReview.net},
  year         = {2022},
  url          = {https://openreview.net/forum?id=shpkpVXzo3h},
  timestamp    = {Sat, 20 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/DettmersLSZ22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/DettmersLBZ22,
  author       = {Tim Dettmers and
                  Mike Lewis and
                  Younes Belkada and
                  Luke Zettlemoyer},
  editor       = {Sanmi Koyejo and
                  S. Mohamed and
                  A. Agarwal and
                  Danielle Belgrave and
                  K. Cho and
                  A. Oh},
  title        = {GPT3.int8(): 8-bit Matrix Multiplication for Transformers at Scale},
  booktitle    = {Advances in Neural Information Processing Systems 35: Annual Conference
                  on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans,
                  LA, USA, November 28 - December 9, 2022},
  year         = {2022},
  url          = {http://papers.nips.cc/paper\_files/paper/2022/hash/c3ba4962c05c49636d4c6206a97e9c8a-Abstract-Conference.html},
  timestamp    = {Mon, 08 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/DettmersLBZ22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2207-03481,
  author       = {Alexander Borzunov and
                  Max Ryabinin and
                  Tim Dettmers and
                  Quentin Lhoest and
                  Lucile Saulnier and
                  Michael Diskin and
                  Yacine Jernite and
                  Thomas Wolf},
  title        = {Training Transformers Together},
  journal      = {CoRR},
  volume       = {abs/2207.03481},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2207.03481},
  doi          = {10.48550/ARXIV.2207.03481},
  eprinttype    = {arXiv},
  eprint       = {2207.03481},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2207-03481.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2208-03306,
  author       = {Margaret Li and
                  Suchin Gururangan and
                  Tim Dettmers and
                  Mike Lewis and
                  Tim Althoff and
                  Noah A. Smith and
                  Luke Zettlemoyer},
  title        = {Branch-Train-Merge: Embarrassingly Parallel Training of Expert Language
                  Models},
  journal      = {CoRR},
  volume       = {abs/2208.03306},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2208.03306},
  doi          = {10.48550/ARXIV.2208.03306},
  eprinttype    = {arXiv},
  eprint       = {2208.03306},
  timestamp    = {Wed, 10 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2208-03306.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2208-07339,
  author       = {Tim Dettmers and
                  Mike Lewis and
                  Younes Belkada and
                  Luke Zettlemoyer},
  title        = {LLM.int8(): 8-bit Matrix Multiplication for Transformers at Scale},
  journal      = {CoRR},
  volume       = {abs/2208.07339},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2208.07339},
  doi          = {10.48550/ARXIV.2208.07339},
  eprinttype    = {arXiv},
  eprint       = {2208.07339},
  timestamp    = {Wed, 17 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2208-07339.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2209-01188,
  author       = {Alexander Borzunov and
                  Dmitry Baranchuk and
                  Tim Dettmers and
                  Max Ryabinin and
                  Younes Belkada and
                  Artem Chumachenko and
                  Pavel Samygin and
                  Colin Raffel},
  title        = {Petals: Collaborative Inference and Fine-tuning of Large Models},
  journal      = {CoRR},
  volume       = {abs/2209.01188},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2209.01188},
  doi          = {10.48550/ARXIV.2209.01188},
  eprinttype    = {arXiv},
  eprint       = {2209.01188},
  timestamp    = {Mon, 26 Sep 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2209-01188.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2212-09720,
  author       = {Tim Dettmers and
                  Luke Zettlemoyer},
  title        = {The case for 4-bit precision: k-bit Inference Scaling Laws},
  journal      = {CoRR},
  volume       = {abs/2212.09720},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2212.09720},
  doi          = {10.48550/ARXIV.2212.09720},
  eprinttype    = {arXiv},
  eprint       = {2212.09720},
  timestamp    = {Tue, 03 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2212-09720.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/LewisBDGZ21,
  author       = {Mike Lewis and
                  Shruti Bhosale and
                  Tim Dettmers and
                  Naman Goyal and
                  Luke Zettlemoyer},
  editor       = {Marina Meila and
                  Tong Zhang},
  title        = {{BASE} Layers: Simplifying Training of Large, Sparse Models},
  booktitle    = {Proceedings of the 38th International Conference on Machine Learning,
                  {ICML} 2021, 18-24 July 2021, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {139},
  pages        = {6265--6274},
  publisher    = {{PMLR}},
  year         = {2021},
  url          = {http://proceedings.mlr.press/v139/lewis21a.html},
  timestamp    = {Wed, 25 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/LewisBDGZ21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BorzunovRDLSDJ021,
  author       = {Alexander Borzunov and
                  Max Ryabinin and
                  Tim Dettmers and
                  Quentin Lhoest and
                  Lucile Saulnier and
                  Michael Diskin and
                  Yacine Jernite and
                  Thomas Wolf},
  editor       = {Douwe Kiela and
                  Marco Ciccone and
                  Barbara Caputo},
  title        = {Training Transformers Together},
  booktitle    = {NeurIPS 2021 Competitions and Demonstrations Track, 6-14 December
                  2021, Online},
  series       = {Proceedings of Machine Learning Research},
  volume       = {176},
  pages        = {335--342},
  publisher    = {{PMLR}},
  year         = {2021},
  url          = {https://proceedings.mlr.press/v176/borzunov22a.html},
  timestamp    = {Thu, 11 Aug 2022 12:07:10 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/BorzunovRDLSDJ021.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2103-16716,
  author       = {Mike Lewis and
                  Shruti Bhosale and
                  Tim Dettmers and
                  Naman Goyal and
                  Luke Zettlemoyer},
  title        = {{BASE} Layers: Simplifying Training of Large, Sparse Models},
  journal      = {CoRR},
  volume       = {abs/2103.16716},
  year         = {2021},
  url          = {https://arxiv.org/abs/2103.16716},
  eprinttype    = {arXiv},
  eprint       = {2103.16716},
  timestamp    = {Wed, 07 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2103-16716.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2110-02861,
  author       = {Tim Dettmers and
                  Mike Lewis and
                  Sam Shleifer and
                  Luke Zettlemoyer},
  title        = {8-bit Optimizers via Block-wise Quantization},
  journal      = {CoRR},
  volume       = {abs/2110.02861},
  year         = {2021},
  url          = {https://arxiv.org/abs/2110.02861},
  eprinttype    = {arXiv},
  eprint       = {2110.02861},
  timestamp    = {Thu, 21 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2110-02861.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/IlharcoITDFL20,
  author       = {Gabriel Ilharco and
                  Cesar Ilharco and
                  Iulia Turc and
                  Tim Dettmers and
                  Felipe Ferreira and
                  Kenton Lee},
  editor       = {Aline Villavicencio and
                  Benjamin Van Durme},
  title        = {High Performance Natural Language Processing},
  booktitle    = {Proceedings of the 2020 Conference on Empirical Methods in Natural
                  Language Processing: Tutorial Abstracts, {EMNLP} 2020, Online, November
                  19-20, 2020},
  pages        = {24--27},
  publisher    = {Association for Computational Linguistics},
  year         = {2020},
  url          = {https://doi.org/10.18653/v1/2020.emnlp-tutorials.4},
  doi          = {10.18653/V1/2020.EMNLP-TUTORIALS.4},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/IlharcoITDFL20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1907-04840,
  author       = {Tim Dettmers and
                  Luke Zettlemoyer},
  title        = {Sparse Networks from Scratch: Faster Training without Losing Performance},
  journal      = {CoRR},
  volume       = {abs/1907.04840},
  year         = {2019},
  url          = {http://arxiv.org/abs/1907.04840},
  eprinttype    = {arXiv},
  eprint       = {1907.04840},
  timestamp    = {Wed, 17 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1907-04840.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/DettmersMS018,
  author       = {Tim Dettmers and
                  Pasquale Minervini and
                  Pontus Stenetorp and
                  Sebastian Riedel},
  editor       = {Sheila A. McIlraith and
                  Kilian Q. Weinberger},
  title        = {Convolutional 2D Knowledge Graph Embeddings},
  booktitle    = {Proceedings of the Thirty-Second {AAAI} Conference on Artificial Intelligence,
                  (AAAI-18), the 30th innovative Applications of Artificial Intelligence
                  (IAAI-18), and the 8th {AAAI} Symposium on Educational Advances in
                  Artificial Intelligence (EAAI-18), New Orleans, Louisiana, USA, February
                  2-7, 2018},
  pages        = {1811--1818},
  publisher    = {{AAAI} Press},
  year         = {2018},
  url          = {https://doi.org/10.1609/aaai.v32i1.11573},
  doi          = {10.1609/AAAI.V32I1.11573},
  timestamp    = {Sat, 21 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/DettmersMS018.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/WeissenbornMAWR18,
  author       = {Dirk Weissenborn and
                  Pasquale Minervini and
                  Isabelle Augenstein and
                  Johannes Welbl and
                  Tim Rockt{\"{a}}schel and
                  Matko Bosnjak and
                  Jeff Mitchell and
                  Thomas Demeester and
                  Tim Dettmers and
                  Pontus Stenetorp and
                  Sebastian Riedel},
  editor       = {Fei Liu and
                  Thamar Solorio},
  title        = {Jack the Reader - {A} Machine Reading Framework},
  booktitle    = {Proceedings of {ACL} 2018, Melbourne, Australia, July 15-20, 2018,
                  System Demonstrations},
  pages        = {25--30},
  publisher    = {Association for Computational Linguistics},
  year         = {2018},
  url          = {https://aclanthology.org/P18-4005/},
  doi          = {10.18653/V1/P18-4005},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/WeissenbornMAWR18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1806-08727,
  author       = {Dirk Weissenborn and
                  Pasquale Minervini and
                  Tim Dettmers and
                  Isabelle Augenstein and
                  Johannes Welbl and
                  Tim Rockt{\"{a}}schel and
                  Matko Bosnjak and
                  Jeff Mitchell and
                  Thomas Demeester and
                  Pontus Stenetorp and
                  Sebastian Riedel},
  title        = {Jack the Reader - {A} Machine Reading Framework},
  journal      = {CoRR},
  volume       = {abs/1806.08727},
  year         = {2018},
  url          = {http://arxiv.org/abs/1806.08727},
  eprinttype    = {arXiv},
  eprint       = {1806.08727},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1806-08727.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/DettmersMSR17,
  author       = {Tim Dettmers and
                  Pasquale Minervini and
                  Pontus Stenetorp and
                  Sebastian Riedel},
  title        = {Convolutional 2D Knowledge Graph Embeddings},
  journal      = {CoRR},
  volume       = {abs/1707.01476},
  year         = {2017},
  url          = {http://arxiv.org/abs/1707.01476},
  eprinttype    = {arXiv},
  eprint       = {1707.01476},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/DettmersMSR17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/Dettmers15,
  author       = {Tim Dettmers},
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {8-Bit Approximations for Parallelism in Deep Learning},
  booktitle    = {4th International Conference on Learning Representations, {ICLR} 2016,
                  San Juan, Puerto Rico, May 2-4, 2016, Conference Track Proceedings},
  year         = {2016},
  url          = {http://arxiv.org/abs/1511.04561},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/Dettmers15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
a service of  Schloss Dagstuhl - Leibniz Center for Informatics