Search dblp for Publications

export results for "pipeline parallelism"

 download as .bib file

@article{DBLP:journals/access/JangYY24,
  author       = {Bongwon Jang and
                  In{-}Chul Yoo and
                  Dongsuk Yook},
  title        = {Pipeline Parallelism With Elastic Averaging},
  journal      = {{IEEE} Access},
  volume       = {12},
  pages        = {5477--5489},
  year         = {2024}
}
@inproceedings{DBLP:conf/asplos/SunCWF0WC24,
  author       = {Zhenbo Sun and
                  Huanqi Cao and
                  Yuanwei Wang and
                  Guanyu Feng and
                  Shengqi Chen and
                  Haojie Wang and
                  Wenguang Chen},
  title        = {AdaPipe: Optimizing Pipeline Parallelism with Adaptive Recomputation
                  and Partitioning},
  booktitle    = {{ASPLOS} {(3)}},
  pages        = {86--100},
  publisher    = {{ACM}},
  year         = {2024}
}
@inproceedings{DBLP:conf/hpca/CragoDSK24,
  author       = {Neal Clayton Crago and
                  Sana Damani and
                  Karthikeyan Sankaralingam and
                  Stephen W. Keckler},
  title        = {{WASP:} Exploiting {GPU} Pipeline Parallelism with Hardware-Accelerated
                  Automatic Warp Specialization},
  booktitle    = {{HPCA}},
  pages        = {1--16},
  publisher    = {{IEEE}},
  year         = {2024}
}
@inproceedings{DBLP:conf/pdp/DreuningLOBN24,
  author       = {Henk Dreuning and
                  Anna Badia Liokouras and
                  Xiaowei Ouyang and
                  Henri E. Bal and
                  Rob V. van Nieuwpoort},
  title        = {CAPSlog: Scalable Memory-Centric Partitioning for Pipeline Parallelism},
  booktitle    = {{PDP}},
  pages        = {17--25},
  publisher    = {{IEEE}},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2401-02088,
  author       = {Mincong Huang and
                  Chao Wang and
                  Chi Ma and
                  Yineng Zhang and
                  Peng Zhang and
                  Lei Yu},
  title        = {Re-evaluating the Memory-balanced Pipeline Parallelism: BPipe},
  journal      = {CoRR},
  volume       = {abs/2401.02088},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2401-10241,
  author       = {Penghui Qi and
                  Xinyi Wan and
                  Guangxing Huang and
                  Min Lin},
  title        = {Zero Bubble Pipeline Parallelism},
  journal      = {CoRR},
  volume       = {abs/2401.10241},
  year         = {2024}
}
@article{DBLP:journals/corr/abs-2402-03791,
  author       = {Ding Tang and
                  Lijuan Jiang and
                  Minxi Jin and
                  Jiecheng Zhou and
                  Hengjie Li and
                  Xingcheng Zhang and
                  Zhilin Pei},
  title        = {Adaptive Blockwise Task-interleaved Pipeline Parallelism},
  journal      = {CoRR},
  volume       = {abs/2402.03791},
  year         = {2024}
}
@article{DBLP:journals/jsac/ShiZLMG23,
  author       = {Hongjian Shi and
                  Weichu Zheng and
                  Zifei Liu and
                  Ruhui Ma and
                  Haibing Guan},
  title        = {Automatic Pipeline Parallelism: {A} Parallel Inference Framework for
                  Deep Learning Applications in 6G Mobile Communication Systems},
  journal      = {{IEEE} J. Sel. Areas Commun.},
  volume       = {41},
  number       = {7},
  pages        = {2041--2056},
  year         = {2023}
}
@inproceedings{DBLP:conf/dac/ZhangZTWH23,
  author       = {Weigang Zhang and
                  Biyu Zhou and
                  Xuehai Tang and
                  Zhaoxing Wang and
                  Songlin Hu},
  title        = {MixPipe: Efficient Bidirectional Pipeline Parallelism for Training
                  Large-Scale Models},
  booktitle    = {{DAC}},
  pages        = {1--6},
  publisher    = {{IEEE}},
  year         = {2023}
}
@inproceedings{DBLP:conf/europar/VontzalidisPBDIDBCEKZT23,
  author       = {Aristotelis Vontzalidis and
                  Stratos Psomadakis and
                  Constantinos Bitsakos and
                  Mark Dokter and
                  Kevin Innerebner and
                  Patrick Damme and
                  Matthias Boehm and
                  Florina M. Ciorba and
                  Ahmed Eleliemy and
                  Vasileios Karakostas and
                  Ales Zamuda and
                  Dimitrios Tsoumakos},
  title        = {{DAPHNE} Runtime: Harnessing Parallelism for Integrated Data Analysis
                  Pipelines},
  booktitle    = {Euro-Par Workshops},
  series       = {Lecture Notes in Computer Science},
  volume       = {14352},
  pages        = {242--246},
  publisher    = {Springer},
  year         = {2023}
}
@inproceedings{DBLP:conf/hpca/NguyenS23,
  author       = {Quan M. Nguyen and
                  Daniel S{\'{a}}nchez},
  title        = {Phloem: Automatic Acceleration of Irregular Applications with Fine-Grain
                  Pipeline Parallelism},
  booktitle    = {{HPCA}},
  pages        = {1262--1274},
  publisher    = {{IEEE}},
  year         = {2023}
}
@inproceedings{DBLP:conf/hpcc/LiuLLW023,
  author       = {Yujie Liu and
                  Zhiquan Lai and
                  Weijie Liu and
                  Wei Wang and
                  Dongsheng Li},
  title        = {Efficient Large Models Fine-tuning on Commodity Servers via Memory-balanced
                  Pipeline Parallelism},
  booktitle    = {HPCC/DSS/SmartCity/DependSys},
  pages        = {726--727},
  publisher    = {{IEEE}},
  year         = {2023}
}
@inproceedings{DBLP:conf/hpdc/XiaZWYZC23,
  author       = {Yaqi Xia and
                  Zheng Zhang and
                  Hulin Wang and
                  Donglin Yang and
                  Xiaobo Zhou and
                  Dazhao Cheng},
  title        = {Redundancy-Free High-Performance Dynamic {GNN} Training with Hierarchical
                  Pipeline Parallelism},
  booktitle    = {{HPDC}},
  pages        = {17--30},
  publisher    = {{ACM}},
  year         = {2023}
}
@inproceedings{DBLP:conf/icml/KimKYC23,
  author       = {Taebum Kim and
                  Hyoungjoo Kim and
                  Gyeong{-}In Yu and
                  Byung{-}Gon Chun},
  title        = {BPipe: Memory-Balanced Pipeline Parallelism for Training Large Language
                  Models},
  booktitle    = {{ICML}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {16639--16653},
  publisher    = {{PMLR}},
  year         = {2023}
}
@inproceedings{DBLP:conf/icpads/NiknamiSW23,
  author       = {Nadia Niknami and
                  Abdalaziz Sawwan and
                  Jie Wu},
  title        = {SmartPipe: Intelligently Freezing Layers in Pipeline Parallelism for
                  Distributed {DNN} Training},
  booktitle    = {{ICPADS}},
  pages        = {1885--1894},
  publisher    = {{IEEE}},
  year         = {2023}
}
@inproceedings{DBLP:conf/ipps/ZhangYXDTZC23,
  author       = {Zheng Zhang and
                  Donglin Yang and
                  Yaqi Xia and
                  Liang Ding and
                  Dacheng Tao and
                  Xiaobo Zhou and
                  Dazhao Cheng},
  title        = {MPipeMoE: Memory Efficient MoE for Pre-trained Models with Adaptive
                  Pipeline Parallelism},
  booktitle    = {{IPDPS}},
  pages        = {167--177},
  publisher    = {{IEEE}},
  year         = {2023}
}
@inproceedings{DBLP:conf/sc/LiuCZ023,
  author       = {Ziming Liu and
                  Shenggan Cheng and
                  Haotian Zhou and
                  Yang You},
  title        = {Hanayo: Harnessing Wave-like Pipeline Parallelism for Enhanced Large
                  Model Training Efficiency},
  booktitle    = {{SC}},
  pages        = {56:1--56:13},
  publisher    = {{ACM}},
  year         = {2023}
}
@inproceedings{DBLP:conf/spawc/WangDZHCL23,
  author       = {Luya Wang and
                  Yanjie Dong and
                  Lei Zhang and
                  Xiping Hu and
                  Laizhong Cui and
                  Victor C. M. Leung},
  title        = {Wireless Model Splitting for Communication-Efficient Personalized
                  Federated Learning with Pipeline Parallelism},
  booktitle    = {{SPAWC}},
  pages        = {421--425},
  publisher    = {{IEEE}},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2302-12803,
  author       = {Zihan Zhang and
                  Philip Rodgers and
                  Peter Kilpatrick and
                  Ivor T. A. Spence and
                  Blesson Varghese},
  title        = {PipeLearn: Pipeline Parallelism for Collaborative Machine Learning},
  journal      = {CoRR},
  volume       = {abs/2302.12803},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2303-01675,
  author       = {Siyu Wang and
                  Zongyan Cao and
                  Chang Si and
                  Lansong Diao and
                  Jiamang Wang and
                  Wei Lin},
  title        = {Ada-Grouper: Accelerating Pipeline Parallelism in Preempted Network
                  by Adaptive Group-Scheduling for Micro-Batches},
  journal      = {CoRR},
  volume       = {abs/2303.01675},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2304-11414,
  author       = {Xin Chen and
                  Hengheng Zhang and
                  Xiaotao Gu and
                  Kaifeng Bi and
                  Lingxi Xie and
                  Qi Tian},
  title        = {Pipeline MoE: {A} Flexible MoE Implementation with Pipeline Parallelism},
  journal      = {CoRR},
  volume       = {abs/2304.11414},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2308-10087,
  author       = {Jingji Chen and
                  Zhuoming Chen and
                  Xuehai Qian},
  title        = {GNNPipe: Accelerating Distributed Full-Graph {GNN} Training with Pipelined
                  Model Parallelism},
  journal      = {CoRR},
  volume       = {abs/2308.10087},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2308-15762,
  author       = {Ziming Liu and
                  Shenggan Cheng and
                  Haotian Zhou and
                  Yang You},
  title        = {Hanayo: Harnessing Wave-like Pipeline Parallelism for Enhanced Large
                  Model Training Efficiency},
  journal      = {CoRR},
  volume       = {abs/2308.15762},
  year         = {2023}
}
@article{DBLP:journals/corr/abs-2311-03703,
  author       = {Aaron Archer and
                  Matthew Fahrbach and
                  Kuikui Liu and
                  Prakash Prabhu},
  title        = {Pipeline Parallelism for {DNN} Inference with Practical Performance
                  Guarantees},
  journal      = {CoRR},
  volume       = {abs/2311.03703},
  year         = {2023}
}
@article{DBLP:journals/et/SparkmanSD22,
  author       = {Brett Sparkman and
                  Scott C. Smith and
                  Jia Di},
  title        = {Built-In Self-Test for Multi-Threshold {NULL} Convention Logic Asynchronous
                  Circuits using Pipeline Stage Parallelism},
  journal      = {J. Electron. Test.},
  volume       = {38},
  number       = {3},
  pages        = {321--334},
  year         = {2022}
}
@article{DBLP:journals/iotj/YoonBKL22,
  author       = {JinYi Yoon and
                  Yeongsin Byeon and
                  Jeewoon Kim and
                  HyungJune Lee},
  title        = {EdgePipe: Tailoring Pipeline Parallelism With Deep Neural Networks
                  for Volatile Wireless Edge Devices},
  journal      = {{IEEE} Internet Things J.},
  volume       = {9},
  number       = {14},
  pages        = {11633--11647},
  year         = {2022}
}
@article{DBLP:journals/ppl/ZhaoXWTWWIJ22,
  author       = {Letian Zhao and
                  Rui Xu and
                  Tianqi Wang and
                  Teng Tian and
                  Xiaotian Wang and
                  Wei Wu and
                  Chio{-}in Ieong and
                  Xi Jin},
  title        = {BaPipe: Balanced Pipeline Parallelism for {DNN} Training},
  journal      = {Parallel Process. Lett.},
  volume       = {32},
  number       = {3{\&}4},
  pages        = {2250005:1--2250005:17},
  year         = {2022}
}
@inproceedings{DBLP:conf/asplos/ZhaoLCSCWZLC22,
  author       = {Shixiong Zhao and
                  Fanxin Li and
                  Xusheng Chen and
                  Tianxiang Shen and
                  Li Chen and
                  Sen Wang and
                  Nicholas Zhang and
                  Cheng Li and
                  Heming Cui},
  title        = {NASPipe: high performance and reproducible pipeline parallel supernet
                  training via causal synchronous parallelism},
  booktitle    = {{ASPLOS}},
  pages        = {374--387},
  publisher    = {{ACM}},
  year         = {2022}
}
@inproceedings{DBLP:conf/cluster/LiuLLDGL22,
  author       = {Weijie Liu and
                  Zhiquan Lai and
                  Shengwei Li and
                  Yabo Duan and
                  Keshi Ge and
                  Dongsheng Li},
  title        = {AutoPipe: {A} Fast Pipeline Parallelism Approach with Balanced Partitioning
                  and Micro-batch Slicing},
  booktitle    = {{CLUSTER}},
  pages        = {301--312},
  publisher    = {{IEEE}},
  year         = {2022}
}
@inproceedings{DBLP:conf/dac/ChiuH22,
  author       = {Cheng{-}Hsiang Chiu and
                  Tsung{-}Wei Huang},
  title        = {Efficient timing propagation with simultaneous structural and pipeline
                  parallelisms: late breaking results},
  booktitle    = {{DAC}},
  pages        = {1388--1389},
  publisher    = {{ACM}},
  year         = {2022}
}
@inproceedings{DBLP:conf/dsd/HuIZKBCW22,
  author       = {Yang Hu and
                  Connor Imes and
                  Xuanang Zhao and
                  Souvik Kundu and
                  Peter A. Beerel and
                  Stephen P. Crago and
                  John Paul Walters},
  title        = {PipeEdge: Pipeline Parallelism for Large-Scale Model Inference on
                  Heterogeneous Edge Devices},
  booktitle    = {{DSD}},
  pages        = {298--307},
  publisher    = {{IEEE}},
  year         = {2022}
}
@inproceedings{DBLP:conf/hpdc/ChiuH22,
  author       = {Cheng{-}Hsiang Chiu and
                  Tsung{-}Wei Huang},
  title        = {Composing Pipeline Parallelism using Control Taskflow Graph},
  booktitle    = {{HPDC}},
  pages        = {283--284},
  publisher    = {{ACM}},
  year         = {2022}
}
@inproceedings{DBLP:conf/ica3pp/JiangWMHHDF22,
  author       = {Wei Jiang and
                  Bo Wang and
                  Sheng Ma and
                  Xiang Hou and
                  Libo Huang and
                  Yi Dai and
                  Jianbin Fang},
  title        = {PipeFB: An Optimized Pipeline Parallelism Scheme to Reduce the Peak
                  Memory Usage},
  booktitle    = {{ICA3PP}},
  series       = {Lecture Notes in Computer Science},
  volume       = {13777},
  pages        = {590--604},
  publisher    = {Springer},
  year         = {2022}
}
@inproceedings{DBLP:conf/iclr/YangZZYW22,
  author       = {Pengcheng Yang and
                  Xiaoming Zhang and
                  Wenpeng Zhang and
                  Ming Yang and
                  Hong Wei},
  title        = {Group-based Interleaved Pipeline Parallelism for Large-scale {DNN}
                  Training},
  booktitle    = {{ICLR}},
  publisher    = {OpenReview.net},
  year         = {2022}
}
@inproceedings{DBLP:conf/icpads/DuanW22,
  author       = {Yubin Duan and
                  Jie Wu},
  title        = {Optimizing Resource Allocation in Pipeline Parallelism for Distributed
                  {DNN} Training},
  booktitle    = {{ICPADS}},
  pages        = {161--168},
  publisher    = {{IEEE}},
  year         = {2022}
}
@inproceedings{DBLP:conf/ipps/BeaumontES22,
  author       = {Olivier Beaumont and
                  Lionel Eyraud{-}Dubois and
                  Alena Shilova},
  title        = {MadPipe: Memory Aware Dynamic Programming Algorithm for Pipelined
                  Model Parallelism},
  booktitle    = {{IPDPS} Workshops},
  pages        = {1063--1073},
  publisher    = {{IEEE}},
  year         = {2022}
}
@inproceedings{DBLP:conf/vee/BlanaruSFK22,
  author       = {Florin Blanaru and
                  Athanasios Stratikopoulos and
                  Juan Fumero and
                  Christos Kotselidis},
  title        = {Enabling pipeline parallelism in heterogeneous managed runtime environments
                  via batch processing},
  booktitle    = {{VEE}},
  pages        = {58--71},
  publisher    = {{ACM}},
  year         = {2022}
}
@article{DBLP:journals/corr/abs-2211-05953,
  author       = {Joel Lamy{-}Poirier},
  title        = {Breadth-First Pipeline Parallelism},
  journal      = {CoRR},
  volume       = {abs/2211.05953},
  year         = {2022}
}
@article{DBLP:journals/ijpp/JanjicBB21,
  author       = {Vladimir Janjic and
                  Christopher Brown and
                  Adam D. Barwell},
  title        = {Restoration of Legacy Parallelism: Transforming Pthreads into Farm
                  and Pipeline Patterns},
  journal      = {Int. J. Parallel Program.},
  volume       = {49},
  number       = {6},
  pages        = {886--910},
  year         = {2021}
}
@article{DBLP:journals/paapp/AndoKT21,
  author       = {Ruo Ando and
                  Youki Kadobayashi and
                  Hiroki Takakura},
  title        = {Choice of parallelism: multi-GPU driven pipeline for huge academic
                  backbone network},
  journal      = {Int. J. Parallel Emergent Distributed Syst.},
  volume       = {36},
  number       = {6},
  pages        = {609--622},
  year         = {2021}
}
@article{DBLP:journals/tcyb/LiZLWKZ21,
  author       = {Jian{-}Yu Li and
                  Zhi{-}Hui Zhan and
                  Run{-}Dong Liu and
                  Chuan Wang and
                  Sam Kwong and
                  Jun Zhang},
  title        = {Generation-Level Parallelism for Evolutionary Computation: {A} Pipeline-Based
                  Parallel Particle Swarm Optimization},
  journal      = {{IEEE} Trans. Cybern.},
  volume       = {51},
  number       = {10},
  pages        = {4848--4859},
  year         = {2021}
}
@inproceedings{DBLP:conf/europar/BeaumontES21,
  author       = {Olivier Beaumont and
                  Lionel Eyraud{-}Dubois and
                  Alena Shilova},
  title        = {Pipelined Model Parallelism: Complexity Results and Memory Considerations},
  booktitle    = {Euro-Par},
  series       = {Lecture Notes in Computer Science},
  volume       = {12820},
  pages        = {183--198},
  publisher    = {Springer},
  year         = {2021}
}
@inproceedings{DBLP:conf/icml/LiZGZZSS21,
  author       = {Zhuohan Li and
                  Siyuan Zhuang and
                  Shiyuan Guo and
                  Danyang Zhuo and
                  Hao Zhang and
                  Dawn Song and
                  Ion Stoica},
  title        = {TeraPipe: Token-Level Pipeline Parallelism for Training Large-Scale
                  Language Models},
  booktitle    = {{ICML}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {139},
  pages        = {6543--6552},
  publisher    = {{PMLR}},
  year         = {2021}
}
@inproceedings{DBLP:conf/ispa/JiangXMWHL21,
  author       = {Wei Jiang and
                  Rui Xu and
                  Sheng Ma and
                  Qiong Wang and
                  Xiang Hou and
                  Hongyi Lu},
  title        = {A Memory Saving Mechanism Based on Data Transferring for Pipeline
                  Parallelism},
  booktitle    = {ISPA/BDCloud/SocialCom/SustainCom},
  pages        = {1230--1235},
  publisher    = {{IEEE}},
  year         = {2021}
}
@inproceedings{DBLP:conf/sosp/KimJRICKKPW21,
  author       = {Jongyul Kim and
                  Insu Jang and
                  Waleed Reda and
                  Jaeseong Im and
                  Marco Canini and
                  Dejan Kostic and
                  Youngjin Kwon and
                  Simon Peter and
                  Emmett Witchel},
  title        = {LineFS: Efficient SmartNIC Offload of a Distributed File System with
                  Pipeline Parallelism},
  booktitle    = {{SOSP}},
  pages        = {756--771},
  publisher    = {{ACM}},
  year         = {2021}
}
@inproceedings{DBLP:conf/usenix/EliadHJSS21,
  author       = {Saar Eliad and
                  Ido Hakimi and
                  Alon De Jagger and
                  Mark Silberstein and
                  Assaf Schuster},
  title        = {Fine-tuning giant neural networks on commodity hardware with automatic
                  pipeline model parallelism},
  booktitle    = {{USENIX} Annual Technical Conference},
  pages        = {381--396},
  publisher    = {{USENIX} Association},
  year         = {2021}
}
@article{DBLP:journals/corr/abs-2102-07988,
  author       = {Zhuohan Li and
                  Siyuan Zhuang and
                  Shiyuan Guo and
                  Danyang Zhuo and
                  Hao Zhang and
                  Dawn Song and
                  Ion Stoica},
  title        = {TeraPipe: Token-Level Pipeline Parallelism for Training Large-Scale
                  Language Models},
  journal      = {CoRR},
  volume       = {abs/2102.07988},
  year         = {2021}
}
@article{DBLP:journals/corr/abs-2106-02679,
  author       = {Joel Lamy{-}Poirier},
  title        = {Layered gradient accumulation and modular pipeline parallelism: fast
                  and efficient training of large language models},
  journal      = {CoRR},
  volume       = {abs/2106.02679},
  year         = {2021}
}
@article{DBLP:journals/corr/abs-2106-12863,
  author       = {Ruo Ando and
                  Youki Kadobayashi and
                  Hiroki Takakura},
  title        = {Choice of Parallelism: Multi-GPU Driven Pipeline for Huge Academic
                  Backbone Network},
  journal      = {CoRR},
  volume       = {abs/2106.12863},
  year         = {2021}
}
@article{DBLP:journals/corr/abs-2110-14895,
  author       = {Yang Hu and
                  Connor Imes and
                  Xuanang Zhao and
                  Souvik Kundu and
                  Peter A. Beerel and
                  Stephen P. Crago and
                  John Paul Walters},
  title        = {Pipeline Parallelism for Inference on Heterogeneous Edge Computing},
  journal      = {CoRR},
  volume       = {abs/2110.14895},
  year         = {2021}
}
@inproceedings{DBLP:conf/ic-nc/TakisawaYI20,
  author       = {Naoki Takisawa and
                  Syunji Yazaki and
                  Hiroaki Ishihata},
  title        = {Distributed Deep Learning of ResNet50 and {VGG16} with Pipeline Parallelism},
  booktitle    = {{CANDAR} (Workshops)},
  pages        = {130--136},
  publisher    = {{IEEE}},
  year         = {2020}
}
@inproceedings{DBLP:conf/micro/NguyenS20,
  author       = {Quan M. Nguyen and
                  Daniel S{\'{a}}nchez},
  title        = {Pipette: Improving Core Utilization on Irregular Applications through
                  Intra-Core Pipeline Parallelism},
  booktitle    = {{MICRO}},
  pages        = {596--608},
  publisher    = {{IEEE}},
  year         = {2020}
}
@inproceedings{DBLP:conf/middleware/RochaMCFBS20,
  author       = {Isabelly Rocha and
                  Nathaniel Morris and
                  Lydia Y. Chen and
                  Pascal Felber and
                  Robert Birke and
                  Valerio Schiavoni},
  title        = {PipeTune: Pipeline Parallelism of Hyper and System Parameters Tuning
                  for Deep Learning Clusters},
  booktitle    = {Middleware},
  pages        = {89--104},
  publisher    = {{ACM}},
  year         = {2020}
}
@inproceedings{DBLP:conf/usenix/ParkYYNLCNC20,
  author       = {Jay H. Park and
                  Gyeongchan Yun and
                  Chang M. Yi and
                  Nguyen T. Nguyen and
                  Seungmin Lee and
                  Jaesik Choi and
                  Sam H. Noh and
                  Young{-}ri Choi},
  title        = {HetPipe: Enabling Large {DNN} Training on (Whimpy) Heterogeneous {GPU}
                  Clusters through Integration of Pipelined Model Parallelism and Data
                  Parallelism},
  booktitle    = {{USENIX} Annual Technical Conference},
  pages        = {307--321},
  publisher    = {{USENIX} Association},
  year         = {2020}
}
@article{DBLP:journals/corr/abs-2004-09910,
  author       = {Chiheon Kim and
                  Heungsub Lee and
                  Myungryong Jeong and
                  Woonhyuk Baek and
                  Boogeon Yoon and
                  Ildoo Kim and
                  Sungbin Lim and
                  Sungwoong Kim},
  title        = {torchgpipe: On-the-fly Pipeline Parallelism for Training Giant Models},
  journal      = {CoRR},
  volume       = {abs/2004.09910},
  year         = {2020}
}
@article{DBLP:journals/corr/abs-2005-14038,
  author       = {Jay H. Park and
                  Gyeongchan Yun and
                  Chang M. Yi and
                  Nguyen T. Nguyen and
                  Seungmin Lee and
                  Jaesik Choi and
                  Sam H. Noh and
                  Young{-}ri Choi},
  title        = {HetPipe: Enabling Large {DNN} Training on (Whimpy) Heterogeneous {GPU}
                  Clusters through Integration of Pipelined Model Parallelism and Data
                  Parallelism},
  journal      = {CoRR},
  volume       = {abs/2005.14038},
  year         = {2020}
}
@article{DBLP:journals/corr/abs-2010-00501,
  author       = {Isabelly Rocha and
                  Nathaniel Morris and
                  Lydia Y. Chen and
                  Pascal Felber and
                  Robert Birke and
                  Valerio Schiavoni},
  title        = {PipeTune: Pipeline Parallelism of Hyper and System Parameters Tuning
                  for Deep Learning Clusters},
  journal      = {CoRR},
  volume       = {abs/2010.00501},
  year         = {2020}
}
@article{DBLP:journals/corr/abs-2012-12544,
  author       = {Letian Zhao and
                  Rui Xu and
                  Tianqi Wang and
                  Teng Tian and
                  Xiaotian Wang and
                  Wei Wu and
                  Chio{-}in Ieong and
                  Xi Jin},
  title        = {BaPipe: Exploration of Balanced Pipeline Parallelism for {DNN} Training},
  journal      = {CoRR},
  volume       = {abs/2012.12544},
  year         = {2020}
}
@inproceedings{DBLP:conf/nips/HuangCBFCCLNLWC19,
  author       = {Yanping Huang and
                  Youlong Cheng and
                  Ankur Bapna and
                  Orhan Firat and
                  Dehao Chen and
                  Mia Xu Chen and
                  HyoukJoong Lee and
                  Jiquan Ngiam and
                  Quoc V. Le and
                  Yonghui Wu and
                  Zhifeng Chen},
  title        = {GPipe: Efficient Training of Giant Neural Networks using Pipeline
                  Parallelism},
  booktitle    = {NeurIPS},
  pages        = {103--112},
  year         = {2019}
}
@inproceedings{DBLP:conf/sosp/NarayananHPSDGG19,
  author       = {Deepak Narayanan and
                  Aaron Harlap and
                  Amar Phanishayee and
                  Vivek Seshadri and
                  Nikhil R. Devanur and
                  Gregory R. Ganger and
                  Phillip B. Gibbons and
                  Matei Zaharia},
  title        = {PipeDream: generalized pipeline parallelism for {DNN} training},
  booktitle    = {{SOSP}},
  pages        = {1--15},
  publisher    = {{ACM}},
  year         = {2019}
}
@article{DBLP:journals/corr/abs-1911-04610,
  author       = {Lei Guan and
                  Wotao Yin and
                  Dongsheng Li and
                  Xicheng Lu},
  title        = {XPipe: Efficient Pipeline Model Parallelism for Multi-GPU {DNN} Training},
  journal      = {CoRR},
  volume       = {abs/1911.04610},
  year         = {2019}
}
@article{DBLP:journals/corr/abs-1811-06965,
  author       = {Yanping Huang and
                  Yonglong Cheng and
                  Dehao Chen and
                  HyoukJoong Lee and
                  Jiquan Ngiam and
                  Quoc V. Le and
                  Zhifeng Chen},
  title        = {GPipe: Efficient Training of Giant Neural Networks using Pipeline
                  Parallelism},
  journal      = {CoRR},
  volume       = {abs/1811.06965},
  year         = {2018}
}
@inproceedings{DBLP:conf/ispa/WangTLF17,
  author       = {Junchang Wang and
                  Yangfeng Tian and
                  Tao Li and
                  Xiong Fu},
  title        = {A Flexible Communication Mechanism for Pipeline Parallelism},
  booktitle    = {{ISPA/IUCC}},
  pages        = {778--785},
  publisher    = {{IEEE}},
  year         = {2017}
}
@inproceedings{DBLP:conf/pdp/WangK17,
  author       = {Yang Wang and
                  Kenneth B. Kent},
  title        = {A Region-Based Approach to Pipeline Parallelism in Java Programs on
                  Multicores},
  booktitle    = {{PDP}},
  pages        = {124--131},
  publisher    = {{IEEE} Computer Society},
  year         = {2017}
}
@article{DBLP:journals/jcsc/KamaliH16,
  author       = {Hadi Mardani Kamali and
                  Shaahin Hessabi},
  title        = {A Fault Tolerant Parallelism Approach for Implementing High-Throughput
                  Pipelined Advanced Encryption Standard},
  journal      = {J. Circuits Syst. Comput.},
  volume       = {25},
  number       = {9},
  pages        = {1650113:1--1650113:14},
  year         = {2016}
}
@inproceedings{DBLP:conf/IEEEpact/KimJKS16,
  author       = {Gwangsun Kim and
                  Jiyun Jeong and
                  John Kim and
                  Mark Stephenson},
  title        = {Automatically Exploiting Implicit Pipeline Parallelism from Multiple
                  Dependent Kernels for GPUs},
  booktitle    = {{PACT}},
  pages        = {341--352},
  publisher    = {{ACM}},
  year         = {2016}
}
@inproceedings{DBLP:conf/asap/ChoiLBA16,
  author       = {Jongsok Choi and
                  Ruolong Lian and
                  Stephen Dean Brown and
                  Jason Helge Anderson},
  title        = {A unified software approach to specify pipeline and spatial parallelism
                  in {FPGA} hardware},
  booktitle    = {{ASAP}},
  pages        = {75--82},
  publisher    = {{IEEE} Computer Society},
  year         = {2016}
}
@inproceedings{DBLP:conf/europar/ParkB16,
  author       = {Jinsu Park and
                  Woongki Baek},
  title        = {{HAP:} {A} Heterogeneity-Conscious Runtime System for Adaptive Pipeline
                  Parallelism},
  booktitle    = {Euro-Par},
  series       = {Lecture Notes in Computer Science},
  volume       = {9833},
  pages        = {518--530},
  publisher    = {Springer},
  year         = {2016}
}
@inproceedings{DBLP:conf/scopes/KoekGHCB16,
  author       = {Peter Koek and
                  Stefan J. Geuns and
                  Joost P. H. M. Hausmans and
                  Henk Corporaal and
                  Marco Jan Gerrit Bekooij},
  title        = {CSDFa: {A} Model for Exploiting the Trade-Off between Data and Pipeline
                  Parallelism},
  booktitle    = {{SCOPES}},
  pages        = {30--39},
  publisher    = {{ACM}},
  year         = {2016}
}
@article{DBLP:journals/ieicet/ChenLWZW15,
  author       = {Chen Chen and
                  Kai Lu and
                  Xiaoping Wang and
                  Xu Zhou and
                  Zhendong Wu},
  title        = {A Load-Balanced Deterministic Runtime for Pipeline Parallelism},
  journal      = {{IEICE} Trans. Inf. Syst.},
  volume       = {98-D},
  number       = {2},
  pages        = {433--436},
  year         = {2015}
}
@article{DBLP:journals/ijnc/YamagiwaWW15,
  author       = {Shinichi Yamagiwa and
                  Guyue Wang and
                  Koichi Wada},
  title        = {Development of an Algorithm for Extracting Parallelism and Pipeline
                  Structure from Stream-based Processing flow with Spanning Tree},
  journal      = {Int. J. Netw. Comput.},
  volume       = {5},
  number       = {1},
  pages        = {159--179},
  year         = {2015}
}
@article{DBLP:journals/jcst/ZhangLC15,
  author       = {Yu Zhang and
                  Zhaopeng Li and
                  Hui{-}Fang Cao},
  title        = {System-Enforced Deterministic Streaming for Efficient Pipeline Parallelism},
  journal      = {J. Comput. Sci. Technol.},
  volume       = {30},
  number       = {1},
  pages        = {57--73},
  year         = {2015}
}
@article{DBLP:journals/topc/LeeLSZS15,
  author       = {I{-}Ting Angelina Lee and
                  Charles E. Leiserson and
                  Tao B. Schardl and
                  Zhunping Zhang and
                  Jim Sukha},
  title        = {On-the-Fly Pipeline Parallelism},
  journal      = {{ACM} Trans. Parallel Comput.},
  volume       = {2},
  number       = {3},
  pages        = {17:1--17:42},
  year         = {2015}
}
@inproceedings{DBLP:conf/bigdataconf/TranPS15,
  author       = {Nam{-}Luc Tran and
                  Thomas Peel and
                  Sabri Skhiri},
  title        = {Distributed frank-wolfe under pipelined stale synchronous parallelism},
  booktitle    = {{IEEE} BigData},
  pages        = {184--192},
  publisher    = {{IEEE} Computer Society},
  year         = {2015}
}
@inproceedings{DBLP:conf/memocode/HausmansGWB14,
  author       = {Joost P. H. M. Hausmans and
                  Stefan J. Geuns and
                  Maarten Wiggers and
                  Marco Jan Gerrit Bekooij},
  title        = {Unified dataflow model for the analysis of data and pipeline parallelism,
                  and buffer sizing},
  booktitle    = {{MEMOCODE}},
  pages        = {12--21},
  publisher    = {{IEEE}},
  year         = {2014}
}
@inproceedings{DBLP:conf/springsim/KhammassiL14,
  author       = {Nader Khammassi and
                  Jean{-}Christophe Le Lann},
  title        = {A high-level programming model to ease pipeline parallelism expression
                  on shared memory multicore architectures},
  booktitle    = {SpringSim {(HPS)}},
  pages        = {9},
  publisher    = {{ACM}},
  year         = {2014}
}
@phdthesis{DBLP:phd/hal/PreudHomme13,
  author       = {Thomas Preud'homme},
  title        = {Communication inter-c{\oe}urs optimis{\'{e}}e pour le parall{\'{e}}lisme
                  de flux. (Optimized inter-core communication for pipeline parallelism)},
  school       = {Pierre and Marie Curie University, Paris, France},
  year         = {2013}
}
@article{DBLP:journals/ieicet/MuLCDW13,
  author       = {Shuai Mu and
                  Dongdong Li and
                  Yubei Chen and
                  Yangdong Deng and
                  Zhihua Wang},
  title        = {Exploiting the Task-Pipelined Parallelism of Stream Programs on Many-Core
                  GPUs},
  journal      = {{IEICE} Trans. Inf. Syst.},
  volume       = {96-D},
  number       = {10},
  pages        = {2194--2207},
  year         = {2013}
}
@article{DBLP:journals/jsa/LinLLHS13,
  author       = {Chih{-}Sheng Lin and
                  Chao{-}Sheng Lin and
                  Yu{-}Shin Lin and
                  Pao{-}Ann Hsiung and
                  Chihhsiong Shih},
  title        = {Multi-objective exploitation of pipeline parallelism using clustering,
                  replication and duplication in embedded multi-core systems},
  journal      = {J. Syst. Archit.},
  volume       = {59},
  number       = {10-C},
  pages        = {1083--1094},
  year         = {2013}
}
@inproceedings{DBLP:conf/cases/CordesENM13,
  author       = {Daniel Cordes and
                  Michael Engel and
                  Olaf Neugebauer and
                  Peter Marwedel},
  title        = {Automatic Extraction of pipeline parallelism for embedded heterogeneous
                  multi-core platforms},
  booktitle    = {{CASES}},
  pages        = {4:1--4:10},
  publisher    = {{IEEE}},
  year         = {2013}
}
@inproceedings{DBLP:conf/cases/SchorYBT13,
  author       = {Lars Schor and
                  Hoeseok Yang and
                  Iuliana Bacivarov and
                  Lothar Thiele},
  title        = {Expandable process networks to efficiently specify and explore task,
                  data, and pipeline parallelism},
  booktitle    = {{CASES}},
  pages        = {5:1--5:10},
  publisher    = {{IEEE}},
  year         = {2013}
}
@inproceedings{DBLP:conf/hipc/LiABC13,
  author       = {Peng Li and
                  Kunal Agrawal and
                  Jeremy Buhler and
                  Roger D. Chamberlain},
  title        = {Adding data parallelism to streaming pipelines for throughput optimization},
  booktitle    = {HiPC},
  pages        = {20--29},
  publisher    = {{IEEE} Computer Society},
  year         = {2013}
}
@inproceedings{DBLP:conf/icpp/YamagiwaJZZX13,
  author       = {Shinichi Yamagiwa and
                  Ryo Jozaki and
                  Shixun Zhang and
                  Ryo Zaizen and
                  Dewen Xu},
  title        = {Exploiting Execution Order and Parallelism from Processing Flow Applying
                  Pipeline-Based Programming Method on Manycore Accelerators},
  booktitle    = {{ICPP}},
  pages        = {708--717},
  publisher    = {{IEEE} Computer Society},
  year         = {2013}
}
@inproceedings{DBLP:conf/pldi/Ragan-KelleyBAPDA13,
  author       = {Jonathan Ragan{-}Kelley and
                  Connelly Barnes and
                  Andrew Adams and
                  Sylvain Paris and
                  Fr{\'{e}}do Durand and
                  Saman P. Amarasinghe},
  title        = {Halide: a language and compiler for optimizing parallelism, locality,
                  and recomputation in image processing pipelines},
  booktitle    = {{PLDI}},
  pages        = {519--530},
  publisher    = {{ACM}},
  year         = {2013}
}
@inproceedings{DBLP:conf/sc/KamruzzamanST13,
  author       = {Md. Kamruzzaman and
                  Steven Swanson and
                  Dean M. Tullsen},
  title        = {Load-balanced pipeline parallelism},
  booktitle    = {{SC}},
  pages        = {14:1--14:12},
  publisher    = {{ACM}},
  year         = {2013}
}
@inproceedings{DBLP:conf/sc/VandierendonckCN13,
  author       = {Hans Vandierendonck and
                  Kallia Chronaki and
                  Dimitrios S. Nikolopoulos},
  title        = {Deterministic scale-free pipeline parallelism with hyperqueues},
  booktitle    = {{SC}},
  pages        = {32:1--32:12},
  publisher    = {{ACM}},
  year         = {2013}
}
@inproceedings{DBLP:conf/spaa/LeeLSSZ13,
  author       = {I{-}Ting Angelina Lee and
                  Charles E. Leiserson and
                  Tao B. Schardl and
                  Jim Sukha and
                  Zhunping Zhang},
  title        = {On-the-fly pipeline parallelism},
  booktitle    = {{SPAA}},
  pages        = {140--151},
  publisher    = {{ACM}},
  year         = {2013}
}
@inproceedings{DBLP:conf/codes/CordesEMN12,
  author       = {Daniel Cordes and
                  Michael Engel and
                  Peter Marwedel and
                  Olaf Neugebauer},
  title        = {Automatic extraction of multi-objective aware pipeline parallelism
                  using genetic algorithms},
  booktitle    = {{CODES+ISSS}},
  pages        = {73--82},
  publisher    = {{ACM}},
  year         = {2012}
}
@inproceedings{DBLP:conf/europar/BenknerBMSNT12,
  author       = {Siegfried Benkner and
                  Enes Bajrovic and
                  Erich Marth and
                  Martin Sandrieser and
                  Raymond Namyst and
                  Samuel Thibault},
  title        = {High-Level Support for Pipeline Parallelism on Many-Core Architectures},
  booktitle    = {Euro-Par},
  series       = {Lecture Notes in Computer Science},
  volume       = {7484},
  pages        = {614--625},
  publisher    = {Springer},
  year         = {2012}
}
@inproceedings{DBLP:conf/icpads/PreudhommeS0F12,
  author       = {Thomas Preud'homme and
                  Julien Sopena and
                  Ga{\"{e}}l Thomas and
                  Bertil Folliot},
  title        = {An Improvement of OpenMP Pipeline Parallelism with the BatchQueue
                  Algorithm},
  booktitle    = {{ICPADS}},
  pages        = {348--355},
  publisher    = {{IEEE} Computer Society},
  year         = {2012}
}
@inproceedings{DBLP:conf/icpp/ChenYZLZC12,
  author       = {Peng Chen and
                  Donglei Yang and
                  Weihua Zhang and
                  Yi Li and
                  Binyu Zang and
                  Haibo Chen},
  title        = {Adaptive Pipeline Parallelism for Image Feature Extraction Algorithms},
  booktitle    = {{ICPP}},
  pages        = {299--308},
  publisher    = {{IEEE} Computer Society},
  year         = {2012}
}
@inproceedings{DBLP:conf/ppopp/Qasem12,
  author       = {Apan Qasem},
  title        = {Efficient execution of time-step computations with pipelined parallelism
                  and inter-thread data locality optimizaitions},
  booktitle    = {{PMAM}},
  pages        = {27--35},
  publisher    = {{ACM}},
  year         = {2012}
}
@inproceedings{DBLP:conf/IEEEpact/SanchezLYSK11,
  author       = {Daniel S{\'{a}}nchez and
                  David Lo and
                  Richard M. Yoo and
                  Jeremy Sugerman and
                  Christos Kozyrakis},
  title        = {Dynamic Fine-Grain Scheduling of Pipeline Parallelism},
  booktitle    = {{PACT}},
  pages        = {22--32},
  publisher    = {{IEEE} Computer Society},
  year         = {2011}
}
@inproceedings{DBLP:conf/ica3pp/LiYHSCP11,
  author       = {Shigang Li and
                  Shucai Yao and
                  Haohu He and
                  Lili Sun and
                  Yi Chen and
                  Yunfeng Peng},
  title        = {Extending Synchronization Constructs in OpenMP to Exploit Pipeline
                  Parallelism on Heterogeneous Multi-core},
  booktitle    = {{ICA3PP} {(2)}},
  series       = {Lecture Notes in Computer Science},
  volume       = {7017},
  pages        = {54--63},
  publisher    = {Springer},
  year         = {2011}
}
@inproceedings{DBLP:conf/icpads/CordesHMM11,
  author       = {Daniel Cordes and
                  Andreas Heinig and
                  Peter Marwedel and
                  Arindam Mallik},
  title        = {Automatic Extraction of Pipeline Parallelism for Embedded Software
                  Using Linear Programming},
  booktitle    = {{ICPADS}},
  pages        = {699--706},
  publisher    = {{IEEE} Computer Society},
  year         = {2011}
}
@inproceedings{DBLP:conf/oopsla/ReedCJ11,
  author       = {Eric C. Reed and
                  Nicholas Chen and
                  Ralph E. Johnson},
  title        = {Expressing pipeline parallelism using {TBB} constructs: a case study
                  on what works and what doesn't},
  booktitle    = {{SPLASH} Workshops},
  pages        = {133--138},
  publisher    = {{ACM}},
  year         = {2011}
}
@article{DBLP:journals/concurrency/Gonzalez-VelezC10,
  author       = {Horacio Gonz{\'{a}}lez{-}V{\'{e}}lez and
                  Murray Cole},
  title        = {Adaptive structured parallelism for distributed heterogeneous architectures:
                  a methodological approach with pipelines and farms},
  journal      = {Concurr. Comput. Pract. Exp.},
  volume       = {22},
  number       = {15},
  pages        = {2073--2094},
  year         = {2010}
}
@article{DBLP:journals/pc/RulVB10,
  author       = {Sean Rul and
                  Hans Vandierendonck and
                  Koen De Bosschere},
  title        = {A profile-based tool for finding pipeline parallelism in sequential
                  programs},
  journal      = {Parallel Comput.},
  volume       = {36},
  number       = {9},
  pages        = {531--551},
  year         = {2010}
}
@inproceedings{DBLP:conf/IEEEpact/SulemanQKP10,
  author       = {M. Aater Suleman and
                  Moinuddin K. Qureshi and
                  Khubaib and
                  Yale N. Patt},
  title        = {Feedback-directed pipeline parallelism},
  booktitle    = {{PACT}},
  pages        = {147--156},
  publisher    = {{ACM}},
  year         = {2010}
}
@inproceedings{DBLP:conf/IEEEpact/TournavitisF10,
  author       = {Georgios Tournavitis and
                  Bj{\"{o}}rn Franke},
  title        = {Semi-automatic extraction and exploitation of hierarchical pipeline
                  parallelism using profiling information},
  booktitle    = {{PACT}},
  pages        = {377--388},
  publisher    = {{ACM}},
  year         = {2010}
}
@inproceedings{DBLP:conf/europar/OttoSDT10,
  author       = {Frank Otto and
                  Christoph A. Schaefer and
                  Matthias Dempe and
                  Walter F. Tichy},
  title        = {A Language-Based Tuning Mechanism for Task and Pipeline Parallelism},
  booktitle    = {Euro-Par {(2)}},
  series       = {Lecture Notes in Computer Science},
  volume       = {6272},
  pages        = {328--340},
  publisher    = {Springer},
  year         = {2010}
}
@inproceedings{DBLP:conf/IEEEpact/NavarroATC09,
  author       = {Angeles G. Navarro and
                  Rafael Asenjo and
                  Siham Tabik and
                  Calin Cascaval},
  title        = {Analytical Modeling of Pipeline Parallelism},
  booktitle    = {{PACT}},
  pages        = {281--290},
  publisher    = {{IEEE} Computer Society},
  year         = {2009}
}
@inproceedings{DBLP:conf/arcs/SyrivelisL09,
  author       = {Dimitris Syrivelis and
                  Spyros Lalis},
  title        = {Extracting Coarse-Grained Pipelined Parallelism Out of Sequential
                  Applications for Parallel Processor Arrays},
  booktitle    = {{ARCS}},
  series       = {Lecture Notes in Computer Science},
  volume       = {5455},
  pages        = {4--15},
  publisher    = {Springer},
  year         = {2009}
}
@inproceedings{DBLP:conf/icppw/WuWDX09,
  author       = {Guiming Wu and
                  Miao Wang and
                  Yong Dou and
                  Fei Xia},
  title        = {Exploiting Fine-Grained Pipeline Parallelism for Wavefront Computations
                  on Multicore Platforms},
  booktitle    = {{ICPP} Workshops},
  pages        = {402--408},
  publisher    = {{IEEE} Computer Society},
  year         = {2009}
}
@inproceedings{DBLP:conf/ics/NavarroATC09,
  author       = {Angeles G. Navarro and
                  Rafael Asenjo and
                  Siham Tabik and
                  Calin Cascaval},
  title        = {Load balancing using work-stealing for pipeline parallelism in emerging
                  applications},
  booktitle    = {{ICS}},
  pages        = {517--518},
  publisher    = {{ACM}},
  year         = {2009}
}
@incollection{DBLP:reference/db/X09xqs,
  title        = {Pipelined and Independent Parallelism},
  booktitle    = {Encyclopedia of Database Systems},
  pages        = {2117},
  publisher    = {Springer {US}},
  year         = {2009}
}
@article{DBLP:journals/jilp/PuzakHESN08,
  author       = {Thomas R. Puzak and
                  Allan Hartstein and
                  Philip G. Emma and
                  Vijayalakshmi Srinivasan and
                  Arthur Nadas},
  title        = {Analyzing the Cost of a Cache Miss Using Pipeline Spectroscopy},
  journal      = {J. Instr. Level Parallelism},
  volume       = {10},
  year         = {2008}
}
@inproceedings{DBLP:conf/icsoft/HassanB08,
  author       = {Mohamad Al Hajj Hassan and
                  Mostafa Bamha},
  title        = {Pipelined Parallelism in Multi-Join Queries on Heterogeneous Shared
                  Nothing Architectures},
  booktitle    = {{ICSOFT} {(PL/DPS/KE)}},
  pages        = {127--134},
  publisher    = {{INSTICC} Press},
  year         = {2008}
}
@inproceedings{DBLP:conf/ppopp/GiacomoniMV08,
  author       = {John Giacomoni and
                  Tipp Moseley and
                  Manish Vachharajani},
  title        = {FastForward for efficient pipeline parallelism: a cache-optimized
                  concurrent lock-free queue},
  booktitle    = {PPoPP},
  pages        = {43--52},
  publisher    = {{ACM}},
  year         = {2008}
}
@inproceedings{DBLP:conf/IEEEpact/GiacomoniMV07,
  author       = {John Giacomoni and
                  Tipp Moseley and
                  Manish Vachharajani},
  title        = {FastForward for Efficient Pipeline Parallelism},
  booktitle    = {{PACT}},
  pages        = {407},
  publisher    = {{IEEE} Computer Society},
  year         = {2007}
}
@inproceedings{DBLP:conf/micro/ThiesCA07,
  author       = {William Thies and
                  Vikram Chandrasekhar and
                  Saman P. Amarasinghe},
  title        = {A Practical Approach to Exploiting Coarse-Grained Pipeline Parallelism
                  in {C} Programs},
  booktitle    = {{MICRO}},
  pages        = {356--369},
  publisher    = {{IEEE} Computer Society},
  year         = {2007}
}
@article{DBLP:journals/mst/ChungGMV06,
  author       = {Fan R. K. Chung and
                  Ronald L. Graham and
                  Jia Mao and
                  George Varghese},
  title        = {Parallelism versus Memory Allocation in Pipelined Router Forwarding
                  Engines},
  journal      = {Theory Comput. Syst.},
  volume       = {39},
  number       = {6},
  pages        = {829--849},
  year         = {2006}
}
@article{DBLP:journals/pcs/AdutskevichL06,
  author       = {Evgeniya V. Adutskevich and
                  Nickolai A. Likhoded},
  title        = {A consistent generation of pipeline parallelism and distribution of
                  operations and data among processors},
  journal      = {Program. Comput. Softw.},
  volume       = {32},
  number       = {3},
  pages        = {166--176},
  year         = {2006}
}
@inproceedings{DBLP:conf/asplos/GordonTA06,
  author       = {Michael I. Gordon and
                  William Thies and
                  Saman P. Amarasinghe},
  title        = {Exploiting coarse-grained task, data, and pipeline parallelism in
                  stream programs},
  booktitle    = {{ASPLOS}},
  pages        = {151--162},
  publisher    = {{ACM}},
  year         = {2006}
}
@inproceedings{DBLP:conf/ispa/Gonzalez-VelezC06,
  author       = {Horacio Gonz{\'{a}}lez{-}V{\'{e}}lez and
                  Murray Cole},
  title        = {Towards Fully Adaptive Pipeline Parallelism for Heterogeneous Distributed
                  Environments},
  booktitle    = {{ISPA}},
  series       = {Lecture Notes in Computer Science},
  volume       = {4330},
  pages        = {916--926},
  publisher    = {Springer},
  year         = {2006}
}
@inproceedings{DBLP:conf/icpp/DuA05,
  author       = {Wei Du and
                  Gagan Agrawal},
  title        = {Filter Decomposition for Supporting Coarse-Grained Pipelined Parallelism},
  booktitle    = {{ICPP}},
  pages        = {539--546},
  publisher    = {{IEEE} Computer Society},
  year         = {2005}
}
@inproceedings{DBLP:conf/micro/LarsenRA05,
  author       = {Samuel Larsen and
                  Rodric M. Rabbah and
                  Saman P. Amarasinghe},
  title        = {Exploiting Vector Parallelism in Software Pipelined Loops},
  booktitle    = {{MICRO}},
  pages        = {119--129},
  publisher    = {{IEEE} Computer Society},
  year         = {2005}
}
@inproceedings{DBLP:conf/vldb/LiuR05,
  author       = {Bin Liu and
                  Elke A. Rundensteiner},
  title        = {Revisiting Pipelined Parallelism in Multi-Join Query Processing},
  booktitle    = {{VLDB}},
  pages        = {829--840},
  publisher    = {{ACM}},
  year         = {2005}
}
@inproceedings{DBLP:conf/icpp/DuA04,
  author       = {Wei Du and
                  Gagan Agrawal},
  title        = {Packet Size Optimization for Supporting Coarse-Grained Pipelined Parallelism},
  booktitle    = {{ICPP}},
  pages        = {259--266},
  publisher    = {{IEEE} Computer Society},
  year         = {2004}
}
@inproceedings{DBLP:conf/spaa/ChungGV04,
  author       = {Fan R. K. Chung and
                  Ronald L. Graham and
                  George Varghese},
  title        = {Parallelism versus memory allocation in pipelined router forwarding
                  engines},
  booktitle    = {{SPAA}},
  pages        = {103--111},
  publisher    = {{ACM}},
  year         = {2004}
}
@inproceedings{DBLP:conf/ipps/DuA03,
  author       = {Wei Du and
                  Gagan Agrawal},
  title        = {Compiler Supported Coarse-Grained Pipelined Parallelism: Why and How},
  booktitle    = {{IPDPS}},
  pages        = {204},
  publisher    = {{IEEE} Computer Society},
  year         = {2003}
}
@inproceedings{DBLP:conf/parco/BahmaE03,
  author       = {Mostafa Bamha and
                  Matthieu Exbrayat},
  title        = {Pipelined parallelism for multi-join queries on shared nothing machines},
  booktitle    = {{PARCO}},
  series       = {Advances in Parallel Computing},
  volume       = {13},
  pages        = {47--54},
  publisher    = {Elsevier},
  year         = {2003}
}
@inproceedings{DBLP:conf/sc/DuFA03,
  author       = {Wei Du and
                  Renato Ferreira and
                  Gagan Agrawal},
  title        = {Compiler Support for Exploiting Coarse-Grained Pipelined Parallelism},
  booktitle    = {{SC}},
  pages        = {8},
  publisher    = {{ACM}},
  year         = {2003}
}
@article{DBLP:journals/jpdc/SubhlokV00,
  author       = {Jaspal Subhlok and
                  Gary Vondran},
  title        = {Optimal Use of Mixed Task and Data Parallelism for Pipelined Computations},
  journal      = {J. Parallel Distributed Comput.},
  volume       = {60},
  number       = {3},
  pages        = {297--319},
  year         = {2000}
}
@inproceedings{DBLP:conf/iscas/ZimmermannL94,
  author       = {Steffen Zimmermann and
                  Ernst Lueder},
  title        = {A Formal Approach To Pipeline Optimization in Synthesis of Digital
                  Signal Processors with Fine Grain Parallelism},
  booktitle    = {{ISCAS}},
  pages        = {325--328},
  publisher    = {{IEEE}},
  year         = {1994}
}
@inproceedings{DBLP:conf/vldb/HasanM94,
  author       = {Waqar Hasan and
                  Rajeev Motwani},
  title        = {Optimization Algorithms for Exploiting the Parallelism-Communication
                  Tradeoff in Pipelined Parallelism},
  booktitle    = {{VLDB}},
  pages        = {36--47},
  publisher    = {Morgan Kaufmann},
  year         = {1994}
}
@inproceedings{DBLP:conf/parle/SpiliopoulouHV92,
  author       = {Myra Spiliopoulou and
                  Michael Hatzopoulos and
                  Costas Vassilakis},
  title        = {Using Parallelism and Pipeline for the Optimisation of Join Queries},
  booktitle    = {{PARLE}},
  series       = {Lecture Notes in Computer Science},
  volume       = {605},
  pages        = {279--294},
  publisher    = {Springer},
  year         = {1992}
}
@inproceedings{DBLP:conf/icpp/LiljaY90,
  author       = {David J. Lilja and
                  Pen{-}Chung Yew},
  title        = {Comparing Parallelism Extraction Techniques: Superscalar Processors,
                  Pipelined Processors, and Multiprocessors},
  booktitle    = {{ICPP} {(1)}},
  pages        = {563--564},
  publisher    = {Pennsylvania State University Press},
  year         = {1990}
}
@inproceedings{DBLP:conf/ieaaie/SarmaW90,
  author       = {D. Sarma and
                  C. P. Wu},
  title        = {Pipelined OR-Parallelism Architecture for Parallel Execution of Prolog},
  booktitle    = {{IEA/AIE} (Vol. 2)},
  pages        = {864--873},
  publisher    = {{ACM}},
  year         = {1990}
}
@article{DBLP:journals/tsp/ParhiM89,
  author       = {Keshab K. Parhi and
                  David G. Messerschmitt},
  title        = {Pipeline interleaving and parallelism in recursive digital filters.
                  I. Pipelining using scattered look-ahead and decomposition},
  journal      = {{IEEE} Trans. Acoust. Speech Signal Process.},
  volume       = {37},
  number       = {7},
  pages        = {1099--1117},
  year         = {1989}
}
@article{DBLP:journals/tsp/ParhiM89a,
  author       = {Keshab K. Parhi and
                  David G. Messerschmitt},
  title        = {Pipeline interleaving and parallelism in recursive digital filters.
                  {II.} Pipelined incremental block filtering},
  journal      = {{IEEE} Trans. Acoust. Speech Signal Process.},
  volume       = {37},
  number       = {7},
  pages        = {1118--1134},
  year         = {1989}
}
@inproceedings{DBLP:conf/eurographics/ChapmanL89,
  author       = {Paul A. Chapman and
                  Eric Lewis},
  title        = {Adding Parallelism in Object Space to the Rendering Pipeline},
  booktitle    = {Eurographics},
  publisher    = {North-Holland / Eurographics Association},
  year         = {1989}
}
@article{DBLP:journals/computer/Witt85a,
  author       = {Bernard I. Witt},
  title        = {Parallelism, Pipelines, and Partitions: Variations on Communicating
                  Modules},
  journal      = {Computer},
  volume       = {18},
  number       = {2},
  pages        = {105--112},
  year         = {1985}
}
a service of  Schloss Dagstuhl - Leibniz Center for Informatics