@inproceedings{
  author={ S. Potluri, H. Wang, D. Bureddy, A. Singh, C. Rosales, D. Panda },
  title={ Optimizing MPI Communication on Multi-GPU Systems using CUDA Inter-Process Communication },
  conference={ International Workshop on Accelerators and Hybrid Exascale Systems (AsHES) },
  year={ 2012 },
  month={ May },
  location={ None },
  source={ http://nowlab.cse.ohio-state.edu/publications/ },
}