cudpp.bib

@incollection{Allusse:2008:GAG,
  author = {Yannick Allusse and Patrick Horain and Ankit Agarwal
                  and Cindula Saipriyadarshan},
  title = {{GpuCV}: A {GPU}-Accelerated Framework for Image
                  Processing and Computer Vision},
  booktitle = {Advances in Visual Computing},
  series = {Lecture Notes in Computer Science},
  publisher = {Springer},
  volume = 5359,
  year = 2008,
  month = dec,
  pages = {430--439},
  doi = {10.1007/978-3-540-89646-3}
}

@incollection{Aubert:2009:API,
  author = {Dominique Aubert and Mehdi Amini and Romaric David},
  title = {A Particle-Mesh Integrator for Galactic Dynamics
                  Powered by {GPGPU}s},
  booktitle = {Proceedings of the 9th International Conference on
                  Computational Science},
  series = {Lecture Notes in Computer Science},
  publisher = {Springer},
  volume = 5544,
  year = 2008,
  month = may,
  pages = {874--883},
  doi = {10.1007/978-3-642-01970-8_88}
}

@inproceedings{Bailer:2010:TAC,
  author = {Bailer, W. and Fassold, H. and Lee, F. and Rosner,
                  J.},
  booktitle = {2010 Conference on Visual Media Production (CVMP)},
  title = {Tracking and Clustering Salient Features in Image
                  Sequences},
  year = 2010,
  pages = {17--24},
  keywords = {computer graphic equipment;coprocessors;data
                  visualisation;image sequences;object
                  tracking;pattern clustering;GPU accelerated
                  approach;audio rendering;computer generated
                  objects;image sequences;media production;object
                  trajectories visualization;salient features
                  clustering;Clustering algorithms;Feature
                  extraction;Graphics processing unit;Hidden Markov
                  models;Image
                  sequences;Tracking;Trajectory;GPU;clustering;motion
                  segmentation;tracking},
  doi = {10.1109/CVMP.2010.10}
}

@inproceedings{Billeter:2009:ESC,
  author = {Markus Billeter and Ola Olsson and Ulf Assarsson},
  title = {Efficient Stream Compaction on Wide {SIMD} Many-Core
                  Architectures},
  booktitle = {Proceedings of High Performance Graphics 2009},
  year = 2009,
  month = aug,
  pages = {159--166},
  doi = {10.1145/1572769.1572795}
}

@inproceedings{Bosnacki:2010:GAE,
  author = {Bo{\v{s}}na{\v{c}}ki, Dragan and Edelkamp, Stefan
                  and Sulewski, Damien and Wijs, Anton},
  booktitle = {2010 Ninth International Workshop on Parallel and
                  Distributed Methods in Verification/ and Second
                  International Workshop on High Performance
                  Computational Systems Biology},
  title = {{GPU-PRISM}: An extension of {PRISM} for General
                  Purpose Graphics Processing Units},
  year = 2010,
  pages = {17--19},
  month = sep,
  keywords = {computer graphic equipment;coprocessors;formal
                  verification;matrix multiplication;parallel
                  algorithms;parallel architectures;CUDA
                  architecture;GPU-PRISM;PRISM model
                  checker;coprocessor;general purpose graphics
                  processing units;linear algebraic operation;linear
                  equation;matrix vector multiplication;parallel
                  algorithm;probabilistic model checking;runtime
                  improvement;GPU;model checker PRISM;parallel
                  algorithms;probabilistic model checking},
  doi = {10.1109/PDMC-HiBi.2010.11}
}

@inproceedings{Cabido:2010:DEF,
  title = {Differential Evolution for Global Optimization on
                  {GPU}},
  author = {Cabido, R. and Duarte, A. and Montemayor, A. S. and
                  Pantrigo, J. J.},
  booktitle = {International Conference on Metaheuritic and Nature
                  Inspired Computing},
  year = 2010
}

@article{Chang:2012:SDP,
  year = 2012,
  issn = {1387-3326},
  journal = {Information Systems Frontiers},
  volume = 14,
  number = 4,
  doi = {10.1007/s10796-011-9322-0},
  title = {Scaling database performance on {GPU}s},
  publisher = {Springer US},
  keywords = {GPU; CUDA; SQLite; In-Memory Database},
  author = {Chang, Yue-Shan and Sheu, Ruey-Kai and Yuan,
                  Shyan-Ming and Hsu, Jyn-Jie},
  pages = {909--924},
  language = {English}
}

@inproceedings{Chiu:2011:DTU,
  author = {Chiu, Chun-Chieh and Luo, Guo-Heng and Yuan,
                  Shyan-Ming},
  title = {A decision tree using {CUDA} {GPU}s},
  booktitle = {Proceedings of the 13th International Conference on
                  Information Integration and Web-based Applications
                  and Services},
  series = {iiWAS '11},
  year = 2011,
  isbn = {978-1-4503-0784-0},
  location = {Ho Chi Minh City, Vietnam},
  pages = {399--402},
  numpages = 4,
  doi = {10.1145/2095536.2095615},
  acmid = 2095615,
  publisher = {ACM},
  address = {New York, NY, USA},
  keywords = {CUDA, GPGPU, classification, data mining, decision
                  tree}
}

@inproceedings{Chong:2008:DLV,
  author = {Jike Chong and Youngmin Yi and Arlo Faria and
                  Nadathur Satish and Kurt Keutzer},
  title = {Data-Parallel Large Vocabulary Continuous Speech
                  Recognition on Graphics Processors},
  booktitle = {Proceedings of the 1st Annual Workshop on Emerging
                  Applications and Many Core Architecture (EAMA)},
  pages = {23--35},
  month = jun,
  year = 2008,
  url = {http://www.gigascale.org/pubs/1499.html}
}

@inproceedings{Davidson:2012:EPM,
  author = {Andrew Davidson and David Tarjan and Michael Garland
                  and John D. Owens},
  title = {Efficient Parallel Merge Sort for Fixed and Variable
                  Length Keys},
  booktitle = {Proceedings of Innovative Parallel Computing (InPar
                  '\textln{12})},
  year = 2012,
  month = may,
  url = {http://www.idav.ucdavis.edu/publications/print_pub?pub_id=1085},
  doi = {10.1109/InPar.2012.6339592},
  acceptance = {25/62 (40.3\%)}
}

@mastersthesis{Dukehart:2009:GRW,
  author = {Sean Peter Dukehart},
  title = {{GPU} Random Walkers for Iterative Image
                  Segmentation},
  school = {Department of Computer Science, University of
                  Maryland Baltimore County},
  year = 2009,
  month = feb
}

@inproceedings{Eisenacher:2009:RTV,
  author = {Christian Eisenacher and Quirin Meyer and Charles
                  Loop},
  title = {Real-Time View-Dependent Rendering of Parametric
                  Surfaces},
  booktitle = {I3D '09: Proceedings of the 2009 Symposium on
                  Interactive 3D Graphics and Games},
  month = feb # {\slash } # mar,
  year = 2009,
  pages = {137--143},
  doi = {10.1145/1507149.1507172}
}

@article{Garanzha:2010:FRS,
  author = {Garanzha, Kirill and Loop, Charles},
  title = {Fast Ray Sorting and Breadth-First Packet Traversal
                  for {GPU} Ray Tracing},
  journal = {Computer Graphics Forum},
  year = 2010,
  month = may,
  volume = 29,
  issue = 2,
  pages = {289--298},
  issn = {1467-8659},
  doi = {10.1111/j.1467-8659.2009.01598.x},
  publisher = {Blackwell Publishing Ltd}
}

@article{Goclawski:2012:AGA,
  title = {A Graph-Based Approach to the Segmentation of Images
                  with Mould Filled Foam Matrices},
  author = {Goc{\l}awski, Jaros{\l}aw and Sekulska-Nalewajko,
                  Joanna},
  journal = {Image Processing \& Communications},
  volume = 17,
  number = 4,
  pages = {59--70},
  year = 2012
}

@incollection{Godiyal:2009:RMG,
  author = {Apeksha Godiyal and Jared Hoberock and Michael
                  Garland and John C. Hart},
  title = {Rapid Multipole Graph Drawing on the {GPU}},
  booktitle = {Proceedings of the 16th International Symposium on
                  Graph Drawing},
  series = {Lecture Notes in Computer Science},
  publisher = {Springer},
  volume = 5417,
  pages = {90--101},
  month = sep,
  year = 2009,
  doi = {10.1007/978-3-642-00219-9}
}

@incollection{Guo:2010:AIP,
  year = 2010,
  isbn = {978-3-642-13135-6},
  booktitle = {Algorithms and Architectures for Parallel
                  Processing},
  volume = 6082,
  series = {Lecture Notes in Computer Science},
  editor = {Hsu, Ching-Hsien and Yang, Laurence T. and Park,
                  JongHyuk and Yeo, Sang-Soo},
  doi = {10.1007/978-3-642-13136-3_30},
  title = {An Improved Parallel {MEMS} Processing-Level
                  Simulation Implementation Using Graphic Processing
                  Unit},
  publisher = {Springer Berlin Heidelberg},
  keywords = {MEMS; Processing-level Simulation; Parallel; GPU;
                  CUDA},
  author = {Guo, Yupeng and Liu, Xiaoguang and Wang, Gang and
                  Zhang, Fan and Zhao, Xin},
  pages = {289--296}
}

@article{Ha:2009:FFP,
  author = {Ha, Linh and Kr{\"{u}}ger, Jens and Silva,
                  Cl{\'{a}}udio T.},
  title = {Fast Four-Way Parallel Radix Sorting on {GPU}s},
  journal = {Computer Graphics Forum},
  volume = 28,
  number = 8,
  publisher = {Blackwell Publishing Ltd},
  issn = {1467-8659},
  url = {http://dx.doi.org/10.1111/j.1467-8659.2009.01542.x},
  doi = {10.1111/j.1467-8659.2009.01542.x},
  pages = {2368--2378},
  keywords = {HPC, GPGPU, GPU sorting, collision detection,
                  parallel sorting},
  keywords = {I.3.1: Parallel processing on Graphic Processing
                  Units, G.1.0: Parallel algorithms},
  year = 2009
}

@incollection{Harish:2011:FMS,
  title = {Fast Minimum Spanning Tree Computation},
  editor = {Wen-{m}ei W. Hwu},
  booktitle = {GPU Computing Gems Jade Edition},
  publisher = {Morgan Kaufmann},
  address = {Boston},
  year = 2012,
  pages = {77--88},
  isbn = {978-0-12-385963-1},
  doi = {http://dx.doi.org/10.1016/B978-0-12-385963-1.00007-1},
  author = {Pawan Harish and P. J. Narayanan and Vibhav Vineet
                  and Suryakant Patidar}
}

@inproceedings{Hoberock:2009:SCF,
  author = {Jared Hoberock and Victor Lu and Yuntao Jia and John
                  C. Hart},
  title = {Stream Compaction for Deferred Shading},
  booktitle = {Proceedings of High Performance Graphics 2009},
  year = 2009,
  month = aug,
  pages = {173--180},
  doi = {10.1145/1572769.1572797}
}

@article{Hou:2008:BBG,
  title = {{BSGP}: Bulk-Synchronous {GPU} Programming},
  author = {Qiming Hou and Kun Zhou and Baining Guo},
  journal = {ACM Transactions on Graphics},
  volume = 27,
  number = 3,
  month = aug,
  year = 2008,
  pages = {19:1--19:13}
}

@inproceedings{Huang:2009:AEO,
  author = {Huang, B. and Jinlan Gao and Xiaoming Li},
  booktitle = {2009 IEEE International Symposium on Parallel and
                  Distributed Processing with Applications},
  title = {An Empirically Optimized Radix Sort for {GPU}},
  year = 2009,
  pages = {234--241},
  keywords = {computer graphic equipment;computer
                  graphics;optimisation;sorting;GPU architectural
                  factors;GPU sort routines;NVIDIA GPU;algorithmic
                  parameters;empirical optimization
                  technique;empirically optimized radix sort;radix
                  sort implementations;sorting routines;Application
                  software;Central Processing Unit;Concurrent
                  computing;Distributed
                  processing;Frequency;Graphics;High performance
                  computing;Programming
                  profession;Sorting;Tuning;GPU;performance
                  tuning;radix sort},
  doi = {10.1109/ISPA.2009.89}
}

@article{Kouassi:2011:EPL,
  title = {Efficient Probabilistic Latent Semantic Indexing
                  using Graphics Processing Unit},
  journal = {Procedia Computer Science},
  volume = 4,
  number = 0,
  pages = {382--391},
  year = 2011,
  note = {Proceedings of the International Conference on
                  Computational Science},
  issn = {1877-0509},
  doi = {10.1016/j.procs.2011.04.040},
  author = {Eli Koffi Kouassi and Toshiyuki Amagasa and Hiroyuki
                  Kitagawa},
  keywords = {Graphic Processing Unit (GPGPU)},
  keywords = {Clustering},
  keywords = {Algorithms},
  keywords = {Probabilistic Latent Semantic Indexint (PLSI)},
  keywords = {Expectation Maximization (EM) Algorithm }
}

@inproceedings{Ladikos:2008:EVH,
  title = {Efficient Visual Hull Computation for Real-Time 3{D}
                  Reconstruction using {CUDA}},
  author = {Alexander Ladikos and Selim Benhimane and Nassir
                  Navab},
  booktitle = {CVPRW '08: Computer Vision and Pattern Recognition
                  Workshops},
  year = 2008,
  month = jun,
  pages = {1--8},
  doi = {10.1109/CVPRW.2008.4563098}
}

@inproceedings{Lin:2011:TDA,
  author = {Chia-Feng Lin and Shyan-Ming Yuan},
  booktitle = {2011 Fifth International Conference on Genetic and
                  Evolutionary Computing (ICGEC)},
  title = {The Design and Evaluation of GPU Based Memory
                  Database},
  year = 2011,
  pages = {224-231},
  keywords = {SQL;computer graphic equipment;coprocessors;storage
                  management;C language;CUDA;GPU based memory
                  database;NVIDIA;SQLite;graphics processing
                  unit;memory capacity;parallel computing
                  language;rational database;Algorithm design and
                  analysis;Arrays;Databases;Graphics processing
                  unit;Instruction
                  sets;Libraries;Sorting;Database;GPU;memory},
  doi = {10.1109/ICGEC.2011.61}
}

@inproceedings{Lipscomb:2012:PVN,
  author = {Lipscomb, Tyson J. and Zou, Anqi and Cho, Samuel S.},
  title = {Parallel {V}erlet Neighbor List Algorithm for
                  {GPU}-Optimized {MD} Simulations},
  booktitle = {Proceedings of the ACM Conference on Bioinformatics,
                  Computational Biology and Biomedicine},
  series = {BCB '12},
  year = 2012,
  isbn = {978-1-4503-1670-5},
  location = {Orlando, Florida},
  pages = {321--328},
  numpages = 8,
  doi = {10.1145/2382936.2382977},
  acmid = 2382977,
  publisher = {ACM},
  address = {New York, NY, USA},
  keywords = {CUDPP, CURAND, coarse-grained MD simulations, energy
                  drift, floating point analysis}
}

@incollection{Feng:2011:TDM,
  author = {Wu{-chun} Feng and Yong Cao and Debprakash Patnaik and 
                  Naren Ramakrishnan},
  editor = {Wen{-mei} W. Hwu},
  booktitle = {GPU Computing Gems},
  volume = 1,
  title = {Temporal Data Mining for Neuroscience},
  chapter = 15,
  publisher = {Morgan Kaufmann},
  month = feb,
  year = 2011,
  pages = {211--227},
  doi = {10.1016/B978-0-12-384988-5.00015-2}
}

@inproceedings{Oikonomidis:2011:EM3,
  title = {Efficient Model-based 3{D} Tracking of Hand
                  Articulations using {K}inect},
  author = {Iason Oikonomidis and Nikolaos Kyriazis and Antonis
                  Argyros},
  year = 2011,
  pages = {101.1--101.11},
  booktitle = {Proceedings of the British Machine Vision
                  Conference},
  publisher = {BMVA Press},
  editors = {Hoey, Jesse and McKenna, Stephen and Trucco,
                  Emanuele},
  isbn = {1-901725-43-X},
  doi = {10.5244/C.25.101},
  month = sep
}

@inproceedings{Patel:2012:PLD,
  author = {Ritesh A. Patel and Yao Zhang and Jason Mak and John
                  D. Owens},
  title = {Parallel Lossless Data Compression on the {GPU}},
  booktitle = {Proceedings of Innovative Parallel Computing (InPar
                  '\textln{12})},
  year = 2012,
  month = may,
  url = {http://www.idav.ucdavis.edu/publications/print_pub?pub_id=1087},
  doi = {10.1109/InPar.2012.6339599},
  acceptance = {25/62 (40.3\%)}
}

@inproceedings{Patnaik:2009:AAT,
  author = {Patnaik, D. and Ponce, S. P. and Yong Cao and
                  Ramakrishnan, N.},
  booktitle = {Sixth IFIP International Conference on Network and
                  Parallel Computing (NPC '09)},
  title = {Accelerator-Oriented Algorithm Transformation for
                  Temporal Data Mining},
  year = 2009,
  pages = {93--100},
  month = oct,
  keywords = {data analysis;data mining;temporal databases;GPU
                  architectures;Nvidias GTX 280;accelerator-oriented
                  algorithm transformation;computational
                  neuroscience;episode discovery
                  algorithm;multineuronal datasets;port existing
                  algorithms;spike train data analysis;temporal data
                  mining;Acceleration;Algorithm design and
                  analysis;Application software;Central Processing
                  Unit;Computer architecture;Concurrent computing;Data
                  mining;Neurons;Neuroscience;Parallel
                  processing;Frequent episodes;GPGPU;Spike train
                  analysis;Temporal data mining},
  doi = {10.1109/NPC.2009.26}
}

@article{Patney:2008:RRA,
  author = {Anjul Patney and John D. Owens},
  title = {Real-Time {R}eyes-Style Adaptive Surface
                  Subdivision},
  journal = {ACM Transactions on Graphics},
  volume = 27,
  number = 5,
  year = 2008,
  month = dec,
  url = {http://graphics.idav.ucdavis.edu/publications/print_pub?pub_id=952},
  doi = {10.1145/1409060.1409096},
  pages = {143:1--143:8}
}

@inproceedings{Patney:2009:PVT,
  author = {Anjul Patney and Mohamed S. Ebeida and John D.
                  Owens},
  title = {Parallel View-Dependent Tessellation of
                  {C}atmull-{C}lark Subdivision Surfaces},
  booktitle = {Proceedings of High Performance Graphics 2009},
  year = 2009,
  month = aug,
  pages = {99--108},
  url = {http://graphics.idav.ucdavis.edu/publications/print_pub?pub_id=964},
  doi = {10.1145/1572769.1572785}
}

@article{Patney:2010:FCA,
  author = {Anjul Patney and Stanley Tzeng and John D. Owens},
  title = {Fragment-Parallel Composite and Filter},
  journal = {Computer Graphics Forum (Proceedings of the
                  Eurographics Symposium on Rendering)},
  year = 2010,
  month = jun,
  volume = 29,
  number = 4,
  pages = {1251--1258},
  doi = {10.1111/j.1467-8659.2010.01720.x},
  acceptance = {38.9\% (28/72)},
  url = {http://www.idav.ucdavis.edu/publications/print_pub?pub_id=1037},
  ucdcite = {a54}
}

@inproceedings{Peters:2009:FCI,
  author = {Hagen Peters and Ole Schulz-Hildebrandt and Norbert
                  Luttenberger},
  title = {Fast comparison-based in-place sorting with {CUDA}},
  booktitle = {Eighth International Conference on Parallel
                  Processing and Applied Mathematics},
  year = 2009,
  month = sep
}

@mastersthesis{Ponce:2009:TAT,
  author = {Sean P. Ponce},
  title = {Towards Algorithm Transformation for Temporal Data
                  Mining on {GPU}},
  school = {Department of Computer Science, Virginia Polytechnic
                  Institute and State University},
  year = 2009,
  month = {7~} # jul
}

@inproceedings{Qiu:2009:GNN,
  author = {Deyuan Qiu and Stefan May and Andreas N{\"{u}}chter},
  title = {{GPU}-accelerated Nearest Neighbor Search for 3{D}
                  Registration},
  booktitle = {ICVS \textln{2009}: Proceedings of the 7th
                  International Conference on Computer Vision Systems},
  year = 2009,
  month = oct
}

@incollection{Saetra:2013:SWS,
  year = 2013,
  isbn = {978-3-642-33133-6},
  booktitle = {Numerical Mathematics and Advanced Applications
                  2011},
  editor = {Cangiani, Andrea and Davidchack, Ruslan L. and
                  Georgoulis, Emmanuil and Gorban, Alexander N. and
                  Levesley, Jeremy and Tretyakov, Michael V.},
  doi = {10.1007/978-3-642-33134-3_71},
  title = {Shallow Water Simulation on {GPU}s for Sparse
                  Domains},
  publisher = {Springer Berlin Heidelberg},
  author = {S{\ae}tra, M.L.},
  pages = {673--680}
}

@inproceedings{Satish:2009:DES,
  author = {Nadathur Satish and Mark Harris and Michael Garland},
  title = {Designing Efficient Sorting Algorithms for Manycore
                  {GPU}s},
  booktitle = {Proceedings of the \textln{23}rd IEEE International
                  Parallel and Distributed Processing Symposium},
  month = may,
  year = 2009
}

@inproceedings{Sengupta:2007:SPF,
  title = {Scan Primitives for {GPU} Computing},
  author = {Shubhabrata Sengupta and Mark Harris and Yao Zhang
                  and John D. Owens},
  booktitle = {Graphics Hardware \textln{2007}},
  year = 2007,
  month = aug,
  pages = {97--106},
  url = {http://graphics.idav.ucdavis.edu/publications/print_pub?pub_id=915}
}

@techreport{Sengupta:2008:SPF,
  title = {Efficient Parallel Scan Algorithms for {GPUs}},
  author = {Shubhabrata Sengupta and Mark Harris and Michael
                  Garland},
  number = {NVR-2008-003},
  institution = {NVIDIA Corporation},
  year = 2008,
  month = dec,
  url = {http://mgarland.org/papers.html#segscan-tr}
}

@article{Stantchev:2008:FPP,
  author = {George Stantchev and William Dorland and Nail
                  Gumerov},
  title = {Fast parallel Particle-To-Grid interpolation for
                  plasma {PIC} simulations on the {GPU}},
  journal = {Journal of Parallel and Distributed Computing},
  volume = 68,
  number = 10,
  pages = {1339--1349},
  year = 2008,
  month = oct,
  doi = {10.1016/j.jpdc.2008.05.009},
  url = {http://www.sciencedirect.com/science/article/B6WKJ-4SW144M-1/2/914e9b94290a555f36b8238a9781aa1d}
}

@article{Stein:2012:CFP,
  title = {{CudaHull}: Fast parallel 3{D} convex hull on the
                  {GPU} },
  journal = {Computers \& Graphics},
  volume = 36,
  number = 4,
  pages = {265--271},
  year = 2012,
  month = mar,
  note = {Applications of Geometry Processing},
  issn = {0097-8493},
  doi = {10.1016/j.cag.2012.02.012},
  author = {Ayal Stein and Eran Geva and Jihad El-Sana},
  keywords = {Convex hull},
  keywords = {Parallel processing},
  keywords = {GPU processing},
  keywords = {CUDA programming }
}

@inproceedings{Sun:2010:FSE,
  author = {Weidong Sun and Weiwei Wang and Zongmin Ma},
  booktitle = {2010 3rd International Conference on Biomedical
                  Engineering and Informatics (BMEI)},
  title = {Fast Short Exact Repeats Finding on {GPU}},
  year = 2010,
  month = oct,
  volume = 5,
  pages = {2197--2200},
  keywords = {DNA;biology computing;computer architecture;computer
                  graphics;genomics;proteomics;CUDA
                  platform;DNA;GPU;NVIDIA Corporation;compute unified
                  device architecture;exact repeats finding;fast short
                  exact repeats;genome sequencing;graphic processing
                  unit;proteome sequence analysis;scalable parallel
                  algorithm;text processing task;vital biological
                  functions;Algorithm design and
                  analysis;Arrays;Bioinformatics;DNA;Genomics;Graphics
                  processing unit;Instruction sets;CUDA;Regulator
                  Detect;Repeats Finding},
  doi = {10.1109/BMEI.2010.5639638}
}

@inproceedings{Thall:2011:FMP,
  author = {Thall, Andrew},
  title = {Fast Mersenne Prime Testing on the GPU},
  booktitle = {Proceedings of the Fourth Workshop on General
                  Purpose Processing on Graphics Processing Units},
  series = {GPGPU-4},
  year = 2011,
  month = mar,
  isbn = {978-1-4503-0569-3},
  location = {Newport Beach, California},
  pages = {6:1--6:8},
  articleno = 6,
  numpages = 8,
  doi = {10.1145/1964179.1964188},
  acmid = 1964188,
  publisher = {ACM},
  address = {New York, NY, USA},
  keywords = {CUDA, GPGPU, IBDWT, Lucas-Lehmer test, Mersenne
                  primes, discrete weighted transforms, fast carry
                  propagation, multiprecision arithmetic, parallel
                  carry-save arithmetic}
}

@inproceedings{Vineet:2009:FMS,
  author = {Vibhav Vineet and Pawan Harish and Suryakant Patidar
                  and P. J. Narayanan},
  title = {Fast Minimum Spanning Tree for Large Graphs on the
                  {GPU}},
  booktitle = {Proceedings of High Performance Graphics 2009},
  year = 2009,
  month = aug,
  pages = {167--171},
  doi = {10.1145/1572769.1572796}
}

@incollection{Wang:2012:GAO,
  year = 2012,
  isbn = {978-3-642-31964-8},
  booktitle = {Communications and Information Processing},
  volume = 288,
  series = {Communications in Computer and Information Science},
  editor = {Zhao, Maotai and Sha, Junpin},
  doi = {10.1007/978-3-642-31965-5_28},
  title = {{GPU}-Based Aggregation of On-Line Analytical
                  Processing},
  publisher = {Springer Berlin Heidelberg},
  keywords = {Real-time Aggregation; OLAP; CUDA; GPUOLAP},
  author = {Wang, Guilan and Zhou, Guoliang},
  pages = {234--245}
}

@incollection{Zeng:2012:AMK,
  year = 2012,
  isbn = {978-3-642-34262-2},
  booktitle = {Computational Visual Media},
  volume = 7633,
  series = {Lecture Notes in Computer Science},
  editor = {Hu, Shi-Min and Martin, Ralph R.},
  doi = {10.1007/978-3-642-34263-9_30},
  title = {A Memory-Efficient {KinectFusion} Using Octree},
  publisher = {Springer Berlin Heidelberg},
  keywords = {Octree; GPU; KinectFusion; 3D Reconstruction},
  author = {Zeng, Ming and Zhao, Fukai and Zheng, Jiaxiang and
                  Liu, Xinguo},
  pages = {234--241}
}

@techreport{Zhou:2008:HPS,
  author = {Kun Zhou and Minmin Gong and Xin Huang and Baining
                  Guo},
  title = {Highly Parallel Surface Reconstruction},
  institution = {Microsoft Research},
  year = 2008,
  number = {MSR-TR-2008-53},
  month = {1~} # apr
}

@article{Zhou:2008:RKC,
  title = {Real-time {KD}-tree Construction on Graphics
                  Hardware},
  author = {Kun Zhou and Qiming Hou and Rui Wang and Baining
                  Guo},
  journal = {ACM Transactions on Graphics},
  volume = 27,
  number = 5,
  month = dec,
  year = 2008,
  pages = {126:1--126:11}
}

@article{Zhou:2012:GPC,
  year = 2012,
  issn = {2095-2732},
  journal = {Frontiers of Electrical and Electronic Engineering},
  volume = 7,
  number = 1,
  doi = {10.1007/s11460-012-0187-x},
  title = {{GPU} parallel computing: Programming language,
                  debugging tools and data structures},
  publisher = {SP Higher Education Press},
  keywords = {graphics processing unit (GPU); parallel computing;
                  programming languages; debugging tools; data
                  structures},
  author = {Zhou, Kun},
  pages = {5--15},
  language = {English}
}