/* * Copyright (c) 2016 University of Cordoba and University of Illinois * All rights reserved. * * Developed by: IMPACT Research Group * University of Cordoba and University of Illinois * http://impact.crhc.illinois.edu/ * * Permission is hereby granted, free of charge, to any person obtaining a copy * of this software and associated documentation files (the "Software"), to deal * with the Software without restriction, including without limitation the * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or * sell copies of the Software, and to permit persons to whom the Software is * furnished to do so, subject to the following conditions: * * > Redistributions of source code must retain the above copyright notice, * this list of conditions and the following disclaimers. * > Redistributions in binary form must reproduce the above copyright * notice, this list of conditions and the following disclaimers in the * documentation and/or other materials provided with the distribution. * > Neither the names of IMPACT Research Group, University of Cordoba, * University of Illinois nor the names of its contributors may be used * to endorse or promote products derived from this Software without * specific prior written permission. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE * CONTRIBUTORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS WITH * THE SOFTWARE. * */ #include "kernel.h" #include "support/partitioner.h" #include #include #include #include // CPU threads-------------------------------------------------------------------------------------- void run_cpu_threads(std::atomic_uint *histo, unsigned int *data, int size, int bins, int n_threads, int chunk, int n_tasks, float alpha #ifdef CUDA_8_0 , std::atomic_int *worklist #endif ) { std::vector cpu_threads; for(int k = 0; k < n_threads; k++) { cpu_threads.push_back(std::thread([=]() { #ifdef CUDA_8_0 Partitioner p = partitioner_create(n_tasks, alpha, k, n_threads, worklist); #else Partitioner p = partitioner_create(n_tasks, alpha, k, n_threads); #endif unsigned int Hs[bins]; // Local histogram initialization for(int i = 0; i < bins; i++) { Hs[i] = 0; } for(int i = cpu_first(&p); cpu_more(&p); i = cpu_next(&p)) { for(int j = 0; j < chunk; j++) { // Read pixel unsigned int d = ((data[i * chunk + j] * bins) >> 12); // Vote in histogram Hs[d]++; } } // Merge to global histogram for(int i = 0; i < bins; i++) { (&histo[i])->fetch_add(Hs[i]); } })); } std::for_each(cpu_threads.begin(), cpu_threads.end(), [](std::thread &t) { t.join(); }); }