// This file is part of BOINC. // http://boinc.berkeley.edu // Copyright (C) 2008 University of California // // BOINC is free software; you can redistribute it and/or modify it // under the terms of the GNU Lesser General Public License // as published by the Free Software Foundation, // either version 3 of the License, or (at your option) any later version. // // BOINC is distributed in the hope that it will be useful, // but WITHOUT ANY WARRANTY; without even the implied warranty of // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. // See the GNU Lesser General Public License for more details. // // You should have received a copy of the GNU Lesser General Public License // along with BOINC. If not, see . // // See http://boinc.berkeley.edu/trac/wiki/GPUApp for any compiling issues. // Contributor: Tuan Le (tuanle86@berkeley.edu) #ifndef NVOPENCL_H_ #define NVOPENCL_H_ #include #include #include #include #include #include #include #include #include #define INPUT_FILENAME "input" #define OUTPUT_FILENAME "output" #define KERNELS_FILENAME "nvopencl_kernels.cl" #define KERNELS_FILEPATH "../../nvopencl_kernels.cl" // for Linux and Mac #define CHECKPOINT_FILE "matrix_inversion_state" #define LOCAL_WORK_SIZE 1 #define GLOBAL_WORK_SIZE 400 #define MATRIX_SIZE 10 #define NUM_ITERATIONS 501 // execute the kernel NUM_ITERATIONS times #ifdef _WIN32 #include "boinc_win.h" #else #include "config.h" #include #include #include #include #include #include #include #endif #include "str_util.h" #include "util.h" #include "filesys.h" #include "boinc_api.h" #include "mfile.h" #include "graphics2.h" struct UC_SHMEM { double update_time; double fraction_done; double cpu_time; BOINC_STATUS status; int countdown; // graphics app sets this to 5 repeatedly, // main program decrements it once/sec. // If it's zero, don't bother updating shmem }; #ifdef APP_GRAPHICS UC_SHMEM* shmem; #endif /*** GLOBALS ***/ bool run_slow = false; bool early_exit = false; bool early_crash = false; bool early_sleep = false; double cpu_time = 20, comp_result; bool isStateFileInUse = false; const char *source; size_t globalThreads[1]; // 1D var for Total # of work items size_t localThreads[1]; // 1D var for # of work items in the work group /* * Input data is stored here. */ cl_float *input; /* * Output data is stored here. */ cl_float *output; /* problem size for a 2D matrix. */ // Note: we will handle the problem as a 1D matrix. cl_uint width; cl_uint height; /* The memory buffer that is used as input/output for OpenCL kernel */ cl_mem inputBuffer; //in this sample app, we will read the result //from the device back to host from inputBuffer as well. cl_context context; cl_device_id *devices; cl_command_queue commandQueue; cl_program program; /* This program uses three kernels */ cl_kernel GEStep1A_kernel; cl_kernel GEStep2_kernel; cl_kernel GEStep3_kernel; /*** FUNCTION DECLARATIONS ***/ /* * Create an input file filled with random data of type cl_float. */ void generate_random_input_file(int n); /* * Parse the input file and determine the size of the matrix. * This is an nxn matrix. Note: if width<> height, the matrix is * non-invertible. */ int get_matrix_size(FILE *infile); /* * Read the float values from input file into "input" array. */ void fetch_elements_into_host_memory(FILE *infile, cl_float *input); /* * BOINC functions */ /* Do a billion floating-point ops */ static double do_a_giga_flop(int foo); /* Save the computation state into checkpoint file */ int do_checkpoint(MFILE& mf, int n, cl_float *input, int matrixSize); #ifdef APP_GRAPHICS void update_shmem() { if (!shmem) return; // always do this; otherwise a graphics app will immediately // assume we're not alive shmem->update_time = dtime(); // Check whether a graphics app is running, // and don't bother updating shmem if so. // This doesn't matter here, // but may be worth doing if updating shmem is expensive. // if (shmem->countdown > 0) { // the graphics app sets this to 5 every time it renders a frame shmem->countdown--; } else { return; } shmem->fraction_done = boinc_get_fraction_done(); shmem->cpu_time = boinc_worker_thread_cpu_time();; boinc_get_status(&shmem->status); } #endif /* * OpenCL related initialisations are done here. * Context, Device list, Command Queue are set up. * Calls are made to set up OpenCL memory buffers that this program uses * and to load the programs into memory and get kernel handles. */ int initialize_cl(void); int initialize_host(FILE *infile); /* * Read the file which contains kernel definitions, and stores the file content * into a char array which is used as an argument to clCreateProgramWithSource. */ char *convert_to_string(const char * filename); /* * This is called once the OpenCL context, memory etc. are set up, * the program is loaded into memory and the kernel handles are ready. * * It sets the values for kernels' arguments and enqueues calls to the kernels * on to the command queue and waits till the calls have finished execution. * * It also gets kernel start and end time if profiling is enabled. */ int run_cl_kernels(void); /* Releases OpenCL resources (Context, Memory etc.) */ int cleanup_cl(void); /* Releases program's resources */ void cleanup_host(void); /* Write the result to output file */ void print_to_file(MFILE *out, float *h_odata, int n); /* * Check if the device is able to support the requested number of work items. */ int check_device_capability(size_t *globalThreads, size_t *localThreads); /* * Functions used to inverst matrix. Call kernels inside. */ void invert(cl_float * input, cl_float *output, int n); void invertge(cl_float * AI_d, int lda, int n); #endif /* #ifndef NVOPENCL_H_ */