// This file is part of BOINC. // http://boinc.berkeley.edu // Copyright (C) 2008 University of California // // BOINC is free software; you can redistribute it and/or modify it // under the terms of the GNU Lesser General Public License // as published by the Free Software Foundation, // either version 3 of the License, or (at your option) any later version. // // BOINC is distributed in the hope that it will be useful, // but WITHOUT ANY WARRANTY; without even the implied warranty of // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. // See the GNU Lesser General Public License for more details. // // You should have received a copy of the GNU Lesser General Public License // along with BOINC. If not, see . // #include using std::string; #include "str_util.h" #include "util.h" #include "sched_config.h" #include "sched_main.h" #include "sched_msgs.h" #include "sched_send.h" #include "sched_score.h" #include "sched_shmem.h" #include "sched_version.h" #include "sched_customize.h" #include "plan_class_spec.h" int PLAN_CLASS_SPECS::parse_file(char*path) { #ifndef _USING_FCGI_ FILE* f = fopen(path, "r"); #else FCGI_FILE *f = FCGI::fopen(path, "r"); #endif if (!f) return ERR_FOPEN; int retval = parse_specs(f); fclose(f); if(!retval) parsed = true; return retval; } // parse_file() bool PLAN_CLASS_SPEC::check(SCHEDULER_REQUEST& sreq, HOST_USAGE& hu) { // fill HOST_USAGE with defaults hu.ncudas = 0; hu.natis = 0; hu.gpu_ram = 0; hu.avg_ncpus = 1; hu.max_ncpus = 1; hu.projected_flops = sreq.host.p_fpops; hu.peak_flops = sreq.host.p_fpops; hu.cmdline[0] = '\0'; { char buf[256]; sprintf(buf, "No work sent. " "See scheduler log messages on %s", config.master_url, sreq.hostid / 1000, sreq.hostid, config.long_name); add_no_work_message(buf); } // CPU features if (!cpu_features.empty()) { char features[512+3] = {0}; char *c; strcpy(features, " "); if(strlen(sreq.host.p_features)) { strcat(features, sreq.host.p_features); strcat(features, " "); } if((c = strrchr(sreq.host.p_model, '['))) { strcat(features, c+1); if((c = strrchr(features, ']'))) *c = ' '; } downcase_string(features); for (unsigned int i=0; i v) { if (config.debug_version_select) log_messages.printf(MSG_NORMAL, "[version] OS version required min: %d, supplied: %d\n", min_macos_version, v); return false; } if(max_macos_version && max_macos_version < v) { if (config.debug_version_select) log_messages.printf(MSG_NORMAL, "[version] OS version required max: %d, supplied: %d\n", max_macos_version, v); return false; } } // OS version (regexp match) if(*os_version_string && regexec(&(os_version_regex), sreq.host.os_version, 0, NULL, 0)) { if (config.debug_version_select) log_messages.printf(MSG_NORMAL, "[version] Couldn't match OS version '%s' with required regexp '%s'\n", sreq.host.os_version, os_version_string); return false; } // project-specific preference if (*project_prefs_tag) { char tag[256]; char buf[65536]; double v = 0; extract_venue(g_reply->user.project_prefs, g_reply->host.venue, buf); sprintf(tag,"<%s>",project_prefs_tag); bool p = parse_double(buf, tag, v); if (config.debug_version_select) { log_messages.printf(MSG_NORMAL, "[version] parsed project prefs setting '%s' : %s : %f\n", project_prefs_tag, p?"true":"false", v); } if ((v < project_prefs_min) || (v > project_prefs_max)) { if (config.debug_version_select) log_messages.printf(MSG_NORMAL, "[version] project prefs setting '%s' (%f) prevents using plan class.\n", project_prefs_tag, v); return false; } } double gpu_utilization = 1.0; // user defined gpu_utilization if (*gpu_utilization_tag) { char tag[256]; char buf[65536]; double v = 0; extract_venue(g_reply->user.project_prefs, g_reply->host.venue, buf); sprintf(tag,"<%s>",gpu_utilization_tag); bool p = parse_double(buf, tag, v); if (config.debug_version_select) { log_messages.printf(MSG_NORMAL, "[version] parsed project prefs setting '%s' : %s : %f\n", gpu_utilization_tag, p?"true":"false", v); } if (v) { gpu_utilization = v; } } // CUDA GPU if (type == 1) { COPROC_NVIDIA& cp = sreq.coprocs.nvidia; // devices if (!cp.count) { if (config.debug_version_select) log_messages.printf(MSG_NORMAL, "[version] No CUDA devices found\n"); return false; } // update requirements if (min_gpu_ram_mb) cuda_requirements.update(0, min_gpu_ram_mb * MEGA); if (min_driver_version) cuda_requirements.update(abs(min_driver_version), 0); // GPU RAM if (min_gpu_ram_mb && min_gpu_ram_mb * MEGA > cp.prop.dtotalGlobalMem) { if (config.debug_version_select) log_messages.printf(MSG_NORMAL, "[version] GPU RAM required min: %f, supplied: %f\n", min_gpu_ram_mb * MEGA, cp.prop.dtotalGlobalMem); return false; } // compute capability int v = (cp.prop.major)*100 + cp.prop.minor; if (min_cuda_compcap && min_cuda_compcap > v) { if (config.debug_version_select) log_messages.printf(MSG_NORMAL, "[version] CUDA compute capability required min: %d, supplied: %d\n", min_cuda_compcap, v); return false; } if (max_cuda_compcap && max_cuda_compcap < v) { if (config.debug_version_select) log_messages.printf(MSG_NORMAL, "[version] CUDA compute capability required max: %d, supplied: %d\n", max_cuda_compcap, v); return false; } // CUDA version if (min_cuda_version && min_cuda_version > cp.cuda_version) { if (config.debug_version_select) log_messages.printf(MSG_NORMAL, "[version] CUDA version required min: %d, supplied: %d\n", min_cuda_version, cp.cuda_version); return false; } if (max_cuda_version && max_cuda_version < cp.cuda_version) { if (config.debug_version_select) log_messages.printf(MSG_NORMAL, "[version] CUDA version required max: %d, supplied: %d\n", max_cuda_version, cp.cuda_version); return false; } // (display) driver version if (min_driver_version && (min_driver_version > 0 || cp.display_driver_version) && abs(min_driver_version) > cp.display_driver_version) { if (config.debug_version_select) log_messages.printf(MSG_NORMAL, "[version] driver version required min: %d, supplied: %d\n", abs(min_driver_version), cp.display_driver_version); return false; } if (max_driver_version && (max_driver_version > 0 || cp.display_driver_version) && abs(max_driver_version) < cp.display_driver_version) { if (config.debug_version_select) log_messages.printf(MSG_NORMAL, "[version] driver version required max: %d, supplied: %d\n", abs(max_driver_version), cp.display_driver_version); return false; } hu.gpu_ram = (gpu_ram_used_mb?gpu_ram_used_mb:min_gpu_ram_mb) * MEGA; // if ngpus < 0, set ncudas by the fraction of the total video RAM a tasks would take // i.e. fill the device memory with tasks if(ngpus < 0) hu.ncudas = (floor(cp.prop.dtotalGlobalMem / hu.gpu_ram) * hu.gpu_ram) / cp.prop.dtotalGlobalMem; else if (ngpus > 0) hu.ncudas = ngpus * gpu_utilization; else hu.ncudas = gpu_utilization; cp.set_peak_flops(); hu.peak_flops = cp.peak_flops * hu.ncudas * peak_flops_factor; if (gpu_flops && cpu_flops) { hu.avg_ncpus = avg_ncpus * sreq.host.p_fpops / cpu_flops; hu.projected_flops = cp.peak_flops / gpu_flops * speedup + 1.0 / hu.avg_ncpus; } else { hu.projected_flops = sreq.host.p_fpops * speedup; hu.avg_ncpus = avg_ncpus; } } // CUDA // NVidia OpenCL GPU else if (type == 3) { COPROC_NVIDIA& cp = sreq.coprocs.nvidia; // devices if (!cp.count) { if (config.debug_version_select) log_messages.printf(MSG_NORMAL, "[version] No NVidia devices found\n"); return false; } // check for OpenCL at all if (!cp.have_opencl) { if (config.debug_version_select) log_messages.printf(MSG_NORMAL, "[version] NVidia device (or driver) doesn't support OpenCL\n"); return false; } // update requirements if (min_gpu_ram_mb) cuda_requirements.update(0, min_gpu_ram_mb * MEGA); if (min_driver_version) cuda_requirements.update(abs(min_driver_version), 0); // GPU RAM if (min_gpu_ram_mb && min_gpu_ram_mb * MEGA > cp.opencl_prop.global_mem_size) { if (config.debug_version_select) log_messages.printf(MSG_NORMAL, "[version] OpenCL GPU RAM required min: %f, supplied: %lu\n", min_gpu_ram_mb * MEGA, cp.opencl_prop.global_mem_size); return false; } // OpenCL device version if (min_opencl_version && min_opencl_version > cp.opencl_prop.opencl_device_version_int) { if (config.debug_version_select) log_messages.printf(MSG_NORMAL, "[version] OpenCL device version required min: %d, supplied: %d\n", min_opencl_version, cp.opencl_prop.opencl_device_version_int); return false; } // (display) driver version if (min_driver_version && (min_driver_version > 0 || cp.display_driver_version) && abs(min_driver_version) > cp.display_driver_version) { if (config.debug_version_select) log_messages.printf(MSG_NORMAL, "[version] driver version required min: %d, supplied: %d\n", abs(min_driver_version), cp.display_driver_version); return false; } if (max_driver_version && (max_driver_version > 0 || cp.display_driver_version) && abs(max_driver_version) < cp.display_driver_version) { if (config.debug_version_select) log_messages.printf(MSG_NORMAL, "[version] driver version required max: %d, supplied: %d\n", abs(max_driver_version), cp.display_driver_version); return false; } hu.gpu_ram = (gpu_ram_used_mb?gpu_ram_used_mb:min_gpu_ram_mb) * MEGA; // if ngpus < 0, set ncudas by the fraction of the total video RAM a tasks would take // i.e. fill the device memory with tasks if(ngpus < 0) hu.ncudas = (floor(cp.opencl_prop.global_mem_size / hu.gpu_ram) * hu.gpu_ram) / cp.opencl_prop.global_mem_size; else if (ngpus > 0) hu.ncudas = ngpus * gpu_utilization; else hu.ncudas = gpu_utilization; cp.set_peak_flops(); hu.peak_flops = cp.peak_flops * hu.ncudas * peak_flops_factor; if (gpu_flops && cpu_flops) { hu.avg_ncpus = avg_ncpus * sreq.host.p_fpops / cpu_flops; hu.projected_flops = cp.peak_flops / gpu_flops * speedup + 1.0 / hu.avg_ncpus; } else { hu.projected_flops = sreq.host.p_fpops * speedup; hu.avg_ncpus = avg_ncpus; } } // NVidia OpenCL // ATI OpenCL GPU else if (type == 4) { COPROC_ATI& cp = sreq.coprocs.ati; // devices if (!cp.count) { if (config.debug_version_select) log_messages.printf(MSG_NORMAL, "[version] No ATI devices found\n"); return false; } // check for OpenCL at all if (!cp.have_opencl) { if (config.debug_version_select) log_messages.printf(MSG_NORMAL, "[version] ATI device (or driver) doesn't support OpenCL\n"); return false; } // update requirements if (min_gpu_ram_mb) ati_requirements.update(0, min_gpu_ram_mb * MEGA); if (min_driver_version) ati_requirements.update(abs(min_driver_version), 0); // GPU RAM if (min_gpu_ram_mb && min_gpu_ram_mb * MEGA > cp.opencl_prop.global_mem_size) { if (config.debug_version_select) log_messages.printf(MSG_NORMAL, "[version] OpenCL GPU RAM required min: %f, supplied: %lu\n", min_gpu_ram_mb * MEGA, cp.opencl_prop.global_mem_size); return false; } // OpenCL device version if (min_opencl_version && min_opencl_version > cp.opencl_prop.opencl_device_version_int) { if (config.debug_version_select) log_messages.printf(MSG_NORMAL, "[version] OpenCL device version required min: %d, supplied: %d\n", min_opencl_version, cp.opencl_prop.opencl_device_version_int); return false; } // (display) driver version if (min_driver_version || max_driver_version) { int driver_version = 0; if(cp.have_cal) { int major, minor, release, scanned; scanned = sscanf(cp.version, "%d.%d.%d", &major, &minor, &release); if (scanned != 3) { if (config.debug_version_select) log_messages.printf(MSG_NORMAL, "[version] driver version '%s' couldn't be parsed\n", cp.version); return false; } else { driver_version = release + minor * 10000 + major * 1000000; } } else { if (config.debug_version_select) log_messages.printf(MSG_NORMAL, "[version] no CAL, driver version couldn't be determined\n", cp.version); } if (min_driver_version && (min_driver_version > 0 || driver_version) && abs(min_driver_version) > driver_version) { if (config.debug_version_select) log_messages.printf(MSG_NORMAL, "[version] driver version required min: %d, supplied: %d\n", abs(min_driver_version), driver_version); return false; } if (max_driver_version && (max_driver_version > 0 || driver_version) && abs(max_driver_version) < driver_version) { if (config.debug_version_select) log_messages.printf(MSG_NORMAL, "[version] driver version required max: %d, supplied: %d\n", abs(max_driver_version), driver_version); return false; } } hu.gpu_ram = (gpu_ram_used_mb?gpu_ram_used_mb:min_gpu_ram_mb) * MEGA; // if ngpus < 0, set natis by the fraction of the total video RAM a tasks would take // i.e. fill the device memory with tasks if(ngpus < 0) hu.natis = (floor(cp.opencl_prop.global_mem_size / hu.gpu_ram) * hu.gpu_ram) / cp.opencl_prop.global_mem_size; else if (ngpus > 0) hu.natis = ngpus * gpu_utilization; else hu.natis = gpu_utilization; cp.set_peak_flops(); hu.peak_flops = cp.peak_flops * hu.natis * peak_flops_factor; if (gpu_flops && cpu_flops) { hu.avg_ncpus = avg_ncpus * sreq.host.p_fpops / cpu_flops; hu.projected_flops = cp.peak_flops / gpu_flops * speedup + 1.0 / hu.avg_ncpus; } else { hu.projected_flops = sreq.host.p_fpops * speedup; hu.avg_ncpus = avg_ncpus; } } // ATI OpenCL else { // CPU only hu.avg_ncpus = avg_ncpus; hu.peak_flops = sreq.host.p_fpops * hu.max_ncpus; hu.projected_flops = sreq.host.p_fpops * speedup * peak_flops_factor; } hu.max_ncpus = max_ncpus; if (config.debug_version_select) log_messages.printf(MSG_NORMAL, "[version] host_flops: %e, \tspeedup: %.2f, \tprojected_flops: %e, \tpeak_flops: %e, \tpeak_flops_factor: %.2f\n", sreq.host.p_fpops, speedup, hu.projected_flops, hu.peak_flops, peak_flops_factor); return true; } // check() bool PLAN_CLASS_SPECS::check(SCHEDULER_REQUEST& sreq, char* plan_class, HOST_USAGE& hu) { for (unsigned int i=0; i\n"); fprintf(stderr, " %s \n", name); fprintf(stderr, " %d \n", type); if(min_cuda_compcap) fprintf(stderr, " %d \n", min_cuda_compcap); if(max_cuda_compcap) fprintf(stderr, " %d \n", max_cuda_compcap); if(min_cuda_version) fprintf(stderr, " %d \n", min_cuda_version); if(max_cuda_version) fprintf(stderr, " %d \n", max_cuda_version); if(min_opencl_version) fprintf(stderr, " %d \n", min_opencl_version); if(min_driver_version) fprintf(stderr, " %d \n", min_driver_version); if(max_driver_version) fprintf(stderr, " %d \n", max_driver_version); if(min_gpu_ram_mb) fprintf(stderr, " %f \n", min_gpu_ram_mb); if(gpu_ram_used_mb) fprintf(stderr, " %f \n", gpu_ram_used_mb); if(*project_prefs_tag) { fprintf(stderr, " %s \n", project_prefs_tag); fprintf(stderr, " %f \n", project_prefs_min); fprintf(stderr, " %f \n", project_prefs_max); } if(*gpu_utilization_tag) fprintf(stderr, " %s \n", project_prefs_tag); if(min_macos_version) fprintf(stderr, " %d \n", min_macos_version); if(max_macos_version) fprintf(stderr, " %d \n", max_macos_version); if(*os_version_string) fprintf(stderr, " %s \n", os_version_string); if(speedup) fprintf(stderr, " %f \n", speedup); if(peak_flops_factor) fprintf(stderr, " %f \n", peak_flops_factor); if(gpu_flops) fprintf(stderr, " %f \n", gpu_flops); if(cpu_flops) fprintf(stderr, " %f \n", cpu_flops); if(avg_ncpus) fprintf(stderr, " %f \n", avg_ncpus); if(max_ncpus) fprintf(stderr, " %f \n", max_ncpus); if(ngpus) fprintf(stderr, " %f \n", ngpus); for (unsigned int i=0; i %s \n", cpu_features[i].c_str()); fprintf(stderr, "\n"); } int PLAN_CLASS_SPECS::parse_specs(FILE* f) { char buf[256]; MIOFILE mf; XML_PARSER xp(&mf); mf.init_file(f); if (!xp.parse_start("plan_classes")) return ERR_XML_PARSE; while (!xp.get_tag()) { if (!xp.is_tag) { fprintf(stderr, "PLAN_CLASS_SPECS::parse(): unexpected text %s\n", xp.parsed_tag); continue; } if (xp.match_tag("/plan_classes")) { return 0; } if (xp.match_tag("plan_class")) { PLAN_CLASS_SPEC pc; while (!xp.get_tag()) { if (xp.match_tag("/plan_class")) { break; } if(xp.parse_str("name", pc.name, sizeof(pc.name))) { strcpy(buf,pc.name); downcase_string(buf); if (strstr(buf,"cuda")) { pc.type = 1; } else if (strstr(buf,"nvidia")) { pc.type = 1; } else if (strstr(buf,"ati")) { pc.type = 2; } continue; } if(xp.parse_str("type", buf, sizeof(buf))) { downcase_string(buf); if (!strcmp(buf,"cpu")) { pc.type = 0; } else if (!strcmp(buf,"cuda")) { pc.type = 1; } else if (strstr(buf,"nvidia")) { pc.type = 1; } else if (!strcmp(buf,"ati")) { pc.type = 2; } else { pc.type = atoi(buf); } continue; } if(xp.parse_int("min_cuda_compcap", pc.min_cuda_compcap)) continue; if(xp.parse_int("max_cuda_compcap", pc.max_cuda_compcap)) continue; if(xp.parse_int("min_cuda_version", pc.min_cuda_version)) continue; if(xp.parse_int("max_cuda_version", pc.max_cuda_version)) continue; if(xp.parse_int("min_opencl_version", pc.min_opencl_version)) continue; if(xp.parse_int("min_opencl_device_version", pc.min_opencl_version)) continue; if(xp.parse_int("min_driver_version", pc.min_driver_version)) continue; if(xp.parse_int("max_driver_version", pc.max_driver_version)) continue; if(xp.parse_double("min_gpu_ram_mb", pc.min_gpu_ram_mb)) continue; if(xp.parse_double("gpu_ram_used_mb", pc.gpu_ram_used_mb)) continue; if(xp.parse_str("project_prefs_tag", pc.project_prefs_tag, sizeof(pc.project_prefs_tag))) continue; if(xp.parse_str("gpu_utilization_tag", pc.gpu_utilization_tag, sizeof(pc.gpu_utilization_tag))) continue; if(xp.parse_double("project_prefs_min", pc.project_prefs_min)) continue; if(xp.parse_double("project_prefs_max", pc.project_prefs_max)) continue; if(xp.parse_int("min_macos_version", pc.min_macos_version)) continue; if(xp.parse_int("max_macos_version", pc.max_macos_version)) continue; if(xp.parse_str("os_version", pc.os_version_string, sizeof(pc.os_version_string))) { if ( regcomp(&(pc.os_version_regex), pc.os_version_string, REG_EXTENDED|REG_NOSUB) ) { log_messages.printf(MSG_CRITICAL, "BAD REGEXP: %s\n", pc.os_version_string); return ERR_XML_PARSE; } continue; } if(xp.parse_double("speedup", pc.speedup)) continue; if(xp.parse_double("peak_flops_factor", pc.peak_flops_factor)) continue; if(xp.parse_double("gpu_flops", pc.gpu_flops)) continue; if(xp.parse_double("cpu_flops", pc.cpu_flops)) continue; if(xp.parse_double("avg_ncpus", pc.avg_ncpus)) continue; if(xp.parse_double("max_ncpus", pc.max_ncpus)) continue; if(xp.parse_double("ngpus", pc.ngpus)) continue; if(xp.parse_str("cpu_feature", buf, sizeof(buf))) { pc.cpu_features.push_back(" " + (string)buf + " "); continue; } } classes.push_back(pc); } } return ERR_XML_PARSE; } // parse_specs() PLAN_CLASS_SPEC::PLAN_CLASS_SPEC() { type = 0; min_cuda_compcap = 0; max_cuda_compcap = 0; min_cuda_version = 0; max_cuda_version = 0; min_opencl_version = 0; min_driver_version = 0; max_driver_version = 0; min_gpu_ram_mb = 0; gpu_ram_used_mb = 0; *project_prefs_tag = '\0'; *gpu_utilization_tag = '\0'; project_prefs_min = 0; project_prefs_max = 0; min_macos_version = 0; max_macos_version = 0; *os_version_string = '\0'; speedup = 1.0; peak_flops_factor = 1.0; cpu_flops = 0; gpu_flops = 0; avg_ncpus = 1.0; max_ncpus = 1.0; ngpus = 0; /* defaults to CPU plan classes */ }; PLAN_CLASS_SPECS::PLAN_CLASS_SPECS() { // classes.get_allocator().allocate(0); parsed = false; };