// Berkeley Open Infrastructure for Network Computing // http://boinc.berkeley.edu // Copyright (C) 2005 University of California // // This is free software; you can redistribute it and/or // modify it under the terms of the GNU Lesser General Public // License as published by the Free Software Foundation; // either version 2.1 of the License, or (at your option) any later version. // // This software is distributed in the hope that it will be useful, // but WITHOUT ANY WARRANTY; without even the implied warranty of // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. // See the GNU Lesser General Public License for more details. // // To view the GNU Lesser General Public License visit // http://www.gnu.org/copyleft/lesser.html // or write to the Free Software Foundation, Inc., // 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA #include "config.h" #include #include #include #include #include #include #include #include #include #include "boinc_db.h" #include "crypt.h" #include "error_numbers.h" #include "md5_file.h" #include "parse.h" #include "str_util.h" #include "common_defs.h" #include "filesys.h" #include "sched_util.h" #include "backend_lib.h" #ifdef _USING_FCGI_ #include "fcgi_stdio.h" #else #define FCGI_ToFILE(x) (x) #endif using std::string; static struct random_init { random_init() { srand48(getpid() + time(0)); } } random_init; int read_file(FILE* f, char* buf, int len) { int n = fread(buf, 1, len, f); buf[n] = 0; return 0; } int read_filename(const char* path, char* buf, int len) { int retval; FILE* f = fopen(path, "r"); if (!f) return -1; retval = read_file(f, buf, len); fclose(f); return retval; } // see checkin notes Dec 30 2004 // static bool got_md5_info( const char *path, char *md5data, double *nbytes ) { bool retval=false; // look for file named FILENAME.md5 containing md5sum and length. // If found, and newer mod time than file, read md5 sum and file // length from it. FILE *fp; char md5name[512]; struct stat md5stat, filestat; char endline='\0'; sprintf(md5name, "%s.md5", path); // get mod times for file if (stat(path, &filestat)) return retval; // get mod time for md5 cache file if (stat(md5name, &md5stat)) return retval; // if cached md5 newer, then open it if (!(fp=fopen(md5name, "r"))) return retval; // read two quantities: md5 sum and length. If we can't read // these, or there is MORE stuff in the file' it's not an md5 // cache file if (3 == fscanf(FCGI_ToFILE(fp), "%s %lf%c", md5data, nbytes, &endline) && endline=='\n' && EOF==fgetc(FCGI_ToFILE(fp)) ) retval=true; fclose(fp); // if this is one of our cached md5 files, but it's OLDER than the // data file which it supposedly corresponds to, delete it. if (retval && md5stat.st_mtime")) { bool generated_locally = false; file_number = -1; out += "\n"; while (1) { p = strtok(0, "\n"); if (!p) break; if (parse_int(p, "", file_number)) { continue; } else if (parse_bool(p, "generated_locally", generated_locally)) { continue; } else if (match_tag(p, "")) { if (file_number < 0) { fprintf(stderr, "No file number found\n"); return ERR_XML_PARSE; } if (file_number >= ninfiles) { fprintf(stderr, "Too few input files given; need at least %d\n", file_number+1 ); return ERR_XML_PARSE; } nfiles_parsed++; if (generated_locally) { sprintf(buf, " %s\n" " \n" "\n", infiles[file_number] ); } else { dir_hier_path( infiles[file_number], config.download_dir, config.uldl_dir_fanout, path, true ); // if file isn't found in hierarchy, // look for it at top level and copy // if (!boinc_file_exists(path)) { sprintf(top_download_path, "%s/%s",config.download_dir, infiles[file_number] ); boinc_copy(top_download_path, path); } if (!config.cache_md5_info || !got_md5_info(path, md5, &nbytes)) { retval = md5_file(path, md5, nbytes); if (retval) { fprintf(stderr, "process_wu_template: md5_file %d\n", retval); return retval; } else if (config.cache_md5_info) { write_md5_info(path, md5, nbytes); } } dir_hier_url( infiles[file_number], config.download_url, config.uldl_dir_fanout, url ); sprintf(buf, " %s\n" " %s\n" " %s\n" " %.0f\n" "\n", infiles[file_number], url, md5, nbytes ); } out += buf; break; } else { out += p; out += "\n"; } } } else if (match_tag(p, "")) { found = true; out += "\n"; if (command_line) { out += "\n"; out += command_line; out += "\n\n"; } } else if (match_tag(p, "")) { if (additional_xml && strlen(additional_xml)) { out += additional_xml; out += "\n"; } out += "\n"; } else if (match_tag(p, "")) { out += "\n"; bool found_file_number = false, found_open_name = false; while (1) { p = strtok(0, "\n"); if (!p) break; if (parse_int(p, "", file_number)) { sprintf(buf, " %s\n", infiles[file_number] ); out += buf; found_file_number = true; continue; } else if (parse_str(p, "", open_name, sizeof(open_name))) { sprintf(buf, " %s\n", open_name); out += buf; found_open_name = true; continue; } else if (match_tag(p, "")) { if (!found_file_number) { fprintf(stderr, "No file number found\n"); return ERR_XML_PARSE; } if (!found_open_name) { fprintf(stderr, "No open name found\n"); return ERR_XML_PARSE; } out += "\n"; break; } else { sprintf(buf, "%s\n", p); out += buf; } } } else if (parse_str(p, "", cmdline)) { if (command_line) { fprintf(stderr, "Can't specify command line twice"); return ERR_XML_PARSE; } out += "\n"; out += cmdline; out += "\n\n"; } else if (parse_double(p, "", wu.rsc_fpops_est)) { continue; } else if (parse_double(p, "", wu.rsc_fpops_bound)) { continue; } else if (parse_double(p, "", wu.rsc_memory_bound)) { continue; } else if (parse_double(p, "", wu.rsc_bandwidth_bound)) { continue; } else if (parse_double(p, "", wu.rsc_disk_bound)) { continue; } else if (parse_int(p, "", wu.batch)) { continue; } else if (parse_int(p, "", wu.delay_bound)) { continue; } else if (parse_int(p, "", wu.min_quorum)) { continue; } else if (parse_int(p, "", wu.target_nresults)) { continue; } else if (parse_int(p, "", wu.max_error_results)) { continue; } else if (parse_int(p, "", wu.max_total_results)) { continue; } else if (parse_int(p, "", wu.max_success_results)) { continue; } else { out += p; out += "\n"; } } if (!found) { fprintf(stderr, "process_wu_template: bad WU template - no \n"); return -1; } if (nfiles_parsed != ninfiles) { fprintf(stderr, "process_wu_template: %d input files listed, but template has %d\n", ninfiles, nfiles_parsed ); return -1; } if (out.size() > sizeof(wu.xml_doc)-1) { fprintf(stderr, "create_work: WU XML field is too long (%d bytes; max is %d)\n", out.size(), sizeof(wu.xml_doc)-1 ); return ERR_BUFFER_OVERFLOW; } strcpy(wu.xml_doc, out.c_str()); return 0; } // initialize an about-to-be-created result, given its WU // static void initialize_result(DB_RESULT& result, WORKUNIT& wu) { result.id = 0; result.create_time = time(0); result.workunitid = wu.id; result.server_state = RESULT_SERVER_STATE_UNSENT; result.hostid = 0; result.report_deadline = 0; result.sent_time = 0; result.received_time = 0; result.client_state = 0; result.cpu_time = 0; strcpy(result.xml_doc_out, ""); strcpy(result.stderr_out, ""); result.outcome = RESULT_OUTCOME_INIT; result.file_delete_state = ASSIMILATE_INIT; result.validate_state = VALIDATE_STATE_INIT; result.claimed_credit = 0; result.granted_credit = 0; result.appid = wu.appid; result.priority = wu.priority; result.batch = wu.batch; } int create_result_ti( TRANSITIONER_ITEM& ti, char* result_template_filename, char* result_name_suffix, R_RSA_PRIVATE_KEY& key, SCHED_CONFIG& config, char* query_string, // if nonzero, write value list here; else do insert int priority_increase ) { WORKUNIT wu; // copy relevant fields from TRANSITIONER_ITEM to WORKUNIT // strcpy(wu.name, ti.name); wu.id = ti.id; wu.appid = ti.appid; wu.priority = ti.priority; wu.batch = ti.batch; return create_result( wu, result_template_filename, result_name_suffix, key, config, query_string, priority_increase ); } // Create a new result for the given WU. // This is called ONLY from the transitioner // int create_result( WORKUNIT& wu, char* result_template_filename, char* result_name_suffix, R_RSA_PRIVATE_KEY& key, SCHED_CONFIG& config, char* query_string, // if nonzero, write value list here; else do insert int priority_increase ) { DB_RESULT result; char base_outfile_name[256]; char result_template[LARGE_BLOB_SIZE]; int retval; result.clear(); initialize_result(result, wu); result.priority = result.priority + priority_increase; sprintf(result.name, "%s_%s", wu.name, result_name_suffix); sprintf(base_outfile_name, "%s_", result.name); retval = read_filename( result_template_filename, result_template, sizeof(result_template) ); if (retval) { fprintf(stderr, "Failed to read result template file '%s': %d\n", result_template_filename, retval ); return retval; } retval = process_result_template( result_template, key, base_outfile_name, config ); if (retval) { fprintf(stderr, "process_result_template() error: %d\n", retval); } if (strlen(result_template) > sizeof(result.xml_doc_in)-1) { fprintf(stderr, "result XML doc is too long: %d bytes, max is %d\n", strlen(result_template), sizeof(result.xml_doc_in)-1 ); return ERR_BUFFER_OVERFLOW; } strlcpy(result.xml_doc_in, result_template, sizeof(result.xml_doc_in)); result.random = lrand48(); if (query_string) { result.db_print_values(query_string); } else { retval = result.insert(); if (retval) { fprintf(stderr, "result.insert(): %d\n", retval); return retval; } } // if using locality scheduling, advertise data file // associated with this newly-created result // if (config.locality_scheduling) { char datafilename[512]; char *last=strstr(result.name, "__"); if (result.name sizeof(wu.result_template_file)-1) { fprintf(stderr, "result template filename is too big: %d bytes, max is %d\n", strlen(result_template_filename), sizeof(wu.result_template_file)-1 ); return ERR_BUFFER_OVERFLOW; } strlcpy(wu.result_template_file, result_template_filename, sizeof(wu.result_template_file)); if (wu.rsc_fpops_est == 0) { fprintf(stderr, "no rsc_fpops_est given; can't create job\n"); return ERR_NO_OPTION; } if (wu.rsc_fpops_bound == 0) { fprintf(stderr, "no rsc_fpops_bound given; can't create job\n"); return ERR_NO_OPTION; } if (wu.rsc_disk_bound == 0) { fprintf(stderr, "no rsc_disk_bound given; can't create job\n"); return ERR_NO_OPTION; } if (wu.target_nresults == 0) { fprintf(stderr, "no target_nresults given; can't create job\n"); return ERR_NO_OPTION; } if (wu.max_error_results == 0) { fprintf(stderr, "no max_error_results given; can't create job\n"); return ERR_NO_OPTION; } if (wu.max_total_results == 0) { fprintf(stderr, "no max_total_results given; can't create job\n"); return ERR_NO_OPTION; } if (wu.max_success_results == 0) { fprintf(stderr, "no max_success_results given; can't create job\n"); return ERR_NO_OPTION; } if (strstr(wu.name, ASSIGNED_WU_STR)) { wu.transition_time = INT_MAX; } else { wu.transition_time = time(0); } if (wu.id) { retval = wu.update(); if (retval) { fprintf(stderr, "create_work: workunit.update() %d\n", retval); return retval; } } else { retval = wu.insert(); if (retval) { fprintf(stderr, "create_work: workunit.insert() %d\n", retval); return retval; } wu.id = boinc_db.insert_id(); } return 0; } const char *BOINC_RCSID_b5f8b10eb5 = "$Id$";