// This file is part of BOINC. // http://boinc.berkeley.edu // Copyright (C) 2011 University of California // // BOINC is free software; you can redistribute it and/or modify it // under the terms of the GNU Lesser General Public License // as published by the Free Software Foundation, // either version 3 of the License, or (at your option) any later version. // // BOINC is distributed in the hope that it will be useful, // but WITHOUT ANY WARRANTY; without even the implied warranty of // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. // See the GNU Lesser General Public License for more details. // // You should have received a copy of the GNU Lesser General Public License // along with BOINC. If not, see . #include #include #include #include #include #include "filesys.h" #include "md5_file.h" #include "sched_config.h" #include "sched_util.h" #include "process_input_template.h" using std::string; // look for file named FILENAME.md5 containing md5sum and length. // If found, and newer mod time than file, // read md5 sum and file length from it. // See checkin notes Dec 30 2004 // static bool got_md5_info( const char *path, char *md5data, double *nbytes ) { char md5name[512]; struct stat md5stat, filestat; char endline='\0'; sprintf(md5name, "%s.md5", path); // get mod times for file // if (stat(path, &filestat)) { return false; } // get mod time for md5 cache file // if (stat(md5name, &md5stat)) { return false; } // if cached md5 newer, then open it #ifndef _USING_FCGI_ FILE *fp=fopen(md5name, "r"); #else FCGI_FILE *fp=FCGI::fopen(md5name, "r"); #endif if (!fp) { return false; } // read two quantities: md5 sum and length. // If we can't read these, or there is MORE stuff in the file, // it's not an md5 cache file // int n = fscanf(fp, "%s %lf%c", md5data, nbytes, &endline); int c = fgetc(fp); fclose(fp); if (n != 3) return false; if (endline !='\n') return false; if (c != EOF) return false; // if this is one of our cached md5 files, but it's OLDER than the // data file which it supposedly corresponds to, delete it. // if (md5stat.st_mtime urls; bool generated_locally = false; int retval, file_number = -1; double nbytes, nbytesdef = -1; string md5str, urlstr, tmpstr; char buf[BLOB_SIZE], path[MAXPATHLEN], top_download_path[MAXPATHLEN], md5[33], url[256]; out += "\n"; while (!xp.get_tag()) { if (xp.parse_int("number", file_number)) { continue; } else if (xp.parse_bool("generated_locally", generated_locally)) { continue; } else if (xp.parse_string("url", urlstr)) { urls.push_back(urlstr); continue; } else if (xp.parse_string("md5_cksum", md5str)) { continue; } else if (xp.parse_double("nbytes", nbytesdef)) { continue; } else if (xp.match_tag("/file_info")) { if (nbytesdef != -1 || md5str != "" || urlstr != "") { if (nbytesdef == -1 || md5str == "" || urlstr == "") { fprintf(stderr, "All file properties must be defined " "if at least one is defined (url, md5_cksum, nbytes)!\n" ); return ERR_XML_PARSE; } } if (file_number < 0) { fprintf(stderr, "No file number found\n"); return ERR_XML_PARSE; } if (file_number >= ninfiles) { fprintf(stderr, "Too few input files given; need at least %d\n", file_number+1 ); return ERR_XML_PARSE; } if (input_file_found[file_number]) { fprintf(stderr, "Input file %d listed twice\n", file_number ); return ERR_XML_PARSE; } input_file_found[file_number] = true; if (generated_locally) { sprintf(buf, " %s\n" " \n" "\n", infiles[file_number] ); } else if (nbytesdef == -1) { // here if nybtes was not supplied; stage the file // dir_hier_path( infiles[file_number], config_loc.download_dir, config_loc.uldl_dir_fanout, path, true ); // if file isn't found in hierarchy, // look for it at top level and copy // if (!boinc_file_exists(path)) { sprintf(top_download_path, "%s/%s",config_loc.download_dir, infiles[file_number] ); boinc_copy(top_download_path, path); } if (!config_loc.cache_md5_info || !got_md5_info(path, md5, &nbytes)) { retval = md5_file(path, md5, nbytes); if (retval) { fprintf(stderr, "process_input_template: md5_file %s\n", boincerror(retval) ); return retval; } else if (config_loc.cache_md5_info) { write_md5_info(path, md5, nbytes); } } dir_hier_url( infiles[file_number], config_loc.download_url, config_loc.uldl_dir_fanout, url ); sprintf(buf, " %s\n" " %s\n" " %s\n" " %.0f\n" "\n", infiles[file_number], url, md5, nbytes ); } else { // here if nbytes etc. was supplied, // i.e the file is already staged, possibly remotely // urlstr = ""; for (unsigned int i=0; i\n"; } sprintf(buf, " %s\n" "%s" " %s\n" " %.0f\n" "\n", infiles[file_number], urlstr.c_str(), md5str.c_str(), nbytesdef ); } out += buf; break; } else { retval = xp.copy_element(tmpstr); if (retval) return retval; out += tmpstr; out += "\n"; } } return 0; } static int process_workunit( XML_PARSER& xp, WORKUNIT& wu, string& out, const char** infiles, const char* command_line, const char* additional_xml ) { char buf[256], open_name[256]; int file_number; string tmpstr, cmdline; int retval; out += "\n"; if (command_line) { //fprintf(stderr, "appending command line: %s\n", command_line); out += "\n"; out += command_line; out += "\n\n"; } while (!xp.get_tag()) { if (xp.match_tag("/workunit")) { if (additional_xml && strlen(additional_xml)) { out += additional_xml; out += "\n"; } out += ""; break; } else if (xp.match_tag("file_ref")) { out += "\n"; bool found_file_number = false, found_open_name = false; while (!xp.get_tag()) { if (xp.parse_int("file_number", file_number)) { sprintf(buf, " %s\n", infiles[file_number] ); out += buf; found_file_number = true; continue; } else if (xp.parse_str("open_name", open_name, sizeof(open_name))) { sprintf(buf, " %s\n", open_name); out += buf; found_open_name = true; continue; } else if (xp.match_tag("/file_ref")) { if (!found_file_number) { fprintf(stderr, "No file number found\n"); return ERR_XML_PARSE; } if (!found_open_name) { fprintf(stderr, "No open name found\n"); return ERR_XML_PARSE; } out += "\n"; break; } else if (xp.parse_string("file_name", tmpstr)) { fprintf(stderr, " ignored in element.\n"); continue; } else { retval = xp.copy_element(tmpstr); if (retval) return retval; out += tmpstr; out += "\n"; } } } else if (xp.parse_string("command_line", cmdline)) { if (command_line) { fprintf(stderr, "Can't specify command line twice"); return ERR_XML_PARSE; } out += "\n"; out += cmdline; out += "\n\n"; } else if (xp.parse_double("rsc_fpops_est", wu.rsc_fpops_est)) { continue; } else if (xp.parse_double("rsc_fpops_bound", wu.rsc_fpops_bound)) { continue; } else if (xp.parse_double("rsc_memory_bound", wu.rsc_memory_bound)) { continue; } else if (xp.parse_double("rsc_bandwidth_bound", wu.rsc_bandwidth_bound)) { continue; } else if (xp.parse_double("rsc_disk_bound", wu.rsc_disk_bound)) { continue; } else if (xp.parse_int("batch", wu.batch)) { continue; } else if (xp.parse_int("delay_bound", wu.delay_bound)){ continue; } else if (xp.parse_int("min_quorum", wu.min_quorum)) { continue; } else if (xp.parse_int("target_nresults", wu.target_nresults)) { continue; } else if (xp.parse_int("max_error_results", wu.max_error_results)) { continue; } else if (xp.parse_int("max_total_results", wu.max_total_results)) { continue; } else if (xp.parse_int("max_success_results", wu.max_success_results)) { continue; } else { retval = xp.copy_element(tmpstr); if (retval) return retval; out += tmpstr; out += "\n"; } } return 0; } // fill in the workunit's XML document (wu.xml_doc) // by scanning the input template, macro-substituting the input files, // and putting in the command line element and additional XML // int process_input_template( WORKUNIT& wu, char* tmplate, const char** infiles, int ninfiles, SCHED_CONFIG& config_loc, const char* command_line, const char* additional_xml ) { string out; int retval; bool found_workunit=false; int nfiles_parsed = 0; for (int i=0; i<1024; i++) { input_file_found[i] = false; } out = ""; MIOFILE mf; XML_PARSER xp(&mf); mf.init_buf_read(tmplate); while (!xp.get_tag()) { if (!xp.is_tag) continue; if (xp.match_tag("input_template")) continue; if (xp.match_tag("/input_template")) continue; if (xp.match_tag("file_info")) { retval = process_file_info(xp, out, ninfiles, infiles, config_loc); if (retval) return retval; nfiles_parsed++; } else if (xp.match_tag("workunit")) { found_workunit = true; retval = process_workunit( xp, wu, out, infiles, command_line, additional_xml ); if (retval) return retval; } } if (!found_workunit) { fprintf(stderr, "process_input_template: bad WU template - no \n"); return ERR_XML_PARSE; } if (nfiles_parsed != ninfiles) { fprintf(stderr, "process_input_template: %d input files listed, but template has %d\n", ninfiles, nfiles_parsed ); return ERR_XML_PARSE; } if (out.size() > sizeof(wu.xml_doc)-1) { fprintf(stderr, "create_work: WU XML field is too long (%d bytes; max is %d)\n", (int)out.size(), (int)sizeof(wu.xml_doc)-1 ); return ERR_BUFFER_OVERFLOW; } //fprintf(stderr, "copying to xml_doc: %s\n", out.c_str()); strcpy(wu.xml_doc, out.c_str()); return 0; }