// This file is part of BOINC. // http://boinc.berkeley.edu // Copyright (C) 2008 University of California // // BOINC is free software; you can redistribute it and/or modify it // under the terms of the GNU Lesser General Public License // as published by the Free Software Foundation, // either version 3 of the License, or (at your option) any later version. // // BOINC is distributed in the hope that it will be useful, // but WITHOUT ANY WARRANTY; without even the implied warranty of // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. // See the GNU Lesser General Public License for more details. // // You should have received a copy of the GNU Lesser General Public License // along with BOINC. If not, see . // This is a framework for an assimilator. // You need to link this with an (application-specific) function // assimilate_handler() // in order to make a complete program. // #include "config.h" #include #include #include #include #include #include "boinc_db.h" #include "parse.h" #include "util.h" #include "error_numbers.h" #include "str_util.h" #include "sched_config.h" #include "sched_util.h" #include "sched_msgs.h" #include "assimilate_handler.h" using std::vector; #define LOCKFILE "assimilator.out" #define PIDFILE "assimilator.pid" #define SLEEP_INTERVAL 10 bool update_db = true; bool noinsert = false; int wu_id_modulus=0, wu_id_remainder=0; int sleep_interval = SLEEP_INTERVAL; int one_pass_N_WU=0; int g_argc; char** g_argv; void usage(char** argv) { fprintf(stderr, "This program is an 'assimilator'; it handles completed jobs.\n" "Normally it is run as a daemon from config.xml.\n" "See: http://boinc.berkeley.edu/trac/wiki/BackendPrograms\n\n" ); fprintf(stderr, "usage: %s [options]\n" " Options:\n" " -app name Process jobs for the given application\n" " [-sleep_interval X] Sleep X seconds if no jobs to process (default 10)\n" " [-mod N R] Process jobs with mod(ID, N) == R\n" " [-one_pass] Do one DB enumeration, then exit\n" " [-one_pass_N_WU N] Process at most N jobs\n" " [-d N] Set verbosity level (1, 2, 3=most verbose)\n" " [-dont_update_db] Don't update DB (for testing)\n" " [-noinsert] Don't insert records in app-specific DB\n", argv[0] ); exit(0); } // assimilate all WUs that need it // return nonzero (true) if did anything // bool do_pass(APP& app) { DB_WORKUNIT wu; DB_RESULT canonical_result, result; bool did_something = false; char buf[256]; char mod_clause[256]; int retval; int num_assimilated=0; check_stop_daemons(); if (wu_id_modulus) { sprintf(mod_clause, " and workunit.id %% %d = %d ", wu_id_modulus, wu_id_remainder ); } else { strcpy(mod_clause, ""); } sprintf(buf, "where appid=%d and assimilate_state=%d %s limit %d", app.id, ASSIMILATE_READY, mod_clause, one_pass_N_WU ? one_pass_N_WU : 1000 ); while (1) { retval = wu.enumerate(buf); if (retval) { if (retval != ERR_DB_NOT_FOUND) { log_messages.printf(MSG_DEBUG, "DB connection lost, exiting\n" ); exit(0); } break; } vector results; // must be inside while()! // for testing purposes, pretend we did nothing // if (update_db) { did_something = true; } log_messages.printf(MSG_DEBUG, "[%s] assimilating WU %d; state=%d\n", wu.name, wu.id, wu.assimilate_state ); sprintf(buf, "where workunitid=%d", wu.id); canonical_result.clear(); bool found = false; while (!result.enumerate(buf)) { results.push_back(result); if (result.id == wu.canonical_resultid) { canonical_result = result; found = true; } } // If no canonical result found and WU had no other errors, // something is wrong, e.g. result records got deleted prematurely. // This is probably unrecoverable, so mark the WU as having // an assimilation error and keep going. // if (!found && !wu.error_mask) { log_messages.printf(MSG_CRITICAL, "[%s] no canonical result\n", wu.name ); wu.error_mask = WU_ERROR_NO_CANONICAL_RESULT; sprintf(buf, "error_mask=%d", wu.error_mask); wu.update_field(buf); } retval = assimilate_handler(wu, results, canonical_result); if (retval && retval != DEFER_ASSIMILATION) { log_messages.printf(MSG_CRITICAL, "[%s] handler returned error %d; exiting\n", wu.name, retval ); exit(retval); } if (update_db) { // Defer assimilation until next result is returned int assimilate_state = ASSIMILATE_DONE; if (retval == DEFER_ASSIMILATION) { assimilate_state = ASSIMILATE_INIT; } sprintf( buf, "assimilate_state=%d, transition_time=%d", assimilate_state, (int)time(0) ); retval = wu.update_field(buf); if (retval) { log_messages.printf(MSG_CRITICAL, "[%s] update failed: %d\n", wu.name, retval ); exit(1); } } num_assimilated++; } if (did_something) { boinc_db.commit_transaction(); } if (num_assimilated) { log_messages.printf(MSG_NORMAL, "Assimilated %d workunits.\n", num_assimilated ); } return did_something; } int main(int argc, char** argv) { int retval; bool one_pass = false; DB_APP app; int i; char buf[256]; strcpy(app.name, ""); check_stop_daemons(); g_argc = argc; g_argv = argv; for (i=1; i