2012-02-16 16:52:07 +00:00
|
|
|
// This file is part of BOINC.
|
|
|
|
// http://boinc.berkeley.edu
|
|
|
|
// Copyright (C) 2012 University of California
|
|
|
|
//
|
|
|
|
// BOINC is free software; you can redistribute it and/or modify it
|
|
|
|
// under the terms of the GNU Lesser General Public License
|
|
|
|
// as published by the Free Software Foundation,
|
|
|
|
// either version 3 of the License, or (at your option) any later version.
|
|
|
|
//
|
|
|
|
// BOINC is distributed in the hope that it will be useful,
|
|
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
|
|
|
|
// See the GNU Lesser General Public License for more details.
|
|
|
|
//
|
|
|
|
// You should have received a copy of the GNU Lesser General Public License
|
|
|
|
// along with BOINC. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
|
|
|
|
// scheduler component for data archival.
|
|
|
|
// Called on each scheduler request.
|
|
|
|
|
2012-03-14 23:31:15 +00:00
|
|
|
#ifdef _USING_FCGI_
|
|
|
|
#include "boinc_fcgi.h"
|
|
|
|
#else
|
|
|
|
#include <cstdio>
|
|
|
|
#endif
|
|
|
|
|
2012-02-16 16:52:07 +00:00
|
|
|
#include <map>
|
|
|
|
#include <string>
|
|
|
|
|
2012-02-29 01:11:28 +00:00
|
|
|
#include "filesys.h"
|
|
|
|
|
|
|
|
#include "backend_lib.h"
|
|
|
|
|
2012-02-28 06:57:28 +00:00
|
|
|
#include "sched_config.h"
|
2012-02-16 23:59:26 +00:00
|
|
|
#include "sched_msgs.h"
|
2012-02-28 06:57:28 +00:00
|
|
|
#include "sched_types.h"
|
2012-02-29 01:11:28 +00:00
|
|
|
#include "sched_util.h"
|
|
|
|
|
|
|
|
#include "vda_lib.h"
|
|
|
|
|
|
|
|
#include "sched_vda.h"
|
2012-02-16 16:52:07 +00:00
|
|
|
|
|
|
|
using std::map;
|
|
|
|
using std::string;
|
2012-02-16 23:59:26 +00:00
|
|
|
using std::pair;
|
2012-02-16 16:52:07 +00:00
|
|
|
|
2012-02-29 01:11:28 +00:00
|
|
|
// mark a vda_file for update by vdad
|
|
|
|
//
|
2012-02-16 23:59:26 +00:00
|
|
|
static int mark_for_update(int vda_file_id) {
|
|
|
|
DB_VDA_FILE f;
|
|
|
|
f.id = vda_file_id;
|
|
|
|
return f.update_field("need_update=1");
|
|
|
|
}
|
|
|
|
|
2012-02-29 01:11:28 +00:00
|
|
|
typedef map<string, DB_VDA_CHUNK_HOST> CHUNK_LIST;
|
|
|
|
|
|
|
|
// get the path to the chunk's directory
|
|
|
|
//
|
|
|
|
static void get_chunk_dir(DB_VDA_FILE& vf, const char* chunk_name, char* dir) {
|
|
|
|
char chunk_dirs[256];
|
|
|
|
strcpy(chunk_dirs, chunk_name);
|
|
|
|
while (1) {
|
|
|
|
char* p = strchr(chunk_dirs, '.');
|
|
|
|
if (!p) break;
|
|
|
|
*p = '/';
|
|
|
|
}
|
|
|
|
sprintf(dir, "%s/%s", vf.dir, chunk_dirs);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void get_chunk_url(DB_VDA_FILE& vf, const char* chunk_name, char* url) {
|
2012-03-29 07:58:47 +00:00
|
|
|
char chunk_dirs[256], buf[1024];
|
2012-02-29 01:11:28 +00:00
|
|
|
strcpy(chunk_dirs, chunk_name);
|
|
|
|
while (1) {
|
|
|
|
char* p = strchr(chunk_dirs, '.');
|
|
|
|
if (!p) break;
|
|
|
|
*p = '/';
|
|
|
|
}
|
2012-03-29 07:58:47 +00:00
|
|
|
dir_hier_url(vf.name, config.download_url, config.uldl_dir_fanout, buf);
|
|
|
|
sprintf(url, "%s/%s/data.vda", buf, chunk_dirs);
|
2012-02-29 01:11:28 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// read the chunk's MD5 file into a buffer
|
|
|
|
//
|
|
|
|
static int get_chunk_md5(char* chunk_dir, char* md5_buf) {
|
|
|
|
char md5_path[1024];
|
|
|
|
sprintf(md5_path, "%s/md5.txt", chunk_dir);
|
2012-03-14 23:31:15 +00:00
|
|
|
#ifndef _USING_FCGI_
|
2012-02-29 01:11:28 +00:00
|
|
|
FILE* f = fopen(md5_path, "r");
|
2012-03-14 23:31:15 +00:00
|
|
|
#else
|
|
|
|
FCGI_FILE* f = FCGI::fopen(md5_path, "r");
|
|
|
|
#endif
|
2012-02-29 01:11:28 +00:00
|
|
|
if (!f) return ERR_FOPEN;
|
|
|
|
char* p = fgets(md5_buf, 64, f);
|
|
|
|
fclose(f);
|
|
|
|
if (p == NULL) return ERR_GETS;
|
|
|
|
strip_whitespace(md5_buf);
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
// process a completed upload:
|
|
|
|
// if vda_chunk_host found
|
|
|
|
// verify md5 of upload
|
|
|
|
// move it from upload dir to vda_file dir
|
|
|
|
// mark vda_file for update
|
|
|
|
// clear transfer_in_progress flag in vda_chunk_host
|
|
|
|
// else
|
|
|
|
// delete from upload dir
|
|
|
|
//
|
|
|
|
static int process_completed_upload(char* chunk_name, CHUNK_LIST& chunks) {
|
|
|
|
char path[1024], client_filename[1024], dir[1024];
|
|
|
|
int retval;
|
|
|
|
|
|
|
|
sprintf(client_filename, "%d_%s", g_reply->host.id, chunk_name);
|
|
|
|
dir_hier_path(
|
|
|
|
client_filename, config.upload_dir, config.uldl_dir_fanout, dir, false
|
|
|
|
);
|
|
|
|
sprintf(path, "%s/%s", dir, client_filename);
|
|
|
|
CHUNK_LIST::iterator i2 = chunks.find(string(chunk_name));
|
|
|
|
if (i2 == chunks.end()) {
|
|
|
|
if (config.debug_vda) {
|
|
|
|
log_messages.printf(MSG_NORMAL,
|
|
|
|
"[vda] chunk_host not found for %s\n", chunk_name
|
|
|
|
);
|
|
|
|
}
|
|
|
|
boinc_delete_file(path);
|
|
|
|
} else {
|
|
|
|
char client_md5[64], server_md5[64];
|
|
|
|
char chunk_dir[1024];
|
|
|
|
DB_VDA_CHUNK_HOST& ch = i2->second;
|
|
|
|
DB_VDA_FILE vf;
|
|
|
|
double size;
|
|
|
|
|
|
|
|
retval = vf.lookup_id(ch.vda_file_id);
|
|
|
|
get_chunk_dir(vf, chunk_name, chunk_dir);
|
|
|
|
retval = get_chunk_md5(chunk_dir, server_md5);
|
|
|
|
if (retval) return retval;
|
|
|
|
retval = md5_file(path, client_md5, size);
|
|
|
|
if (retval) return retval;
|
|
|
|
if (strcmp(client_md5, server_md5)) {
|
|
|
|
if (config.debug_vda) {
|
|
|
|
log_messages.printf(MSG_NORMAL,
|
|
|
|
"[vda] MD5 mismatch %s %s\n", client_md5, server_md5
|
|
|
|
);
|
|
|
|
}
|
|
|
|
boinc_delete_file(path);
|
|
|
|
} else {
|
|
|
|
retval = vf.update_field("need_update=1");
|
|
|
|
if (retval) return retval;
|
|
|
|
retval = ch.update_field("transfer_in_progress=0");
|
|
|
|
if (retval) return retval;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2012-07-05 20:24:17 +00:00
|
|
|
// Process a present file; possibilities:
|
|
|
|
// - a download finished
|
|
|
|
// - this host hasn't communicated in a while, and we deleted the
|
|
|
|
// VDA_CHUNK_HOST record
|
|
|
|
// So:
|
2012-02-29 01:11:28 +00:00
|
|
|
// - create a vda_chunk_host record if needed
|
|
|
|
// - set present_on_host flag in vda_chunk_host
|
|
|
|
// - mark our in-memory vda_chunk_host record as "found"
|
|
|
|
// - mark vda_file for update
|
|
|
|
//
|
|
|
|
static int process_present_file(FILE_INFO& fi, CHUNK_LIST& chunks) {
|
2012-07-05 20:24:17 +00:00
|
|
|
DB_VDA_CHUNK_HOST* ch;
|
|
|
|
CHUNK_LIST::iterator cli = chunks.find(string(fi.name));
|
|
|
|
if (cli == chunks.end()) {
|
|
|
|
// don't have a record of this chunk on this host; make one
|
|
|
|
//
|
|
|
|
ch = new DB_VDA_CHUNK_HOST;
|
|
|
|
ch->create_time = dtime();
|
|
|
|
|
|
|
|
} else {
|
|
|
|
ch = &(cli->second);
|
|
|
|
}
|
|
|
|
ch->transfer_in_progress = false;
|
|
|
|
mark_for_update(ch->vda_file_id);
|
2012-02-29 01:11:28 +00:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
// for each vda_chunk_host not in file list:
|
|
|
|
// - delete from DB
|
|
|
|
// - mark vda_file for update
|
|
|
|
//
|
|
|
|
static int process_missing_chunks(CHUNK_LIST& chunks) {
|
|
|
|
CHUNK_LIST::iterator it;
|
2012-02-29 07:22:59 +00:00
|
|
|
for (it = chunks.begin(); it != chunks.end(); it++) {
|
2012-02-29 01:11:28 +00:00
|
|
|
DB_VDA_CHUNK_HOST& ch = it->second;
|
2012-02-29 07:22:59 +00:00
|
|
|
if (!ch.present_on_host && ch.transfer_in_progress) continue;
|
2012-02-29 01:11:28 +00:00
|
|
|
if (!ch.found) {
|
|
|
|
if (config.debug_vda) {
|
|
|
|
log_messages.printf(MSG_NORMAL,
|
|
|
|
"[vda] in DB but not on client: %s\n", ch.name
|
|
|
|
);
|
|
|
|
}
|
|
|
|
ch.delete_from_db();
|
2012-02-29 07:22:59 +00:00
|
|
|
ch.transfer_in_progress = false;
|
2012-02-29 01:11:28 +00:00
|
|
|
mark_for_update(ch.vda_file_id);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
// if process is using more than its share of disk space,
|
|
|
|
// remove some chunks and mark vda_files for update
|
|
|
|
//
|
|
|
|
static int enforce_quota(CHUNK_LIST& chunks) {
|
|
|
|
if (!g_request->host.d_project_share) return 0;
|
|
|
|
|
|
|
|
double x = g_request->host.d_boinc_used_project;
|
|
|
|
if (config.debug_vda) {
|
|
|
|
log_messages.printf(MSG_NORMAL,
|
|
|
|
"[vda] share: %f used: %f\n",
|
|
|
|
g_request->host.d_project_share, x
|
|
|
|
);
|
|
|
|
}
|
|
|
|
CHUNK_LIST::iterator it = chunks.begin();
|
|
|
|
while (x > g_request->host.d_project_share && it != chunks.end()) {
|
|
|
|
DB_VDA_CHUNK_HOST& ch = it->second;
|
2012-02-29 07:22:59 +00:00
|
|
|
if (!ch.found) continue;
|
2012-02-29 01:11:28 +00:00
|
|
|
FILE_INFO fi;
|
|
|
|
strcpy(fi.name, ch.name);
|
|
|
|
if (config.debug_vda) {
|
|
|
|
log_messages.printf(MSG_NORMAL,
|
|
|
|
"[vda] deleting: %s\n", ch.name
|
|
|
|
);
|
|
|
|
}
|
|
|
|
x -= ch.size;
|
|
|
|
g_reply->file_deletes.push_back(fi);
|
|
|
|
it++;
|
|
|
|
}
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
// issue upload and download commands
|
|
|
|
//
|
|
|
|
static int issue_transfer_commands(CHUNK_LIST& chunks) {
|
2012-02-29 07:22:59 +00:00
|
|
|
char xml_buf[8192], file_name[1024];
|
2012-02-29 01:11:28 +00:00
|
|
|
int retval;
|
|
|
|
char url[1024];
|
|
|
|
|
2012-02-29 20:58:45 +00:00
|
|
|
CHUNK_LIST::iterator it;
|
|
|
|
for (it = chunks.begin(); it != chunks.end(); it++) {
|
|
|
|
vector<const char*> urls;
|
2012-02-29 01:11:28 +00:00
|
|
|
DB_VDA_CHUNK_HOST& ch = it->second;
|
|
|
|
if (!ch.transfer_in_progress) continue;
|
|
|
|
if (!ch.transfer_wait) continue;
|
|
|
|
DB_VDA_FILE vf;
|
|
|
|
retval = vf.lookup_id(ch.vda_file_id);
|
|
|
|
if (retval) return retval;
|
|
|
|
if (ch.present_on_host) {
|
|
|
|
if (config.debug_vda) {
|
|
|
|
log_messages.printf(MSG_NORMAL,
|
|
|
|
"[vda] sending upload command: %s\n", ch.name
|
|
|
|
);
|
|
|
|
}
|
|
|
|
// upload
|
|
|
|
//
|
|
|
|
sprintf(file_name, "%d_%s__%s", g_reply->host.id, ch.name, vf.name);
|
|
|
|
urls.push_back(config.upload_url);
|
|
|
|
R_RSA_PRIVATE_KEY key;
|
|
|
|
retval = get_file_xml(
|
|
|
|
file_name,
|
|
|
|
urls,
|
|
|
|
ch.size,
|
|
|
|
dtime() + VDA_HOST_TIMEOUT,
|
|
|
|
false,
|
|
|
|
key,
|
|
|
|
xml_buf
|
|
|
|
);
|
|
|
|
} else {
|
|
|
|
if (config.debug_vda) {
|
|
|
|
log_messages.printf(MSG_NORMAL,
|
|
|
|
"[vda] sending download command: %s\n", ch.name
|
|
|
|
);
|
|
|
|
}
|
|
|
|
// download
|
|
|
|
//
|
|
|
|
char md5[64], chunk_dir[1024];
|
|
|
|
sprintf(file_name, "%s__%s", ch.name, vf.name);
|
|
|
|
get_chunk_url(vf, ch.name, url);
|
|
|
|
urls.push_back(url);
|
|
|
|
get_chunk_dir(vf, ch.name, chunk_dir);
|
2012-02-29 07:22:59 +00:00
|
|
|
retval = get_chunk_md5(chunk_dir, md5);
|
|
|
|
if (retval) return retval;
|
2012-02-29 01:11:28 +00:00
|
|
|
retval = put_file_xml(
|
|
|
|
file_name,
|
|
|
|
urls,
|
|
|
|
md5,
|
|
|
|
ch.size,
|
|
|
|
dtime() + VDA_HOST_TIMEOUT,
|
|
|
|
xml_buf
|
|
|
|
);
|
|
|
|
}
|
|
|
|
g_reply->file_transfer_requests.push_back(string(xml_buf));
|
|
|
|
}
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2012-02-24 22:55:11 +00:00
|
|
|
// handle a scheduler request:
|
2012-02-29 01:11:28 +00:00
|
|
|
//
|
2012-02-24 22:55:11 +00:00
|
|
|
// - handle completed uploads
|
|
|
|
// - handle set of files present on client
|
|
|
|
// (update or create VDA_CHUNK_HOST record)
|
|
|
|
// - handle files expected but not present
|
|
|
|
// - issue delete commands if needed to enforce share
|
|
|
|
// - issue upload or download commands to client
|
|
|
|
//
|
2012-02-16 23:59:26 +00:00
|
|
|
// relevant fields of SCHEDULER_REQUEST
|
|
|
|
// file_infos: list of sticky files
|
|
|
|
// file_xfer_results: list of completed file xfers
|
|
|
|
//
|
2012-02-16 16:52:07 +00:00
|
|
|
void handle_vda() {
|
2012-02-16 23:59:26 +00:00
|
|
|
int retval;
|
|
|
|
unsigned int i;
|
2012-02-29 01:11:28 +00:00
|
|
|
CHUNK_LIST chunks;
|
2012-02-16 16:52:07 +00:00
|
|
|
// chunks that are supposed to be on this host
|
|
|
|
|
2012-02-29 01:11:28 +00:00
|
|
|
// enumerate the vda_chunk_host records for this host from DB
|
2012-02-16 23:59:26 +00:00
|
|
|
//
|
2012-02-16 16:52:07 +00:00
|
|
|
DB_VDA_CHUNK_HOST ch;
|
|
|
|
char buf[256];
|
2012-02-29 07:22:59 +00:00
|
|
|
sprintf(buf, "where host_id=%d", g_reply->host.id);
|
2012-02-16 16:52:07 +00:00
|
|
|
while (1) {
|
|
|
|
retval = ch.enumerate(buf);
|
|
|
|
if (retval == ERR_DB_NOT_FOUND) break;
|
|
|
|
if (retval) {
|
2012-02-29 01:11:28 +00:00
|
|
|
// if we didn't get a complete enumeration,
|
|
|
|
// give up rather than continuing with partial info
|
2012-02-16 16:52:07 +00:00
|
|
|
//
|
|
|
|
log_messages.printf(MSG_NORMAL,
|
|
|
|
"[vda]: ch.enumerate() failed %d\n", retval
|
|
|
|
);
|
|
|
|
return;
|
|
|
|
}
|
2012-02-28 06:57:28 +00:00
|
|
|
if (config.debug_vda) {
|
|
|
|
log_messages.printf(MSG_NORMAL,
|
|
|
|
"[vda] DB: has chunk %s\n", ch.name
|
|
|
|
);
|
|
|
|
}
|
2012-02-16 23:59:26 +00:00
|
|
|
chunks.insert(pair<string, DB_VDA_CHUNK_HOST>(string(ch.name), ch));
|
|
|
|
}
|
|
|
|
|
2012-02-29 01:11:28 +00:00
|
|
|
// process completed uploads
|
2012-07-05 20:24:17 +00:00
|
|
|
// NOTE: completed downloads are handled below
|
2012-02-16 23:59:26 +00:00
|
|
|
//
|
|
|
|
for (i=0; i<g_request->file_xfer_results.size(); i++) {
|
|
|
|
RESULT& r = g_request->file_xfer_results[i];
|
2012-07-05 20:24:17 +00:00
|
|
|
if (strstr(r.name, "vda_upload")) {
|
|
|
|
char* chunk_name = r.name + strlen("vda_upload_");
|
|
|
|
if (config.debug_vda) {
|
|
|
|
log_messages.printf(MSG_NORMAL,
|
|
|
|
"[vda] DB: completed upload %s\n", chunk_name
|
|
|
|
);
|
|
|
|
}
|
|
|
|
retval = process_completed_upload(chunk_name, chunks);
|
|
|
|
if (retval) {
|
|
|
|
log_messages.printf(MSG_CRITICAL,
|
|
|
|
"[vda] process_completed_upload(): %d\n", retval
|
|
|
|
);
|
|
|
|
return;
|
|
|
|
}
|
2012-02-29 01:11:28 +00:00
|
|
|
}
|
2012-02-16 23:59:26 +00:00
|
|
|
}
|
|
|
|
|
2012-02-29 01:11:28 +00:00
|
|
|
// process files present on host
|
2012-02-16 23:59:26 +00:00
|
|
|
//
|
|
|
|
for (i=0; i<g_request->file_infos.size(); i++) {
|
|
|
|
FILE_INFO& fi = g_request->file_infos[i];
|
2012-02-29 01:11:28 +00:00
|
|
|
if (!starts_with(fi.name, "vda_")) {
|
|
|
|
continue;
|
|
|
|
}
|
2012-02-28 06:57:28 +00:00
|
|
|
if (config.debug_vda) {
|
|
|
|
log_messages.printf(MSG_NORMAL,
|
|
|
|
"[vda] request: client has file %s\n", fi.name
|
|
|
|
);
|
|
|
|
}
|
2012-02-29 01:11:28 +00:00
|
|
|
process_present_file(fi, chunks);
|
2012-02-16 23:59:26 +00:00
|
|
|
}
|
|
|
|
|
2012-02-29 01:11:28 +00:00
|
|
|
process_missing_chunks(chunks);
|
2012-02-16 16:52:07 +00:00
|
|
|
|
2012-02-29 01:11:28 +00:00
|
|
|
enforce_quota(chunks);
|
2012-02-24 22:55:11 +00:00
|
|
|
|
2012-02-29 01:11:28 +00:00
|
|
|
issue_transfer_commands(chunks);
|
2012-02-16 16:52:07 +00:00
|
|
|
}
|