mirror of https://github.com/BOINC/boinc.git
449 lines
12 KiB
C++
449 lines
12 KiB
C++
// This file is part of BOINC.
|
|
// http://boinc.berkeley.edu
|
|
// Copyright (C) 2008 University of California
|
|
//
|
|
// BOINC is free software; you can redistribute it and/or modify it
|
|
// under the terms of the GNU Lesser General Public License
|
|
// as published by the Free Software Foundation,
|
|
// either version 3 of the License, or (at your option) any later version.
|
|
//
|
|
// BOINC is distributed in the hope that it will be useful,
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
|
|
// See the GNU Lesser General Public License for more details.
|
|
//
|
|
// You should have received a copy of the GNU Lesser General Public License
|
|
// along with BOINC. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
#ifndef _SERVER_TYPES_
|
|
#define _SERVER_TYPES_
|
|
|
|
#include <cstdio>
|
|
#include <vector>
|
|
|
|
#include "boinc_db.h"
|
|
#include "common_defs.h"
|
|
#include "md5_file.h"
|
|
#include "coproc.h"
|
|
|
|
#include "edf_sim.h"
|
|
|
|
// for projects that support work filtering by app,
|
|
// this records an app for which the user will accept work
|
|
//
|
|
struct APP_INFO {
|
|
int appid;
|
|
int work_available;
|
|
};
|
|
|
|
// represents a resource (disk etc.) that the client may not have enough of
|
|
//
|
|
struct RESOURCE {
|
|
bool insufficient;
|
|
double needed; // the min extra amount needed
|
|
|
|
inline void set_insufficient(double x) {
|
|
insufficient = true;
|
|
if (needed) {
|
|
if (x < needed) needed = x;
|
|
} else {
|
|
needed = x;
|
|
}
|
|
}
|
|
};
|
|
|
|
// message intended for human eyes
|
|
//
|
|
struct USER_MESSAGE {
|
|
std::string message;
|
|
std::string priority;
|
|
USER_MESSAGE(const char* m, const char*p);
|
|
};
|
|
|
|
struct HOST_USAGE {
|
|
int ncudas;
|
|
double avg_ncpus;
|
|
double max_ncpus;
|
|
double flops;
|
|
char cmdline[256];
|
|
|
|
HOST_USAGE() {
|
|
ncudas = 0;
|
|
avg_ncpus = 1;
|
|
max_ncpus = 1;
|
|
flops = 0;
|
|
strcpy(cmdline, "");
|
|
}
|
|
void sequential_app(double x) {
|
|
ncudas = 0;
|
|
avg_ncpus = 1;
|
|
max_ncpus = 1;
|
|
flops = x;
|
|
if (flops <= 0) flops = 1e9;
|
|
strcpy(cmdline, "");
|
|
}
|
|
~HOST_USAGE(){}
|
|
};
|
|
|
|
// summary of a client's request for work, and our response to it
|
|
// Note: this is zeroed out in SCHEDULER_REPLY constructor
|
|
//
|
|
struct WORK_REQ {
|
|
bool anonymous_platform;
|
|
|
|
// Flags used by old-style scheduling,
|
|
// while making multiple passes through the work array
|
|
bool infeasible_only;
|
|
bool reliable_only;
|
|
bool user_apps_only;
|
|
bool beta_only;
|
|
|
|
// user preferences
|
|
bool no_gpus;
|
|
bool no_cpu;
|
|
bool allow_non_preferred_apps;
|
|
bool allow_beta_work;
|
|
std::vector<APP_INFO> preferred_apps;
|
|
|
|
bool reliable;
|
|
// whether the host is classified as "reliable"
|
|
// (misnomer: means low turnaround time and low error rate
|
|
|
|
bool trust;
|
|
// whether to send unreplicated jobs
|
|
int effective_ncpus;
|
|
int effective_ngpus;
|
|
|
|
// 6.7+ clients send separate requests for different resource types:
|
|
//
|
|
double cpu_req_secs; // instance-seconds requested
|
|
double cpu_req_instances; // number of idle instances, use if possible
|
|
double cuda_req_secs;
|
|
double cuda_req_instances;
|
|
inline bool need_cpu() {
|
|
return (cpu_req_secs>0) || (cpu_req_instances>0);
|
|
}
|
|
inline bool need_cuda() {
|
|
return (cuda_req_secs>0) || (cuda_req_instances>0);
|
|
}
|
|
inline void clear_cpu_req() {
|
|
cpu_req_secs = 0;
|
|
cpu_req_instances = 0;
|
|
}
|
|
inline void clear_gpu_req() {
|
|
cuda_req_secs = 0;
|
|
cuda_req_instances = 0;
|
|
}
|
|
|
|
// older clients send send a single number, the requested duration of jobs
|
|
//
|
|
double seconds_to_fill;
|
|
|
|
// true if new-type request
|
|
//
|
|
bool rsc_spec_request;
|
|
|
|
double disk_available;
|
|
double ram, usable_ram;
|
|
double running_frac;
|
|
double dcf;
|
|
int njobs_sent;
|
|
|
|
// The following keep track of the "easiest" job that was rejected
|
|
// by EDF simulation.
|
|
// Any jobs harder than this can be rejected without doing the simulation.
|
|
//
|
|
double edf_reject_min_cpu;
|
|
int edf_reject_max_delay_bound;
|
|
bool have_edf_reject;
|
|
void edf_reject(double cpu, int delay_bound) {
|
|
if (have_edf_reject) {
|
|
if (cpu < edf_reject_min_cpu) edf_reject_min_cpu = cpu;
|
|
if (delay_bound> edf_reject_max_delay_bound) edf_reject_max_delay_bound = delay_bound;
|
|
} else {
|
|
edf_reject_min_cpu = cpu;
|
|
edf_reject_max_delay_bound = delay_bound;
|
|
have_edf_reject = true;
|
|
}
|
|
}
|
|
bool edf_reject_test(double cpu, int delay_bound) {
|
|
if (!have_edf_reject) return false;
|
|
if (cpu < edf_reject_min_cpu) return false;
|
|
if (delay_bound > edf_reject_max_delay_bound) return false;
|
|
return true;
|
|
}
|
|
|
|
RESOURCE disk;
|
|
RESOURCE mem;
|
|
RESOURCE speed;
|
|
RESOURCE bandwidth;
|
|
|
|
std::vector<USER_MESSAGE> no_work_messages;
|
|
std::vector<BEST_APP_VERSION*> best_app_versions;
|
|
|
|
// various reasons for not sending jobs (used to explain why)
|
|
//
|
|
bool no_allowed_apps_available;
|
|
bool excessive_work_buf;
|
|
bool hr_reject_temp;
|
|
bool hr_reject_perm;
|
|
bool outdated_client;
|
|
bool no_gpus_prefs;
|
|
bool no_cpu_prefs;
|
|
bool daily_result_quota_exceeded;
|
|
bool max_jobs_on_host_exceeded;
|
|
bool max_jobs_on_host_cpu_exceeded;
|
|
bool max_jobs_on_host_gpu_exceeded;
|
|
bool no_jobs_available; // project has no work right now
|
|
|
|
int max_jobs_per_day;
|
|
// host.max_results_day * (NCPUS + NCUDA*cuda_multiplier)
|
|
int max_jobs_per_rpc;
|
|
int njobs_on_host;
|
|
// How many jobs from this project are in progress on the host.
|
|
// Initially this is the number of "other_results"
|
|
// reported in the request message.
|
|
// If the resend_lost_results option is used,
|
|
// it's set to the number of outstanding results taken from the DB
|
|
// (those that were lost are resent).
|
|
// As new results are sent, it's incremented.
|
|
int njobs_on_host_cpu;
|
|
// same, but just CPU jobs.
|
|
int njobs_on_host_gpu;
|
|
// same, but just GPU jobs.
|
|
int max_jobs_on_host;
|
|
int max_jobs_on_host_cpu;
|
|
int max_jobs_on_host_gpu;
|
|
void update_for_result(double seconds_filled);
|
|
void insert_no_work_message(const USER_MESSAGE&);
|
|
void get_job_limits();
|
|
};
|
|
|
|
// a description of a sticky file on host.
|
|
//
|
|
struct FILE_INFO {
|
|
char name[256];
|
|
|
|
int parse(FILE*);
|
|
};
|
|
|
|
struct MSG_FROM_HOST_DESC {
|
|
char variety[256];
|
|
std::string msg_text;
|
|
int parse(FILE*);
|
|
};
|
|
|
|
// an app version from an anonymous-platform client
|
|
//
|
|
struct CLIENT_APP_VERSION {
|
|
char app_name[256];
|
|
char platform[256];
|
|
int version_num;
|
|
char plan_class[256];
|
|
HOST_USAGE host_usage;
|
|
|
|
int parse(FILE*);
|
|
};
|
|
|
|
// keep track of the best app_version for each app for this host
|
|
//
|
|
struct BEST_APP_VERSION {
|
|
int appid;
|
|
|
|
bool present;
|
|
|
|
// populated if anonymous platform:
|
|
CLIENT_APP_VERSION* cavp;
|
|
|
|
// populated otherwise:
|
|
APP_VERSION* avp;
|
|
|
|
// populated in either case:
|
|
HOST_USAGE host_usage;
|
|
|
|
BEST_APP_VERSION() {
|
|
present = false;
|
|
cavp = NULL;
|
|
avp = NULL;
|
|
}
|
|
};
|
|
|
|
// subset of global prefs used by scheduler
|
|
//
|
|
struct GLOBAL_PREFS {
|
|
double mod_time;
|
|
double disk_max_used_gb;
|
|
double disk_max_used_pct;
|
|
double disk_min_free_gb;
|
|
double work_buf_min_days;
|
|
double ram_max_used_busy_frac;
|
|
double ram_max_used_idle_frac;
|
|
double max_ncpus_pct;
|
|
|
|
void parse(const char* buf, const char* venue);
|
|
void defaults();
|
|
inline double work_buf_min() {return work_buf_min_days*86400;}
|
|
};
|
|
|
|
struct GUI_URLS {
|
|
char* text;
|
|
void init();
|
|
void get_gui_urls(USER& user, HOST& host, TEAM& team, char*);
|
|
};
|
|
|
|
struct PROJECT_FILES {
|
|
char* text;
|
|
void init();
|
|
};
|
|
|
|
// Represents a result from this project that the client has.
|
|
// The request message has a list of these.
|
|
// The reply message may include a list of those to be aborted
|
|
// or aborted if not started
|
|
//
|
|
struct OTHER_RESULT {
|
|
char name[256];
|
|
char plan_class[64];
|
|
bool have_plan_class;
|
|
bool abort;
|
|
bool abort_if_not_started;
|
|
int reason; // see codes below
|
|
|
|
int parse(FILE*);
|
|
};
|
|
|
|
#define ABORT_REASON_NOT_FOUND 1
|
|
#define ABORT_REASON_WU_CANCELLED 2
|
|
#define ABORT_REASON_ASSIMILATED 3
|
|
#define ABORT_REASON_TIMED_OUT 4
|
|
|
|
struct CLIENT_PLATFORM {
|
|
char name[256];
|
|
int parse(FILE*);
|
|
};
|
|
|
|
struct PLATFORM_LIST {
|
|
std::vector<PLATFORM*> list;
|
|
};
|
|
|
|
struct SCHEDULER_REQUEST {
|
|
char authenticator[256];
|
|
CLIENT_PLATFORM platform;
|
|
std::vector<CLIENT_PLATFORM> alt_platforms;
|
|
PLATFORM_LIST platforms;
|
|
char cross_project_id[256];
|
|
int hostid; // zero if first RPC
|
|
int core_client_major_version;
|
|
int core_client_minor_version;
|
|
int core_client_release;
|
|
int core_client_version; // 100*major + minor
|
|
int rpc_seqno;
|
|
double work_req_seconds;
|
|
// in "normalized CPU seconds" (see work_req.php)
|
|
double cpu_req_secs;
|
|
double cpu_req_instances;
|
|
double resource_share_fraction;
|
|
// this project's fraction of total resource share
|
|
double rrs_fraction;
|
|
// ... of runnable resource share
|
|
double prrs_fraction;
|
|
// ... of potentially runnable resource share
|
|
double cpu_estimated_delay;
|
|
// currently queued jobs saturate the CPU for this long;
|
|
// used for crude deadline check
|
|
double duration_correction_factor;
|
|
char global_prefs_xml[BLOB_SIZE];
|
|
char working_global_prefs_xml[BLOB_SIZE];
|
|
char code_sign_key[4096];
|
|
|
|
bool anonymous_platform;
|
|
std::vector<CLIENT_APP_VERSION> client_app_versions;
|
|
GLOBAL_PREFS global_prefs;
|
|
char global_prefs_source_email_hash[MD5_LEN];
|
|
|
|
HOST host; // request message is parsed into here.
|
|
// does NOT contain the full host record.
|
|
COPROCS coprocs;
|
|
COPROC_CUDA* coproc_cuda;
|
|
std::vector<RESULT> results;
|
|
// completed results being reported
|
|
std::vector<MSG_FROM_HOST_DESC> msgs_from_host;
|
|
std::vector<FILE_INFO> file_infos;
|
|
// sticky files reported by host for locality scheduling
|
|
std::vector<FILE_INFO> file_delete_candidates;
|
|
// sticky files reported by host, deletion candidates
|
|
std::vector<FILE_INFO> files_not_needed;
|
|
// sticky files reported by host, no longer needed
|
|
std::vector<OTHER_RESULT> other_results;
|
|
// in-progress results from this project
|
|
std::vector<IP_RESULT> ip_results;
|
|
// in-progress results from all projects
|
|
bool have_other_results_list;
|
|
bool have_ip_results_list;
|
|
bool have_time_stats_log;
|
|
bool client_cap_plan_class;
|
|
int sandbox; // -1 = don't know
|
|
|
|
SCHEDULER_REQUEST();
|
|
~SCHEDULER_REQUEST();
|
|
const char* parse(FILE*);
|
|
int write(FILE*); // write request info to file: not complete
|
|
};
|
|
|
|
// keep track of bottleneck disk preference
|
|
//
|
|
struct DISK_LIMITS {
|
|
double max_used;
|
|
double max_frac;
|
|
double min_free;
|
|
};
|
|
|
|
// NOTE: if any field requires initialization,
|
|
// you must do it in the constructor. Nothing is zeroed by default.
|
|
//
|
|
struct SCHEDULER_REPLY {
|
|
WORK_REQ wreq;
|
|
DISK_LIMITS disk_limits;
|
|
double request_delay; // don't request again until this time elapses
|
|
std::vector<USER_MESSAGE> messages;
|
|
int hostid;
|
|
// nonzero only if a new host record was created.
|
|
// this tells client to reset rpc_seqno
|
|
int lockfile_fd; // file descriptor of lockfile, or -1 if no lock.
|
|
bool send_global_prefs;
|
|
bool nucleus_only; // send only message
|
|
USER user;
|
|
char email_hash[MD5_LEN];
|
|
HOST host; // after validation, contains full host rec
|
|
TEAM team;
|
|
std::vector<APP> apps;
|
|
std::vector<APP_VERSION> app_versions;
|
|
std::vector<WORKUNIT>wus;
|
|
std::vector<RESULT>results;
|
|
std::vector<std::string>result_acks;
|
|
std::vector<std::string>result_aborts;
|
|
std::vector<std::string>result_abort_if_not_starteds;
|
|
std::vector<MSG_TO_HOST>msgs_to_host;
|
|
std::vector<FILE_INFO>file_deletes;
|
|
char code_sign_key[4096];
|
|
char code_sign_key_signature[4096];
|
|
bool send_msg_ack;
|
|
bool project_is_down;
|
|
|
|
SCHEDULER_REPLY();
|
|
~SCHEDULER_REPLY();
|
|
int write(FILE*, SCHEDULER_REQUEST&);
|
|
void insert_app_unique(APP&);
|
|
void insert_app_version_unique(APP_VERSION&);
|
|
void insert_workunit_unique(WORKUNIT&);
|
|
void insert_result(RESULT&);
|
|
void insert_message(const USER_MESSAGE&);
|
|
void set_delay(double);
|
|
};
|
|
|
|
extern SCHEDULER_REQUEST* g_request;
|
|
extern SCHEDULER_REPLY* g_reply;
|
|
extern WORK_REQ* g_wreq;
|
|
|
|
#endif
|