- scheduler: fix memory leak (free BEST_APP_VERSION objects)

svn path=/trunk/boinc/; revision=21597
2010-05-21 21:49:54 +00:00 · 2010-05-21 21:49:54 +00:00 · ca239d913a
parent fa66519441
commit ca239d913a
3 changed files with 155 additions and 140 deletions
--- a/7
+++ b/7
@ -3830,3 +3830,10 @@ David  20 May 2010
    sched/
        sched_customize.cpp
        sched_version.cpp
 David  20 May 2010
    - scheduler: fix memory leak (free BEST_APP_VERSION objects)
    sched/
        sched_types.h
        sched_version.cpp
--- a/sched/sched_types.h
+++ b/sched/sched_types.h
@ -105,146 +105,6 @@ struct HOST_USAGE {
    }
 };
 // summary of a client's request for work, and our response to it
 // Note: this is zeroed out in SCHEDULER_REPLY constructor
 //
 struct WORK_REQ {
    bool anonymous_platform;
    // Flags used by old-style scheduling,
    // while making multiple passes through the work array
    bool infeasible_only;
    bool reliable_only;
    bool user_apps_only;
    bool beta_only;
    // user preferences
    bool no_cuda;
    bool no_ati;
    bool no_cpu;
 	bool allow_non_preferred_apps;
 	bool allow_beta_work;
 	std::vector<APP_INFO> preferred_apps;
    bool has_reliable_version;
        // whether the host has a reliable app version
    int effective_ncpus;
    int effective_ngpus;
    // 6.7+ clients send separate requests for different resource types:
    //
    double cpu_req_secs;        // instance-seconds requested
    double cpu_req_instances;   // number of idle instances, use if possible
    double cuda_req_secs;
    double cuda_req_instances;
    double ati_req_secs;
    double ati_req_instances;
    inline bool need_cpu() {
        return (cpu_req_secs>0) || (cpu_req_instances>0);
    }
    inline bool need_cuda() {
        return (cuda_req_secs>0) || (cuda_req_instances>0);
    }
    inline bool need_ati() {
        return (ati_req_secs>0) || (ati_req_instances>0);
    }
    inline void clear_cpu_req() {
        cpu_req_secs = 0;
        cpu_req_instances = 0;
    }
    inline void clear_gpu_req() {
        cuda_req_secs = 0;
        cuda_req_instances = 0;
        ati_req_secs = 0;
        ati_req_instances = 0;
    }
    // older clients send send a single number, the requested duration of jobs
    //
    double seconds_to_fill;
    // true if new-type request
    //
    bool rsc_spec_request;
    double disk_available;
    double ram, usable_ram;
    double running_frac;
    int njobs_sent;
    // The following keep track of the "easiest" job that was rejected
    // by EDF simulation.
    // Any jobs harder than this can be rejected without doing the simulation.
    //
    double edf_reject_min_cpu;
    int edf_reject_max_delay_bound;
    bool have_edf_reject;
    void edf_reject(double cpu, int delay_bound) {
        if (have_edf_reject) {
            if (cpu < edf_reject_min_cpu) edf_reject_min_cpu = cpu;
            if (delay_bound> edf_reject_max_delay_bound) edf_reject_max_delay_bound = delay_bound;
        } else {
            edf_reject_min_cpu = cpu;
            edf_reject_max_delay_bound = delay_bound;
            have_edf_reject = true;
        }
    }
    bool edf_reject_test(double cpu, int delay_bound) {
        if (!have_edf_reject) return false;
        if (cpu < edf_reject_min_cpu) return false;
        if (delay_bound > edf_reject_max_delay_bound) return false;
        return true;
    }
    RESOURCE disk;
    RESOURCE mem;
    RESOURCE speed;
    RESOURCE bandwidth;
    std::vector<USER_MESSAGE> no_work_messages;
    std::vector<BEST_APP_VERSION*> best_app_versions;
    std::vector<DB_HOST_APP_VERSION> host_app_versions;
    std::vector<DB_HOST_APP_VERSION> host_app_versions_orig;
    // various reasons for not sending jobs (used to explain why)
    //
    bool no_allowed_apps_available;
    bool excessive_work_buf;
    bool hr_reject_temp;
    bool hr_reject_perm;
    bool outdated_client;
    bool no_cuda_prefs;
    bool no_ati_prefs;
    bool no_cpu_prefs;
    bool max_jobs_on_host_exceeded;
    bool max_jobs_on_host_cpu_exceeded;
    bool max_jobs_on_host_gpu_exceeded;
    bool no_jobs_available;     // project has no work right now
    //int max_jobs_per_day;
        // host.max_results_day * (NCPUS + NGPUS*gpu_multiplier)
    int max_jobs_per_rpc;
    int njobs_on_host;
        // How many jobs from this project are in progress on the host.
        // Initially this is the number of "other_results"
        // reported in the request message.
        // If the resend_lost_results option is used,
        // it's set to the number of outstanding results taken from the DB
        // (those that were lost are resent).
        // As new results are sent, it's incremented.
    int njobs_on_host_cpu;
        // same, but just CPU jobs.
    int njobs_on_host_gpu;
        // same, but just GPU jobs.
    int max_jobs_on_host;
    int max_jobs_on_host_cpu;
    int max_jobs_on_host_gpu;
    void update_for_result(double seconds_filled);
    void add_no_work_message(const char*);
    void get_job_limits();
 };
 // a description of a sticky file on host.
 //
 struct FILE_INFO {
@ -441,6 +301,153 @@ struct DISK_LIMITS {
    double min_free;
 };
 // summary of a client's request for work, and our response to it
 // Note: this is zeroed out in SCHEDULER_REPLY constructor
 //
 struct WORK_REQ {
    bool anonymous_platform;
    // Flags used by old-style scheduling,
    // while making multiple passes through the work array
    bool infeasible_only;
    bool reliable_only;
    bool user_apps_only;
    bool beta_only;
    // user preferences
    bool no_cuda;
    bool no_ati;
    bool no_cpu;
 	bool allow_non_preferred_apps;
 	bool allow_beta_work;
 	std::vector<APP_INFO> preferred_apps;
    bool has_reliable_version;
        // whether the host has a reliable app version
    int effective_ncpus;
    int effective_ngpus;
    // 6.7+ clients send separate requests for different resource types:
    //
    double cpu_req_secs;        // instance-seconds requested
    double cpu_req_instances;   // number of idle instances, use if possible
    double cuda_req_secs;
    double cuda_req_instances;
    double ati_req_secs;
    double ati_req_instances;
    inline bool need_cpu() {
        return (cpu_req_secs>0) || (cpu_req_instances>0);
    }
    inline bool need_cuda() {
        return (cuda_req_secs>0) || (cuda_req_instances>0);
    }
    inline bool need_ati() {
        return (ati_req_secs>0) || (ati_req_instances>0);
    }
    inline void clear_cpu_req() {
        cpu_req_secs = 0;
        cpu_req_instances = 0;
    }
    inline void clear_gpu_req() {
        cuda_req_secs = 0;
        cuda_req_instances = 0;
        ati_req_secs = 0;
        ati_req_instances = 0;
    }
    // older clients send send a single number, the requested duration of jobs
    //
    double seconds_to_fill;
    // true if new-type request
    //
    bool rsc_spec_request;
    double disk_available;
    double ram, usable_ram;
    double running_frac;
    int njobs_sent;
    // The following keep track of the "easiest" job that was rejected
    // by EDF simulation.
    // Any jobs harder than this can be rejected without doing the simulation.
    //
    double edf_reject_min_cpu;
    int edf_reject_max_delay_bound;
    bool have_edf_reject;
    void edf_reject(double cpu, int delay_bound) {
        if (have_edf_reject) {
            if (cpu < edf_reject_min_cpu) edf_reject_min_cpu = cpu;
            if (delay_bound> edf_reject_max_delay_bound) edf_reject_max_delay_bound = delay_bound;
        } else {
            edf_reject_min_cpu = cpu;
            edf_reject_max_delay_bound = delay_bound;
            have_edf_reject = true;
        }
    }
    bool edf_reject_test(double cpu, int delay_bound) {
        if (!have_edf_reject) return false;
        if (cpu < edf_reject_min_cpu) return false;
        if (delay_bound > edf_reject_max_delay_bound) return false;
        return true;
    }
    RESOURCE disk;
    RESOURCE mem;
    RESOURCE speed;
    RESOURCE bandwidth;
    std::vector<USER_MESSAGE> no_work_messages;
    std::vector<BEST_APP_VERSION*> best_app_versions;
    std::vector<BEST_APP_VERSION*> all_best_app_versions;
    std::vector<DB_HOST_APP_VERSION> host_app_versions;
    std::vector<DB_HOST_APP_VERSION> host_app_versions_orig;
    // various reasons for not sending jobs (used to explain why)
    //
    bool no_allowed_apps_available;
    bool excessive_work_buf;
    bool hr_reject_temp;
    bool hr_reject_perm;
    bool outdated_client;
    bool no_cuda_prefs;
    bool no_ati_prefs;
    bool no_cpu_prefs;
    bool max_jobs_on_host_exceeded;
    bool max_jobs_on_host_cpu_exceeded;
    bool max_jobs_on_host_gpu_exceeded;
    bool no_jobs_available;     // project has no work right now
    //int max_jobs_per_day;
        // host.max_results_day * (NCPUS + NGPUS*gpu_multiplier)
    int max_jobs_per_rpc;
    int njobs_on_host;
        // How many jobs from this project are in progress on the host.
        // Initially this is the number of "other_results"
        // reported in the request message.
        // If the resend_lost_results option is used,
        // it's set to the number of outstanding results taken from the DB
        // (those that were lost are resent).
        // As new results are sent, it's incremented.
    int njobs_on_host_cpu;
        // same, but just CPU jobs.
    int njobs_on_host_gpu;
        // same, but just GPU jobs.
    int max_jobs_on_host;
    int max_jobs_on_host_cpu;
    int max_jobs_on_host_gpu;
    void update_for_result(double seconds_filled);
    void add_no_work_message(const char*);
    void get_job_limits();
    ~WORK_REQ() {
        for (unsigned int i=0; i<all_best_app_versions.size(); i++) {
            delete all_best_app_versions[i];
        }
    }
 };
 // NOTE: if any field requires initialization,
 // you must do it in the constructor.  Nothing is zeroed by default.
 //
--- a/sched/sched_version.cpp
+++ b/sched/sched_version.cpp
@ -405,6 +405,7 @@ BEST_APP_VERSION* get_app_version(
            bavp->trusted = app_version_is_trusted(gavid);
        }
        g_wreq->best_app_versions.push_back(bavp);
        g_wreq->all_best_app_versions.push_back(bavp);
        if (!bavp->present) return NULL;
        return bavp;
    }