Skip to content
Snippets Groups Projects
Commit f8ef1f4d authored by Marcin Kirsz's avatar Marcin Kirsz
Browse files

Update

parent 945e74d5
No related branches found
No related tags found
No related merge requests found
Pipeline #47130 passed
Pipeline: Tadah.MLIP

#47133

    ...@@ -295,12 +295,12 @@ class MPI_Trainer: public Trainer { ...@@ -295,12 +295,12 @@ class MPI_Trainer: public Trainer {
    } }
    }; };
    class MPI_Trainer_HOST: public MPI_Trainer { class TrainerHost: public MPI_Trainer {
    private: private:
    std::vector<std::tuple<std::string,int,int>> wpckgs; std::vector<std::tuple<std::string,int,int>> wpckgs;
    public: public:
    MPI_Trainer_HOST(Config &c, int &rank, int &ncpu): TrainerHost(Config &c, int &rank, int &ncpu):
    MPI_Trainer(c, rank, ncpu) MPI_Trainer(c, rank, ncpu)
    {} {}
    ...@@ -421,12 +421,45 @@ class MPI_Trainer_HOST: public MPI_Trainer { ...@@ -421,12 +421,45 @@ class MPI_Trainer_HOST: public MPI_Trainer {
    MPI_Send (&ready, 1, MPI_INT, worker, MPI_Send (&ready, 1, MPI_INT, worker,
    MPI_Trainer::CONFIG_TAG, MPI_COMM_WORLD); MPI_Trainer::CONFIG_TAG, MPI_COMM_WORLD);
    } }
    void run() {
    prep_wpckgs();
    // Process requests from workers
    while (true) {
    // Exit loop if there are no more packages
    if (!has_packages()) break;
    // Probe for incoming requests from any worker
    probe();
    // Handle requests based on their tags
    if (tag == MPI_Trainer::WORK_TAG) {
    work_tag();
    } else if (tag == MPI_Trainer::DATA_TAG) {
    data_tag();
    } else {
    throw std::runtime_error("HOST: Unexpected request from "
    + std::to_string(worker));
    }
    }
    // Collect remaining data and release all workers
    int count = 1;
    while (true) {
    probe();
    if (tag == MPI_Trainer::DATA_TAG) {
    data_tag();
    } else {
    release_tag(count);
    }
    if (count == ncpu) break; // Exit when all workers are released
    }
    }
    }; };
    class Trainer_WORKER: public MPI_Trainer { class TrainerWorker: public MPI_Trainer {
    public: public:
    Trainer_WORKER(Config &c, int &rank, int &ncpu): TrainerWorker(Config &c, int &rank, int &ncpu):
    MPI_Trainer(c, rank, ncpu) MPI_Trainer(c, rank, ncpu)
    {} {}
    ......
    0% Loading or .
    You are about to add 0 people to the discussion. Proceed with caution.
    Finish editing this message first!
    Please register or to comment