ag_gen/src/mpi/tasks.cpp

#include <algorithm>
#include <chrono>
#include <iostream>
#include <vector>
#include <tuple>
#include <unordered_map>
#include <omp.h>
#include <sys/time.h>
#include <string.h>
#include <map>

#include <boost/mpi/collectives.hpp>
#include <boost/archive/tmpdir.hpp>
#include <boost/archive/text_iarchive.hpp>
#include <boost/archive/text_oarchive.hpp>

#include <boost/serialization/base_object.hpp>
#include <boost/serialization/utility.hpp>
#include <boost/serialization/list.hpp>
#include <boost/serialization/assume_abstract.hpp>
#include <boost/serialization/string.hpp>
#include <boost/serialization/vector.hpp>

#include <boost/mpi.hpp>
#include <boost/mpi/environment.hpp>
#include <boost/mpi/communicator.hpp>
#include <boost/mpi/collectives.hpp>
#include <boost/serialization/is_bitwise_serializable.hpp>

#include "../util/db_functions.h"
#include "../util/avail_mem.h"
#include "../util/odometer.h"

#include "serialize_tuple.h"
#include "../ag_gen/ag_gen.h"
#include "tasks.h"

namespace mpi = boost::mpi;

void task_zero(AGGenInstance &instance, std::deque<NetworkState> &localFrontier, double mem_threshold)
{
	//std::cout << "Frontier empty, retrieving from database" << std::endl;
    double f_alpha = 0.0;
    double total_tt = 0.0;
    struct timeval tt1,tt2;
    int retrv_counter = 0;

    auto tot_sys_mem = getTotalSystemMemory();
    gettimeofday(&tt1,NULL);

    //TODO: One (or a few) larger queries to pull in new states, rather than single queries that pull states one-by-one
    do {
        NetworkState db_new_state = fetch_unexplored(instance.facts);
        localFrontier.emplace_front(db_new_state);
        //alpha = get_alpha();
        f_alpha = (static_cast<double>(localFrontier.size()) * (localFrontier.back().get_size()))/tot_sys_mem;
        retrv_counter += 1;
    }
    //Leave a 30% buffer in alpha
    while((f_alpha <= (mem_threshold * 0.7)) && !unex_empty());

    //std::cout << "Retrieved " << retrv_counter << " factbases from the database." << std::endl;
    gettimeofday(&tt2,NULL);
    total_tt+=(tt2.tv_sec-tt1.tv_sec)*1000.0+(tt2.tv_usec-tt1.tv_usec)/1000.0;
    //printf("Retrieving from db took %lf s.\n", total_tt);
}

void task_one(AGGenInstance &instance, NetworkState &current_state,\
 std::vector<Exploit> &exploit_list, std::unordered_map<size_t, PermSet<size_t>> &od_map,\
 int alloc, int two_alloc, int reduc_factor, int num_tasks, mpi::communicator &world,\
 mpi::communicator &tcomm){

    std::cout << "Process rank " << world.rank() << " with " << alloc << " node(s) allocated has started Task 1." << std::endl;
	std::vector<std::tuple<Exploit, AssetGroup>> appl_exploits;
	unsigned long esize = exploit_list.size();

    //Distribute work to all nodes
	for (size_t i = 0; i < esize; i++) {//for loop for applicable exploits starts
		if (i % alloc != tcomm.rank())
			continue;

        auto e = exploit_list.at(i);
        size_t num_params = e.get_num_params();
        auto preconds_q = e.precond_list_q();
        auto preconds_t = e.precond_list_t();
        auto perms = od_map[num_params];
        std::vector<AssetGroup> asset_groups;
		for (auto perm : perms) {
            std::vector<Quality> asset_group_quals;
            std::vector<Topology> asset_group_topos;
            asset_group_quals.reserve(preconds_q.size());
            asset_group_topos.reserve(preconds_t.size());

			for (auto &precond : preconds_q) {

				asset_group_quals.emplace_back(
                   perm[precond.get_param_num()], precond.name, precond.op,
                   precond.value, instance.facts);
            }
            for (auto &precond : preconds_t) {
                auto dir = precond.get_dir();
                auto prop = precond.get_property();
                auto op = precond.get_operation();
                auto val = precond.get_value();
                asset_group_topos.emplace_back(
                    perm[precond.get_from_param()],
                    perm[precond.get_to_param()], dir, prop, op, val, instance.facts);
            }
            asset_groups.emplace_back(asset_group_quals, asset_group_topos,
                                      perm);
        }
        auto assetgroup_size = asset_groups.size();
        for (size_t j = 0; j < assetgroup_size; j++) {
            auto asset_group = asset_groups.at(j);

			for (auto &quality : asset_group.get_hypo_quals()) {
                if (!current_state.get_factbase().find_quality(quality)) {
                    goto LOOPCONTINUE1;
                }
            }
            for (auto &topology : asset_group.get_hypo_topos()) {
                if (!current_state.get_factbase().find_topology(topology)) {
                    goto LOOPCONTINUE1;
                }
            }
            {
                auto new_appl_exploit = std::make_tuple(e, asset_group);
                appl_exploits.push_back(new_appl_exploit);
            }
        LOOPCONTINUE1:;
        }
    } //for loop for applicable exploits ends

    //Less nodes allocated to task 2 than task 1.
    //Distribute the appl_exploit list from the extra node in task 1 to all other nodes in this task
    if (alloc > two_alloc){

	int has_data;
	//std::tuple<int, int> data_mod = std::make_tuple(0, 0);
	if (world.rank() == alloc){
		if (appl_exploits.size() > 0){
			//std::get<0>(data_mod) = ceil((double)appl_exploits.size()/((double)tcomm.size()-1));
			//std::get<1>(data_mod) = appl_exploits.size()%(tcomm.size()-1);
			//data_mod = std::make_tuple(ceil((double)appl_exploits.size()/((double)tcomm.size()-1)), appl_exploits.size()%(tcomm.size()-1));
			has_data = 1;
			}
		else{
			has_data = 0;
		}
	}

 	//Convert world.rank() of alloc to tcomm rank by -1
	broadcast(tcomm, has_data, alloc-1);

	if(has_data==1){
		std::vector<std::vector<std::tuple<Exploit, AssetGroup>>> sub_partials;
		std::vector<std::tuple<Exploit, AssetGroup>> partial_appl_exploits;
		if (world.rank() == alloc){
			size_t num_data = appl_exploits.size()/(tcomm.size()-1);
			size_t remain = appl_exploits.size()%(tcomm.size()-1);
			int begin = 0;
			int end = 0;
			for (int i = 0; i < std::min((int)(tcomm.size()-1), (int)appl_exploits.size()); ++i){
				end += (remain > 0) ? (num_data + !!(remain--)) : num_data;
				sub_partials.push_back(std::vector<std::tuple<Exploit, AssetGroup>>(appl_exploits.begin()+begin, appl_exploits.begin()+end));
				begin = end;
				mpi::request scatter_req = tcomm.isend(i, 21, sub_partials.at(i));
				std::cout << "PROCESS " << world.rank() << " SENDING APPL EXPLOIT LIST OF SIZE " << sub_partials.at(i).size() << "TO TCOMM RANK " << i << " ORIGINAL LIST WAS SIZE " << appl_exploits.size() <<  std::endl;
				scatter_req.wait();
			}
		}
		tcomm.barrier();
        	if(world.rank() < alloc){
            		if(tcomm.iprobe(alloc-1, 21)){
				tcomm.recv(alloc-1, 21, partial_appl_exploits);
				std::cout << "PROCESS " << world.rank() << " RECEIVED APPL EXPLOIT LIST OF SIZE " << partial_appl_exploits.size() << " IN TASK 1" << std::endl;
				appl_exploits.insert(std::end(appl_exploits), std::begin(partial_appl_exploits), std::end(partial_appl_exploits));
				//for(auto itr=partial_appl_exploits.begin(); itr!=partial_appl_exploits.end(); itr++){
                		//	auto index_r=std::distance(partial_appl_exploits.begin(),itr);
                		//	appl_exploits.push_back(partial_appl_exploits.at(index_r));
         			//}
			}
        	}
    	}
    }

    //Send Applicable Exploit List
    int skip_greatest = 0;
    if (alloc > two_alloc)
        skip_greatest = 1;
    if(world.rank() <= (alloc - skip_greatest)){
        std::cout << "Process " << world.rank() << " sending applicable exploit list of size " << appl_exploits.size() <<\
        " to Process " << send_check(world, world.rank() + alloc -1) << std::endl;
        mpi::request appl_req = world.isend(send_check(world, world.rank() + alloc -1), 30, appl_exploits);
        mpi::request cs_req = world.isend(send_check(world, world.rank() + alloc -1), 40, current_state);
	appl_req.wait();
	cs_req.wait();
    }
}

void task_two(AGGenInstance &instance, int alloc, int two_alloc, boost::mpi::communicator &world,\
    std::deque<NetworkState> &localFrontier, double mem_threshold, boost::mpi::communicator &ttwo_comm,\
    std::vector<std::string> ex_groups, std::unordered_map<size_t, int> &hash_map){

    std::cout << "Process rank " << world.rank() << " with " << two_alloc <<\
     " node(s) allocated has started Task 2 with local communicator rank of " << ttwo_comm.rank() << std::endl;

    NetworkState current_state;
    std::vector<std::tuple<Exploit, AssetGroup>> appl_exploits;

    world.recv(mpi::any_source, 30, appl_exploits);
    world.recv(mpi::any_source, 40, current_state);

    std::cout << "Process " << world.rank() << " received Task 1 data with Appl exploit size " << appl_exploits.size() << std::endl;

    //Check for new fact and new state that caused an update in the hash table and facts
    while(world.iprobe(mpi::any_source, 3) || world.iprobe(mpi::any_source, 4)){
	NetworkState update_state;
	Quality update_fact;

	world.recv(mpi::any_source, 3, update_state);
	world.recv(mpi::any_source, 4, update_fact);

	instance.facts.hash_table[update_state.compound_assign(update_fact)]=instance.facts.size();
	instance.facts.length++;
	instance.facts.str_vector.push_back(update_state.compound_assign(update_fact));
    }

    std::vector<std::tuple<Exploit, AssetGroup>> partial_appl_exploits;

    //Don't think we need this? All nodes get their own appl_expl list
    //if(ttwo_comm.size() > 1)
        //mpi::scatter(ttwo_comm, partial_appl_exploits, appl_exploits.data(), 0);
        //mpi::scatter(ttwo_comm, &partial_appl_exploits, appl_exploits, 0);

    auto current_hash = current_state.get_hash(instance.facts);

    std::map<std::string, int> group_fired; //Map to hold fired status per group
    std::map<std::string, std::vector<std::tuple<Exploit, AssetGroup>>> sync_vectors; //Map to hold all group exploits

    for (auto map_group : ex_groups)
    {
        group_fired.insert(std::pair<std::string, int> (map_group, 0));
    }

    std::string egroup;

    //Build up the map of synchronous fire exploits and send to 0th node of task 2
    for(auto itr=appl_exploits.begin(); itr!=appl_exploits.end();){
        //auto e = appl_exploits.at(itr);

        auto e = *itr;
        egroup = std::get<0>(e).get_group();
	int tflag = 0;
        if (egroup != "null"){
            sync_vectors[egroup].push_back(e);
            if(ttwo_comm.rank() != 0){
		std::cout << "NODE " << world.rank() << " HAD A SYNC EXPLOIT " << std::endl;
		itr = appl_exploits.erase(itr);
		tflag = 1;
	    }
	}
	if(tflag == 0)
	    itr++;
    }

    if(ttwo_comm.rank() != 0){
        for (auto map_group : ex_groups){
            if(sync_vectors[map_group].size() > 0){
       	    	mpi::request sync_req = ttwo_comm.isend(0, 9, std::make_tuple(map_group, sync_vectors[map_group]));
	    	std::cout << "NODE " << world.rank() << " SENDING SYNC APPL SIZE OF " << sync_vectors[map_group].size() << std::endl;
		sync_req.wait();
		sync_vectors[map_group].clear();
            }
	}
	/*
        for(auto itr = appl_exploits.begin(); itr != appl_exploits.end();){
            egroup = std::get<0>(*itr).get_group();
            if (egroup != "null"){
                itr = appl_exploits.erase(itr);
            }
            else{
                itr++;
            }
        }*/
    }

    ttwo_comm.barrier();
    if(ttwo_comm.rank() == 0 && ttwo_comm.size() > 1){
        //Attempt to distribute workload evenly has unintended effects since we don't know which Task 1 data goes where: it could all go to this node.
	//for(auto itr = appl_exploits.begin(); itr != appl_exploits.end();){
        //    itr = appl_exploits.erase(itr);
        //}
	//for (int r = 0; r < ex_groups.size() * (ttwo_comm.size()-1); r++){
    	while(ttwo_comm.iprobe(mpi::any_source, 9)){
	    std::tuple<std::string, std::vector<std::tuple<Exploit, AssetGroup>>> sync_recv;
	    ttwo_comm.recv(mpi::any_source, 9, sync_recv);
	    partial_appl_exploits = std::get<1>(sync_recv);
	    appl_exploits.insert(std::end(appl_exploits), std::begin(partial_appl_exploits), std::end(partial_appl_exploits));
	    std::cout << "TTWO COMM RANK 0 HAS RECEIVED AN APPL EXPLOIT LIST SIZE OF " << partial_appl_exploits.size() << " RESULTING IN A TOTAL SIZE OF " << appl_exploits.size() << std::endl;
	    sync_vectors[std::get<0>(sync_recv)].insert(std::end(sync_vectors[std::get<0>(sync_recv)]), std::begin(partial_appl_exploits), std::end(partial_appl_exploits));
            //for(auto itr=partial_appl_exploits.begin(); itr!=partial_appl_exploits.end(); itr++){
            //    auto index_r=std::distance(partial_appl_exploits.begin(),itr);
            //    appl_exploits.push_back(partial_appl_exploits.at(index_r));
            //	}
	}
    }

    //loop through the vector
    for(auto itr=appl_exploits.begin(); itr!=appl_exploits.end(); itr++){

	//Check for new fact and new state that caused an update in the hash table and facts
	while(world.iprobe(mpi::any_source, 3) || world.iprobe(mpi::any_source, 4)){
	    NetworkState update_state;
	    Quality update_fact;

	    world.recv(mpi::any_source, 3, update_state);
	    world.recv(mpi::any_source, 4, update_fact);
	    instance.facts.hash_table[update_state.compound_assign(update_fact)]=instance.facts.size();
	    instance.facts.length++;
	    instance.facts.str_vector.push_back(update_state.compound_assign(update_fact));
	}

        auto e = *itr;
        auto exploit = std::get<0>(e);
        auto assetGroup = std::get<1>(e);

        egroup=exploit.get_group();

        if ((egroup != "null" && group_fired[egroup] == 0) || egroup == "null"){
            NetworkState new_state{current_state};
            std::vector<std::tuple<Exploit, AssetGroup>> sync_exploits;

            if (egroup == "null")
                sync_exploits.push_back(e);

            else {
                sync_exploits = sync_vectors[egroup];

                //TODO: Does not work if only some assets belong to a group. This only works if
                //all assets are in the group
                if(sync_exploits.size() < instance.assets.size()){
                    break;
                }
            }
            std::cout << "Sync exploit size " << sync_exploits.size() << " at Node " << world.rank() << " out of a total of " << appl_exploits.size() << std::endl;
            for(auto sync_itr=sync_exploits.begin(); sync_itr!=sync_exploits.end(); sync_itr++){
                e = *sync_itr;
                exploit = std::get<0>(e);
                egroup=exploit.get_group();
                assetGroup = std::get<1>(e);
                group_fired[egroup] = 1;

                auto postconditions = createPostConditions(e, instance.facts);
                auto qualities = std::get<0>(postconditions);
                auto topologies = std::get<1>(postconditions);

                for(auto &qual : qualities) {
                    auto action = std::get<0>(qual);
                    auto fact = std::get<1>(qual);
                    switch(action) {
                        case ADD_T:
                            new_state.add_quality(fact);
                                break;
                        case UPDATE_T:
                            new_state.update_quality(fact);

                            //TODO: if fact!= "="" call new_state function, passing fact and instance.facts. Update the quality, and insert it into the hash_table instead of this convoluted mess
                            if(fact.get_op()=="+="){

                                //std::cout<<" AFTER UPDATE "<<new_state.compound_assign(fact)<<std::endl;
                                std::unordered_map<std::string,int>::const_iterator got = instance.facts.hash_table.find(new_state.compound_assign(fact));

                                //If the value is not already in the hash_table, insert it.
                                //Since the compound operators include a value that is not in the original Keyvalue object, the unordered map does not include it
                                //As a result, you have to manually add it.
                                if(got==instance.facts.hash_table.end()){
                                    instance.facts.hash_table[new_state.compound_assign(fact)]=instance.facts.size();
                                    instance.facts.length++;
                                    instance.facts.str_vector.push_back(new_state.compound_assign(fact));
                                    //Update ALL nodes (include ttwo_comm nodes) with new data
                                    for (int w = 0; w < world.size(); w++)
                                    {
                                        if(w != world.rank())
                                        {
                                            mpi::request ns_req = world.isend(w, 3, new_state);
                                            mpi::request fact_req = world.isend(w, 4, fact);
					    ns_req.wait();
					    fact_req.wait();
                                        }
                                    }
                                }
                            }
                            break;
                        case DELETE_T:
                            new_state.delete_quality(fact);
                            break;
                    }
                }

                for(auto &topo : topologies) {
                    auto action = std::get<0>(topo);
                    auto fact = std::get<1>(topo);
                    switch(action) {
                        case ADD_T:
                            new_state.add_topology(fact);
                            break;
                        case UPDATE_T:
                            new_state.update_topology(fact);
                            break;
                        case DELETE_T:
                            new_state.delete_topology(fact);
                            break;
                    }
                }
            }//Sync. Fire for

            auto hash_num = new_state.get_hash(instance.facts);

            if (hash_num == current_hash){
                std::cout << "Same hash." << std::endl;
                continue;
            }

            //<6 Node Edge Case Prevention: Node 0 unable to execute task 3
            if(world.rank() != 0){
                std::cout << "Node " << world.rank() << " sending new state data to Node 0" << std::endl;
                mpi::request ns_req = world.isend(0, 5, new_state);
                mpi::request cs_req = world.isend(0, 6, current_state);
                mpi::request ex_req = world.isend(0, 10, exploit);
                mpi::request ag_req = world.isend(0, 11, assetGroup);
            	ns_req.wait();
		cs_req.wait();
		ex_req.wait();
		ag_req.wait();
	    }
            else {
                task_three(instance, new_state, localFrontier, mem_threshold, world,\
                    alloc, two_alloc, current_state, exploit, assetGroup, hash_map);
            }
        }
        else{
            std::cout << "Breaking." << std::endl;
            break;
        }
    }
}

void task_three(AGGenInstance &instance, NetworkState &new_state, std::deque<NetworkState> &localFrontier,\
    double mem_threshold, boost::mpi::communicator &world, int alloc, int two_alloc, NetworkState &current_state,\
    Exploit &exploit, AssetGroup &assetGroup, std::unordered_map<size_t, int> &hash_map){

    std::cout << "Started Task 3." << std::endl;
    auto hash_num = new_state.get_hash(instance.facts);

    //although local frontier is updated, the global hash is also updated to avoid testing on explored states.
    if (hash_map.find(hash_num) == hash_map.end()) {
        new_state.set_id();
        auto facts_tuple = new_state.get_factbase().get_facts_tuple();
        FactbaseItems new_items = std::make_tuple(facts_tuple, new_state.get_id());
        instance.factbase_items.push_back(new_items);
        instance.factbases.push_back(new_state.get_factbase());
        hash_map.insert(std::make_pair(new_state.get_hash(instance.facts), new_state.get_id()));

        //See memory usage. If it exceeds the threshold, store new states in the DB
        double i_alpha = 0.0;
        //Get the most recent Factbase's size * total number of factbases, rough approximation of *2 to account for factbase_items
        double i_usage = instance.factbases.back().get_size() * instance.factbases.size() * 2 + sizeof(instance.edges[0]) * instance.edges.size();

        auto tot_sys_mem = getTotalSystemMemory();
        i_alpha = i_usage/tot_sys_mem;
        double f_alpha;
        if (!localFrontier.empty())
            f_alpha = (static_cast<double>(localFrontier.size()) * (localFrontier.back().get_size()))/tot_sys_mem;
        else
            f_alpha = 0.0;

        if (f_alpha >= (mem_threshold/2)) {
            //std::cout << "Frontier Alpha prior to database storing: " << f_alpha << std::endl;
            mpi::request ns_req = world.isend(send_check(world, alloc+two_alloc+1), 50, new_state);
	    ns_req.wait();
	    //save_unexplored_to_db(new_state);
            if (!localFrontier.empty())
                f_alpha = (static_cast<double>(localFrontier.size()) * (localFrontier.back().get_size()))/tot_sys_mem;
            else
                f_alpha = 0;
            //std::cout << "Frontier Alpha after database storing: " << f_alpha << std::endl;
        }

        //Store new state in database to ensure proper ordering of the FIFO queue
        else if (!unex_empty()){
            mpi::request ns_req = world.isend(send_check(world, alloc+two_alloc+1), 50, new_state);
	    ns_req.wait();
	    //save_unexplored_to_db(new_state);
        }

        //Otherwise, we can just store in memory
        else {
            localFrontier.emplace_front(new_state);
        }

        if (i_alpha >= mem_threshold/2){
            //std::cout << "Instance Alpha prior to database storing: " << i_alpha << std::endl;
            mpi::request fb_req = world.isend(send_check(world, alloc+two_alloc), 7, instance.factbases);
            mpi::request ed_req = world.isend(send_check(world, alloc+two_alloc), 8, instance.edges);
            //save_ag_to_db(instance, true);
	    fb_req.wait();
	    ed_req.wait();
            //Clear vectors and free memory
            std::vector<Factbase>().swap(instance.factbases);
            std::vector<FactbaseItems>().swap(instance.factbase_items);
            std::vector<Edge>().swap(instance.edges);

            i_usage = (sizeof(instance.factbases) + (sizeof(instance.factbases[0]) * instance.factbases.size()) +\
                        sizeof(instance.factbase_items) + (sizeof(instance.factbase_items[0]) * instance.factbase_items.size()) +\
                        sizeof(instance.edges) + (sizeof(instance.edges[0]) * instance.edges.size()));
            i_alpha = i_usage/tot_sys_mem;
            //std::cout << "Instance Alpha after database storing: " << i_alpha << std::endl;

        }

        Edge ed(current_state.get_id(), new_state.get_id(), exploit, assetGroup);
        ed.set_id();
        instance.edges.push_back(ed);
    } //END if (hash_map.find(hash_num) == hash_map.end())

    else {
            int id = hash_map[hash_num];
            Edge ed(current_state.get_id(), id, exploit, assetGroup);
            ed.set_id();
            instance.edges.push_back(ed);
    }
}


int send_check(boost::mpi::communicator &world, int curr_node){
    int send_to = curr_node + 1;
    if (curr_node >= world.size()-1)
        send_to = 0;

    return send_to;
}