src/chunk_pool.cpp

/* MIT License
 *
 * Copyright (c) 2018 Sam Kovaka <skovaka@gmail.com>
 *
 * Permission is hereby granted, free of charge, to any person obtaining a copy
 * of this software and associated documentation files (the "Software"), to deal
 * in the Software without restriction, including without limitation the rights
 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 * copies of the Software, and to permit persons to whom the Software is
 * furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice shall be included in all
 * copies or substantial portions of the Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
 * SOFTWARE.
 */

#include <thread>
#include <chrono>
#include "chunk_pool.hpp"
#include "mapper.hpp"


ChunkPool::ChunkPool(const UncalledOpts &opts) {
    for (u16 t = 0; t < opts.threads_; t++) {
        threads_.emplace_back(mappers_);
    }
    
    //mappers_.reserve(nchannels);
    channel_active_.reserve(opts.num_channels_);
    chunk_buffer_.resize(opts.num_channels_);
    buffer_queue_.reserve(opts.num_channels_);
    for (u16 i = 0; i < opts.num_channels_; i++) {
        mappers_.push_back(Mapper(opts));
        channel_active_.push_back(false);
    }

    for (u16 t = 0; t < opts.threads_; t++) {
        threads_[t].start();
    }
}

//ChunkPool::~ChunkPool() {
//
//}

void ChunkPool::buffer_chunk(Chunk &c) {
    u16 ch = c.get_channel();
    if (chunk_buffer_[ch].empty()) {
        buffer_queue_.push_back(ch);
    } else {
        //TODO: handle backlog
        chunk_buffer_[ch].clear();
    }
    chunk_buffer_[ch].swap(c);
}

//Add chunk to master buffer
bool ChunkPool::add_chunk(Chunk &c) {
    u16 ch = c.get_channel();

    //Check if previous read is still aligning
    //If so, tell thread to reset, store chunk in pool buffer
    if (mappers_[ch].prev_unfinished(c.get_number())) {
        mappers_[ch].request_reset();
        buffer_chunk(c);
        //std::cout << "# requesting reset\n";
        return true;
    }

    //Previous alignment finished but mapper hasn't reset
    //Happens if update hasn't been called yet
    if (mappers_[ch].finished()) {
        if (mappers_[ch].get_read().number_ != c.get_number()){ 
            buffer_chunk(c);
        }
        return true;
    }

    //Mapper inactive - need to reset graph and assign to thread
    if (mappers_[ch].get_state() == Mapper::State::INACTIVE) {
        mappers_[ch].new_read(c);
        active_queue_.push_back(ch);
        return true;
    } else if (mappers_[ch].swap_chunk(c)) {
        return true;
    } 
    
    //TODO: something about it

    return false;
}

void ChunkPool::end_read(u16 ch, u32 number) {
    mappers_[ch].end_read(number);
}

std::vector<MapResult> ChunkPool::update() {

    std::vector< u16 > read_counts(threads_.size());
    u16 active_count = 0;

    std::vector<MapResult> ret;
    //Get alignment outputs
    //TODO: redo this
    for (u16 t = 0; t < threads_.size(); t++) {
        if (!threads_[t].out_chs_.empty()) {

            //Store and empty thread output buffer
            threads_[t].out_mtx_.lock();
            out_chs_.swap(threads_[t].out_chs_);
            threads_[t].out_mtx_.unlock();

            //Loop over alignments
            for (auto ch : out_chs_) {
                ReadBuffer &r = mappers_[ch].get_read();
                ret.emplace_back(r.channel_, r.number_, r.loc_);
                mappers_[ch].deactivate();
            }
            out_chs_.clear();
        }

        //Count reads aligning in each thread
        read_counts[t] = threads_[t].read_count();
        active_count += read_counts[t];
    }

    //std::cout << "# " << active_count << " active\n";
    //std::cout.flush();

    for (u16 i = buffer_queue_.size()-1; i < buffer_queue_.size(); i--) {
        u16 ch = buffer_queue_[i];//TODO: store chunks in queue
        Chunk &c = chunk_buffer_[ch];

        bool added;

        if (mappers_[ch].get_state() == Mapper::State::INACTIVE) {
            mappers_[ch].new_read(c);
            active_queue_.push_back(ch);
            added = true;
        } else {
            added = mappers_[ch].swap_chunk(c);
        } 

        if (added) {
            if (i != buffer_queue_.size()-1) {
                buffer_queue_[i] = buffer_queue_.back();
            }
            buffer_queue_.pop_back();
        }
    }

    //Estimate how much to fill each thread
    u16 target = active_queue_.size() + active_count,
        per_thread = target / threads_.size() + (target % threads_.size() > 0);

    for (u16 t = 0; t < threads_.size(); t++) {

        //If thread not full
        if (read_counts[t] < per_thread) {

            //Fill thread till full
            //TODO: compute number exactly, only lock while adding
            threads_[t].in_mtx_.lock();
            while (!active_queue_.empty() && read_counts[t] < per_thread) {
                u16 ch = active_queue_.back(); 
                active_queue_.pop_back();
                threads_[t].in_chs_.push_back(ch);
                //std::cout << "# activated " << ch << " " << t << "\n";
                read_counts[t]++;
            }
            threads_[t].in_mtx_.unlock();
        }
    }

    return ret;
}

bool ChunkPool::all_finished() {
    //TODO: think about this
    if (!buffer_queue_.empty()) return false;

    for (MapperThread &t : threads_) {
        if (t.read_count() > 0 || !t.out_chs_.empty()) return false;
    }

    return true;
}

void ChunkPool::stop_all() {
    for (MapperThread &t : threads_) {
        t.running_ = false;
        t.thread_.join();
    }
}

u16 ChunkPool::MapperThread::num_threads = 0;

ChunkPool::MapperThread::MapperThread(std::vector<Mapper> &mappers)
    : tid_(num_threads++),
      mappers_(mappers),
      running_(true) {}

ChunkPool::MapperThread::MapperThread(MapperThread &&mt) 
    : tid_(mt.tid_),
      mappers_(mt.mappers_),
      running_(mt.running_),                                             
      thread_(std::move(mt.thread_)) {}

void ChunkPool::MapperThread::start() {
    thread_ = std::thread(&ChunkPool::MapperThread::run, this);
}


u16 ChunkPool::MapperThread::read_count() const {
    return in_chs_.size() + active_chs_.size();
}

void ChunkPool::MapperThread::run() {
    std::string fast5_id;
    std::vector<float> fast5_signal;

    std::vector<u16> finished;

    while (running_) {
        if (read_count() == 0) {
            std::this_thread::sleep_for(std::chrono::milliseconds(100));
            continue;
        }

        //Read inputs (pop, lock, and swap it)
        if (!in_chs_.empty()) {
            in_mtx_.lock();
            in_tmp_.swap(in_chs_);
            in_mtx_.unlock();

            for (auto ch : in_tmp_) {
                active_chs_.push_back(ch);
            }
            //std::cout << "# " << tid_ << " controlling";
            //for (auto ch : active_chs_) std::cout << " " << ch;
            //std::cout << "\n";

            in_tmp_.clear(); //(pop)
        }


        //Map chunks
        for (u16 i = 0; i < active_chs_.size() && running_; i++) {
            u16 ch = active_chs_[i];
            mappers_[ch].process_chunk();
            //std::cout << "# mapping " << ch << "\n";
            if (mappers_[ch].map_chunk()) {
                out_tmp_.push_back(i);
                //std::cout << "# finishch " << ch << "\n";
            }
        }

        //Add finished to output
        if (!out_tmp_.empty()) {
            //std::cout << "# " << tid_ << " has " << out_chs_.size() << " pending\n";
            out_mtx_.lock();
            for (auto i : out_tmp_) out_chs_.push_back(active_chs_[i]);
            out_mtx_.unlock();

            std::sort(out_tmp_.begin(), out_tmp_.end(),
                      [](u32 a, u32 b) { return a > b; });
            //std::cout << "# popping";
            for (auto i : out_tmp_) {
                //std::cout << " " << i;
                active_chs_[i] = active_chs_.back();
                active_chs_.pop_back();
            }
            //std::cout << "\n";
            out_tmp_.clear();
        }
    }
}