tenncor_docs/ccur_2session_8hpp_source.html

 #include <atomic>

 #include <boost/asio/thread_pool.hpp>
 #include <boost/asio/post.hpp>

 #include "eteq/session.hpp"

 #include "ccur/partition.hpp"

 #ifndef CCUR_SESS_HPP
 #define CCUR_SESS_HPP

 namespace ccur
 {

 using SessReqsT = std::vector<std::pair<teq::iOperableFunc*,size_t>>;

 using LSessReqsT = std::list<std::pair<teq::iOperableFunc*,size_t>>;

 using AtomicFulfilMapT = std::unordered_map<
     teq::iOperableFunc*,std::atomic<long>>;

 struct Session final : public eteq::iSession
 {
     Session (size_t nthreads = 2, OpWeightT weights = OpWeightT()) :
         nthreads_(nthreads), weights_(weights) {}

     void track (teq::TensptrsT roots) override
     {
         tracked_.insert(roots.begin(), roots.end());

         teq::GraphStat stat;
         for (auto& trac : tracked_)
         {
             trac->accept(stat);
         }
         teq::ParentFinder pfinder;
         for (teq::TensptrT& root : roots)
         {
             root->accept(pfinder);
         }

         teq::TensptrsT trackvecs(tracked_.begin(), tracked_.end());
         PartGroupsT groups = k_partition(trackvecs, nthreads_, weights_);
         requirements_.clear();
         for (auto& group : groups)
         {
             SessReqsT reqs;
             reqs.reserve(group.size());
             for (teq::iFunctor* func : group)
             {
                 auto& args = func->get_children();
                 teq::TensSetT unique_children;
                 for (const teq::FuncArg& arg : args)
                 {
                     auto tens = arg.get_tensor().get();
                     if (0 < stat.graphsize_[tens].upper_) // ignore leaves
                     {
                         unique_children.emplace(tens);
                     }
                 }
                 reqs.push_back({
                     static_cast<teq::iOperableFunc*>(func),
                     unique_children.size()
                 });
             }
             requirements_.push_back(reqs);
         }

         for (auto& assocs : pfinder.parents_)
         {
             for (auto& parent_pair : assocs.second)
             {
                 parents_[assocs.first].emplace(
                     static_cast<teq::iOperableFunc*>(parent_pair.first));
             }
         }

         ops_.clear();
         for (auto& tpair : stat.graphsize_)
         {
             if (tpair.second.upper_ > 0)
             {
                 ops_.emplace(static_cast<teq::iOperableFunc*>(tpair.first));
             }
         }
     }

     void update (teq::TensSetT ignored = {}) override
     {
         size_t nthreads = requirements_.size();
         std::vector<LSessReqsT> indep_requirements(nthreads);
         for (size_t i = 0; i < nthreads; ++i)
         {
             auto& reqs = requirements_[i];
             auto& indep_reqs = indep_requirements[i];
             teq::TensSetT acceptable;
             for (auto& root : tracked_)
             {
                 acceptable.emplace(root.get());
             }
             // ignored tensors will never populate reqs
             for (auto rit = reqs.rbegin(), ret = reqs.rend();
                 rit != ret; ++rit)
             {
                 auto& op = rit->first;
                 if (estd::has(acceptable, op) &&
                     false == estd::has(ignored, op))
                 {
                     indep_reqs.push_front({op, rit->second});
                     auto& children = op->get_children();
                     for (auto& child : children)
                     {
                         acceptable.emplace(child.get_tensor().get());
                     }
                 }
             }
         }

         AtomicFulfilMapT fulfilments;
         for (auto op : ops_)
         {
             fulfilments.emplace(op, 0);
         }

         for (auto ig : ignored)
         {
             std::unordered_set<teq::iOperableFunc*> op_parents;
             if (estd::get(op_parents, parents_, ig))
             {
                 for (auto& op_parent : op_parents)
                 {
                     ++fulfilments.at(op_parent);
                 }
             }
         }

         // for each req in requirements distribute to thread
         boost::asio::thread_pool pool(nthreads);
         for (auto& reqs : indep_requirements)
         {
             // add thread
             boost::asio::post(pool,
             [this, &reqs, &fulfilments]()
             {
                 for (auto& op : reqs)
                 {
                     // fulfilled and not ignored
                     auto& ff = fulfilments.at(op.first);
                     if (ff++ == op.second)
                     {
                         op.first->update();
                         std::unordered_set<teq::iOperableFunc*> op_parents;
                         if (estd::get(op_parents,
                             this->parents_, op.first))
                         {
                             for (auto& op_parent : op_parents)
                             {
                                 ++fulfilments.at(op_parent);
                             }
                         }
                         ++ff;
                     }
                     --ff;
                 }
             });
         }
         pool.join();
     }

     void update_target (teq::TensSetT target,
         teq::TensSetT ignored = {}) override
     {
         size_t nthreads = requirements_.size();
         std::vector<LSessReqsT> indep_requirements(nthreads);
         for (size_t i = 0; i < nthreads; ++i)
         {
             auto& reqs = requirements_[i];
             auto& indep_reqs = indep_requirements[i];
             teq::TensSetT acceptable;
             for (auto& root : target)
             {
                 acceptable.emplace(root);
             }
             // ignored tensors will never populate reqs
             for (auto rit = reqs.rbegin(), ret = reqs.rend();
                 rit != ret; ++rit)
             {
                 auto& op = rit->first;
                 if (estd::has(acceptable, op) &&
                     false == estd::has(ignored, op))
                 {
                     indep_reqs.push_front({op, rit->second});
                     auto& children = op->get_children();
                     for (auto& child : children)
                     {
                         acceptable.emplace(child.get_tensor().get());
                     }
                 }
             }
         }

         AtomicFulfilMapT fulfilments;
         for (auto op : ops_)
         {
             fulfilments.emplace(op, 0);
         }

         for (auto ig : ignored)
         {
             std::unordered_set<teq::iOperableFunc*> op_parents;
             if (estd::get(op_parents, parents_, ig))
             {
                 for (auto& op_parent : op_parents)
                 {
                     ++fulfilments.at(op_parent);
                 }
             }
         }

         // for each req in requirements distribute to thread
         boost::asio::thread_pool pool(nthreads);
         for (auto& reqs : indep_requirements)
         {
             // make thread
             boost::asio::post(pool,
             [this, &reqs, &fulfilments]()
             {
                 for (auto& op : reqs)
                 {
                     // is relevant to target, is fulfilled and not ignored
                     auto& ff = fulfilments.at(op.first);
                     if (ff++ == op.second)
                     {
                         op.first->update();
                         std::unordered_set<teq::iOperableFunc*> op_parents;
                         if (estd::get(op_parents,
                             this->parents_, op.first))
                         {
                             for (auto& op_parent : op_parents)
                             {
                                 ++fulfilments.at(op_parent);
                             }
                         }
                         ++ff;
                     }
                     --ff;
                 }
             });
         }
         pool.join();
     }

     void optimize (const opt::OptCtx& rules)
     {
         teq::TensptrsT tracked(tracked_.begin(), tracked_.end());
         opt::optimize(tracked, rules);
         parents_.clear();
         track(tracked);
     }

     teq::TensptrSetT tracked_;

     std::unordered_map<teq::iTensor*,
         std::unordered_set<teq::iOperableFunc*>> parents_;

     std::vector<SessReqsT> requirements_;

 private:
     size_t nthreads_;

     OpWeightT weights_;

     std::unordered_set<teq::iOperableFunc*> ops_;
 };

 }

 #endif // CCUR_SESS_HPP
csv_to_png.args
args
Definition: csv_to_png.py:105

teq::TensSetT
std::unordered_set< teq::iTensor * > TensSetT
Hash set of raw tensor pointers.
Definition: itensor.hpp:63

teq::GraphStat::graphsize_
std::unordered_map< iTensor *, estd::NumRange< size_t > > graphsize_
Definition: traveler.hpp:105

teq::iOperableFunc
A functor node with direct access to evaluated data.
Definition: iopfunc.hpp:20

ccur::SessReqsT
std::vector< std::pair< teq::iOperableFunc *, size_t > > SessReqsT
Definition: session.hpp:27

ccur::PartGroupsT
std::vector< std::vector< teq::iFunctor * > > PartGroupsT
Groups of functors.
Definition: partition.hpp:20

ccur::Session::nthreads_
size_t nthreads_
Definition: session.hpp:295

teq::iFunctor
Interface of iOperation-defined operation node.
Definition: ifunctor.hpp:28

teq::TensptrSetT
std::unordered_set< teq::TensptrT > TensptrSetT
Hash set of tensor smart pointers.
Definition: itensor.hpp:66

teq::ParentFinder::parents_
std::unordered_map< iTensor *, ParentMapT > parents_
Definition: traveler.hpp:189

opt::optimize
teq::TensptrsT optimize(teq::TensptrsT roots, const OptCtx &opts)

eteq::iSession
Session interface that tracks and rapidly updates subgraphs.
Definition: session.hpp:27

ccur::Session::tracked_
teq::TensptrSetT tracked_
Definition: session.hpp:284

ccur::AtomicFulfilMapT
std::unordered_map< teq::iOperableFunc *, std::atomic< long > > AtomicFulfilMapT
Definition: session.hpp:35

ccur::Session::ops_
std::unordered_set< teq::iOperableFunc * > ops_
Definition: session.hpp:299

session.hpp

teq::ParentFinder
Traveler that for each child tracks the relationship to all parents.
Definition: traveler.hpp:162

teq::FuncArg
Coordinate mapper and tensor pair.
Definition: funcarg.hpp:21

opt::OptCtx
Encapsulation of all conversion rules.
Definition: optimize.hpp:23

teq::GraphStat
Traveler that maps each tensor to its subtree&#39;s maximum depth.
Definition: traveler.hpp:57

ccur::Session
Definition: session.hpp:39

ccur
Definition: partition.hpp:16

ccur::Session::parents_
std::unordered_map< teq::iTensor *, std::unordered_set< teq::iOperableFunc * > > parents_
Map of tensor to the set of the tensor&#39;s parents.
Definition: session.hpp:288

ccur::k_partition
PartGroupsT k_partition(teq::TensptrsT roots, size_t k, OpWeightT weights=OpWeightT())
Return k groups of graphs under roots given some weight.

ccur::Session::update_target
void update_target(teq::TensSetT target, teq::TensSetT ignored={}) override
Implementation of iSession.
Definition: session.hpp:190

ccur::OpWeightT
std::unordered_map< size_t, double > OpWeightT
Map functor opcode to the operation&#39;s weight value.
Definition: partition.hpp:23

teq::TensptrT
std::shared_ptr< iTensor > TensptrT
Tensor smart pointer.
Definition: itensor.hpp:51

teq::TensptrsT
std::vector< TensptrT > TensptrsT
Vector of tensor smart pointers.
Definition: itensor.hpp:60

teq::iTensor
Interface of traversible and differentiable nodes with shape information.
Definition: itensor.hpp:36

ccur::Session::track
void track(teq::TensptrsT roots) override
Implementation of iSession.
Definition: session.hpp:45

partition.hpp

ccur::Session::update
void update(teq::TensSetT ignored={}) override
Implementation of iSession.
Definition: session.hpp:107

ccur::LSessReqsT
std::list< std::pair< teq::iOperableFunc *, size_t > > LSessReqsT
Same as SessReqsT except as a list.
Definition: session.hpp:30

ccur::Session::weights_
OpWeightT weights_
Definition: session.hpp:297

ccur::Session::requirements_
std::vector< SessReqsT > requirements_
Definition: session.hpp:292

ccur::Session::optimize
void optimize(const opt::OptCtx &rules)
Apply input optimization rules using opt module, then re-track.
Definition: session.hpp:274

ccur::Session::Session
Session(size_t nthreads=2, OpWeightT weights=OpWeightT())
Definition: session.hpp:41