d4/d36/_advanced_physical_node_factory_8cc_source.html

 /*****************************************************************************

  *                                                                           *

  *  Copyright 2018 Rice University                                           *

  *                                                                           *

  *  Licensed under the Apache License, Version 2.0 (the "License");          *

  *  you may not use this file except in compliance with the License.         *

  *  You may obtain a copy of the License at                                  *

  *                                                                           *

  *      http://www.apache.org/licenses/LICENSE-2.0                           *

  *                                                                           *

  *  Unless required by applicable law or agreed to in writing, software      *

  *  distributed under the License is distributed on an "AS IS" BASIS,        *

  *  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. *

  *  See the License for the specific language governing permissions and      *

  *  limitations under the License.                                           *

  *                                                                           *

  *****************************************************************************/


 #include "AdvancedPhysicalOptimizer/AdvancedPhysicalNodeFactory.h"

 #include "AdvancedPhysicalOptimizer/Pipes/AdvancedPhysicalAggregationPipe.h"

 #include "AdvancedPhysicalOptimizer/Pipes/AdvancedPhysicalJoinSidePipe.h"

 #include "AdvancedPhysicalOptimizer/Pipes/AdvancedPhysicalStraightPipe.h"


 namespace pdb {


 AdvancedPhysicalNodeFactory::AdvancedPhysicalNodeFactory(const string &jobId,

                                                          const Handle<ComputePlan> &computePlan,

                                                          const ConfigurationPtr &conf)

     : AbstractPhysicalNodeFactory(computePlan), jobId(jobId), conf(conf), currentNodeIndex(0) {}


 vector<AbstractPhysicalNodePtr> AdvancedPhysicalNodeFactory::generateAnalyzerGraph(std::vector<AtomicComputationPtr> sources) {


   // go through each source in the sources

   for(const AtomicComputationPtr &source : sources) {


     std::cout << source->getAtomicComputationType() << std::endl;


     // go trough each consumer of this node

     for(const auto &consumer : computationGraph.getConsumingAtomicComputations(source->getOutputName())) {


       // we start with a source so we push that back

       currentPipe.push_back(source);


       // add the consumer to the pipe

       currentPipe.push_back(consumer);


       // then we start transversing the graph upwards

       transverseTCAPGraph(consumer);

     }

   }


   // connect the pipes

   connectThePipes();


   // return the generated source nodes

   return this->physicalSourceNodes;

 }


 void AdvancedPhysicalNodeFactory::transverseTCAPGraph(AtomicComputationPtr curNode) {


   // did we already visit this node

   if(visitedNodes.find(curNode) != visitedNodes.end()) {


     // clear the pipe we are done here

     currentPipe.clear();


     // we are done here

     return;

   }


   // ok now we visited this node

   visitedNodes.insert(curNode);


   // check the type of this node might be a pipeline breaker

   switch (curNode->getAtomicComputationTypeID()) {


     case HashOneTypeID:

     case HashLeftTypeID:

     case HashRightTypeID: {


       // we got a hash operation, create a shuffle pipe

       createPhysicalPipeline<AdvancedPhysicalJoinSidePipe>();

       currentPipe.clear();


       break;

     }

     case ApplyAggTypeID: {


       // we got a aggregation so we need to create an aggregation shuffle pipe

       createPhysicalPipeline<AdvancedPhysicalAggregationPipe>();

       currentPipe.clear();


       break;

     }

     case WriteSetTypeID: {


       // do we just have one write set that was after an aggregation in this pipeline we just skip it no pipe is created

       if(currentPipe.size() == 1) {

         currentPipe.clear();

         return;

       }


       // write set also breaks the pipe because this is where the pipe ends

       createPhysicalPipeline<AdvancedPhysicalStraightPipe>();

       currentPipe.clear();

     }

     default: {


       // we only care about these since they tend to be pipeline breakers

       break;

     }

   }


   // grab all the consumers

   auto consumers = computationGraph.getConsumingAtomicComputations(curNode->getOutputName());


   // if we have multiple consumers and there is still stuff left in the pipe

   if(consumers.size() > 1 && !currentPipe.empty()) {


     // this is a pipeline breaker create a pipe

     //currentPipe.push_back(curNode);

     createPhysicalPipeline<AdvancedPhysicalStraightPipe>();

     currentPipe.clear();

   }


   // go through each consumer and transverse to get the next pipe

   for(auto &consumer : consumers) {

     currentPipe.push_back(consumer);

     transverseTCAPGraph(consumer);

   }

 }


 void AdvancedPhysicalNodeFactory::setConsumers(shared_ptr<AdvancedPhysicalAbstractPipe> node) {


   // all the consumers of these pipes

   std::vector<std::string> consumers;


   // go trough each consumer of this node

   for(const auto &consumer : computationGraph.getConsumingAtomicComputations(this->currentPipe.back()->getOutputName())) {


     // if the next pipe begins with a write set we just ignore it...

     // this is happening usually when we have an aggregation connected to a write set which is not really necessary

     if(consumer->getAtomicComputationTypeID() == WriteSetTypeID){

       std::cout << consumer->getOutputName() << std::endl;

       continue;

     }


     // add them to the consumers

     consumers.push_back(consumer->getOutputName());

   }


   // set the consumers

   if(!consumers.empty()) {

     this->consumedBy[node->getNodeIdentifier()] = consumers;

   }

 }


 void AdvancedPhysicalNodeFactory::connectThePipes() {


   for(auto node : physicalNodes) {


     // get all the consumers of this pipe

     auto consumingAtomicComputation = consumedBy[node.second->getNodeIdentifier()];


     // go through each at

     for(const auto &atomicComputation : consumingAtomicComputation) {


       std::cout << node.second->getPipeComputations().back()->getOutputName() << ":" << atomicComputation << std::endl;

       // get the consuming pipeline

       auto consumer = startsWith[atomicComputation];


       // add the consuming node of this guy

       node.second->addConsumer(consumer);

     }

   }

 }


 }

pdb::AdvancedPhysicalNodeFactory::physicalSourceNodes
std::vector< AbstractPhysicalNodePtr > physicalSourceNodes
Definition: AdvancedPhysicalNodeFactory.h:135

HashLeftTypeID
Definition: AtomicComputation.h:42

AdvancedPhysicalJoinSidePipe.h

pdb::AdvancedPhysicalNodeFactory::consumedBy
std::map< std::string, std::vector< std::string > > consumedBy
Definition: AdvancedPhysicalNodeFactory.h:146

pdb::AdvancedPhysicalNodeFactory::connectThePipes
void connectThePipes()
Definition: AdvancedPhysicalNodeFactory.cc:159

pdb::AdvancedPhysicalNodeFactory::AdvancedPhysicalNodeFactory
AdvancedPhysicalNodeFactory(const string &jobId, const Handle< ComputePlan > &computePlan, const ConfigurationPtr &conf)
Definition: AdvancedPhysicalNodeFactory.cc:26

pdb::AdvancedPhysicalNodeFactory::physicalNodes
std::map< std::string, AdvancedPhysicalPipelineNodePtr > physicalNodes
Definition: AdvancedPhysicalNodeFactory.h:130

pdb::AbstractPhysicalNodeFactory
Definition: AbstractPhysicalNodeFactory.h:30

pdb::AdvancedPhysicalNodeFactory::startsWith
std::map< std::string, AdvancedPhysicalPipelineNodePtr > startsWith
Definition: AdvancedPhysicalNodeFactory.h:141

pdb::AdvancedPhysicalNodeFactory::visitedNodes
std::set< AtomicComputationPtr > visitedNodes
Definition: AdvancedPhysicalNodeFactory.h:120

AdvancedPhysicalAggregationPipe.h

pdb::AdvancedPhysicalNodeFactory::transverseTCAPGraph
void transverseTCAPGraph(AtomicComputationPtr curNode)
Definition: AdvancedPhysicalNodeFactory.cc:60

ApplyAggTypeID
Definition: AtomicComputation.h:47

pdb::AdvancedPhysicalNodeFactory::currentPipe
std::vector< AtomicComputationPtr > currentPipe
Definition: AdvancedPhysicalNodeFactory.h:125

WriteSetTypeID
Definition: AtomicComputation.h:49

AdvancedPhysicalStraightPipe.h

AtomicComputationList::getConsumingAtomicComputations
std::vector< AtomicComputationPtr > & getConsumingAtomicComputations(std::string inputName)
Definition: AtomicComputationList.cc:36

pdb::AdvancedPhysicalNodeFactory::setConsumers
void setConsumers(shared_ptr< AdvancedPhysicalAbstractPipe > node)
Definition: AdvancedPhysicalNodeFactory.cc:134

pdb::AdvancedPhysicalNodeFactory::generateAnalyzerGraph
vector< AbstractPhysicalNodePtr > generateAnalyzerGraph(std::vector< AtomicComputationPtr > sources) override
Definition: AdvancedPhysicalNodeFactory.cc:32

pdb::AbstractPhysicalNodeFactory::computationGraph
AtomicComputationList computationGraph
Definition: AbstractPhysicalNodeFactory.h:61

ConfigurationPtr
shared_ptr< Configuration > ConfigurationPtr
Definition: Configuration.h:89

AtomicComputationPtr
std::shared_ptr< struct AtomicComputation > AtomicComputationPtr
Definition: AtomicComputation.h:36

HashOneTypeID
Definition: AtomicComputation.h:44

AdvancedPhysicalNodeFactory.h

HashRightTypeID
Definition: AtomicComputation.h:43

pdb::Handle
Definition: Allocator.h:399