Exemplo n.º 1
0
  private void setPartitionConstraintsDFS(
      OperatorDescriptorId opId,
      Map<IConnectorDescriptor, TargetConstraint> tgtConstraints,
      IOperatorDescriptor parentOp) {
    List<IConnectorDescriptor> opInputs = jobSpec.getOperatorInputMap().get(opId);
    AlgebricksPartitionConstraint opConstraint = null;
    IOperatorDescriptor opDesc = jobSpec.getOperatorMap().get(opId);
    if (opInputs != null) {
      for (IConnectorDescriptor conn : opInputs) {
        ConnectorDescriptorId cid = conn.getConnectorId();
        org.apache.commons.lang3.tuple.Pair<
                org.apache.commons.lang3.tuple.Pair<IOperatorDescriptor, Integer>,
                org.apache.commons.lang3.tuple.Pair<IOperatorDescriptor, Integer>>
            p = jobSpec.getConnectorOperatorMap().get(cid);
        IOperatorDescriptor src = p.getLeft().getLeft();
        // DFS
        setPartitionConstraintsDFS(src.getOperatorId(), tgtConstraints, opDesc);

        TargetConstraint constraint = tgtConstraints.get(conn);
        if (constraint != null) {
          switch (constraint) {
            case ONE:
              {
                opConstraint = new AlgebricksCountPartitionConstraint(1);
                break;
              }
            case SAME_COUNT:
              {
                opConstraint = partitionConstraintMap.get(src);
                break;
              }
          }
        }
      }
    }
    if (partitionConstraintMap.get(opDesc) == null) {
      if (opConstraint == null) {
        if (parentOp != null) {
          AlgebricksPartitionConstraint pc = partitionConstraintMap.get(parentOp);
          if (pc != null) {
            opConstraint = pc;
          } else if (opInputs == null || opInputs.size() == 0) {
            opConstraint = new AlgebricksCountPartitionConstraint(1);
          }
        }
        if (opConstraint == null) {
          opConstraint = clusterLocations;
        }
      }
      partitionConstraintMap.put(opDesc, opConstraint);
      AlgebricksPartitionConstraintHelper.setPartitionConstraintInJobSpec(
          jobSpec, opDesc, opConstraint);
    }
  }
  /**
   * rewrite an activity cluster internally
   *
   * @param ac the activity cluster to be rewritten
   */
  private void rewriteIntraActivityCluster(
      ActivityCluster ac, Map<IActivity, SuperActivity> invertedActivitySuperActivityMap) {
    Map<ActivityId, IActivity> activities = ac.getActivityMap();
    Map<ActivityId, List<IConnectorDescriptor>> activityInputMap = ac.getActivityInputMap();
    Map<ActivityId, List<IConnectorDescriptor>> activityOutputMap = ac.getActivityOutputMap();
    Map<ConnectorDescriptorId, Pair<Pair<IActivity, Integer>, Pair<IActivity, Integer>>>
        connectorActivityMap = ac.getConnectorActivityMap();
    ActivityClusterGraph acg = ac.getActivityClusterGraph();
    Map<ActivityId, IActivity> startActivities = new HashMap<ActivityId, IActivity>();
    Map<ActivityId, SuperActivity> superActivities = new HashMap<ActivityId, SuperActivity>();
    Map<ActivityId, Queue<IActivity>> toBeExpendedMap = new HashMap<ActivityId, Queue<IActivity>>();

    /** Build the initial super activities */
    for (Entry<ActivityId, IActivity> entry : activities.entrySet()) {
      ActivityId activityId = entry.getKey();
      IActivity activity = entry.getValue();
      if (activityInputMap.get(activityId) == null) {
        startActivities.put(activityId, activity);
        /** use the start activity's id as the id of the super activity */
        createNewSuperActivity(
            ac,
            superActivities,
            toBeExpendedMap,
            invertedActivitySuperActivityMap,
            activityId,
            activity);
      }
    }

    /**
     * expand one-to-one connected activity cluster by the BFS order. after the while-loop, the
     * original activities are partitioned into equivalent classes, one-per-super-activity.
     */
    Map<ActivityId, SuperActivity> clonedSuperActivities = new HashMap<ActivityId, SuperActivity>();
    while (toBeExpendedMap.size() > 0) {
      clonedSuperActivities.clear();
      clonedSuperActivities.putAll(superActivities);
      for (Entry<ActivityId, SuperActivity> entry : clonedSuperActivities.entrySet()) {
        ActivityId superActivityId = entry.getKey();
        SuperActivity superActivity = entry.getValue();

        /** for the case where the super activity has already been swallowed */
        if (superActivities.get(superActivityId) == null) {
          continue;
        }

        /** expend the super activity */
        Queue<IActivity> toBeExpended = toBeExpendedMap.get(superActivityId);
        if (toBeExpended == null) {
          /** Nothing to expand */
          continue;
        }
        IActivity expendingActivity = toBeExpended.poll();
        List<IConnectorDescriptor> outputConnectors =
            activityOutputMap.get(expendingActivity.getActivityId());
        if (outputConnectors != null) {
          for (IConnectorDescriptor outputConn : outputConnectors) {
            Pair<Pair<IActivity, Integer>, Pair<IActivity, Integer>> endPoints =
                connectorActivityMap.get(outputConn.getConnectorId());
            IActivity newActivity = endPoints.getRight().getLeft();
            SuperActivity existingSuperActivity = invertedActivitySuperActivityMap.get(newActivity);
            if (outputConn.getClass().getName().contains(ONE_TO_ONE_CONNECTOR)) {
              /** expend the super activity cluster on an one-to-one out-bound connection */
              if (existingSuperActivity == null) {
                superActivity.addActivity(newActivity);
                toBeExpended.add(newActivity);
                invertedActivitySuperActivityMap.put(newActivity, superActivity);
              } else {
                /** the two activities already in the same super activity */
                if (existingSuperActivity == superActivity) {
                  continue;
                }
                /** swallow an existing super activity */
                swallowExistingSuperActivity(
                    superActivities,
                    toBeExpendedMap,
                    invertedActivitySuperActivityMap,
                    superActivity,
                    superActivityId,
                    existingSuperActivity);
              }
            } else {
              if (existingSuperActivity == null) {
                /** create new activity */
                createNewSuperActivity(
                    ac,
                    superActivities,
                    toBeExpendedMap,
                    invertedActivitySuperActivityMap,
                    newActivity.getActivityId(),
                    newActivity);
              }
            }
          }
        }

        /** remove the to-be-expended queue if it is empty */
        if (toBeExpended.size() == 0) {
          toBeExpendedMap.remove(superActivityId);
        }
      }
    }

    Map<ConnectorDescriptorId, IConnectorDescriptor> connMap = ac.getConnectorMap();
    Map<ConnectorDescriptorId, RecordDescriptor> connRecordDesc =
        ac.getConnectorRecordDescriptorMap();
    Map<SuperActivity, Integer> superActivityProducerPort = new HashMap<SuperActivity, Integer>();
    Map<SuperActivity, Integer> superActivityConsumerPort = new HashMap<SuperActivity, Integer>();
    for (Entry<ActivityId, SuperActivity> entry : superActivities.entrySet()) {
      superActivityProducerPort.put(entry.getValue(), 0);
      superActivityConsumerPort.put(entry.getValue(), 0);
    }

    /** create a new activity cluster to replace the old activity cluster */
    ActivityCluster newActivityCluster = new ActivityCluster(acg, ac.getId());
    newActivityCluster.setConnectorPolicyAssignmentPolicy(ac.getConnectorPolicyAssignmentPolicy());
    for (Entry<ActivityId, SuperActivity> entry : superActivities.entrySet()) {
      newActivityCluster.addActivity(entry.getValue());
      acg.getActivityMap().put(entry.getKey(), newActivityCluster);
    }

    /** Setup connectors: either inside a super activity or among super activities */
    for (Entry<ConnectorDescriptorId, Pair<Pair<IActivity, Integer>, Pair<IActivity, Integer>>>
        entry : connectorActivityMap.entrySet()) {
      ConnectorDescriptorId connectorId = entry.getKey();
      Pair<Pair<IActivity, Integer>, Pair<IActivity, Integer>> endPoints = entry.getValue();
      IActivity producerActivity = endPoints.getLeft().getLeft();
      IActivity consumerActivity = endPoints.getRight().getLeft();
      int producerPort = endPoints.getLeft().getRight();
      int consumerPort = endPoints.getRight().getRight();
      RecordDescriptor recordDescriptor = connRecordDesc.get(connectorId);
      IConnectorDescriptor conn = connMap.get(connectorId);
      if (conn.getClass().getName().contains(ONE_TO_ONE_CONNECTOR)) {
        /** connection edge between inner activities */
        SuperActivity residingSuperActivity =
            invertedActivitySuperActivityMap.get(producerActivity);
        residingSuperActivity.connect(
            conn, producerActivity, producerPort, consumerActivity, consumerPort, recordDescriptor);
      } else {
        /** connection edge between super activities */
        SuperActivity producerSuperActivity =
            invertedActivitySuperActivityMap.get(producerActivity);
        SuperActivity consumerSuperActivity =
            invertedActivitySuperActivityMap.get(consumerActivity);
        int producerSAPort = superActivityProducerPort.get(producerSuperActivity);
        int consumerSAPort = superActivityConsumerPort.get(consumerSuperActivity);
        newActivityCluster.addConnector(conn);
        newActivityCluster.connect(
            conn,
            producerSuperActivity,
            producerSAPort,
            consumerSuperActivity,
            consumerSAPort,
            recordDescriptor);

        /** bridge the port */
        producerSuperActivity.setClusterOutputIndex(
            producerSAPort, producerActivity.getActivityId(), producerPort);
        consumerSuperActivity.setClusterInputIndex(
            consumerSAPort, consumerActivity.getActivityId(), consumerPort);
        acg.getConnectorMap().put(connectorId, newActivityCluster);

        /** increasing the port number for the producer and consumer */
        superActivityProducerPort.put(producerSuperActivity, ++producerSAPort);
        superActivityConsumerPort.put(consumerSuperActivity, ++consumerSAPort);
      }
    }

    /** Set up the roots of the new activity cluster */
    for (Entry<ActivityId, SuperActivity> entry : superActivities.entrySet()) {
      List<IConnectorDescriptor> connIds =
          newActivityCluster.getActivityOutputMap().get(entry.getKey());
      if (connIds == null || connIds.size() == 0) {
        newActivityCluster.addRoot(entry.getValue());
      }
    }

    /**
     * set up the blocked2Blocker mapping, which will be updated in the rewriteInterActivityCluster
     * call
     */
    newActivityCluster.getBlocked2BlockerMap().putAll(ac.getBlocked2BlockerMap());

    /** replace the old activity cluster with the new activity cluster */
    acg.getActivityClusterMap().put(ac.getId(), newActivityCluster);
  }