コード例 #1
0
  @Override
  protected org.apache.flink.api.common.operators.base.GroupReduceOperatorBase<?, T, ?>
      translateToDataFlow(Operator<T> input) {

    final RichGroupReduceFunction<T, T> function = new DistinctFunction<T>();

    String name = getName() != null ? getName() : "Distinct at " + distinctLocationName;

    if (keys instanceof Keys.ExpressionKeys) {

      int[] logicalKeyPositions = keys.computeLogicalKeyPositions();
      UnaryOperatorInformation<T, T> operatorInfo =
          new UnaryOperatorInformation<T, T>(getInputType(), getResultType());
      GroupReduceOperatorBase<T, T, GroupReduceFunction<T, T>> po =
          new GroupReduceOperatorBase<T, T, GroupReduceFunction<T, T>>(
              function, operatorInfo, logicalKeyPositions, name);

      po.setCombinable(true);
      po.setInput(input);
      po.setDegreeOfParallelism(getParallelism());

      // make sure that distinct preserves the partitioning for the fields on which they operate
      if (getType().isTupleType()) {
        SingleInputSemanticProperties sProps = new SingleInputSemanticProperties();

        for (int field : keys.computeLogicalKeyPositions()) {
          sProps.addForwardedField(field, field);
        }

        po.setSemanticProperties(sProps);
      }

      return po;
    } else if (keys instanceof Keys.SelectorFunctionKeys) {

      @SuppressWarnings("unchecked")
      Keys.SelectorFunctionKeys<T, ?> selectorKeys = (Keys.SelectorFunctionKeys<T, ?>) keys;

      PlanUnwrappingReduceGroupOperator<T, T, ?> po =
          translateSelectorFunctionDistinct(
              selectorKeys, function, getInputType(), getResultType(), name, input);

      po.setDegreeOfParallelism(this.getParallelism());

      return po;
    } else {
      throw new UnsupportedOperationException("Unrecognized key type.");
    }
  }
コード例 #2
0
  protected org.apache.flink.api.common.operators.SingleInputOperator<?, T, ?> translateToDataFlow(
      Operator<T> input) {

    String name = "Partition at " + partitionLocationName;

    // distinguish between partition types
    if (pMethod == PartitionMethod.REBALANCE) {

      UnaryOperatorInformation<T, T> operatorInfo =
          new UnaryOperatorInformation<T, T>(getType(), getType());
      PartitionOperatorBase<T> noop = new PartitionOperatorBase<T>(operatorInfo, pMethod, name);

      noop.setInput(input);
      noop.setParallelism(getParallelism());

      return noop;
    } else if (pMethod == PartitionMethod.HASH || pMethod == PartitionMethod.CUSTOM) {

      if (pKeys instanceof Keys.ExpressionKeys) {

        int[] logicalKeyPositions = pKeys.computeLogicalKeyPositions();
        UnaryOperatorInformation<T, T> operatorInfo =
            new UnaryOperatorInformation<T, T>(getType(), getType());
        PartitionOperatorBase<T> noop =
            new PartitionOperatorBase<T>(operatorInfo, pMethod, logicalKeyPositions, name);

        noop.setInput(input);
        noop.setParallelism(getParallelism());
        noop.setCustomPartitioner(customPartitioner);

        return noop;
      } else if (pKeys instanceof Keys.SelectorFunctionKeys) {

        @SuppressWarnings("unchecked")
        Keys.SelectorFunctionKeys<T, ?> selectorKeys = (Keys.SelectorFunctionKeys<T, ?>) pKeys;
        MapOperatorBase<?, T, ?> po =
            translateSelectorFunctionPartitioner(
                selectorKeys, pMethod, getType(), name, input, getParallelism(), customPartitioner);
        return po;
      } else {
        throw new UnsupportedOperationException("Unrecognized key type.");
      }

    } else if (pMethod == PartitionMethod.RANGE) {
      throw new UnsupportedOperationException("Range partitioning not yet supported");
    } else {
      throw new UnsupportedOperationException("Unsupported partitioning method: " + pMethod.name());
    }
  }