public void dispose(StepMetaInterface smi, StepDataInterface sdi) {
    // Recover memory immediately, allow in-memory data to be garbage collected
    data.look = null;
    data.list = null;
    data.hashIndex = null;
    data.longIndex = null;

    super.dispose(smi, sdi);
  private void addToCache(
      RowMetaInterface keyMeta, Object[] keyData, RowMetaInterface valueMeta, Object[] valueData)
      throws KettleValueException {
    if (meta.isMemoryPreservationActive()) {
      if (meta.isUsingSortedList()) {
        KeyValue keyValue = new KeyValue(keyData, valueData);
        int idx = Collections.binarySearch(data.list, keyValue, data.comparator);
        if (idx < 0) {
          int index = -idx - 1; // this is the insertion point
          data.list.add(index, keyValue); // insert to keep sorted.
        } else {
          data.list.set(idx, keyValue); // Overwrite to simulate Hashtable behaviour
      } else {
        if (meta.isUsingIntegerPair()) {
          if (!data.metadataVerifiedIntegerPair) {
            data.metadataVerifiedIntegerPair = true;
            if (keyMeta.size() != 1
                || valueMeta.size() != 1
                || !keyMeta.getValueMeta(0).isInteger()
                || !valueMeta.getValueMeta(0).isInteger()) {

              throw new KettleValueException(
                      PKG, "StreamLookup.Exception.CanNotUseIntegerPairAlgorithm"));

          Long key = keyMeta.getInteger(keyData, 0);
          Long value = valueMeta.getInteger(valueData, 0);
          data.longIndex.put(key, value);
        } else {
          if (data.hashIndex == null) {
            data.hashIndex = new ByteArrayHashIndex(keyMeta);
              RowMeta.extractData(keyMeta, keyData), RowMeta.extractData(valueMeta, valueData));
    } else {
      // We can't just put Object[] in the map
      // The compare function is not in it.
      // We need to wrap in and use that.
      // Let's use RowMetaAndData for this one.
      data.look.put(new RowMetaAndData(keyMeta, keyData), valueData);
  public boolean init(StepMetaInterface smi, StepDataInterface sdi) {
    meta = (StreamLookupMeta) smi;
    data = (StreamLookupData) sdi;

    if (super.init(smi, sdi)) {
      data.readLookupValues = true;

      return true;
    return false;
  private void handleNullIf() {
    data.nullIf = new Object[meta.getValue().length];

    for (int i = 0; i < meta.getValue().length; i++) {
      if (meta.getValueDefaultType()[i] < 0) {
        // logError("unknown default value type: "+dtype+" for value "+value[i]+", default to type:
        // String!");
        meta.getValueDefaultType()[i] = ValueMetaInterface.TYPE_STRING;
      data.nullIf[i] = null;
      switch (meta.getValueDefaultType()[i]) {
        case ValueMetaInterface.TYPE_STRING:
          if (Const.isEmpty(meta.getValueDefault()[i])) {
            data.nullIf[i] = null;
          } else {
            data.nullIf[i] = meta.getValueDefault()[i];
        case ValueMetaInterface.TYPE_DATE:
          try {
            data.nullIf[i] = DateFormat.getInstance().parse(meta.getValueDefault()[i]);
          } catch (Exception e) {
        case ValueMetaInterface.TYPE_NUMBER:
          try {
            data.nullIf[i] = new Double(Double.parseDouble(meta.getValueDefault()[i]));
          } catch (Exception e) {
        case ValueMetaInterface.TYPE_INTEGER:
          try {
            data.nullIf[i] = new Long(Long.parseLong(meta.getValueDefault()[i]));
          } catch (Exception e) {
        case ValueMetaInterface.TYPE_BOOLEAN:
          if ("TRUE".equalsIgnoreCase(meta.getValueDefault()[i])
              || //$NON-NLS-1$
              "Y".equalsIgnoreCase(meta.getValueDefault()[i])) // $NON-NLS-1$
          data.nullIf[i] = Boolean.TRUE;
          else data.nullIf[i] = Boolean.FALSE;
        case ValueMetaInterface.TYPE_BIGNUMBER:
          try {
            data.nullIf[i] = new BigDecimal(meta.getValueDefault()[i]);
          } catch (Exception e) {
          // if a default value is given and no conversion is implemented throw an error
          if (meta.getValueDefault()[i] != null && meta.getValueDefault()[i].trim().length() > 0) {
            throw new RuntimeException(
                BaseMessages.getString(PKG, "StreamLookup.Exception.ConversionNotImplemented")
                    + " "
                    + ValueMeta.getTypeDesc(meta.getValueDefaultType()[i]));
          } else {
            // no default value given: just set it to null
            data.nullIf[i] = null;
  public boolean processRow(StepMetaInterface smi, StepDataInterface sdi) throws KettleException {
    meta = (StreamLookupMeta) smi;
    data = (StreamLookupData) sdi;

    if (data.readLookupValues) {
      data.readLookupValues = false;

      if (!readLookupValues()) // Read values in lookup table (look)
                PKG, "StreamLookup.Log.UnableToReadDataFromLookupStream")); // $NON-NLS-1$
        return false;

      // At this point, all the values in the cache are of normal storage data type...
      // We should reflect this in the metadata...
      if (data.keyMeta != null) { // null when no rows coming from lookup stream
        for (ValueMetaInterface valueMeta : data.keyMeta.getValueMetaList()) {
      if (data.valueMeta != null) { // null when no rows coming from lookup stream
        for (ValueMetaInterface valueMeta : data.valueMeta.getValueMetaList()) {

      return true;

    Object[] r = getRow(); // Get row from input rowset & set row busy!
    if (r == null) // no more input to be expected...
      if (log.isDetailed())
                getLinesRead() + "")); // $NON-NLS-1$ //$NON-NLS-2$
      return false;

    if (first) {
      first = false;

      // read the lookup values!
      data.keynrs = new int[meta.getKeystream().length];
      data.lookupMeta = new RowMeta();
      data.convertKeysToNative = new boolean[meta.getKeystream().length];

      for (int i = 0; i < meta.getKeystream().length; i++) {
        // Find the keynr in the row (only once)
        data.keynrs[i] = getInputRowMeta().indexOfValue(meta.getKeystream()[i]);
        if (data.keynrs[i] < 0) {
          throw new KettleStepException(
                  "" + getInputRowMeta().getString(r))); // $NON-NLS-1$ //$NON-NLS-2$ //$NON-NLS-3$
        } else {
          if (log.isDetailed())
                    "" + data.keynrs[i])); // $NON-NLS-1$ //$NON-NLS-2$ //$NON-NLS-3$


        // If we have binary storage data coming in, we convert it to normal data storage.
        // The storage in the lookup data store is also normal data storage. TODO: enforce normal
        // data storage??
        data.convertKeysToNative[i] =

      data.outputRowMeta = getInputRowMeta().clone();
          data.outputRowMeta, getStepname(), new RowMetaInterface[] {data.infoMeta}, null, this);

      // Handle the NULL values (not found...)

    Object[] outputRow =
        lookupValues(getInputRowMeta(), r); // Do the actual lookup in the hastable.
    if (outputRow == null) {
      setOutputDone(); // signal end to receiver(s)
      return false;

    putRow(data.outputRowMeta, outputRow); // copy row to output rowset(s);

    if (checkFeedback(getLinesRead())) {
      if (log.isBasic())
            BaseMessages.getString(PKG, "StreamLookup.Log.LineNumber")
                + getLinesRead()); //$NON-NLS-1$

    return true;
  private Object[] lookupValues(RowMetaInterface rowMeta, Object[] row) throws KettleException {
    // See if we need to stop.
    if (isStopped()) return null;

    if (data.lookupColumnIndex == null) {
      String names[] = data.lookupMeta.getFieldNames();
      data.lookupColumnIndex = new int[names.length];

      for (int i = 0; i < names.length; i++) {
        data.lookupColumnIndex[i] = rowMeta.indexOfValue(names[i]);
        if (data.lookupColumnIndex[i] < 0) {
          // we should not get here
          throw new KettleStepException("The lookup column '" + names[i] + "' could not be found");

    // Copy value references to lookup table.
    Object[] lu = new Object[data.keynrs.length];
    for (int i = 0; i < data.keynrs.length; i++) {
      // If the input is binary storage data, we convert it to normal storage.
      if (data.convertKeysToNative[i]) {
        lu[i] =
                .convertBinaryStringToNativeType((byte[]) row[data.keynrs[i]]);
      } else {
        lu[i] = row[data.keynrs[i]];

    // Handle conflicting types (Number-Integer-String conversion to lookup type in hashtable)
    if (data.keyTypes != null) {
      for (int i = 0; i < data.lookupMeta.size(); i++) {
        ValueMetaInterface inputValue = data.lookupMeta.getValueMeta(i);
        ValueMetaInterface lookupValue = data.keyTypes.getValueMeta(i);
        if (inputValue.getType() != lookupValue.getType()) {
          try {
            // Change the input value to match the lookup value
            lu[i] = lookupValue.convertDataCompatible(inputValue, lu[i]);
          } catch (KettleValueException e) {
            throw new KettleStepException("Error converting data while looking up value", e);

    Object[] add = null;

    if (data.hasLookupRows) {
      try {
        if (meta.getKeystream().length > 0) {
          add = getFromCache(data.keyTypes, lu);
        } else {
          // Just take the first element in the hashtable...
          throw new KettleStepException(
              BaseMessages.getString(PKG, "StreamLookup.Log.GotRowWithoutKeys")); // $NON-NLS-1$
      } catch (Exception e) {
        throw new KettleStepException(e);

    if (add == null) // nothing was found, unknown code: add the specified default value...
      add = data.nullIf;

    return RowDataUtil.addRowData(row, rowMeta.size(), add);
  private boolean readLookupValues() throws KettleException {
    data.infoStream = meta.getStepIOMeta().getInfoStreams().get(0);
    if (data.infoStream.getStepMeta() == null) {
          BaseMessages.getString(PKG, "StreamLookup.Log.NoLookupStepSpecified")); // $NON-NLS-1$
      return false;
    if (log.isDetailed())
          BaseMessages.getString(PKG, "StreamLookup.Log.ReadingFromStream")
              + data.infoStream.getStepname()
              + "]"); //$NON-NLS-1$ //$NON-NLS-2$

    int[] keyNrs = new int[meta.getKeylookup().length];
    int[] valueNrs = new int[meta.getValue().length];
    boolean firstRun = true;

    // Which row set do we read from?
    RowSet rowSet = findInputRowSet(data.infoStream.getStepname());
    Object[] rowData = getRowFrom(rowSet); // rows are originating from "lookup_from"
    while (rowData != null) {
      if (log.isRowLevel())
            BaseMessages.getString(PKG, "StreamLookup.Log.ReadLookupRow")
                + rowSet.getRowMeta().getString(rowData)); // $NON-NLS-1$

      if (firstRun) {
        firstRun = false;
        data.hasLookupRows = true;

        data.infoMeta = rowSet.getRowMeta().clone();
        data.keyMeta = new RowMeta();
        data.valueMeta = new RowMeta();

        // Look up the keys in the source rows
        for (int i = 0; i < meta.getKeylookup().length; i++) {
          keyNrs[i] = rowSet.getRowMeta().indexOfValue(meta.getKeylookup()[i]);
          if (keyNrs[i] < 0) {
            throw new KettleStepException(
                    meta.getKeylookup()[i])); // $NON-NLS-1$ //$NON-NLS-2$
        // Save the data types of the keys to optionally convert input rows later on...
        if (data.keyTypes == null) {
          data.keyTypes = data.keyMeta.clone();
        // set the meta data for the keys also to STORAGE_TYPE_NORMAL, otherwise it will conflict
        // later on
        // for the data is is already set to STORAGE_TYPE_NORMAL in StreamLookupMeta.getFields()
        // all values in the cache are of this storage type (see convertToNormalStorageType below)
        // position here after keyTypes are stored (needed below for correct
        // convertToNormalStorageType)
        for (int i = 0; i < keyNrs.length; i++) {

        for (int v = 0; v < meta.getValue().length; v++) {
          valueNrs[v] = rowSet.getRowMeta().indexOfValue(meta.getValue()[v]);
          if (valueNrs[v] < 0) {
            throw new KettleStepException(
                    meta.getValue()[v])); // $NON-NLS-1$ //$NON-NLS-2$

      Object[] keyData = new Object[keyNrs.length];
      for (int i = 0; i < keyNrs.length; i++) {
        ValueMetaInterface keyMeta = data.keyTypes.getValueMeta(i);
        keyData[i] =
                rowData[keyNrs[i]]); // Make sure only normal storage goes in
                .STORAGE_TYPE_NORMAL); // now we need to change keyMeta/keyTypes also to normal

      Object[] valueData = new Object[valueNrs.length];
      for (int i = 0; i < valueNrs.length; i++) {
        ValueMetaInterface valueMeta = data.valueMeta.getValueMeta(i);
        valueData[i] =
                rowData[valueNrs[i]]); // make sure only normal storage goes in

      addToCache(data.keyMeta, keyData, data.valueMeta, valueData);

      rowData = getRowFrom(rowSet);

    return true;