private void combineParts( MultiMap<Part, ColumnKey> needed, MultiMap<ColumnKey, Part> classified, List<ExpressionNode> andexprs, List<Part> andparts) { Part p = needed.keySet().iterator().next(); Collection<ColumnKey> missing = needed.get(p); if (missing == null || missing.isEmpty()) { andexprs.add((ExpressionNode) p.getParent()); needed.remove(p); andparts.add(p); return; } ListSet<Part> containingMissing = new ListSet<Part>(); boolean first = true; for (ColumnKey ck : missing) { Collection<Part> matching = classified.get(ck); if (matching == null || matching.isEmpty()) continue; if (first) containingMissing.addAll(matching); else { containingMissing.retainAll(matching); } } if (containingMissing.isEmpty()) { andexprs.add((ExpressionNode) p.getParent()); andparts.add(p); needed.remove(p); } else { ListSet<Part> toCombine = new ListSet<Part>(); toCombine.add(p); toCombine.addAll(containingMissing); ListSet<Part> toRemove = new ListSet<Part>(); toRemove.addAll(toCombine); Part clhs = choosePartForAndCombo(toCombine); toCombine.remove(clhs); while (!toCombine.isEmpty()) { Part crhs = choosePartForAndCombo(toCombine); toCombine.remove(crhs); clhs = combineParts(clhs, crhs); } for (Part rp : toRemove) { needed.remove(rp); ArrayList<ColumnKey> classKeys = new ArrayList<ColumnKey>(classified.keySet()); for (ColumnKey ck : classKeys) { Collection<Part> sub = classified.get(ck); if (sub == null || sub.isEmpty()) continue; if (sub.contains(rp)) classified.remove(ck, rp); } } andexprs.add((ExpressionNode) clhs.getParent()); andparts.add(clhs); } }
public static SelectStatement filterEntryProjection(SelectStatement in, PartitionEntry jre) throws PEException { PartitionEntry actual = jre.getActualEntry(); SelectStatement expecting = null; if (actual instanceof OriginalPartitionEntry) expecting = ((OriginalPartitionEntry) actual).getChildCopy(); else expecting = actual.getJoinQuery(null); ListSet<ColumnKey> ec = new ListSet<ColumnKey>(); for (ExpressionNode en : expecting.getProjection()) { ExpressionNode targ = ExpressionUtils.getTarget(en); if (targ instanceof ColumnInstance) { ColumnKey was = ((ColumnInstance) targ).getColumnKey(); ColumnKey isnow = in.getMapper().copyColumnKeyForward(was); if (isnow == null) { throw new SchemaException(Pass.PLANNER, "Lost column during lookup table join"); } ec.add(isnow); } else if (targ instanceof FunctionCall) { ExpressionNode exn = targ; RewriteKey rk = in.getMapper().mapExpressionToColumn(exn); while (rk == null && (exn.getParent() instanceof ExpressionNode)) { exn = (ExpressionNode) exn.getParent(); rk = in.getMapper().mapExpressionToColumn(exn); } if (rk != null) { ec.add((ColumnKey) rk); } } } for (Iterator<ExpressionNode> iter = in.getProjectionEdge().iterator(); iter.hasNext(); ) { ExpressionNode en = ExpressionUtils.getTarget(iter.next()); if (en instanceof ColumnInstance) { ColumnKey ck = ((ColumnInstance) en).getColumnKey(); if (!ec.contains(ck)) iter.remove(); } } return in; }
protected ListSet<Part> getCompletedParts() { if (stopped) return null; ListSet<Part> cols = new ListSet<Part>(); for (Part p : completedParts) { if (p instanceof OredParts) cols.add(p); } completedParts.removeAll(cols); for (Part p : cols) { for (Part sp : p.getParts()) { completedParts.remove(sp); } } completedParts.addAll(cols); return completedParts; }
// we have the temp table on the temp group for the constrained side // we need to build the bcast temp table on the pers group public static RedistFeatureStep buildLookupTableRedist( PlannerContext pc, PartitionEntry srcEntry, RedistFeatureStep constrainedOnTempGroup, JoinEntry rje, PEStorageGroup targetGroup, boolean indexJoinColumns) throws PEException { ProjectingFeatureStep selectDistinct = constrainedOnTempGroup.buildNewProjectingStep( pc, rje.getFeaturePlanner(), null, DMLExplainReason.LOOKUP_JOIN_LOOKUP_TABLE.makeRecord()); SelectStatement ss = (SelectStatement) selectDistinct.getPlannedStatement(); DistributionVector distVect = constrainedOnTempGroup.getTargetTempTable().getDistributionVector(pc.getContext()); ListSet<ColumnKey> mappedColumnsInJoin = null; if (rje.getJoin().getJoin() != null) { ListSet<ColumnKey> columnsInJoin = ColumnInstanceCollector.getColumnKeys( ColumnInstanceCollector.getColumnInstances(rje.getJoin().getJoin().getJoinOn())); // build the set of columns in the src entry projection ListSet<ColumnKey> srcColumns = new ListSet<ColumnKey>(); for (BufferEntry be : srcEntry.getBufferEntries()) { ExpressionNode targ = ExpressionUtils.getTarget(be.getTarget()); if (targ instanceof ColumnInstance) { ColumnInstance ci = (ColumnInstance) targ; srcColumns.add(ci.getColumnKey()); } } columnsInJoin.retainAll(srcColumns); mappedColumnsInJoin = new ListSet<ColumnKey>(); for (ColumnKey ck : columnsInJoin) { mappedColumnsInJoin.add(ss.getMapper().copyColumnKeyForward(ck)); } } for (Iterator<ExpressionNode> iter = ss.getProjectionEdge().iterator(); iter.hasNext(); ) { ExpressionNode en = iter.next(); if (en instanceof ColumnInstance) { ColumnInstance ci = (ColumnInstance) en; PEColumn pec = ci.getPEColumn(); if (!distVect.contains(srcEntry.getSchemaContext(), pec) && (mappedColumnsInJoin == null || !mappedColumnsInJoin.contains(ci.getColumnKey()))) iter.remove(); } } ss.setSetQuantifier(SetQuantifier.DISTINCT); ss.normalize(srcEntry.getSchemaContext()); // now that we have the select distinct set up // redistribute it bcast back onto the pers group RedistFeatureStep out = selectDistinct.redist( pc, rje.getFeaturePlanner(), new TempTableCreateOptions(Model.BROADCAST, targetGroup), null, DMLExplainReason.LOOKUP_JOIN_LOOKUP_TABLE.makeRecord()); if (indexJoinColumns) out.getTargetTempTable() .noteJoinedColumns(pc.getContext(), out.getTargetTempTable().getColumns(pc.getContext())); return out; }
@Override public ListSet<Part> getParts() { ListSet<Part> me = new ListSet<Part>(); me.add(this); return me; }
private void setComplete(Part p) { p.setComplete(); completedParts.add(p); }
protected ListSet<ColumnKey> buildKeyColumns(TableKey tk, Collection<PEColumn> cols) { ListSet<ColumnKey> out = new ListSet<ColumnKey>(); for (PEColumn c : cols) out.add(new ColumnKey(tk, c)); return out; }