use of org.apache.sysml.hops.codegen.cplan.CNode in project systemml by apache.
the class CPlanOpRewriter method rFindAndRemoveBinaryMS.
private static void rFindAndRemoveBinaryMS(CNode node, CNodeData mainInput, BinType type, String lit, String replace) {
for (int i = 0; i < node.getInput().size(); i++) {
CNode tmp = node.getInput().get(i);
if (TemplateUtils.isBinary(tmp, type) && tmp.getInput().get(1).isLiteral() && tmp.getInput().get(1).getVarname().equals(lit) && tmp.getInput().get(0) instanceof CNodeData && ((CNodeData) tmp.getInput().get(0)).getHopID() == mainInput.getHopID()) {
CNodeData cnode = new CNodeData(new LiteralOp(replace));
cnode.setLiteral(true);
node.getInput().set(i, cnode);
} else
rFindAndRemoveBinaryMS(tmp, mainInput, type, lit, replace);
}
}
use of org.apache.sysml.hops.codegen.cplan.CNode in project systemml by apache.
the class TemplateMultiAgg method constructCplan.
@Override
public Pair<Hop[], CNodeTpl> constructCplan(Hop hop, CPlanMemoTable memo, boolean compileLiterals) {
// get all root nodes for multi aggregation
MemoTableEntry multiAgg = memo.getBest(hop.getHopID(), TemplateType.MAGG);
ArrayList<Hop> roots = new ArrayList<>();
for (int i = 0; i < 3; i++) if (multiAgg.isPlanRef(i))
roots.add(memo._hopRefs.get(multiAgg.input(i)));
Hop.resetVisitStatus(roots);
// recursively process required cplan outputs
HashSet<Hop> inHops = new HashSet<>();
HashMap<Long, CNode> tmp = new HashMap<>();
for (// use celltpl cplan construction
Hop root : // use celltpl cplan construction
roots) super.rConstructCplan(root, memo, tmp, inHops, compileLiterals);
Hop.resetVisitStatus(roots);
// reorder inputs (ensure matrices/vectors come first) and prune literals
// note: we order by number of cells and subsequently sparsity to ensure
// that sparse inputs are used as the main input w/o unnecessary conversion
Hop shared = getSparseSafeSharedInput(roots, inHops);
Hop[] sinHops = inHops.stream().filter(h -> !(h.getDataType().isScalar() && tmp.get(h.getHopID()).isLiteral())).sorted(new HopInputComparator(shared)).toArray(Hop[]::new);
// construct template node
ArrayList<CNode> inputs = new ArrayList<>();
for (Hop in : sinHops) inputs.add(tmp.get(in.getHopID()));
ArrayList<CNode> outputs = new ArrayList<>();
ArrayList<AggOp> aggOps = new ArrayList<>();
for (Hop root : roots) {
CNode node = tmp.get(root.getHopID());
if (// add indexing ops for sideways data inputs
node instanceof CNodeData && ((CNodeData) inputs.get(0)).getHopID() != ((CNodeData) node).getHopID())
node = new CNodeUnary(node, (roots.get(0).getDim2() == 1) ? UnaryType.LOOKUP_R : UnaryType.LOOKUP_RC);
outputs.add(node);
aggOps.add(TemplateUtils.getAggOp(root));
}
CNodeMultiAgg tpl = new CNodeMultiAgg(inputs, outputs);
tpl.setAggOps(aggOps);
tpl.setSparseSafe(isSparseSafe(roots, sinHops[0], tpl.getOutputs(), tpl.getAggOps(), true));
tpl.setRootNodes(roots);
tpl.setBeginLine(hop.getBeginLine());
// return cplan instance
return new Pair<>(sinHops, tpl);
}
use of org.apache.sysml.hops.codegen.cplan.CNode in project systemml by apache.
the class TemplateOuterProduct method constructCplan.
@Override
public Pair<Hop[], CNodeTpl> constructCplan(Hop hop, CPlanMemoTable memo, boolean compileLiterals) {
// recursively process required cplan output
HashSet<Hop> inHops = new HashSet<>();
HashMap<String, Hop> inHops2 = new HashMap<>();
HashMap<Long, CNode> tmp = new HashMap<>();
hop.resetVisitStatus();
rConstructCplan(hop, memo, tmp, inHops, inHops2, compileLiterals);
hop.resetVisitStatus();
// reorder inputs (ensure matrix is first input)
Hop X = inHops2.get("_X");
Hop U = inHops2.get("_U");
Hop V = inHops2.get("_V");
LinkedList<Hop> sinHops = new LinkedList<>(inHops);
sinHops.remove(V);
sinHops.addFirst(V);
sinHops.remove(U);
sinHops.addFirst(U);
sinHops.remove(X);
sinHops.addFirst(X);
// construct template node
ArrayList<CNode> inputs = new ArrayList<>();
for (Hop in : sinHops) if (in != null)
inputs.add(tmp.get(in.getHopID()));
CNode output = tmp.get(hop.getHopID());
CNodeOuterProduct tpl = new CNodeOuterProduct(inputs, output);
tpl.setOutProdType(TemplateUtils.getOuterProductType(X, U, V, hop));
tpl.setTransposeOutput(!HopRewriteUtils.isTransposeOperation(hop) && tpl.getOutProdType() == OutProdType.LEFT_OUTER_PRODUCT);
tpl.setBeginLine(hop.getBeginLine());
return new Pair<>(sinHops.toArray(new Hop[0]), tpl);
}
use of org.apache.sysml.hops.codegen.cplan.CNode in project systemml by apache.
the class SpoofCompiler method cleanupCPlans.
/**
* Cleanup generated cplans in order to remove unnecessary inputs created
* during incremental construction. This is important as it avoids unnecessary
* redundant computation.
*
* @param memo memoization table
* @param cplans set of cplans
*/
private static HashMap<Long, Pair<Hop[], CNodeTpl>> cleanupCPlans(CPlanMemoTable memo, HashMap<Long, Pair<Hop[], CNodeTpl>> cplans) {
HashMap<Long, Pair<Hop[], CNodeTpl>> cplans2 = new HashMap<>();
CPlanOpRewriter rewriter = new CPlanOpRewriter();
CPlanCSERewriter cse = new CPlanCSERewriter();
for (Entry<Long, Pair<Hop[], CNodeTpl>> e : cplans.entrySet()) {
CNodeTpl tpl = e.getValue().getValue();
Hop[] inHops = e.getValue().getKey();
// remove invalid plans with null inputs
if (Arrays.stream(inHops).anyMatch(h -> (h == null)))
continue;
// perform simplifications and cse rewrites
tpl = rewriter.simplifyCPlan(tpl);
tpl = cse.eliminateCommonSubexpressions(tpl);
// update input hops (order-preserving)
HashSet<Long> inputHopIDs = tpl.getInputHopIDs(false);
inHops = Arrays.stream(inHops).filter(p -> p != null && inputHopIDs.contains(p.getHopID())).toArray(Hop[]::new);
cplans2.put(e.getKey(), new Pair<>(inHops, tpl));
// remove invalid plans with column indexing on main input
if (tpl instanceof CNodeCell || tpl instanceof CNodeRow) {
CNodeData in1 = (CNodeData) tpl.getInput().get(0);
boolean inclRC1 = !(tpl instanceof CNodeRow);
if (rHasLookupRC1(tpl.getOutput(), in1, inclRC1) || isLookupRC1(tpl.getOutput(), in1, inclRC1)) {
cplans2.remove(e.getKey());
if (LOG.isTraceEnabled())
LOG.trace("Removed cplan due to invalid rc1 indexing on main input.");
}
} else if (tpl instanceof CNodeMultiAgg) {
CNodeData in1 = (CNodeData) tpl.getInput().get(0);
for (CNode output : ((CNodeMultiAgg) tpl).getOutputs()) if (rHasLookupRC1(output, in1, true) || isLookupRC1(output, in1, true)) {
cplans2.remove(e.getKey());
if (LOG.isTraceEnabled())
LOG.trace("Removed cplan due to invalid rc1 indexing on main input.");
}
}
// remove invalid lookups on main input (all templates)
CNodeData in1 = (CNodeData) tpl.getInput().get(0);
if (tpl instanceof CNodeMultiAgg)
rFindAndRemoveLookupMultiAgg((CNodeMultiAgg) tpl, in1);
else
rFindAndRemoveLookup(tpl.getOutput(), in1, !(tpl instanceof CNodeRow));
// remove invalid row templates (e.g., unsatisfied blocksize constraint)
if (tpl instanceof CNodeRow) {
// check for invalid row cplan over column vector
if (((CNodeRow) tpl).getRowType() == RowType.NO_AGG && tpl.getOutput().getDataType().isScalar()) {
cplans2.remove(e.getKey());
if (LOG.isTraceEnabled())
LOG.trace("Removed invalid row cplan w/o agg on column vector.");
} else if (OptimizerUtils.isSparkExecutionMode()) {
Hop hop = memo.getHopRefs().get(e.getKey());
boolean isSpark = DMLScript.rtplatform == RUNTIME_PLATFORM.SPARK || OptimizerUtils.getTotalMemEstimate(inHops, hop, true) > OptimizerUtils.getLocalMemBudget();
boolean invalidNcol = hop.getDataType().isMatrix() && (HopRewriteUtils.isTransposeOperation(hop) ? hop.getDim1() > hop.getRowsInBlock() : hop.getDim2() > hop.getColsInBlock());
for (Hop in : inHops) invalidNcol |= (in.getDataType().isMatrix() && in.getDim2() > in.getColsInBlock());
if (isSpark && invalidNcol) {
cplans2.remove(e.getKey());
if (LOG.isTraceEnabled())
LOG.trace("Removed invalid row cplan w/ ncol>ncolpb.");
}
}
}
// remove cplan w/ single op and w/o agg
if ((tpl instanceof CNodeCell && ((CNodeCell) tpl).getCellType() == CellType.NO_AGG && TemplateUtils.hasSingleOperation(tpl)) || (tpl instanceof CNodeRow && (((CNodeRow) tpl).getRowType() == RowType.NO_AGG || ((CNodeRow) tpl).getRowType() == RowType.NO_AGG_B1 || ((CNodeRow) tpl).getRowType() == RowType.ROW_AGG) && TemplateUtils.hasSingleOperation(tpl)) || TemplateUtils.hasNoOperation(tpl)) {
cplans2.remove(e.getKey());
if (LOG.isTraceEnabled())
LOG.trace("Removed cplan with single operation.");
}
// remove cplan if empty
if (tpl.getOutput() instanceof CNodeData) {
cplans2.remove(e.getKey());
if (LOG.isTraceEnabled())
LOG.trace("Removed empty cplan.");
}
// rename inputs (for codegen and plan caching)
tpl.renameInputs();
}
return cplans2;
}
use of org.apache.sysml.hops.codegen.cplan.CNode in project systemml by apache.
the class CPlanComparisonTest method testEqualBinaryNodes.
@Test
public void testEqualBinaryNodes() {
CNode c1 = createCNodeData(DataType.MATRIX);
CNode c2 = createCNodeData(DataType.SCALAR);
CNode bin1 = new CNodeBinary(c1, c2, BinType.PLUS);
CNode bin2 = new CNodeBinary(c1, c2, BinType.PLUS);
Assert.assertEquals(bin1.hashCode(), bin2.hashCode());
Assert.assertEquals(bin1, bin2);
}
Aggregations