use of com.tencent.angel.ml.math2.storage.LongLongVectorStorage in project angel by Tencent.
the class SimpleBinaryOutNonZAExecutor method apply.
public static Vector apply(LongLongVector v1, LongLongVector v2, Binary op) {
LongLongVectorStorage newStorage = (LongLongVectorStorage) StorageSwitch.apply(v1, v2, op);
if (v1.isSparse() && v2.isSparse()) {
long v1Size = v1.size();
long v2Size = v2.size();
if (v1Size >= v2Size * Constant.sparseThreshold && (v1Size + v2Size) * Constant.intersectionCoeff <= Constant.sparseDenseStorageThreshold * v1.dim()) {
// we gauss the indices of v2 maybe is a subset of v1, or overlap is very large
ObjectIterator<Long2LongMap.Entry> iter = v2.getStorage().entryIterator();
while (iter.hasNext()) {
Long2LongMap.Entry entry = iter.next();
long idx = entry.getLongKey();
newStorage.set(idx, op.apply(v1.get(idx), entry.getLongValue()));
}
} else if ((v1Size + v2Size) * Constant.intersectionCoeff >= Constant.sparseDenseStorageThreshold * v1.dim()) {
// we gauss dense storage is more efficient
ObjectIterator<Long2LongMap.Entry> iter1 = v1.getStorage().entryIterator();
while (iter1.hasNext()) {
Long2LongMap.Entry entry = iter1.next();
long idx = entry.getLongKey();
newStorage.set(idx, entry.getLongValue());
}
ObjectIterator<Long2LongMap.Entry> iter2 = v2.getStorage().entryIterator();
while (iter2.hasNext()) {
Long2LongMap.Entry entry = iter2.next();
long idx = entry.getLongKey();
newStorage.set(idx, op.apply(v1.get(idx), entry.getLongValue()));
}
} else {
// to avoid multi-rehash
int capacity = 1 << (32 - Integer.numberOfLeadingZeros((int) (v1.size() / 0.75)));
if (v1.size() + v2.size() <= 1.5 * capacity) {
// no rehashor one onle rehash is required, nothing to optimization
ObjectIterator<Long2LongMap.Entry> iter = v2.getStorage().entryIterator();
while (iter.hasNext()) {
Long2LongMap.Entry entry = iter.next();
long idx = entry.getLongKey();
newStorage.set(idx, op.apply(v1.get(idx), entry.getLongValue()));
}
} else {
// multi-rehash
ObjectIterator<Long2LongMap.Entry> iter1 = v1.getStorage().entryIterator();
while (iter1.hasNext()) {
Long2LongMap.Entry entry = iter1.next();
long idx = entry.getLongKey();
newStorage.set(idx, entry.getLongValue());
}
ObjectIterator<Long2LongMap.Entry> iter2 = v2.getStorage().entryIterator();
while (iter2.hasNext()) {
Long2LongMap.Entry entry = iter2.next();
long idx = entry.getLongKey();
newStorage.set(idx, op.apply(v1.get(idx), entry.getLongValue()));
}
}
}
} else if (v1.isSparse() && v2.isSorted()) {
long v1Size = v1.size();
long v2Size = v2.size();
if (v1Size >= v2Size * Constant.sparseThreshold && (v1Size + v2Size) * Constant.intersectionCoeff <= Constant.sparseDenseStorageThreshold * v1.dim()) {
// we gauss the indices of v2 maybe is a subset of v1, or overlap is very large
long[] v2Indices = v2.getStorage().getIndices();
long[] v2Values = v2.getStorage().getValues();
for (int i = 0; i < v2.size(); i++) {
long idx = v2Indices[i];
newStorage.set(idx, op.apply(v1.get(idx), v2Values[i]));
}
} else if ((v1Size + v2Size) * Constant.intersectionCoeff >= Constant.sparseDenseStorageThreshold * v1.dim()) {
ObjectIterator<Long2LongMap.Entry> iter1 = v1.getStorage().entryIterator();
while (iter1.hasNext()) {
Long2LongMap.Entry entry = iter1.next();
long idx = entry.getLongKey();
newStorage.set(idx, entry.getLongValue());
}
long[] v2Indices = v2.getStorage().getIndices();
long[] v2Values = v2.getStorage().getValues();
long size = v2.size();
for (int i = 0; i < size; i++) {
long idx = v2Indices[i];
newStorage.set(idx, op.apply(v1.get(idx), v2Values[i]));
}
} else {
// to avoid multi-rehash
int capacity = 1 << (32 - Integer.numberOfLeadingZeros((int) (v1.size() / 0.75)));
if (v1.size() + v2.size() <= 1.5 * capacity) {
long[] v2Indices = v2.getStorage().getIndices();
long[] v2Values = v2.getStorage().getValues();
for (int i = 0; i < v2.size(); i++) {
long idx = v2Indices[i];
newStorage.set(idx, op.apply(v1.get(idx), v2Values[i]));
}
} else {
ObjectIterator<Long2LongMap.Entry> iter1 = v1.getStorage().entryIterator();
while (iter1.hasNext()) {
Long2LongMap.Entry entry = iter1.next();
long idx = entry.getLongKey();
newStorage.set(idx, entry.getLongValue());
}
long[] v2Indices = v2.getStorage().getIndices();
long[] v2Values = v2.getStorage().getValues();
long size = v2.size();
for (int i = 0; i < size; i++) {
long idx = v2Indices[i];
newStorage.set(idx, op.apply(v1.get(idx), v2Values[i]));
}
}
}
} else if (v1.isSorted() && v2.isSparse()) {
long v1Size = v1.size();
long v2Size = v2.size();
if ((v1Size + v2Size) * Constant.intersectionCoeff >= Constant.sortedDenseStorageThreshold * v1.dim()) {
if (op.isKeepStorage()) {
long[] v1Indices = v1.getStorage().getIndices();
long[] idxiter = v2.getStorage().indexIterator().toLongArray();
long[] indices = new long[(int) (v1Size + v2Size)];
System.arraycopy(v1Indices, 0, indices, 0, (int) v1.size());
System.arraycopy(idxiter, 0, indices, (int) v1.size(), (int) v2.size());
LongAVLTreeSet avl = new LongAVLTreeSet(indices);
LongBidirectionalIterator iter = avl.iterator();
long[] values = new long[indices.length];
int i = 0;
while (iter.hasNext()) {
long idx = iter.nextLong();
indices[i] = idx;
values[i] = op.apply(v1.get(idx), v2.get(idx));
i++;
}
while (i < indices.length) {
indices[i] = 0;
i++;
}
newStorage = new LongLongSortedVectorStorage(v1.getDim(), (int) avl.size(), indices, values);
} else {
long[] v1Indices = v1.getStorage().getIndices();
long[] v1Values = v1.getStorage().getValues();
long size = v1.size();
for (int i = 0; i < size; i++) {
long idx = v1Indices[i];
newStorage.set(idx, v1Values[i]);
}
ObjectIterator<Long2LongMap.Entry> iter = v2.getStorage().entryIterator();
while (iter.hasNext()) {
Long2LongMap.Entry entry = iter.next();
long idx = entry.getLongKey();
newStorage.set(idx, op.apply(newStorage.get(idx), entry.getLongValue()));
}
}
} else {
if (op.isKeepStorage()) {
long[] v1Indices = v1.getStorage().getIndices();
long[] idxiter = v2.getStorage().indexIterator().toLongArray();
long[] indices = new long[(int) (v1Size + v2Size)];
System.arraycopy(v1Indices, 0, indices, 0, (int) v1.size());
System.arraycopy(idxiter, 0, indices, (int) v1.size(), (int) v2.size());
LongAVLTreeSet avl = new LongAVLTreeSet(indices);
LongBidirectionalIterator iter = avl.iterator();
long[] values = new long[indices.length];
int i = 0;
while (iter.hasNext()) {
long idx = iter.nextLong();
indices[i] = idx;
values[i] = op.apply(v1.get(idx), v2.get(idx));
i++;
}
while (i < indices.length) {
indices[i] = 0;
i++;
}
newStorage = new LongLongSortedVectorStorage(v1.getDim(), (int) avl.size(), indices, values);
} else {
long[] v1Indices = v1.getStorage().getIndices();
long[] v1Values = v1.getStorage().getValues();
long size = v1.size();
for (int i = 0; i < size; i++) {
long idx = v1Indices[i];
newStorage.set(idx, v1Values[i]);
}
ObjectIterator<Long2LongMap.Entry> iter = v2.getStorage().entryIterator();
while (iter.hasNext()) {
Long2LongMap.Entry entry = iter.next();
long idx = entry.getLongKey();
newStorage.set(idx, op.apply(newStorage.get(idx), entry.getLongValue()));
}
}
}
} else if (v1.isSorted() && v2.isSorted()) {
int v1Pointor = 0;
int v2Pointor = 0;
long size1 = v1.size();
long size2 = v2.size();
long[] v1Indices = v1.getStorage().getIndices();
long[] v1Values = v1.getStorage().getValues();
long[] v2Indices = v2.getStorage().getIndices();
long[] v2Values = v2.getStorage().getValues();
if ((size1 + size2) * Constant.intersectionCoeff >= Constant.sortedDenseStorageThreshold * v1.dim()) {
if (op.isKeepStorage()) {
// sorted
long[] resIndices = newStorage.getIndices();
long[] resValues = newStorage.getValues();
int global = 0;
while (v1Pointor < size1 && v2Pointor < size2) {
if (v1Indices[v1Pointor] == v2Indices[v2Pointor]) {
resIndices[global] = v1Indices[v1Pointor];
resValues[global] = op.apply(v1Values[v1Pointor], v2Values[v2Pointor]);
global++;
v1Pointor++;
v2Pointor++;
} else if (v1Indices[v1Pointor] < v2Indices[v2Pointor]) {
resIndices[global] = v1Indices[v1Pointor];
resValues[global] = v1Values[v1Pointor];
global++;
v1Pointor++;
} else {
// v1Indices[v1Pointor] > v2Indices[v2Pointor]
resIndices[global] = v2Indices[v2Pointor];
resValues[global] = op.apply(0, v2Values[v2Pointor]);
global++;
v2Pointor++;
}
}
} else {
// dense
while (v1Pointor < size1 || v2Pointor < size2) {
if ((v1Pointor < size1 && v2Pointor < size2) && v1Indices[v1Pointor] == v2Indices[v2Pointor]) {
newStorage.set(v1Indices[v1Pointor], op.apply(v1Values[v1Pointor], v2Values[v2Pointor]));
v1Pointor++;
v2Pointor++;
} else if ((v1Pointor < size1 && v2Pointor < size2) && v1Indices[v1Pointor] < v2Indices[v2Pointor] || (v1Pointor < size1 && v2Pointor >= size2)) {
newStorage.set(v1Indices[v1Pointor], v1Values[v1Pointor]);
v1Pointor++;
} else if (((v1Pointor < size1 && v2Pointor < size2) && v1Indices[v1Pointor] >= v2Indices[v2Pointor]) || (v1Pointor >= size1 && v2Pointor < size2)) {
newStorage.set(v2Indices[v2Pointor], op.apply(0, v2Values[v2Pointor]));
v2Pointor++;
}
}
}
} else {
if (op.isKeepStorage()) {
long[] resIndices = newStorage.getIndices();
long[] resValues = newStorage.getValues();
int globalPointor = 0;
while (v1Pointor < size1 && v2Pointor < size2) {
if (v1Indices[v1Pointor] == v2Indices[v2Pointor]) {
resIndices[globalPointor] = v1Indices[v1Pointor];
resValues[globalPointor] = op.apply(v1Values[v1Pointor], v2Values[v2Pointor]);
v1Pointor++;
v2Pointor++;
globalPointor++;
} else if (v1Indices[v1Pointor] < v2Indices[v2Pointor]) {
resIndices[globalPointor] = v1Indices[v1Pointor];
resValues[globalPointor] = v1Values[v1Pointor];
v1Pointor++;
globalPointor++;
} else {
// v1Indices[v1Pointor] > v2Indices[v2Pointor]
resIndices[globalPointor] = v2Indices[v2Pointor];
resValues[globalPointor] = op.apply(0, v2Values[v2Pointor]);
v2Pointor++;
globalPointor++;
}
}
} else {
while (v1Pointor < size1 || v2Pointor < size2) {
if ((v1Pointor < size1 && v2Pointor < size2) && v1Indices[v1Pointor] == v2Indices[v2Pointor]) {
newStorage.set(v1Indices[v1Pointor], op.apply(v1Values[v1Pointor], v2Values[v2Pointor]));
v1Pointor++;
v2Pointor++;
} else if ((v1Pointor < size1 && v2Pointor < size2) && v1Indices[v1Pointor] < v2Indices[v2Pointor] || (v1Pointor < size1 && v2Pointor >= size2)) {
newStorage.set(v1Indices[v1Pointor], v1Values[v1Pointor]);
v1Pointor++;
} else if (((v1Pointor < size1 && v2Pointor < size2) && v1Indices[v1Pointor] >= v2Indices[v2Pointor]) || (v1Pointor >= size1 && v2Pointor < size2)) {
newStorage.set(v2Indices[v2Pointor], op.apply(0, v2Values[v2Pointor]));
v2Pointor++;
}
}
}
}
} else {
throw new AngelException("The operation is not support!");
}
return new LongLongVector(v1.getMatrixId(), v1.getRowId(), v1.getClock(), v1.getDim(), newStorage);
}
use of com.tencent.angel.ml.math2.storage.LongLongVectorStorage in project angel by Tencent.
the class RangeRouterUtils method splitLongLongVector.
public static KeyValuePart[] splitLongLongVector(MatrixMeta matrixMeta, LongLongVector vector) {
LongLongVectorStorage storage = vector.getStorage();
if (storage.isSparse()) {
// Get keys and values
LongLongSparseVectorStorage sparseStorage = (LongLongSparseVectorStorage) storage;
long[] keys = sparseStorage.getIndices();
long[] values = sparseStorage.getValues();
return split(matrixMeta, vector.getRowId(), keys, values, false);
} else {
// Key and value array pair
LongLongSortedVectorStorage sortStorage = (LongLongSortedVectorStorage) storage;
long[] keys = sortStorage.getIndices();
long[] values = sortStorage.getValues();
return split(matrixMeta, vector.getRowId(), keys, values, true);
}
}
use of com.tencent.angel.ml.math2.storage.LongLongVectorStorage in project angel by Tencent.
the class HashRouterUtils method splitLongLongVector.
public static void splitLongLongVector(KeyHash hasher, MatrixMeta matrixMeta, LongLongVector vector, KeyValuePart[] dataParts) {
int dataPartNum = dataParts.length;
int dataPartNumMinus1 = dataPartNum - 1;
if (isPow2(dataPartNum)) {
LongLongVectorStorage storage = vector.getStorage();
if (storage.isSparse()) {
// Use iterator
LongLongSparseVectorStorage sparseStorage = (LongLongSparseVectorStorage) storage;
ObjectIterator<Long2LongMap.Entry> iter = sparseStorage.entryIterator();
while (iter.hasNext()) {
Long2LongMap.Entry keyValue = iter.next();
int partId = computeHashCode(hasher, keyValue.getLongKey()) & dataPartNumMinus1;
((HashLongKeysLongValuesPart) dataParts[partId]).add(keyValue.getLongKey(), keyValue.getLongValue());
}
} else {
// Key and value array pair
LongLongSortedVectorStorage sortStorage = (LongLongSortedVectorStorage) storage;
long[] keys = sortStorage.getIndices();
long[] values = sortStorage.getValues();
for (int i = 0; i < keys.length; i++) {
int partId = computeHashCode(hasher, keys[i]) & dataPartNumMinus1;
((HashLongKeysLongValuesPart) dataParts[partId]).add(keys[i], values[i]);
}
}
} else {
LongLongVectorStorage storage = vector.getStorage();
if (storage.isSparse()) {
// Use iterator
LongLongSparseVectorStorage sparseStorage = (LongLongSparseVectorStorage) storage;
ObjectIterator<Long2LongMap.Entry> iter = sparseStorage.entryIterator();
while (iter.hasNext()) {
Long2LongMap.Entry keyValue = iter.next();
int partId = computeHashCode(hasher, keyValue.getLongKey()) % dataPartNum;
((HashLongKeysLongValuesPart) dataParts[partId]).add(keyValue.getLongKey(), keyValue.getLongValue());
}
} else {
// Key and value array pair
LongLongSortedVectorStorage sortStorage = (LongLongSortedVectorStorage) storage;
long[] keys = sortStorage.getIndices();
long[] values = sortStorage.getValues();
for (int i = 0; i < keys.length; i++) {
int partId = computeHashCode(hasher, keys[i]) % dataPartNum;
((HashLongKeysLongValuesPart) dataParts[partId]).add(keys[i], values[i]);
}
}
}
}
use of com.tencent.angel.ml.math2.storage.LongLongVectorStorage in project angel by Tencent.
the class ColumnFormat method saveLongLongRows.
private void saveLongLongRows(ServerPartition part, ServerRow[] rows, MatrixPartitionMeta partMeta, PSMatrixSaveContext saveContext, DataOutputStream output) throws IOException {
Vector vec = ServerRowUtils.getVector((ServerLongLongRow) rows[0]);
// int size = rows.size();
long indexOffset = part.getPartitionKey().getStartCol();
LongLongsCol col = new LongLongsCol(0, new long[rows.length]);
if (vec instanceof IntLongVector) {
IntLongVectorStorage storage = ((IntLongVector) vec).getStorage();
long startCol = rows[0].getStartCol();
long endCol = rows[0].getEndCol();
if (storage.isDense()) {
for (long i = startCol; i < endCol; i++) {
col.colId = i;
for (int j = 0; j < rows.length; j++) {
col.colElems[j] = ((ServerLongLongRow) (rows[j])).get(col.colId);
}
save(col, output);
}
} else {
if (saveContext.sortFirst()) {
int[] indices = storage.getIndices();
Sort.quickSort(indices, 0, indices.length - 1);
for (int i = 0; i < indices.length; i++) {
col.colId = indices[i] + indexOffset;
for (int j = 0; j < rows.length; j++) {
col.colElems[j] = ((ServerLongLongRow) (rows[j])).get(col.colId);
}
save(col, output);
}
} else {
ObjectIterator<Int2LongMap.Entry> iter = storage.entryIterator();
while (iter.hasNext()) {
col.colId = iter.next().getIntKey() + indexOffset;
for (int j = 0; j < rows.length; j++) {
col.colElems[j] = ((ServerLongLongRow) (rows[j])).get(col.colId);
}
save(col, output);
}
}
}
} else {
LongLongVectorStorage storage = ((LongLongVector) vec).getStorage();
if (saveContext.sortFirst()) {
long[] indices = storage.getIndices();
Sort.quickSort(indices, 0, indices.length - 1);
for (int i = 0; i < indices.length; i++) {
col.colId = indices[i] + indexOffset;
for (int j = 0; j < rows.length; j++) {
col.colElems[j] = ((ServerLongLongRow) (rows[j])).get(col.colId);
}
save(col, output);
}
} else {
ObjectIterator<Long2LongMap.Entry> iter = storage.entryIterator();
while (iter.hasNext()) {
col.colId = iter.next().getLongKey() + indexOffset;
for (int j = 0; j < rows.length; j++) {
col.colElems[j] = ((ServerLongLongRow) (rows[j])).get(col.colId);
}
save(col, output);
}
}
}
}
use of com.tencent.angel.ml.math2.storage.LongLongVectorStorage in project angel by Tencent.
the class MixedBinaryInAllExecutor method apply.
private static Vector apply(CompLongLongVector v1, LongDummyVector v2, Binary op) {
LongLongVector[] parts = v1.getPartitions();
Storage[] resParts = StorageSwitch.applyComp(v1, v2, op);
if (!op.isKeepStorage()) {
for (int i = 0; i < parts.length; i++) {
if (parts[i].getStorage() instanceof LongLongSortedVectorStorage) {
resParts[i] = new LongLongSparseVectorStorage(parts[i].getDim(), parts[i].getStorage().getIndices(), parts[i].getStorage().getValues());
}
}
}
long subDim = (v1.getDim() + v1.getNumPartitions() - 1) / v1.getNumPartitions();
for (int i = 0; i < v1.getDim(); i++) {
int pidx = (int) (i / subDim);
long subidx = i % subDim;
((LongLongVectorStorage) resParts[pidx]).set(subidx, op.apply(parts[pidx].get(subidx), v2.get(i)));
}
LongLongVector[] res = new LongLongVector[parts.length];
int i = 0;
for (LongLongVector part : parts) {
res[i] = new LongLongVector(part.getMatrixId(), part.getRowId(), part.getClock(), part.getDim(), (LongLongVectorStorage) resParts[i]);
i++;
}
v1.setPartitions(res);
return v1;
}
Aggregations