use of org.apache.hadoop.hive.serde2.objectinspector.PrimitiveObjectInspector.PrimitiveCategory in project hive by apache.
the class VectorUDFDateDiffColCol method toDateArray.
private LongColumnVector toDateArray(VectorizedRowBatch batch, TypeInfo typeInfo, ColumnVector inputColVector, LongColumnVector dateVector) {
PrimitiveCategory primitiveCategory = ((PrimitiveTypeInfo) typeInfo).getPrimitiveCategory();
int size = batch.size;
if (primitiveCategory == PrimitiveCategory.DATE) {
return (LongColumnVector) inputColVector;
}
if (size > dateVector.vector.length) {
if (dateVector1 == dateVector) {
dateVector1 = new LongColumnVector(size * 2);
dateVector = dateVector1;
} else {
dateVector2 = new LongColumnVector(size * 2);
dateVector = dateVector2;
}
}
switch(primitiveCategory) {
case TIMESTAMP:
TimestampColumnVector tcv = (TimestampColumnVector) inputColVector;
copySelected(tcv, batch.selectedInUse, batch.selected, batch.size, dateVector);
return dateVector;
case STRING:
case CHAR:
case VARCHAR:
BytesColumnVector bcv = (BytesColumnVector) inputColVector;
copySelected(bcv, batch.selectedInUse, batch.selected, batch.size, dateVector);
return dateVector;
default:
throw new Error("Unsupported input type " + primitiveCategory.name());
}
}
use of org.apache.hadoop.hive.serde2.objectinspector.PrimitiveObjectInspector.PrimitiveCategory in project hive by apache.
the class VectorUDFDateDiffScalarCol method evaluate.
@Override
public void evaluate(VectorizedRowBatch batch) {
if (childExpressions != null) {
super.evaluateChildren(batch);
}
LongColumnVector outputColVector = (LongColumnVector) batch.cols[outputColumnNum];
ColumnVector inputCol = batch.cols[this.colNum];
/* every line below this is identical for evaluateLong & evaluateString */
final int n = inputCol.isRepeating ? 1 : batch.size;
int[] sel = batch.selected;
final boolean selectedInUse = (inputCol.isRepeating == false) && batch.selectedInUse;
boolean[] outputIsNull = outputColVector.isNull;
if (batch.size == 0) {
/* n != batch.size when isRepeating */
return;
}
// We do not need to do a column reset since we are carefully changing the output.
outputColVector.isRepeating = false;
PrimitiveCategory primitiveCategory0 = ((PrimitiveTypeInfo) inputTypeInfos[0]).getPrimitiveCategory();
switch(primitiveCategory0) {
case DATE:
baseDate = (int) longValue;
break;
case TIMESTAMP:
date.setTime(timestampValue.getTime());
baseDate = DateWritable.dateToDays(date);
break;
case STRING:
case CHAR:
case VARCHAR:
try {
date.setTime(formatter.parse(new String(stringValue, "UTF-8")).getTime());
baseDate = DateWritable.dateToDays(date);
break;
} catch (Exception e) {
outputColVector.noNulls = false;
if (selectedInUse) {
for (int j = 0; j < n; j++) {
int i = sel[j];
outputColVector.isNull[i] = true;
}
} else {
for (int i = 0; i < n; i++) {
outputColVector.isNull[i] = true;
}
}
return;
}
default:
throw new Error("Unsupported input type " + primitiveCategory0.name());
}
PrimitiveCategory primitiveCategory1 = ((PrimitiveTypeInfo) inputTypeInfos[1]).getPrimitiveCategory();
switch(primitiveCategory1) {
case DATE:
if (inputCol.isRepeating) {
if (inputCol.noNulls || !inputCol.isNull[0]) {
outputColVector.isNull[0] = false;
outputColVector.vector[0] = evaluateDate(inputCol, 0);
} else {
outputColVector.isNull[0] = true;
outputColVector.noNulls = false;
}
outputColVector.isRepeating = true;
} else if (inputCol.noNulls) {
if (batch.selectedInUse) {
if (!outputColVector.noNulls) {
for (int j = 0; j != n; j++) {
final int i = sel[j];
// Set isNull before call in case it changes it mind.
outputIsNull[i] = false;
outputColVector.vector[i] = evaluateDate(inputCol, i);
}
} else {
for (int j = 0; j != n; j++) {
final int i = sel[j];
outputColVector.vector[i] = evaluateDate(inputCol, i);
}
}
} else {
if (!outputColVector.noNulls) {
// Assume it is almost always a performance win to fill all of isNull so we can
// safely reset noNulls.
Arrays.fill(outputIsNull, false);
outputColVector.noNulls = true;
}
for (int i = 0; i != n; i++) {
outputColVector.vector[i] = evaluateDate(inputCol, i);
}
}
} else /* there are NULLs in the inputColVector */
{
// Carefully handle NULLs..
// Handle case with nulls. Don't do function if the value is null, to save time,
// because calling the function can be expensive.
outputColVector.noNulls = false;
if (selectedInUse) {
for (int j = 0; j < n; j++) {
int i = sel[j];
outputColVector.isNull[i] = inputCol.isNull[i];
if (!inputCol.isNull[i]) {
outputColVector.vector[i] = evaluateDate(inputCol, i);
}
}
} else {
for (int i = 0; i < n; i++) {
outputColVector.isNull[i] = inputCol.isNull[i];
if (!inputCol.isNull[i]) {
outputColVector.vector[i] = evaluateDate(inputCol, i);
}
}
}
}
break;
case TIMESTAMP:
if (inputCol.isRepeating) {
if (inputCol.noNulls || !inputCol.isNull[0]) {
outputColVector.isNull[0] = false;
outputColVector.vector[0] = evaluateTimestamp(inputCol, 0);
} else {
outputColVector.isNull[0] = true;
outputColVector.noNulls = false;
}
outputColVector.isRepeating = true;
} else if (inputCol.noNulls) {
if (batch.selectedInUse) {
if (!outputColVector.noNulls) {
for (int j = 0; j != n; j++) {
final int i = sel[j];
// Set isNull before call in case it changes it mind.
outputIsNull[i] = false;
outputColVector.vector[i] = evaluateTimestamp(inputCol, i);
}
} else {
for (int j = 0; j != n; j++) {
final int i = sel[j];
outputColVector.vector[i] = evaluateTimestamp(inputCol, i);
}
}
} else {
if (!outputColVector.noNulls) {
// Assume it is almost always a performance win to fill all of isNull so we can
// safely reset noNulls.
Arrays.fill(outputIsNull, false);
outputColVector.noNulls = true;
}
for (int i = 0; i != n; i++) {
outputColVector.vector[i] = evaluateTimestamp(inputCol, i);
}
}
} else /* there are nulls in the inputColVector */
{
// Carefully handle NULLs..
// Handle case with nulls. Don't do function if the value is null, to save time,
// because calling the function can be expensive.
outputColVector.noNulls = false;
if (selectedInUse) {
for (int j = 0; j < n; j++) {
int i = sel[j];
outputColVector.isNull[i] = inputCol.isNull[i];
if (!inputCol.isNull[i]) {
outputColVector.vector[i] = evaluateTimestamp(inputCol, i);
}
}
} else {
for (int i = 0; i < n; i++) {
outputColVector.isNull[i] = inputCol.isNull[i];
if (!inputCol.isNull[i]) {
outputColVector.vector[i] = evaluateTimestamp(inputCol, i);
}
}
}
}
break;
case STRING:
case CHAR:
case VARCHAR:
if (inputCol.isRepeating) {
if (inputCol.noNulls || !inputCol.isNull[0]) {
outputColVector.isNull[0] = false;
evaluateString(inputCol, outputColVector, 0);
} else {
outputColVector.isNull[0] = true;
outputColVector.noNulls = false;
}
outputColVector.isRepeating = true;
} else if (inputCol.noNulls) {
if (batch.selectedInUse) {
if (!outputColVector.noNulls) {
for (int j = 0; j != n; j++) {
final int i = sel[j];
// Set isNull before call in case it changes it mind.
outputIsNull[i] = false;
evaluateString(inputCol, outputColVector, i);
}
} else {
for (int j = 0; j != n; j++) {
final int i = sel[j];
evaluateString(inputCol, outputColVector, i);
}
}
} else {
if (!outputColVector.noNulls) {
// Assume it is almost always a performance win to fill all of isNull so we can
// safely reset noNulls.
Arrays.fill(outputIsNull, false);
outputColVector.noNulls = true;
}
for (int i = 0; i != n; i++) {
evaluateString(inputCol, outputColVector, i);
}
}
} else /* there are nulls in the inputColVector */
{
// Carefully handle NULLs..
// Handle case with nulls. Don't do function if the value is null, to save time,
// because calling the function can be expensive.
outputColVector.noNulls = false;
if (selectedInUse) {
for (int j = 0; j < n; j++) {
int i = sel[j];
outputColVector.isNull[i] = inputCol.isNull[i];
if (!inputCol.isNull[i]) {
evaluateString(inputCol, outputColVector, i);
}
}
} else {
for (int i = 0; i < n; i++) {
outputColVector.isNull[i] = inputCol.isNull[i];
if (!inputCol.isNull[i]) {
evaluateString(inputCol, outputColVector, i);
}
}
}
}
break;
default:
throw new Error("Unsupported input type " + primitiveCategory1.name());
}
}
use of org.apache.hadoop.hive.serde2.objectinspector.PrimitiveObjectInspector.PrimitiveCategory in project hive by apache.
the class CastLongToDate method evaluate.
@Override
public void evaluate(VectorizedRowBatch batch) {
if (childExpressions != null) {
super.evaluateChildren(batch);
}
LongColumnVector inV = (LongColumnVector) batch.cols[inputColumn];
int[] sel = batch.selected;
int n = batch.size;
LongColumnVector outV = (LongColumnVector) batch.cols[outputColumnNum];
if (n == 0) {
// Nothing to do
return;
}
PrimitiveCategory primitiveCategory = ((PrimitiveTypeInfo) inputTypeInfos[0]).getPrimitiveCategory();
switch(primitiveCategory) {
case DATE:
inV.copySelected(batch.selectedInUse, batch.selected, batch.size, outV);
break;
default:
throw new Error("Unsupported input type " + primitiveCategory.name());
}
}
use of org.apache.hadoop.hive.serde2.objectinspector.PrimitiveObjectInspector.PrimitiveCategory in project hive by apache.
the class TestVectorGenericDateExpressions method testDateSubColScalar.
@Test
public void testDateSubColScalar() throws HiveException {
for (PrimitiveCategory colType1 : dateTimestampStringTypes) testDateAddColScalar(colType1, false);
VectorExpression udf = new VectorUDFDateSubColScalar(0, 0, 1);
udf.setInputTypeInfos(new TypeInfo[] { TypeInfoFactory.stringTypeInfo, TypeInfoFactory.timestampTypeInfo });
udf.transientInit();
VectorizedRowBatch batch = new VectorizedRowBatch(2, 1);
batch.cols[0] = new BytesColumnVector(1);
batch.cols[1] = new LongColumnVector(1);
BytesColumnVector bcv = (BytesColumnVector) batch.cols[0];
byte[] bytes = "error".getBytes(utf8);
bcv.vector[0] = bytes;
bcv.start[0] = 0;
bcv.length[0] = bytes.length;
udf.evaluate(batch);
Assert.assertEquals(batch.cols[1].isNull[0], true);
}
use of org.apache.hadoop.hive.serde2.objectinspector.PrimitiveObjectInspector.PrimitiveCategory in project hive by apache.
the class TestVectorGenericDateExpressions method testDateSubScalarCol.
@Test
public void testDateSubScalarCol() throws HiveException {
for (PrimitiveCategory scalarType1 : dateTimestampStringTypes) testDateAddScalarCol(scalarType1, false);
VectorExpression udf = new VectorUDFDateSubScalarCol("error".getBytes(utf8), 0, 1);
udf.setInputTypeInfos(new TypeInfo[] { TypeInfoFactory.stringTypeInfo, TypeInfoFactory.timestampTypeInfo });
udf.transientInit();
VectorizedRowBatch batch = new VectorizedRowBatch(2, 1);
batch.cols[0] = new LongColumnVector(1);
batch.cols[1] = new LongColumnVector(1);
udf.evaluate(batch);
Assert.assertEquals(batch.cols[1].isNull[0], true);
}
Aggregations