use of com.yahoo.document.annotation.SpanList in project vespa by vespa-engine.
the class StringTestCase method annotate.
public Document annotate(Document document, DocumentTypeManager manager) {
AnnotationTypeRegistry registry = manager.getAnnotationTypeRegistry();
AnnotationType company = registry.getType("company");
AnnotationType industry = registry.getType("industry");
AnnotationType person = registry.getType("person");
AnnotationType location = registry.getType("location");
Map<String, AnnotationType> m = registry.getTypes();
for (String key : m.keySet()) {
System.out.println("Key: " + key);
AnnotationType val = m.get(key);
parseAnnotationType(val);
}
SpanTree tree = new SpanTree("testannotations");
SpanList root = (SpanList) tree.getRoot();
SpanNode companySpan = new Span(0, 5);
SpanNode industrySpan = new Span(5, 10);
SpanNode personSpan = new Span(10, 15);
SpanNode locationSpan = new Span(15, 20);
root.add(companySpan);
root.add(industrySpan);
root.add(personSpan);
root.add(locationSpan);
Struct companyValue = (Struct) company.getDataType().createFieldValue();
companyValue.setFieldValue("name", new StringFieldValue("Sun"));
companyValue.setFieldValue("ceo", new StringFieldValue("Scott Mcnealy"));
companyValue.setFieldValue("lat", new DoubleFieldValue(37.7));
companyValue.setFieldValue("lon", new DoubleFieldValue(-122.44));
companyValue.setFieldValue("vertical", new StringFieldValue("software"));
Annotation compAn = new Annotation(company, companyValue);
tree.annotate(companySpan, compAn);
Struct personValue = new Struct(manager.getDataType("annotation.person"));
personValue.setFieldValue("name", new StringFieldValue("Richard Bair"));
Annotation personAn = new Annotation(person, personValue);
tree.annotate(personSpan, personAn);
Struct locValue = new Struct(manager.getDataType("annotation.location"));
locValue.setFieldValue("name", new StringFieldValue("Prinsens Gate"));
Annotation loc = new Annotation(location, locValue);
tree.annotate(locationSpan, loc);
Struct locValue2 = new Struct(manager.getDataType("annotation.location"));
locValue2.setFieldValue("name", new StringFieldValue("Kongens Gate"));
Annotation locAn = new Annotation(location, locValue2);
tree.annotate(locationSpan, locAn);
SpanList branch = new SpanList();
SpanNode span1 = new Span(0, 3);
SpanNode span2 = new Span(1, 9);
SpanNode span3 = new Span(12, 10);
branch.add(span1);
branch.add(span3);
branch.add(span2);
Struct industryValue = new Struct(manager.getDataType("annotation.industry"));
industryValue.setFieldValue("vertical", new StringFieldValue("Manufacturing"));
Annotation ind = new Annotation(industry, industryValue);
tree.annotate(span1, ind);
Struct pValue = new Struct(manager.getDataType("annotation.person"));
pValue.setFieldValue("name", new StringFieldValue("Praveen Mohan"));
Annotation pAn = new Annotation(person, pValue);
tree.annotate(span2, pAn);
Struct lValue = new Struct(manager.getDataType("annotation.location"));
lValue.setFieldValue("name", new StringFieldValue("Embassy Golf Links"));
Annotation locn = new Annotation(location, lValue);
tree.annotate(span3, locn);
Struct cValue = (Struct) company.getDataType().createFieldValue();
cValue.setFieldValue("name", new StringFieldValue("Yahoo"));
cValue.setFieldValue("ceo", new StringFieldValue("Carol Bartz"));
cValue.setFieldValue("lat", new DoubleFieldValue(127.7));
cValue.setFieldValue("lon", new DoubleFieldValue(-42.44));
cValue.setFieldValue("vertical", new StringFieldValue("search"));
Annotation cAn = new Annotation(company, cValue);
tree.annotate(branch, cAn);
Struct pVal = new Struct(manager.getDataType("annotation.person"));
pVal.setFieldValue("name", new StringFieldValue("Kim Omar"));
Annotation an = new Annotation(person, pVal);
tree.annotate(root, an);
root.add(branch);
StringFieldValue body = (StringFieldValue) document.getFieldValue(document.getDataType().getField("body"));
root.remove(branch);
tree.cleanup();
System.out.println("No. Of Annotations: " + tree.numAnnotations());
body.setSpanTree(tree);
document.setFieldValue(document.getField("body"), body);
return document;
}
use of com.yahoo.document.annotation.SpanList in project vespa by vespa-engine.
the class StringTestCase method consumeAnnotations.
public void consumeAnnotations(SpanTree tree, SpanList root) {
System.out.println("\n\nSpanList: " + root + " num Children: " + root.numChildren());
System.out.println("-------------------");
Iterator<SpanNode> childIterator = root.childIterator();
while (childIterator.hasNext()) {
SpanNode node = childIterator.next();
// + " Span Text: " + node.getText(fieldValStr));
System.out.println("Span Node: " + node);
if (node instanceof SpanList) {
System.out.println("Encountered another span list");
SpanList spl = (SpanList) node;
ListIterator<SpanNode> lli = spl.childIterator();
while (lli.hasNext()) {
System.out.print(" " + lli.next() + " ");
}
consumeAnnotations(tree, (SpanList) node);
} else {
System.out.println("\nGetting annotations for this span node: " + node);
getAnnotationsForNode(tree, node);
}
}
System.out.println("\nGetting annotations for the SpanList itself : " + root);
getAnnotationsForNode(tree, root);
}
use of com.yahoo.document.annotation.SpanList in project vespa by vespa-engine.
the class StringTestCase method testNestedSpanTreeBug4187377.
@Test
public void testNestedSpanTreeBug4187377() {
AnnotationType type = new AnnotationType("ann", DataType.STRING);
StringFieldValue outerString = new StringFieldValue("Ballooo");
SpanTree outerTree = new SpanTree("outer");
outerString.setSpanTree(outerTree);
SpanList outerRoot = (SpanList) outerTree.getRoot();
Span outerSpan = new Span(0, 1);
outerRoot.add(outerSpan);
StringFieldValue innerString = new StringFieldValue("innerBalloooo");
outerTree.annotate(outerSpan, new Annotation(type, innerString));
SpanTree innerTree = new SpanTree("inner");
innerString.setSpanTree(innerTree);
SpanList innerRoot = (SpanList) innerTree.getRoot();
Span innerSpan = new Span(0, 1);
innerRoot.add(innerSpan);
innerTree.annotate(innerSpan, new Annotation(type));
GrowableByteBuffer buffer = new GrowableByteBuffer(1024);
DocumentSerializer serializer = DocumentSerializerFactory.create42(buffer);
try {
serializer.write(null, outerString);
fail("Should have failed, nested span trees are not supported.");
} catch (SerializationException se) {
// OK!
}
}
use of com.yahoo.document.annotation.SpanList in project vespa by vespa-engine.
the class VespaDocumentDeserializer42 method readSpanNode.
private SpanNode readSpanNode() {
byte type = buf.get();
buf.position(buf.position() - 1);
SpanNode retval;
if ((type & Span.ID) == Span.ID) {
retval = new Span();
if (spanNodes != null) {
spanNodes.add(retval);
}
read((Span) retval);
} else if ((type & SpanList.ID) == SpanList.ID) {
retval = new SpanList();
if (spanNodes != null) {
spanNodes.add(retval);
}
read((SpanList) retval);
} else if ((type & AlternateSpanList.ID) == AlternateSpanList.ID) {
retval = new AlternateSpanList();
if (spanNodes != null) {
spanNodes.add(retval);
}
read((AlternateSpanList) retval);
} else {
throw new DeserializationException("Cannot read SpanNode of type " + type);
}
return retval;
}
Aggregations