Search in sources :

Example 1 with TextStyleType

use of eu.transkribus.core.model.beans.pagecontent.TextStyleType in project TranskribusCore by Transkribus.

the class TextStyleTag method reset.

@Override
protected void reset(boolean withIndices) {
    super.reset(withIndices);
    ts = new TextStyleType();
}
Also used : TextStyleType(eu.transkribus.core.model.beans.pagecontent.TextStyleType)

Example 2 with TextStyleType

use of eu.transkribus.core.model.beans.pagecontent.TextStyleType in project TranskribusCore by Transkribus.

the class BeanCopyUtils method copyTextStyleType.

public static TextStyleType copyTextStyleType(TextStyleType style) {
    if (style == null)
        return null;
    TextStyleType copy = new TextStyleType();
    TextStyleTypeUtils.copyTextStyleTypeFields(style, copy);
    return copy;
}
Also used : TextStyleType(eu.transkribus.core.model.beans.pagecontent.TextStyleType)

Example 3 with TextStyleType

use of eu.transkribus.core.model.beans.pagecontent.TextStyleType in project TranskribusCore by Transkribus.

the class TextStyleTypeUtilsTest method testMergeEqualTextStyleTypeFields.

// @Test public void testTrue() {
// Assert.assertTrue("yeah!", true==true);
// }
@Test
public void testMergeEqualTextStyleTypeFields() {
    TextStyleType ts1 = new TextStyleType();
    ts1.setFontFamily("hello");
    TextStyleType ts2 = new TextStyleType();
    ts2.setBold(true);
    TextStyleType mergedTs = TextStyleTypeUtils.mergeEqualTextStyleTypeFields(ts1, ts2);
    TextStyleType mergedCheck = new TextStyleType();
    logger.debug("merged = " + mergedTs);
    Assert.assertTrue("merged should be empty", TextStyleTypeUtils.equalsInEffectiveValues(mergedCheck, mergedTs));
}
Also used : TextStyleType(eu.transkribus.core.model.beans.pagecontent.TextStyleType) Test(org.junit.Test)

Example 4 with TextStyleType

use of eu.transkribus.core.model.beans.pagecontent.TextStyleType in project TranskribusCore by Transkribus.

the class DocxBuilder method getFormattedTextForShapeElement.

private static void getFormattedTextForShapeElement(ITrpShapeType element, P p, MainDocumentPart mdp) throws Exception {
    ArrayList<R> listOfallRuns = new ArrayList<R>();
    String textStr = element.getUnicodeText();
    CustomTagList cl = element.getCustomTagList();
    if (textStr == null || cl == null)
        throw new IOException("Element has no text or custom tag list: " + element + ", class: " + element.getClass().getName());
    if (textStr.isEmpty()) {
        return;
    }
    boolean rtl = false;
    // from right to left
    if (Character.getDirectionality(textStr.charAt(0)) == Character.DIRECTIONALITY_RIGHT_TO_LEFT || Character.getDirectionality(textStr.charAt(0)) == Character.DIRECTIONALITY_RIGHT_TO_LEFT_ARABIC || Character.getDirectionality(textStr.charAt(0)) == Character.DIRECTIONALITY_RIGHT_TO_LEFT_EMBEDDING || Character.getDirectionality(textStr.charAt(0)) == Character.DIRECTIONALITY_RIGHT_TO_LEFT_OVERRIDE) {
        logger.debug("&&&&&&&& STRING IS RTL : ");
        deleteCharAtIndex(0, textStr);
        rtl = true;
    }
    // format according to tags:CustomTagList
    for (CustomTag nonIndexedTag : cl.getNonIndexedTags()) {
        // exchange chars with * if wished to be blackened
        if (doBlackening && nonIndexedTag.getTagName().equals(RegionTypeUtil.BLACKENING_REGION.toLowerCase())) {
            // logger.debug("nonindexed tag found ");
            textStr = ExportUtils.blackenString(nonIndexedTag, textStr);
        }
        /*
			 * for gap and comment: remember their position to find and add them to their corresponding 'run' later on 
			 * 
			 */
        if (nonIndexedTag.getTagName().equals("gap")) {
            GapTag gap = (GapTag) nonIndexedTag;
            gapList.put(nonIndexedTag.getOffset(), gap);
        }
    // unclear and comments can not be non-indexed
    // if (nonIndexedTag.getTagName().equals("comment")){
    // logger.debug("nonindexed comment tag found ");
    // CommentTag ct = (CommentTag) nonIndexedTag;
    // commentList.put(nonIndexedTag.getEnd()-1, ct.getComment());
    // }
    // if(nonIndexedTag.getTagName().equals("unclear")){
    // logger.debug("unclear tag found ");
    // unclearList.put(nonIndexedTag.getOffset(), nonIndexedTag.getOffset()+nonIndexedTag.getLength());
    // }
    }
    for (CustomTag indexedTag : cl.getIndexedTags()) {
        if (doBlackening && indexedTag.getTagName().equals(RegionTypeUtil.BLACKENING_REGION.toLowerCase())) {
            textStr = ExportUtils.blackenString(indexedTag, textStr);
        }
        /*
			 * find all gaps and store the offset
			 */
        if (indexedTag.getTagName().equals("gap")) {
            GapTag gap = (GapTag) indexedTag;
            gapList.put(indexedTag.getOffset(), gap);
        }
        if (indexedTag.getTagName().equals("comment")) {
            // logger.debug("indexed comment tag found at pos " + (indexedTag.getEnd()-1));
            CommentTag ct = (CommentTag) indexedTag;
            commentList.put(indexedTag.getEnd() - 1, ct.getComment());
        }
        // if(exportTags){
        if (markUnclearWords && indexedTag.getTagName().equals("unclear")) {
            // logger.debug("unclear tag found ");
            // logger.debug("unclear start is: " + indexedTag.getOffset());
            // logger.debug("unclear end is: " + (indexedTag.getEnd()-1));
            unclearList.put(indexedTag.getOffset(), indexedTag.getEnd() - 1);
        }
        if (expandAbbrevs && indexedTag.getTagName().equals("abbrev")) {
            logger.debug("abbrev tag found ");
            AbbrevTag at = (AbbrevTag) indexedTag;
            String expansion = at.getExpansion();
            // only add if an expansion was typed
            if (!expansion.equals("")) {
                expandAbbrevList.put(indexedTag.getEnd(), at.getExpansion());
            }
        }
        if (substituteAbbrevs && indexedTag.getTagName().equals("abbrev")) {
            // logger.debug("abbrev tag found ");
            AbbrevTag at = (AbbrevTag) indexedTag;
            String expansion = at.getExpansion();
            // key is the start of the abbrev
            if (!expansion.equals("")) {
                substituteAbbrevList.put(indexedTag.getOffset(), at);
            }
        }
        if (showSuppliedWithBrackets && indexedTag.getTagName().equals("supplied")) {
            // logger.debug("supplied tag found ");
            SuppliedTag at = (SuppliedTag) indexedTag;
            String text = at.getContainedText();
            // only add if an expansion was typed
            if (!text.equals("")) {
                showSuppliedList.put(indexedTag.getOffset(), text);
            }
        }
        if (ignoreSupplied && indexedTag.getTagName().equals("supplied")) {
            // logger.debug("supplied tag found ");
            SuppliedTag at = (SuppliedTag) indexedTag;
            String text = at.getContainedText();
            // only add if an expansion was typed
            if (!text.equals("")) {
                ignoreSuppliedList.put(indexedTag.getOffset(), text);
            }
        }
        // create index for all choosen tagnames
        if (exportTags && tagnames.contains(indexedTag.getTagName()) && !indexedTag.getTagName().equals("gap")) {
            // logger.debug("export tag as idx entry " + indexedTag.getOffset());
            addValuesToIdxList(idxList, indexedTag.getEnd(), indexedTag);
        }
    // }
    }
    List<TextStyleTag> textStylesTags = element.getTextStyleTags();
    // ArrayList<R> runs = new ArrayList<R>();
    boolean shapeEnded = false;
    for (int i = 0; i <= textStr.length(); ++i) {
        // use of abbrevIdx: this is necessary for the appearance at the end of a textline
        // otherwise the abbrev expansion would not appear at the end of a line because then the index i would be too small
        shapeEnded = (i + 1 >= textStr.length() ? true : false);
        /*
			 * is this case the abbrev gets totally replaced by its expansion
			 * so if the start of the abbrev was found the expansion is written and we can break the writing of the abbrev
			 */
        if (substituteAbbrevList.containsKey(i)) {
            String exp = substituteAbbrevList.get(i).getExpansion();
            if (rtl) {
                exp = reverseString(exp);
            }
            org.docx4j.wml.Text abbrevText = factory.createText();
            abbrevText.setValue(exp);
            org.docx4j.wml.R abbrevRun = factory.createR();
            // p.getContent().add(abbrevRun);
            abbrevRun.getContent().add(abbrevText);
            listOfallRuns.add(abbrevRun);
            // go to end of the abbreviation and proceed with remaining text
            i += substituteAbbrevList.get(i).getLength();
            shapeEnded = (i == textStr.length() ? true : false);
        }
        /*
			 * add expansion in brackets behind the abbrev		
			 * the abbrev list contains as key the end index of the abbrev	
			 */
        if (expandAbbrevList.containsKey(i)) {
            String exp = expandAbbrevList.get(i);
            if (rtl) {
                exp = reverseString(exp);
            }
            org.docx4j.wml.Text abbrevText = factory.createText();
            abbrevText.setValue("[" + exp + "]");
            org.docx4j.wml.R abbrevRun = factory.createR();
            // p.getContent().add(abbrevRun);
            abbrevRun.getContent().add(abbrevText);
            listOfallRuns.add(abbrevRun);
        }
        /*
			 * in this case the supplied tag is expanded either with or without brackets
			 * 
			 */
        if (showSuppliedList.containsKey(i)) {
            String exp = showSuppliedList.get(i);
            if (rtl) {
                exp = reverseString(exp);
            }
            org.docx4j.wml.Text suppliedText = factory.createText();
            suppliedText.setValue("[" + exp + "]");
            org.docx4j.wml.R suppliedRun = factory.createR();
            suppliedRun.getContent().add(suppliedText);
            listOfallRuns.add(suppliedRun);
            // supplied is handled now - so set i to the end of supplied
            i += showSuppliedList.get(i).length();
            shapeEnded = (i == textStr.length() ? true : false);
        }
        /*
			 * in this case the supplied tag gets ignored
			 * this means that index i must be incremented by the length of this supplied tag text
			 */
        if (ignoreSuppliedList.containsKey(i)) {
            i += ignoreSuppliedList.get(i).length();
            shapeEnded = (i == textStr.length() ? true : false);
        }
        /*
			 * gap is at this position
			 * hence create extra run with [...] as value and then go on
			 * of if suppied attribute is set handle supplied as set in the export settings
			 */
        if (gapList.containsKey(i)) {
            org.docx4j.wml.Text t = factory.createText();
            // if (!rtl)
            // t.setValue("[...] ");
            // else
            // t.setValue(" [...]");
            GapTag gt = gapList.get(i);
            String cta = (String) gt.getAttributeValue("supplied");
            // attribute supplied is set in the gap tag -> handle supplied as wanted
            if (cta != null && !cta.equals("")) {
                // may the gap with supplied attribute gets ignored
                if (!ignoreSupplied) {
                    if (showSuppliedWithBrackets) {
                        t.setValue("[" + cta + "]");
                    }
                // do not show supplied attribute by default!?
                // else{
                // t.setValue(cta);
                // }
                }
            } else // nothing supplied, so show [...] for the gap tag
            {
                t.setValue("[...]");
                t.setSpace("preserve");
            }
            org.docx4j.wml.R run = factory.createR();
            // p.getContent().add(run);
            run.getContent().add(t);
            listOfallRuns.add(run);
        }
        // begin of unclear word should be marked with [ and end with ]
        if (unclearList.containsKey(i)) {
            org.docx4j.wml.Text t = factory.createText();
            if (!rtl)
                t.setValue("[");
            else
                t.setValue("]");
            org.docx4j.wml.R run = factory.createR();
            // p.getContent().add(run);
            run.getContent().add(t);
            listOfallRuns.add(run);
        }
        /*
			 * if so we create an index entry for this text string in the docx
			 */
        if (idxList.containsKey(i)) {
            addIndexEntry(i, p, textStr, rtl);
        }
        String currText = "";
        if (i + 1 <= textStr.length()) {
            currText = textStr.substring(i, i + 1);
        // logger.debug("&&&&&&&& current single char : " + currText);
        }
        /*
			 * 2nd is (should be) soft hyphen with Unicode U+00AD
			 * First arg is not sign and was initially used for soft hyphen by Diggitexx
			 * need to be at the line end - otherwise 
			 * 
			 */
        if ((currText.equals("¬") || currText.equals("­") || currText.equals("-")) && !preserveLineBreaks && shapeEnded) {
            break;
        }
        org.docx4j.wml.Text t = factory.createText();
        t.setValue(currText);
        t.setSpace("preserve");
        org.docx4j.wml.R run = factory.createR();
        // p.getContent().add(run);
        run.getContent().add(t);
        listOfallRuns.add(run);
        // end of unclear tag
        if (unclearList.containsValue(i)) {
            org.docx4j.wml.Text unclearEnd = factory.createText();
            if (!rtl)
                unclearEnd.setValue("]");
            else
                unclearEnd.setValue("[");
            org.docx4j.wml.R unclearRun = factory.createR();
            // p.getContent().add(unclearRun);
            unclearRun.getContent().add(unclearEnd);
            listOfallRuns.add(unclearRun);
        }
        // the properties of this text section
        org.docx4j.wml.RPr rpr = factory.createRPr();
        /*
			 * format according to custom style tag - check for each char in the text if a special style should be set
			 */
        for (TextStyleTag styleTag : textStylesTags) {
            if (i >= styleTag.getOffset() && i < (styleTag.getOffset() + styleTag.getLength())) {
                org.docx4j.wml.BooleanDefaultTrue b = new org.docx4j.wml.BooleanDefaultTrue();
                b.setVal(true);
                TextStyleType ts = styleTag.getTextStyle();
                if (ts == null)
                    continue;
                if (CoreUtils.val(ts.isBold())) {
                    rpr.setB(b);
                }
                if (CoreUtils.val(ts.isItalic())) {
                    rpr.setI(b);
                }
                if (CoreUtils.val(ts.isLetterSpaced())) {
                // ????
                }
                if (CoreUtils.val(ts.isMonospace())) {
                // ????
                }
                if (CoreUtils.val(ts.isReverseVideo())) {
                // ????
                }
                if (CoreUtils.val(ts.isSerif())) {
                // ????
                }
                if (CoreUtils.val(ts.isSmallCaps())) {
                    rpr.setSmallCaps(b);
                }
                if (CoreUtils.val(ts.isStrikethrough())) {
                    rpr.setStrike(b);
                }
                if (CoreUtils.val(ts.isSubscript())) {
                    org.docx4j.wml.CTVerticalAlignRun al = factory.createCTVerticalAlignRun();
                    al.setVal(STVerticalAlignRun.SUBSCRIPT);
                    rpr.setVertAlign(al);
                }
                if (CoreUtils.val(ts.isSuperscript())) {
                    org.docx4j.wml.CTVerticalAlignRun al = factory.createCTVerticalAlignRun();
                    al.setVal(STVerticalAlignRun.SUPERSCRIPT);
                    rpr.setVertAlign(al);
                }
                if (CoreUtils.val(ts.isUnderlined())) {
                    U u = factory.createU();
                    u.setVal(UnderlineEnumeration.SINGLE);
                    rpr.setU(u);
                }
            // BooleanDefaultTrue bdt = Context.getWmlObjectFactory().createBooleanDefaultTrue();
            // bdt.setVal(Boolean.TRUE);
            // rpr.setRtl(bdt);
            // rpr.setHighlight(new Highlight());
            }
        }
        // at the run properties (= text styles) to the run
        run.setRPr(rpr);
        // find position of footnote/comment
        if (commentList.containsKey(i)) {
            // logger.debug("position of comment: " + i);
            // logger.debug("value of comment: " + commentList.get(i));
            // creates the footnote at the end of the wished text - this position was found at the beginning of this method
            org.docx4j.wml.R fnRun = factory.createR();
            // p.getContent().add(fnRun);
            createFootnote(commentList.get(i), fnRun, mdp);
            listOfallRuns.add(fnRun);
        }
        /*
			 * add space at end of line if line breaks are not preserved
			 */
        if (!preserveLineBreaks && shapeEnded) {
            org.docx4j.wml.Text space = factory.createText();
            space.setValue(" ");
            space.setSpace("preserve");
            org.docx4j.wml.R runSpace = factory.createR();
            // p.getContent().add(runSpace);
            runSpace.getContent().add(space);
            listOfallRuns.add(runSpace);
        }
    // runs.add(run);
    }
    if (rtl) {
        PPr paragraphProperties = factory.createPPr();
        Jc justification = factory.createJc();
        justification.setVal(JcEnumeration.RIGHT);
        paragraphProperties.setJc(justification);
        p.setPPr(paragraphProperties);
    }
    for (int i = listOfallRuns.size() - 1; i >= 0; i--) {
        if (rtl) {
            p.getContent().add(listOfallRuns.get(i));
        } else {
            p.getContent().addAll(listOfallRuns);
            break;
        }
    }
    clearAllLists();
}
Also used : ArrayList(java.util.ArrayList) CustomTag(eu.transkribus.core.model.beans.customtags.CustomTag) RPr(org.docx4j.wml.RPr) R(org.docx4j.wml.R) U(org.docx4j.wml.U) R(org.docx4j.wml.R) Jc(org.docx4j.wml.Jc) Text(org.docx4j.wml.Text) TextStyleType(eu.transkribus.core.model.beans.pagecontent.TextStyleType) SuppliedTag(eu.transkribus.core.model.beans.customtags.SuppliedTag) CustomTagList(eu.transkribus.core.model.beans.customtags.CustomTagList) IOException(java.io.IOException) CommentTag(eu.transkribus.core.model.beans.customtags.CommentTag) TextStyleTag(eu.transkribus.core.model.beans.customtags.TextStyleTag) PPr(org.docx4j.wml.PPr) GapTag(eu.transkribus.core.model.beans.customtags.GapTag) AbbrevTag(eu.transkribus.core.model.beans.customtags.AbbrevTag)

Example 5 with TextStyleType

use of eu.transkribus.core.model.beans.pagecontent.TextStyleType in project TranskribusCore by Transkribus.

the class TextStyleTag method mergeEqualAttributes.

@Override
public void mergeEqualAttributes(CustomTag src, boolean withIndices) {
    super.mergeEqualAttributes(src, withIndices);
    if (src instanceof TextStyleTag) {
        TextStyleTag tst = (TextStyleTag) src;
        TextStyleType mergedTs = TextStyleTypeUtils.mergeEqualTextStyleTypeFields(this.ts, tst.ts);
        this.ts = mergedTs;
    }
}
Also used : TextStyleType(eu.transkribus.core.model.beans.pagecontent.TextStyleType)

Aggregations

TextStyleType (eu.transkribus.core.model.beans.pagecontent.TextStyleType)5 AbbrevTag (eu.transkribus.core.model.beans.customtags.AbbrevTag)1 CommentTag (eu.transkribus.core.model.beans.customtags.CommentTag)1 CustomTag (eu.transkribus.core.model.beans.customtags.CustomTag)1 CustomTagList (eu.transkribus.core.model.beans.customtags.CustomTagList)1 GapTag (eu.transkribus.core.model.beans.customtags.GapTag)1 SuppliedTag (eu.transkribus.core.model.beans.customtags.SuppliedTag)1 TextStyleTag (eu.transkribus.core.model.beans.customtags.TextStyleTag)1 IOException (java.io.IOException)1 ArrayList (java.util.ArrayList)1 Jc (org.docx4j.wml.Jc)1 PPr (org.docx4j.wml.PPr)1 R (org.docx4j.wml.R)1 RPr (org.docx4j.wml.RPr)1 Text (org.docx4j.wml.Text)1 U (org.docx4j.wml.U)1 Test (org.junit.Test)1