Search in sources :

Example 16 with PDDocument

use of com.tom_roush.pdfbox.pdmodel.PDDocument in project PdfBox-Android by TomRoush.

the class TestFontEmbedding method testCIDFontType2VerticalSubsetProportional.

/**
 * Embed a proportional TTF as vertical CIDFontType2 with subsetting.
 *
 * @throws IOException
 */
@Test
public void testCIDFontType2VerticalSubsetProportional() throws IOException {
    String text = "「ABC」";
    String expectedExtractedtext = "「\nA\nB\nC\n」";
    File pdf = new File(OUT_DIR, "CIDFontType2VP.pdf");
    PDDocument document = new PDDocument();
    PDPage page = new PDPage(PDRectangle.A4);
    document.addPage(page);
    File ipafont = new File("target/fonts/ipagp00303", "ipagp.ttf");
    assumeTrue(ipafont.exists());
    PDType0Font vfont = PDType0Font.loadVertical(document, ipafont);
    PDPageContentStream contentStream = new PDPageContentStream(document, page);
    contentStream.beginText();
    contentStream.setFont(vfont, 20);
    contentStream.newLineAtOffset(50, 700);
    contentStream.showText(text);
    contentStream.endText();
    contentStream.close();
    // Check the font substitution
    byte[] encode = vfont.encode(text);
    int cid = ((encode[0] & 0xFF) << 8) + (encode[1] & 0xFF);
    // it's 12461 without substitution
    assertEquals(12607, cid);
    // Check the dictionaries
    COSDictionary fontDict = vfont.getCOSObject();
    assertEquals(COSName.IDENTITY_V, fontDict.getDictionaryObject(COSName.ENCODING));
    document.save(pdf);
    // Vertical metrics are fixed during subsetting, so do this after calling save()
    COSDictionary descFontDict = vfont.getDescendantFont().getCOSObject();
    COSArray dw2 = (COSArray) descFontDict.getDictionaryObject(COSName.DW2);
    // This font uses default values for DW2
    assertNull(dw2);
    // c [ w1_1y v_1x v_1y ... w1_ny v_nx v_ny ]
    COSArray w2 = (COSArray) descFontDict.getDictionaryObject(COSName.W2);
    assertEquals(2, w2.size());
    // Start CID
    assertEquals(12607, w2.getInt(0));
    COSArray metrics = (COSArray) w2.getObject(1);
    int i = 0;
    for (int n : new int[] { -570, 500, 450, -570, 500, 880 }) {
        assertEquals(n, metrics.getInt(i++));
    }
    document.close();
    // Check text extraction
    String extracted = getUnicodeText(pdf);
    assertEquals(expectedExtractedtext, extracted.replaceAll("\r", "").trim());
}
Also used : PDPage(com.tom_roush.pdfbox.pdmodel.PDPage) COSDictionary(com.tom_roush.pdfbox.cos.COSDictionary) COSArray(com.tom_roush.pdfbox.cos.COSArray) PDDocument(com.tom_roush.pdfbox.pdmodel.PDDocument) PDPageContentStream(com.tom_roush.pdfbox.pdmodel.PDPageContentStream) File(java.io.File) Test(org.junit.Test)

Example 17 with PDDocument

use of com.tom_roush.pdfbox.pdmodel.PDDocument in project PdfBox-Android by TomRoush.

the class TestFontEmbedding method testCIDFontType2VerticalSubsetMonospace.

/**
 * Embed a monospace TTF as vertical CIDFontType2 with subsetting.
 *
 * @throws IOException
 */
@Test
public void testCIDFontType2VerticalSubsetMonospace() throws IOException {
    String text = "「ABC」";
    String expectedExtractedtext = "「\nA\nB\nC\n」";
    File pdf = new File(OUT_DIR, "CIDFontType2VM.pdf");
    PDDocument document = new PDDocument();
    PDPage page = new PDPage(PDRectangle.A4);
    document.addPage(page);
    File ipafont = new File("target/fonts/ipag00303", "ipag.ttf");
    assumeTrue(ipafont.exists());
    PDType0Font vfont = PDType0Font.loadVertical(document, ipafont);
    PDPageContentStream contentStream = new PDPageContentStream(document, page);
    contentStream.beginText();
    contentStream.setFont(vfont, 20);
    contentStream.newLineAtOffset(50, 700);
    contentStream.showText(text);
    contentStream.endText();
    contentStream.close();
    // Check the font substitution
    byte[] encode = vfont.encode(text);
    int cid = ((encode[0] & 0xFF) << 8) + (encode[1] & 0xFF);
    // it's 441 without substitution
    assertEquals(7392, cid);
    // Check the dictionaries
    COSDictionary fontDict = vfont.getCOSObject();
    assertEquals(COSName.IDENTITY_V, fontDict.getDictionaryObject(COSName.ENCODING));
    document.save(pdf);
    // Vertical metrics are fixed during subsetting, so do this after calling save()
    COSDictionary descFontDict = vfont.getDescendantFont().getCOSObject();
    COSArray dw2 = (COSArray) descFontDict.getDictionaryObject(COSName.DW2);
    // This font uses default values for DW2
    assertNull(dw2);
    COSArray w2 = (COSArray) descFontDict.getDictionaryObject(COSName.W2);
    // Monospaced font has no entries
    assertEquals(0, w2.size());
    document.close();
    // Check text extraction
    String extracted = getUnicodeText(pdf);
    assertEquals(expectedExtractedtext, extracted.replaceAll("\r", "").trim());
}
Also used : PDPage(com.tom_roush.pdfbox.pdmodel.PDPage) COSDictionary(com.tom_roush.pdfbox.cos.COSDictionary) COSArray(com.tom_roush.pdfbox.cos.COSArray) PDDocument(com.tom_roush.pdfbox.pdmodel.PDDocument) PDPageContentStream(com.tom_roush.pdfbox.pdmodel.PDPageContentStream) File(java.io.File) Test(org.junit.Test)

Example 18 with PDDocument

use of com.tom_roush.pdfbox.pdmodel.PDDocument in project PdfBox-Android by TomRoush.

the class TestFontEmbedding method getUnicodeText.

private String getUnicodeText(File file) throws IOException {
    PDDocument document = PDDocument.load(file);
    PDFTextStripper stripper = new PDFTextStripper();
    return stripper.getText(document);
}
Also used : PDDocument(com.tom_roush.pdfbox.pdmodel.PDDocument) PDFTextStripper(com.tom_roush.pdfbox.text.PDFTextStripper)

Example 19 with PDDocument

use of com.tom_roush.pdfbox.pdmodel.PDDocument in project PdfBox-Android by TomRoush.

the class TestFontEmbedding method validateCIDFontType2.

private void validateCIDFontType2(boolean useSubset) throws Exception {
    PDDocument document = new PDDocument();
    PDPage page = new PDPage(PDRectangle.A4);
    document.addPage(page);
    InputStream input = PDFont.class.getResourceAsStream("/com/tom_roush/pdfbox/resources/ttf/LiberationSans-Regular.ttf");
    PDType0Font font = PDType0Font.load(document, input, useSubset);
    PDPageContentStream stream = new PDPageContentStream(document, page);
    stream.beginText();
    stream.setFont(font, 12);
    String text = "Unicode русский язык Tiếng Việt";
    stream.newLineAtOffset(50, 600);
    stream.showText(text);
    stream.endText();
    stream.close();
    File file = new File(OUT_DIR, "CIDFontType2.pdf");
    document.save(file);
    document.close();
    // check that the extracted text matches what we wrote
    String extracted = getUnicodeText(file);
    assertEquals(text, extracted.trim());
}
Also used : PDPage(com.tom_roush.pdfbox.pdmodel.PDPage) InputStream(java.io.InputStream) PDDocument(com.tom_roush.pdfbox.pdmodel.PDDocument) PDPageContentStream(com.tom_roush.pdfbox.pdmodel.PDPageContentStream) File(java.io.File)

Example 20 with PDDocument

use of com.tom_roush.pdfbox.pdmodel.PDDocument in project PdfBox-Android by TomRoush.

the class PDTextFieldTest method setUp.

@Before
public void setUp() {
    document = new PDDocument();
    acroForm = new PDAcroForm(document);
}
Also used : PDDocument(com.tom_roush.pdfbox.pdmodel.PDDocument) Before(org.junit.Before)

Aggregations

PDDocument (com.tom_roush.pdfbox.pdmodel.PDDocument)137 File (java.io.File)80 Test (org.junit.Test)69 PDPage (com.tom_roush.pdfbox.pdmodel.PDPage)37 PDPageContentStream (com.tom_roush.pdfbox.pdmodel.PDPageContentStream)22 InputStream (java.io.InputStream)21 Bitmap (android.graphics.Bitmap)18 IOException (java.io.IOException)14 PDResources (com.tom_roush.pdfbox.pdmodel.PDResources)11 PDFRenderer (com.tom_roush.pdfbox.rendering.PDFRenderer)11 ArrayList (java.util.ArrayList)11 PDDocumentCatalog (com.tom_roush.pdfbox.pdmodel.PDDocumentCatalog)10 ByteArrayOutputStream (java.io.ByteArrayOutputStream)9 FileInputStream (java.io.FileInputStream)9 FileOutputStream (java.io.FileOutputStream)9 COSArray (com.tom_roush.pdfbox.cos.COSArray)8 PDEmbeddedFile (com.tom_roush.pdfbox.pdmodel.common.filespecification.PDEmbeddedFile)8 PDFont (com.tom_roush.pdfbox.pdmodel.font.PDFont)8 COSDictionary (com.tom_roush.pdfbox.cos.COSDictionary)7 Paint (android.graphics.Paint)6