public class DocumentSource
extends java.lang.Object
Modifier and Type | Field and Description |
---|---|
static int |
PDFTOXML_FILES_AMOUNT_LIMIT |
Modifier and Type | Method and Description |
---|---|
void |
close(boolean cleanImages,
boolean cleanAnnotations,
boolean cleanOutline) |
static void |
close(DocumentSource source,
boolean cleanImages,
boolean cleanAnnotations,
boolean cleanOutline) |
static DocumentSource |
fromPdf(java.io.File pdfFile) |
static DocumentSource |
fromPdf(java.io.File pdfFile,
int startPage,
int endPage)
By default the XML extracted from the PDF is without images, to avoid flooding the grobid-home/tmp directory,
but with the extra annotation file and with outline
|
static DocumentSource |
fromPdf(java.io.File pdfFile,
int startPage,
int endPage,
boolean withImages,
boolean withAnnotations,
boolean withOutline) |
java.io.File |
getPdfFile() |
java.io.File |
getXmlFile() |
java.io.File |
pdf2xml(java.lang.Integer timeout,
boolean force,
int startPage,
int endPage,
java.io.File pdfPath,
java.io.File tmpPath,
boolean withImages,
boolean withAnnotations,
boolean withOutline)
Create an XML representation from a pdf file.
|
void |
setPdfFile(java.io.File pdfFile) |
void |
setXmlFile(java.io.File xmlFile) |
public static final int PDFTOXML_FILES_AMOUNT_LIMIT
public static DocumentSource fromPdf(java.io.File pdfFile)
public static DocumentSource fromPdf(java.io.File pdfFile, int startPage, int endPage)
public static DocumentSource fromPdf(java.io.File pdfFile, int startPage, int endPage, boolean withImages, boolean withAnnotations, boolean withOutline)
public java.io.File pdf2xml(java.lang.Integer timeout, boolean force, int startPage, int endPage, java.io.File pdfPath, java.io.File tmpPath, boolean withImages, boolean withAnnotations, boolean withOutline)
public void close(boolean cleanImages, boolean cleanAnnotations, boolean cleanOutline)
public static void close(DocumentSource source, boolean cleanImages, boolean cleanAnnotations, boolean cleanOutline)
public java.io.File getPdfFile()
public void setPdfFile(java.io.File pdfFile)
public java.io.File getXmlFile()
public void setXmlFile(java.io.File xmlFile)