Platform Explorer / Nuxeo Platform LTS 2017 9.10

Operation PDF.ExtractText (PDF: Extract Text)

Description

Extracts raw text from a PDF. If the PDF is encrypted, a password is required.
Operation id PDF.ExtractText
Category Document
Label PDF: Extract Text
Requires
Since

Parameters

Name Description Type Required Default value
password string no  
patterntofind string no  
pdfxpath string no  
removepatternfromresult boolean no  
save boolean no  
targetxpath string no  

Signature

Inputs document, documents
Outputs document, documents

Implementation Information

JSON Definition

{
  "id" : "PDF.ExtractText",
  "label" : "PDF: Extract Text",
  "category" : "Document",
  "requires" : null,
  "description" : "Extracts raw text from a PDF. If the PDF is encrypted, a password is required.",
  "url" : "PDF.ExtractText",
  "signature" : [ "document", "document", "documents", "documents" ],
  "params" : [ {
    "name" : "password",
    "description" : null,
    "type" : "string",
    "required" : false,
    "widget" : null,
    "order" : 0,
    "values" : [ ]
  }, {
    "name" : "patterntofind",
    "description" : null,
    "type" : "string",
    "required" : false,
    "widget" : null,
    "order" : 0,
    "values" : [ ]
  }, {
    "name" : "pdfxpath",
    "description" : null,
    "type" : "string",
    "required" : false,
    "widget" : null,
    "order" : 0,
    "values" : [ ]
  }, {
    "name" : "removepatternfromresult",
    "description" : null,
    "type" : "boolean",
    "required" : false,
    "widget" : null,
    "order" : 0,
    "values" : [ ]
  }, {
    "name" : "save",
    "description" : null,
    "type" : "boolean",
    "required" : false,
    "widget" : null,
    "order" : 0,
    "values" : [ ]
  }, {
    "name" : "targetxpath",
    "description" : null,
    "type" : "string",
    "required" : false,
    "widget" : null,
    "order" : 0,
    "values" : [ ]
  } ]
}