api documentation for textract (v2.1.2)

Extracting text from files of various type including html, pdf, doc, docx, xls, xlsx, csv, pptx, png, jpg, gif, rtf, text/*, and various open office.

table of contents

  1. module textract
    1. function textract.fromBufferWithMime ( type, bufferContent, options, cb, withPath )
    2. function textract.fromBufferWithName ( filePath, bufferContent, options, cb )
    3. function textract.fromFileWithMimeAndPath ( type, filePath, options, cb )
    4. function textract.fromFileWithPath ( filePath, options, cb )
    5. function textract.fromUrl ( url, options, cb )
    6. object textract.docx
    7. object textract.dxf
    8. object textract.html
    9. object textract.images
    10. object textract.md
    11. object textract.odt
    12. object textract.pdf
    13. object textract.ppt
    14. object textract.pptx
    15. object textract.rtf
    16. object textract.text
    17. object textract.util
    18. object textract.xls
  2. module textract.docx
    1. function textract.docx.extract ( filePath, options, cb )
    2. object textract.docx.types
  3. module textract.dxf
    1. function textract.dxf.extract ( filePath, options, cb )
    2. function textract.dxf.test ( options, cb )
    3. object textract.dxf.types
  4. module textract.html
    1. function textract.html.extract ( filePath, options, cb )
    2. function textract.html.extractFromText ( data, cb )
    3. object textract.html.types
  5. module textract.images
    1. function textract.images.extract ( filePath, options, cb )
    2. function textract.images.test ( options, cb )
    3. object textract.images.types
  6. module textract.md
    1. function textract.md.extract ( filePath, options, cb )
    2. object textract.md.types
  7. module textract.odt
    1. function textract.odt.extract ( filePath, options, cb )
    2. object textract.odt.types
  8. module textract.pdf
    1. function textract.pdf.extract ( filePath, options, cb )
    2. function textract.pdf.test ( options, cb )
    3. object textract.pdf.types
  9. module textract.ppt
    1. function textract.ppt.extract ( filePath, options, cb )
    2. object textract.ppt.types
  10. module textract.pptx
    1. function textract.pptx.extract ( filePath, options, cb )
    2. object textract.pptx.types
  11. module textract.rtf
    1. function textract.rtf.extract ( filePath, options, cb )
    2. function textract.rtf.test ( options, cb )
    3. object textract.rtf.types
  12. module textract.text
    1. function textract.text.extract ( filePath, options, cb )
    2. object textract.text.types
  13. module textract.util
    1. function textract.util.createExecOptions ( type, options )
    2. function textract.util.getTextFromZipFile ( zipfile, entry, cb )
    3. function textract.util.replaceBadCharacters ( text )
    4. function textract.util.runExecIntoFile ( label, filePath, options, execOptions, genCommand, cb )
    5. function textract.util.unzipCheck ( type, cb )
    6. function textract.util.yauzlError ( err, cb )
  14. module textract.xls
    1. function textract.xls.extract ( filePath, options, cb )
    2. object textract.xls.types

module textract

function textract.fromBufferWithMime ( type, bufferContent, options, cb, withPath )

function textract.fromBufferWithName ( filePath, bufferContent, options, cb )

function textract.fromFileWithMimeAndPath ( type, filePath, options, cb )

function textract.fromFileWithPath ( filePath, options, cb )

function textract.fromUrl ( url, options, cb )

module textract.docx

function textract.docx.extract ( filePath, options, cb )

module textract.dxf

function textract.dxf.extract ( filePath, options, cb )

function textract.dxf.test ( options, cb )

module textract.html

function textract.html.extract ( filePath, options, cb )

function textract.html.extractFromText ( data, cb )

module textract.images

function textract.images.extract ( filePath, options, cb )

function textract.images.test ( options, cb )

module textract.md

function textract.md.extract ( filePath, options, cb )

module textract.odt

function textract.odt.extract ( filePath, options, cb )

module textract.pdf

function textract.pdf.extract ( filePath, options, cb )

function textract.pdf.test ( options, cb )

module textract.ppt

function textract.ppt.extract ( filePath, options, cb )

module textract.pptx

function textract.pptx.extract ( filePath, options, cb )

module textract.rtf

function textract.rtf.extract ( filePath, options, cb )

function textract.rtf.test ( options, cb )

module textract.text

function textract.text.extract ( filePath, options, cb )

module textract.util

function textract.util.createExecOptions ( type, options )

function textract.util.getTextFromZipFile ( zipfile, entry, cb )

function textract.util.replaceBadCharacters ( text )

function textract.util.runExecIntoFile ( label, filePath, options, execOptions, genCommand, cb )

function textract.util.unzipCheck ( type, cb )

function textract.util.yauzlError ( err, cb )

module textract.xls

function textract.xls.extract ( filePath, options, cb )

[ this document was created with utility2 ]