tesseract.js/src/common/options.js

const { OEM, PSM } = require('./types');

module.exports = {
  defaultOptions: {
    /*
     * default path for downloading *.traineddata, this URL basically
     * points to a github page, not using jsDelivr as there is is limitation
     * of 20 MB.
     */
    langPath: 'https://tessdata.projectnaptha.com/4.0.0',
  },
  /*
   * default params for recognize()
   */
  defaultParams: {
    tessedit_ocr_engine_mode: OEM.LSTM_ONLY,
    tessedit_pageseg_mode: PSM.SINGLE_BLOCK,
    tessedit_char_whiltelist: '',
    tessedit_create_pdf: '0',
    tessedit_create_hocr: '1',
    tessedit_create_tsv: '1',
    tessedit_create_box: '0',
    tessedit_create_unlv: '0',
    tessedit_create_osd: '0',
    textonly_pdf: '0',
    pdf_name: 'tesseract.js-ocr-result',
    pdf_title: 'Tesseract.js OCR Result',
    pdf_auto_download: true,
    pdf_bin: false,
  },
};
Add pdf output feature and rename oem params 6 years ago			`const { OEM, PSM } = require('./types');`

Minor refactor 7 years ago			`module.exports = {`
			`defaultOptions: {`
Add comments and remove unused files 6 years ago			`/*`
			`* default path for downloading *.traineddata, this URL basically`
			`* points to a github page, not using jsDelivr as there is is limitation`
			`* of 20 MB.`
			`*/`
Minor refactor 7 years ago			`langPath: 'https://tessdata.projectnaptha.com/4.0.0',`
			`},`
Add pdf output feature and rename oem params 6 years ago			`/*`
			`* default params for recognize()`
			`*/`
			`defaultParams: {`
Change default OCR engine mode to LSTM_ONLY 6 years ago			`tessedit_ocr_engine_mode: OEM.LSTM_ONLY,`
Add pdf output feature and rename oem params 6 years ago			`tessedit_pageseg_mode: PSM.SINGLE_BLOCK,`
			`tessedit_char_whiltelist: '',`
			`tessedit_create_pdf: '0',`
Make output of hocr, tsv, box, unlv, osd to be optional 6 years ago			`tessedit_create_hocr: '1',`
			`tessedit_create_tsv: '1',`
			`tessedit_create_box: '0',`
			`tessedit_create_unlv: '0',`
			`tessedit_create_osd: '0',`
Add pdf output feature and rename oem params 6 years ago			`textonly_pdf: '0',`
			`pdf_name: 'tesseract.js-ocr-result',`
			`pdf_title: 'Tesseract.js OCR Result',`
Update tesseract_parameters.md and export pdf bin data in result object 6 years ago			`pdf_auto_download: true,`
			`pdf_bin: false,`
Add pdf output feature and rename oem params 6 years ago			`},`
Minor refactor 7 years ago			`};`