diff --git a/README.md b/README.md index 656af3a..7e7a795 100644 --- a/README.md +++ b/README.md @@ -39,7 +39,7 @@ Tesseract.js works with a ` + ``` After including your scripts, the `Tesseract` variable will be defined globally! diff --git a/docs/faq.md b/docs/faq.md index 1698ff3..ca1ddd7 100644 --- a/docs/faq.md +++ b/docs/faq.md @@ -24,7 +24,11 @@ const { TesseractWorker } = Tesseract; const worker = new TesseractWorker(); worker - .recognize('https://tesseract.projectnaptha.com/img/eng_bw.png') + .recognize('https://tesseract.projectnaptha.com/img/eng_bw.png', 'eng', { + tessedit_create_box: '1', + tessedit_create_unlv: '1', + tessedit_create_osd: '1', + }) .then((result) => { console.log(result.text); console.log(result.hocr); diff --git a/docs/local-installation.md b/docs/local-installation.md index 0bdcda4..bbe72c9 100644 --- a/docs/local-installation.md +++ b/docs/local-installation.md @@ -1,6 +1,6 @@ ## Local Installation -Check here for an example: https://github.com/jeromewu/tesseract.js-offline +Check here for examples: https://github.com/naptha/tesseract.js/blob/master/docs/examples.md In browser environment, `tesseract.js` simply provides the API layer. Internally, it opens a WebWorker to handle requests. That worker itself loads code from the Emscripten-built `tesseract.js-core` which itself is hosted on a CDN. Then it dynamically loads language files hosted on another CDN. @@ -10,7 +10,7 @@ In Node.js environment, the only path you may want to customize is languages/lan ```javascript const worker = Tesseract.TesseractWorker({ - workerPath: 'https://unpkg.com/tesseract.js@v2.0.0-alpha.8/dist/worker.min.js', + workerPath: 'https://unpkg.com/tesseract.js@v2.0.0-alpha.10/dist/worker.min.js', langPath: 'https://tessdata.projectnaptha.com/4.0.0', corePath: 'https://unpkg.com/tesseract.js-core@v2.0.0-beta.10/tesseract-core.wasm.js', }); @@ -23,6 +23,6 @@ A string specifying the location of the [worker.js](./dist/worker.min.js) file. A string specifying the location of the tesseract language files, with default value 'https://tessdata.projectnaptha.com/4.0.0'. Language file URLs are calculated according to the formula `langPath + langCode + '.traineddata.gz'`. ### corePath -A string specifying the location of the [tesseract.js-core library](https://github.com/naptha/tesseract.js-core), with default value 'https://unpkg.com/tesseract.js-core@v2.0.0-beta.8/tesseract-core.wasm.js' (fallback to tesseract-core.asm.js when WebAssembly is not available). +A string specifying the location of the [tesseract.js-core library](https://github.com/naptha/tesseract.js-core), with default value 'https://unpkg.com/tesseract.js-core@v2.0.0-beta.10/tesseract-core.wasm.js' (fallback to tesseract-core.asm.js when WebAssembly is not available). -Another WASM option is 'https://unpkg.com/tesseract.js-core@v2.0.0-beta.8/tesseract-core.js' which is a script that loads 'https://unpkg.com/tesseract.js-core@v2.0.0-beta.8/tesseract-core.wasm'. But it fails to fetch at this moment. +Another WASM option is 'https://unpkg.com/tesseract.js-core@v2.0.0-beta.10/tesseract-core.js' which is a script that loads 'https://unpkg.com/tesseract.js-core@v2.0.0-beta.10/tesseract-core.wasm'. But it fails to fetch at this moment. diff --git a/package-lock.json b/package-lock.json index dd7e176..cc8485b 100644 --- a/package-lock.json +++ b/package-lock.json @@ -1,6 +1,6 @@ { "name": "tesseract.js", - "version": "2.0.0-alpha.9", + "version": "2.0.0-alpha.10", "lockfileVersion": 1, "requires": true, "dependencies": { diff --git a/package.json b/package.json index c6d3205..34ee08e 100644 --- a/package.json +++ b/package.json @@ -1,6 +1,6 @@ { "name": "tesseract.js", - "version": "2.0.0-alpha.9", + "version": "2.0.0-alpha.10", "description": "Pure Javascript Multilingual OCR", "main": "src/index.js", "scripts": {