use ocr to identifier page content

This commit is contained in:
Lei PAN
2023-05-19 21:00:38 +02:00
parent 7717a04b43
commit 076a5195b7
4 changed files with 81 additions and 20 deletions
+46
View File
@@ -0,0 +1,46 @@
const {v4: uuidv4} = require("uuid");
const tesseract = require("node-tesseract-ocr");
function delay(delayInMs) {
return new Promise(resolve => {
setTimeout(() => {
resolve(2);
}, delayInMs);
});
}
const config = {
lang: "eng",
oem: 1,
psm: 3,
}
class OCRChecker {
constructor(device, contact) {
this.device = device;
this.contact = contact;
}
get_file_name() {
let uuid = uuidv4();
return this.contact.passportNumber + "_" + uuid + ".png"
}
async get_result() {
let fileName = await this.take_screen_shot()
let result = await tesseract
.recognize(fileName, config)
console.log(result)
}
async take_screen_shot() {
let name = this.get_file_name()
await this.device.screenshot({path: name});
await delay(1000);
return name
// console.log(`stdout: ${stdout1}`);
}
}
module.exports = OCRChecker