当前位置：首页 > ops >正文

纯前端实现图文识别 OCR

ops 2025/8/20 20:02:08

Tesseract.js

Tesseract.js 是一个基于 Google Tesseract OCR 引擎的 JavaScript 库，利用 WebAssembly 技术将的 OCR 引擎带到了浏览器中。它完全运行在客户端，无需依赖服务器，适合处理中小型图片的文字识别。

基本使用

以下示例展示了如何使用 Tesseract.js 从图片中提取文字：
在这里插入图片描述

demo

HTML单文件：

<!DOCTYPE html>
<html lang="en"><head><meta charset="UTF-8"><title>OCR 图文识别</title><!-- <script src="https://unpkg.com/tesseract.js@2.1.1/dist/tesseract.min.js"></script> --><script src="https://unpkg.com/tesseract.js@v2.1.0/dist/tesseract.min.js"></script></head><body><h1>OCR 图文识别</h1><input type="file" id="imageFile" accept="image/*" /><br /><button onclick="recognizeImg()">识别图像</button><br /><h2>识别结果：</h2><div id="result">???</div><script>const worker = Tesseract.createWorker({logger: function (m) {console.log(m);},});async function recognizeImg() {const fileInput = document.getElementById("imageFile");const selectedFile = fileInput.files[0];console.log(selectedFile);await worker.load();await worker.loadLanguage(["eng", "chi_sim"]);await worker.initialize(["eng", "chi_sim"]);const ret = await worker.recognize(selectedFile||'https://tesseract.projectnaptha.com/img/eng_bw.png');console.log(ret.data.text);handleOCRResponse(ret.data);// 或者使用 FileReader方式// handleFileFn(selectedFile);}function handleFileFn(file) {// 使用 FileReader 读取图像文件内容const reader = new FileReader();reader.onload = function (e) {const imageDataURL = e.target.result;// 上传图像文件至 OCR APIuploadImageToOCR(imageDataURL);};reader.readAsDataURL(file);}async function uploadImageToOCR(imageDataURL) {await worker.load();await worker.loadLanguage(["eng", "chi_sim"]);await worker.initialize(["eng", "chi_sim"]);const ret = await worker.recognize(imageDataURL);console.log(ret.data.text);if (ret.data) {handleOCRResponse(ret.data);}}function handleOCRResponse(data) {const resultDiv = document.getElementById("result");if (data && data.text) {resultDiv.textContent = data.text;} else {resultDiv.textContent = "未能识别文本。";}}</script></body>
</html>