1.安装依赖的leptonica库
wget http://www.leptonica.org/source/leptonica-1.78.0.tar.gz
tar -xzvf leptonica-1.78.0.tar.gz
cd leptonica-1.78.0
./configure
make && make install
2.安装Tesseract-OCR
wget https://codeload.github.com/tesseract-ocr/tesseract/tar.gz/4.1.0
tar -xvf 4.1.0
cd tesseract-4.1.0/
./autogen.sh
./configure
make && make install
sudo ldconfig
3.安装openssl
// 下载
wget https://www.openssl.org/source/openssl-1.1.1g.tar.gz
// 安装
tar -zxvf openssl-1.1.1c.tar.gz
cd openssl-1.1.1c
# 如果此步骤报错,需要安装perl以及gcc包
./config --prefix=/usr/local/openssl
make && make install
mv /usr/bin/openssl /usr/bin/openssl.bak
ln -sf /usr/local/openssl/bin/openssl /usr/bin/openssl
echo "/usr/local/openssl/lib" >> /etc/ld.so.conf
# 设置生效
ldconfig -v
4.语言包
#获取所有语言包
git clone https://github.com/tesseract-ocr/tessdata.git
下载地址:https://github.com/tesseract-ocr/tessdata
wget --no-check-certificate https://github.com/tesseract-ocr/tessdata/raw/master/eng.traineddatachi_sim.traineddata 中文
eng.traineddata 英文
enm.traineddata 数字
5.执行命令
sudo tesseract 444.jpg 444 -l chi_sim+eng --psm 7
centos7 python安装opencv图片处理+tesseract-ocr识别
python-3.10.13
pip 23.2.1
1.python安装opencv-python
pip3 install opencv-python
2.安装leptonica
安装依赖 yum install autoconf automake libtool libjpeg-devel libpng-devel libtiff-devel zlib-develcd /home wget http://www.leptonica.org/source/leptonica-1.83.0.tar.gztar -zxvf leptonica-1.83.0.tar.gzcd leptonica-1.83.0./autogen.sh
mkdir /usr/local/leptonica./configure --prefix=/usr/local/leptonicamake make install配置一下 leptonica 的环境变量vi /etc/profile文本最后添加export LD_LIBRARY_PATH=$LD_LIBRARY_PATH:/usr/local/leptonica/lib
export LIBLEPT_HEADERSDIR=/usr/local/leptonica/include
export PKG_CONFIG_PATH=/usr/local/leptonica/lib/pkgconfig应用配置source /etc/profile
3.安装 tesserac
异常处理 :Your compiler does not have the necessary C++17 support! Cannot proceed升级gcc 版本yum install -y centos-release-sclyum install devtoolset-8-gcc*mv /usr/bin/gcc /usr/bin/gcc-4.8.5ln -s /opt/rh/devtoolset-8/root/bin/gcc /usr/bin/gccmv /usr/bin/g++ /usr/bin/g++-4.8.5ln -s /opt/rh/devtoolset-8/root/bin/g++ /usr/bin/g++gcc -v 查看版本tesserac 下载地址:https://github.com/tesseract-ocr/tesseract/releaseswget https://codeload.github.com/tesseract-ocr/tesseract/tar.gz/refs/tags/5.3.2tar -zxvf 5.3.2cd tesseract-5.3.2./autogen.sh mkdir /usr/local/tesseract./configure --prefix=/usr/local/tesseractmake && make installln -s /usr/local/tesseract/bin/tesseract /bin/tesseracttesseract --version下载字符集下载地址:https://tesseract-ocr.github.io/tessdoc/Data-Files.html下载好的字符放入目录:/usr/local/tesseract/share/tessdata
安装pytesseract
pip3 install pytesseract