-
大小: 44.3MB文件類型: .rar金幣: 1下載: 0 次發布日期: 2024-01-28
- 語言: C#
- 標簽: OCR??Tesseract??Tesseract-OC??
資源簡介
使用詳見我的博客:https://blog.csdn.net/HorseRoll/article/details/83310677
代碼片段和文件信息
using?System;
using?System.Collections.Generic;
using?System.ComponentModel;
using?System.Data;
using?System.Drawing;
using?System.Drawing.Drawing2D;
using?System.Drawing.Imaging;
using?System.Linq;
using?System.Text;
using?System.Threading.Tasks;
using?System.Windows.Forms;
using?Tesseract;
namespace?Tesseract_OCR識別
{
????public?partial?class?Form1?:?Form
????{
????????TesseractEngine?ocr;
????????public?Form1()
????????{
????????????InitializeComponent();
????????????//ocr?=?new?TesseractEngine(“./tessdata“?“eng“?EngineMode.TesseractAndCube);//設置語言???英文
????????????//ocr?=?new?TesseractEngine(“./tessdata“?“chi_sim“);//設置語言???中文
????????????ocr?=?new?TesseractEngine(“./tessdata“?“jpn“);//設置語言???日語
????????}
????????private?void?button1_Click(object?sender?EventArgs?e)
????????{
????????????OpenFileDialog?filename?=?new?OpenFileDialog();
????????????filename.Filter?=?“All?files(*.*)|*.*|image?files(*.bmp)|*.bmp;?*.jpg;?*.gif;?*.jpeg;*.png“;
????????????filename.FilterIndex?=?2;
????????????if?(filename.ShowDialog()?==?DialogResult.OK)
????????????{
????????????????Bitmap?bit?=?new?Bitmap(Image.FromFile(filename.FileName.ToString()));
????????????????//bit?=?PreprocesImage(bit);//進行圖像處理如果識別率低可試試
????????????????Page?page?=?ocr.Process(bit);
????????????????string?str?=?page.GetText();//識別后的內容
????????????????page.Dispose();
????????????????pictureBox1.Image?=?bit;
????????????????richTextBox1.AppendText(str);
????????????}
????????}
????????///?
????????///?圖片顏色區分,剩下白色和黑色
????????///?
????????///?
????????///?
????????private?Bitmap?PreprocesImage(Bitmap?image)
????????{
????????????//You?can?change?your?new?color?here.?RedGreenLawnGreen?any..
????????????Color?actualColor;
????????????//make?an?empty?bitmap?the?same?size?as?scrBitmap
????????????image?=?ResizeImage(image?image.Width?*?5?image.Height?*?5);
????????????//image.Save(@“D:\UpWork\OCR_WinForm\Preprocess_Resize.jpg“);
????????????Bitmap?newBitmap?=?new?Bitmap(image.Width?image.Height);
????????????for?(int?i?=?0;?i?????????????{
????????????????for?(int?j?=?0;?j?????????????????{
????????????????????//get?the?pixel?from?the?scrBitmap?image
????????????????????actualColor?=?image.GetPixel(i?j);
????????????????????//?>?150?because..?Images?edges?can?be?of?low?pixel?colr.?if?we?set?all?pixel?color?to?new?then?there?will?be?no?smoothness?left.
????????????????????if?(actualColor.R?>?23?||?actualColor.G?>?23?||?actualColor.B?>?23)//在這里設置RGB
????????????????????????newBitmap.SetPixel(i?j?Color.White);
????????????????????else
????????????????????????newBitmap.SetPixel(i?j?Color.Black);
????????????????}
????????????}
????????????return?newBitmap;
????????}
????????///?
????????///?調整圖片大小和對比度
????????///?
????????///?
????????///?
?屬性????????????大小?????日期????時間???名稱
-----------?---------??----------?-----??----
?????文件????????187??2018-10-23?16:47??Tesseract-OCR識別\App.config
?????文件???39973777??2012-10-17?22:55??Tesseract-OCR識別\bin\Debug\tessdata\chi_sim.traineddata
?????文件?????171918??2012-10-17?22:55??Tesseract-OCR識別\bin\Debug\tessdata\eng.cube.bigrams
?????文件?????????38??2012-10-17?22:55??Tesseract-OCR識別\bin\Debug\tessdata\eng.cube.fold
?????文件????????181??2012-10-17?22:55??Tesseract-OCR識別\bin\Debug\tessdata\eng.cube.lm
?????文件?????857304??2012-10-17?22:55??Tesseract-OCR識別\bin\Debug\tessdata\eng.cube.nn
?????文件????????254??2012-10-17?22:55??Tesseract-OCR識別\bin\Debug\tessdata\eng.cube.params
?????文件???13020078??2012-10-17?22:55??Tesseract-OCR識別\bin\Debug\tessdata\eng.cube.size
?????文件????2444187??2012-10-17?22:55??Tesseract-OCR識別\bin\Debug\tessdata\eng.cube.word-freq
?????文件????????996??2012-10-17?22:55??Tesseract-OCR識別\bin\Debug\tessdata\eng.tesseract_cube.nn
?????文件???21876572??2012-10-17?22:55??Tesseract-OCR識別\bin\Debug\tessdata\eng.traineddata
?????文件???30901222??2012-10-17?22:55??Tesseract-OCR識別\bin\Debug\tessdata\jpn.traineddata
?????文件??????10752??2018-10-23?17:54??Tesseract-OCR識別\bin\Debug\Tesseract-OCR識別.exe
?????文件????????187??2018-10-23?16:47??Tesseract-OCR識別\bin\Debug\Tesseract-OCR識別.exe.config
?????文件??????22016??2018-10-23?17:54??Tesseract-OCR識別\bin\Debug\Tesseract-OCR識別.pdb
?????文件?????114688??2016-02-12?20:52??Tesseract-OCR識別\bin\Debug\Tesseract.dll
?????文件??????92369??2016-02-12?20:52??Tesseract-OCR識別\bin\Debug\Tesseract.xm
?????文件????3207680??2018-10-23?17:00??Tesseract-OCR識別\bin\Debug\x64\liblept172.dll
?????文件????2743808??2018-10-23?17:00??Tesseract-OCR識別\bin\Debug\x64\libtesseract304.dll
?????文件????2459648??2018-10-23?17:00??Tesseract-OCR識別\bin\Debug\x86\liblept172.dll
?????文件????2138624??2018-10-23?17:00??Tesseract-OCR識別\bin\Debug\x86\libtesseract304.dll
?????文件???????4425??2018-10-23?17:54??Tesseract-OCR識別\Form1.cs
?????文件???????3555??2018-10-23?17:52??Tesseract-OCR識別\Form1.Designer.cs
?????文件???????5817??2018-10-23?17:52??Tesseract-OCR識別\Form1.resx
?????文件????????827??2018-10-23?16:47??Tesseract-OCR識別\obj\Debug\DesignTimeResolveAssemblyReferences.cache
?????文件???????7719??2018-10-23?17:00??Tesseract-OCR識別\obj\Debug\DesignTimeResolveAssemblyReferencesInput.cache
?????文件??????????0??2018-10-23?16:47??Tesseract-OCR識別\obj\Debug\TemporaryGeneratedFile_036C0B5B-1481-4323-8D20-8F5ADCB23D92.cs
?????文件??????????0??2018-10-23?16:47??Tesseract-OCR識別\obj\Debug\TemporaryGeneratedFile_5937a670-0e60-4077-877b-f7221da3dda1.cs
?????文件??????????0??2018-10-23?16:47??Tesseract-OCR識別\obj\Debug\TemporaryGeneratedFile_E7A71F73-0F8D-4B9B-B56E-8E70B10BC5D3.cs
?????文件??????????0??2018-10-23?17:54??Tesseract-OCR識別\obj\Debug\Tesseract-OCR識別.csproj.CopyComplete
............此處省略36個文件信息
評論
共有 條評論