zoukankan      html  css  js  c++  java
  • csharp: Emgu.CV.OCR and Tesseract.OCR Optical Character Recognition

    using System;
    using System.Collections.Generic;
    using System.ComponentModel;
    using System.Data;
    using System.Drawing;
    using System.Linq;
    using System.Text;
    using System.Threading.Tasks;
    using System.Windows.Forms;
    using Emgu.CV;  //3.2.02
    using Emgu.CV.VideoStab;
    using Emgu.CV.ML;
    using Emgu.CV.OCR;
    using Emgu.CV.Structure;
    //https://github.com/iobrains/OpenCV
    
    
    namespace CharacterRecognition
    {
    
        /// <summary>
        /// geovindu edit
        /// </summary>
        public partial class MainWnd : Form
        {
            string path;
            public MainWnd()
            {
                InitializeComponent();
            }
            /// <summary>
            /// 
            /// </summary>
            /// <param name="sender"></param>
            /// <param name="e"></param>
            private void loadImageToolStripMenuItem_Click(object sender, EventArgs e)
            {
                rtbOcrResult.Clear();
    
                OpenFileDialog ofd = new OpenFileDialog();
                ofd.Title = "Select an image";
                ofd.Filter = "Image Files(*.png; *.jpg; *.bmp; *.gif)|*.png; *.jpg; *.bmp; *.gif";
                if (ofd.ShowDialog() == DialogResult.OK)
                {
                    path = System.IO.Path.GetFullPath(ofd.FileName);
                    picBox.Image = new Bitmap(path);
                    picBox.SizeMode = PictureBoxSizeMode.Zoom;
                    statusLabelOCR.Text = path + " loaded.";
                }
            }
            /// <summary>
            /// 
            /// </summary>
            /// <param name="sender"></param>
            /// <param name="e"></param>
            private void exitToolStripMenuItem_Click(object sender, EventArgs e)
            {
                Close();
            }
            /// <summary>
            /// 
            /// </summary>
            /// <param name="sender"></param>
            /// <param name="e"></param>
            private void btnAnalyzeImage_Click(object sender, EventArgs e)
            {
                if(picBox.Image == null)
                {
                    MessageBox.Show("Load an image first!");
                }
                else
                {
                    statusLabelOCR.Text = "Analyzing invoice image...";
                    Task.Run(() =>
                    {
                        using (var img = new Image<Bgr, byte>(path))
                        {
                            //https://github.com/tesseract-ocr/tessdata/
                            //Environment.GetEnvironmentVariable("EMGU_ROOT") +
                            string tessdata = @"D:open sourceface	essdata";
                            using (var ocrProvider = new Tesseract(tessdata, "eng", OcrEngineMode.TesseractOnly))  //TesseractCubeCombined
                            {
                                ocrProvider.SetImage(img); //Recognize
                                string text = ocrProvider.GetUTF8Text().TrimEnd(); //GetText
                                rtbOcrResult.Invoke((MethodInvoker)delegate
                                                   {
                                                       statusLabelOCR.Text = "Analysis completed.";
                                                       rtbOcrResult.AppendText(text);
                                                   });
                                
                            }
                        }
                    });
                    
                }
            }
            /// <summary>
            /// 
            /// </summary>
            /// <param name="sender"></param>
            /// <param name="e"></param>
            private void MainWnd_Load(object sender, EventArgs e)
            {
    
            }
        }
    }
    

      

  • 相关阅读:
    linux c dlopen加载动态链接库
    c++锁 测试 (gcc test.cpp -o test -lpthread)
    shell 清理目录下 超过一段时间的数据。
    大话存储学习笔记
    python总结
    正则表达式使用
    #linux shell#模拟日志生成过程
    深入理解Java虚拟机
    Nginx修改access.log日志时间格式
    mfcs100d.lib(dllmodul.obj) : error LNK2005: _DllMain@12 already defined
  • 原文地址:https://www.cnblogs.com/geovindu/p/13255964.html
Copyright © 2011-2022 走看看