rlabrecque · December 31, 2016 08:53
diff --git a/KNN_Character_Recognition_Emgu_CV_3_CS b/KNN_Character_Recognition_Emgu_CV_3_CS
 // GenData
 using System;
 using System.Collections.Generic;
 using System.Drawing;
 using System.Windows.Forms;

 using System.Xml;
 using System.Xml.Serialization; //these imports are for writing Matrix objects to file, see end of program
 using System.IO;

 using Emgu.CV;
 using Emgu.CV.CvEnum;
 using Emgu.CV.Structure;
 using Emgu.CV.Util;
 using Emgu.CV.UI;

 namespace SomeNamspace {
 	public partial class GenData : Form {
 		const int MIN_CONTOUR_AREA = 100;

 		const int RESIZED_IMAGE_WIDTH = 20;
 		const int RESIZED_IMAGE_HEIGHT = 30;

 		public GenData() {
 			InitializeComponent();
 		}

 		private void btnOpenTrainingImage_Click(object sender, EventArgs e) {
 			DialogResult drChosenFile;
 			drChosenFile = ofdOpenFile.ShowDialog(); // open file dialog

 			if (drChosenFile != DialogResult.OK || ofdOpenFile.FileName == "") { // if user chose Cancel or filename is blank . . .
 				lblChosenFile.Text = "file not chosen"; // show error message on label
 				return; // and exit function
 			}

 			Mat imgTrainingNumbers;

 			try {
 				imgTrainingNumbers = new Mat(ofdOpenFile.FileName);
 			}
 			catch (Exception ex) { // if error occurred
 				lblChosenFile.Text = "unable to open image, error: " + ex.Message; // show error message on label
 				return; // and exit function
 			}

 			if (imgTrainingNumbers == null) { // if image could not be opened
 				lblChosenFile.Text = "unable to open image"; // show error message on label
 				return; // and exit function
 			}

 			lblChosenFile.Text = ofdOpenFile.FileName; //update label with file name

 			Mat imgGrayscale = new Mat();
 			Mat imgBlurred = new Mat(); // declare various images
 			Mat imgThresh = new Mat();
 			Mat imgThreshCopy = new Mat();
 			VectorOfVectorOfPoint contours = new VectorOfVectorOfPoint();
 			//Matrix<Single> mtxClassifications = new Matrix<Single>();
 			//Matrix<Single> mtxTrainingImages = new Matrix<Single>();
 			Mat matTrainingImagesAsFlattenedFloats = new Mat();

 			//possible chars we are interested in are digits 0 through 9 and capital letters A through Z, put these in list intValidChars
 			var intValidChars = new List<int>(new int[] {
 				'0', '1', '2', '3', '4', '5', '6', '7', '8', '9',
 				'A', 'B', 'C', 'D', 'E', 'F', 'G', 'H', 'I', 'J',
 				'K', 'L', 'M', 'N', 'O', 'P', 'Q', 'R', 'S', 'T',
 				'U', 'V', 'W', 'X', 'Y', 'Z' });

 			CvInvoke.CvtColor(imgTrainingNumbers, imgGrayscale, ColorConversion.Bgr2Gray);       //convert to grayscale
 			CvInvoke.GaussianBlur(imgGrayscale, imgBlurred, new Size(5, 5), 0);                  //blur

 			//threshold image from grayscale to black and white
 			CvInvoke.AdaptiveThreshold(imgBlurred, imgThresh, 255.0, AdaptiveThresholdType.GaussianC, ThresholdType.BinaryInv, 11, 2);
 			CvInvoke.Imshow("imgThresh", imgThresh);                //show threshold image for reference
 			imgThreshCopy = imgThresh.Clone();              //make a copy of the thresh image, this in necessary b/c findContours modifies the image

 			//get external countours only
 			CvInvoke.FindContours(imgThreshCopy, contours, null, RetrType.External, ChainApproxMethod.ChainApproxSimple);
 			int intNumberOfTrainingSamples = contours.Size;
 			Matrix<Single> mtxClassifications = new Matrix<Single>(intNumberOfTrainingSamples, 1);      //this is our classifications data structure

 			//this is our training images data structure, note we will have to perform some conversions to write to this later
 			Matrix<Single> mtxTrainingImages = new Matrix<Single>(intNumberOfTrainingSamples, RESIZED_IMAGE_WIDTH * RESIZED_IMAGE_HEIGHT);

 			//this keeps track of which row we are on in both classifications and training images,
 			int intTrainingDataRowToAdd = 0;          //note that each sample will correspond to one row in

 			//both the classifications XML file and the training images XML file
 			for (int i = 0; i <= contours.Size - 1; ++i) {                               //for each contour
 				if (CvInvoke.ContourArea(contours[i]) > MIN_CONTOUR_AREA) {                      //if contour is big enough to consider
 					Rectangle boundingRect = CvInvoke.BoundingRectangle(contours[i]);                //get the bounding rect
 					CvInvoke.Rectangle(imgTrainingNumbers, boundingRect, new MCvScalar(0.0, 0.0, 255.0), 2);    //draw red rectangle around each contour as we ask user for input

 					Mat imgROItoBeCloned = new Mat(imgThresh, boundingRect);        //get ROI image of current char
 					Mat imgROI = imgROItoBeCloned.Clone();           //make a copy so we do not change the ROI area of the original image
 					Mat imgROIResized = new Mat();

 					//resize image, this is necessary for recognition and storage
 					CvInvoke.Resize(imgROI, imgROIResized, new Size(RESIZED_IMAGE_WIDTH, RESIZED_IMAGE_HEIGHT));

 					CvInvoke.Imshow("imgROI", imgROI);                                   //show ROI image for reference
 					CvInvoke.Imshow("imgROIResized", imgROIResized);                     //show resized ROI image for reference
 					CvInvoke.Imshow("imgTrainingNumbers", imgTrainingNumbers);           //show training numbers image, this will now have red rectangles drawn on it

 					int intChar = CvInvoke.WaitKey(0); //get key press

 					if (intChar == 27) { //if esc key was pressed
 						CvInvoke.DestroyAllWindows();
 						return; //exit the function
 					}
 					else if (intValidChars.Contains(intChar)) { //else if the char is in the list of chars we are looking for . . .
 						mtxClassifications[intTrainingDataRowToAdd, 0] = Convert.ToSingle(intChar); //write classification char to classifications Matrix

 						//now add the training image (some conversion is necessary first) . . .
 						//note that we have to covert the images to Matrix(Of Single) type, this is necessary to pass into the KNearest object call to train
 						Matrix<Single> mtxTemp = new Matrix<Single>(imgROIResized.Size);
 						Matrix<Single> mtxTempReshaped = new Matrix<Single>(1, RESIZED_IMAGE_WIDTH * RESIZED_IMAGE_HEIGHT);
 						imgROIResized.ConvertTo(mtxTemp, DepthType.Cv32F);           //convert Image to a Matrix of Singles with the same dimensions
 						
 						for (int intRow = 0; intRow <= RESIZED_IMAGE_HEIGHT - 1; ++intRow) {          //flatten Matrix into one row by RESIZED_IMAGE_WIDTH * RESIZED_IMAGE_HEIGHT number of columns
 							for (int intCol = 0; intCol <= RESIZED_IMAGE_WIDTH - 1; ++intCol) {
 								mtxTempReshaped[0, (intRow * RESIZED_IMAGE_WIDTH) + intCol] = mtxTemp[intRow, intCol];
 							}
 						}

 						for (int intCol = 0; intCol <= (RESIZED_IMAGE_WIDTH * RESIZED_IMAGE_HEIGHT) - 1; ++intCol) {         //write flattened Matrix into one row of training images Matrix
 							mtxTrainingImages[intTrainingDataRowToAdd, intCol] = mtxTempReshaped[0, intCol];
 						}
 						intTrainingDataRowToAdd = intTrainingDataRowToAdd + 1; //increment which row, i.e. sample we are on
 					}
 				}
 			}

 			txtInfo.Text = txtInfo.Text + "training complete !!" + "\n" + "\n";

 			//save classifications to file
 			XmlSerializer xmlSerializer = new XmlSerializer(mtxClassifications.GetType());
 			StreamWriter streamWriter;
 			
 			try {
 				streamWriter = new StreamWriter("classifications.xml"); //attempt to open classifications file
 			}
 			catch (Exception ex) {  //if error is encountered, show error and return
 				txtInfo.Text = "\n" + txtInfo.Text + "unable to open 'classifications.xml', error:" + "\n";
 				txtInfo.Text = txtInfo.Text + ex.Message + "\n" + "\n";
 				return;
 			}
 			
 			xmlSerializer.Serialize(streamWriter, mtxClassifications);
 			streamWriter.Close();

 			//save training images to file
 			xmlSerializer = new XmlSerializer(mtxTrainingImages.GetType());
 			
 			try {
 				streamWriter = new StreamWriter("images.xml"); // attempt to open images file
 			}
 			catch (Exception ex) { // if error is encountered, show error and return
 				txtInfo.Text = "\n" + txtInfo.Text + "unable to open 'images.xml', error:" + "\n";
 				txtInfo.Text = txtInfo.Text + ex.Message + "\n" + "\n";
 				return;
 			}
 			
 			xmlSerializer.Serialize(streamWriter, mtxTrainingImages);
 			streamWriter.Close();
 			txtInfo.Text = "\n" + txtInfo.Text + "file writing done" + "\n";
 			MessageBox.Show("Training complete, file writing done !!");
 		}
 	}
 }
	// GenData
	using System;
	using System.Collections.Generic;
	using System.Drawing;
	using System.Windows.Forms;

	using System.Xml;
	using System.Xml.Serialization; //these imports are for writing Matrix objects to file, see end of program
	using System.IO;

	using Emgu.CV;
	using Emgu.CV.CvEnum;
	using Emgu.CV.Structure;
	using Emgu.CV.Util;
	using Emgu.CV.UI;

	namespace SomeNamspace {
	public partial class GenData : Form {
	const int MIN_CONTOUR_AREA = 100;

	const int RESIZED_IMAGE_WIDTH = 20;
	const int RESIZED_IMAGE_HEIGHT = 30;

	public GenData() {
	InitializeComponent();
	}

	private void btnOpenTrainingImage_Click(object sender, EventArgs e) {
	DialogResult drChosenFile;
	drChosenFile = ofdOpenFile.ShowDialog(); // open file dialog

	if (drChosenFile != DialogResult.OK \|\| ofdOpenFile.FileName == "") { // if user chose Cancel or filename is blank . . .
	lblChosenFile.Text = "file not chosen"; // show error message on label
	return; // and exit function
	}

	Mat imgTrainingNumbers;

	try {
	imgTrainingNumbers = new Mat(ofdOpenFile.FileName);
	}
	catch (Exception ex) { // if error occurred
	lblChosenFile.Text = "unable to open image, error: " + ex.Message; // show error message on label
	return; // and exit function
	}

	if (imgTrainingNumbers == null) { // if image could not be opened
	lblChosenFile.Text = "unable to open image"; // show error message on label
	return; // and exit function
	}

	lblChosenFile.Text = ofdOpenFile.FileName; //update label with file name

	Mat imgGrayscale = new Mat();
	Mat imgBlurred = new Mat(); // declare various images
	Mat imgThresh = new Mat();
	Mat imgThreshCopy = new Mat();
	VectorOfVectorOfPoint contours = new VectorOfVectorOfPoint();
	//Matrix<Single> mtxClassifications = new Matrix<Single>();
	//Matrix<Single> mtxTrainingImages = new Matrix<Single>();
	Mat matTrainingImagesAsFlattenedFloats = new Mat();

	//possible chars we are interested in are digits 0 through 9 and capital letters A through Z, put these in list intValidChars
	var intValidChars = new List<int>(new int[] {
	'0', '1', '2', '3', '4', '5', '6', '7', '8', '9',
	'A', 'B', 'C', 'D', 'E', 'F', 'G', 'H', 'I', 'J',
	'K', 'L', 'M', 'N', 'O', 'P', 'Q', 'R', 'S', 'T',
	'U', 'V', 'W', 'X', 'Y', 'Z' });

	CvInvoke.CvtColor(imgTrainingNumbers, imgGrayscale, ColorConversion.Bgr2Gray); //convert to grayscale
	CvInvoke.GaussianBlur(imgGrayscale, imgBlurred, new Size(5, 5), 0); //blur

	//threshold image from grayscale to black and white
	CvInvoke.AdaptiveThreshold(imgBlurred, imgThresh, 255.0, AdaptiveThresholdType.GaussianC, ThresholdType.BinaryInv, 11, 2);
	CvInvoke.Imshow("imgThresh", imgThresh); //show threshold image for reference
	imgThreshCopy = imgThresh.Clone(); //make a copy of the thresh image, this in necessary b/c findContours modifies the image

	//get external countours only
	CvInvoke.FindContours(imgThreshCopy, contours, null, RetrType.External, ChainApproxMethod.ChainApproxSimple);
	int intNumberOfTrainingSamples = contours.Size;
	Matrix<Single> mtxClassifications = new Matrix<Single>(intNumberOfTrainingSamples, 1); //this is our classifications data structure

	//this is our training images data structure, note we will have to perform some conversions to write to this later
	Matrix<Single> mtxTrainingImages = new Matrix<Single>(intNumberOfTrainingSamples, RESIZED_IMAGE_WIDTH * RESIZED_IMAGE_HEIGHT);

	//this keeps track of which row we are on in both classifications and training images,
	int intTrainingDataRowToAdd = 0; //note that each sample will correspond to one row in

	//both the classifications XML file and the training images XML file
	for (int i = 0; i <= contours.Size - 1; ++i) { //for each contour
	if (CvInvoke.ContourArea(contours[i]) > MIN_CONTOUR_AREA) { //if contour is big enough to consider
	Rectangle boundingRect = CvInvoke.BoundingRectangle(contours[i]); //get the bounding rect
	CvInvoke.Rectangle(imgTrainingNumbers, boundingRect, new MCvScalar(0.0, 0.0, 255.0), 2); //draw red rectangle around each contour as we ask user for input

	Mat imgROItoBeCloned = new Mat(imgThresh, boundingRect); //get ROI image of current char
	Mat imgROI = imgROItoBeCloned.Clone(); //make a copy so we do not change the ROI area of the original image
	Mat imgROIResized = new Mat();

	//resize image, this is necessary for recognition and storage
	CvInvoke.Resize(imgROI, imgROIResized, new Size(RESIZED_IMAGE_WIDTH, RESIZED_IMAGE_HEIGHT));

	CvInvoke.Imshow("imgROI", imgROI); //show ROI image for reference
	CvInvoke.Imshow("imgROIResized", imgROIResized); //show resized ROI image for reference
	CvInvoke.Imshow("imgTrainingNumbers", imgTrainingNumbers); //show training numbers image, this will now have red rectangles drawn on it

	int intChar = CvInvoke.WaitKey(0); //get key press

	if (intChar == 27) { //if esc key was pressed
	CvInvoke.DestroyAllWindows();
	return; //exit the function
	}
	else if (intValidChars.Contains(intChar)) { //else if the char is in the list of chars we are looking for . . .
	mtxClassifications[intTrainingDataRowToAdd, 0] = Convert.ToSingle(intChar); //write classification char to classifications Matrix

	//now add the training image (some conversion is necessary first) . . .
	//note that we have to covert the images to Matrix(Of Single) type, this is necessary to pass into the KNearest object call to train
	Matrix<Single> mtxTemp = new Matrix<Single>(imgROIResized.Size);
	Matrix<Single> mtxTempReshaped = new Matrix<Single>(1, RESIZED_IMAGE_WIDTH * RESIZED_IMAGE_HEIGHT);
	imgROIResized.ConvertTo(mtxTemp, DepthType.Cv32F); //convert Image to a Matrix of Singles with the same dimensions

	for (int intRow = 0; intRow <= RESIZED_IMAGE_HEIGHT - 1; ++intRow) { //flatten Matrix into one row by RESIZED_IMAGE_WIDTH * RESIZED_IMAGE_HEIGHT number of columns
	for (int intCol = 0; intCol <= RESIZED_IMAGE_WIDTH - 1; ++intCol) {
	mtxTempReshaped[0, (intRow * RESIZED_IMAGE_WIDTH) + intCol] = mtxTemp[intRow, intCol];
	}
	}

	for (int intCol = 0; intCol <= (RESIZED_IMAGE_WIDTH * RESIZED_IMAGE_HEIGHT) - 1; ++intCol) { //write flattened Matrix into one row of training images Matrix
	mtxTrainingImages[intTrainingDataRowToAdd, intCol] = mtxTempReshaped[0, intCol];
	}
	intTrainingDataRowToAdd = intTrainingDataRowToAdd + 1; //increment which row, i.e. sample we are on
	}
	}
	}

	txtInfo.Text = txtInfo.Text + "training complete !!" + "\n" + "\n";

	//save classifications to file
	XmlSerializer xmlSerializer = new XmlSerializer(mtxClassifications.GetType());
	StreamWriter streamWriter;

	try {
	streamWriter = new StreamWriter("classifications.xml"); //attempt to open classifications file
	}
	catch (Exception ex) { //if error is encountered, show error and return
	txtInfo.Text = "\n" + txtInfo.Text + "unable to open 'classifications.xml', error:" + "\n";
	txtInfo.Text = txtInfo.Text + ex.Message + "\n" + "\n";
	return;
	}

	xmlSerializer.Serialize(streamWriter, mtxClassifications);
	streamWriter.Close();

	//save training images to file
	xmlSerializer = new XmlSerializer(mtxTrainingImages.GetType());

	try {
	streamWriter = new StreamWriter("images.xml"); // attempt to open images file
	}
	catch (Exception ex) { // if error is encountered, show error and return
	txtInfo.Text = "\n" + txtInfo.Text + "unable to open 'images.xml', error:" + "\n";
	txtInfo.Text = txtInfo.Text + ex.Message + "\n" + "\n";
	return;
	}

	xmlSerializer.Serialize(streamWriter, mtxTrainingImages);
	streamWriter.Close();
	txtInfo.Text = "\n" + txtInfo.Text + "file writing done" + "\n";
	MessageBox.Show("Training complete, file writing done !!");
	}
	}
	}