Python3實(shí)現(xiàn)簡單可學(xué)習(xí)的手寫體識別(實(shí)例講解)
1.前言
版本:Python3.6.1 + PyQt5 + SQL Server 2012
以前一直覺得,機(jī)器學(xué)習(xí)、手寫體識別這種程序都是很高大上很難的,直到偶然看到了這個視頻,聽了老師講的思路后,瞬間覺得原來這個并不是那么的難,原來我還是有可能做到的。
于是我開始順著思路打算用Python、PyQt、SQLServer做一個出來,看看能不能行。然而中間遇到了太多的問題,數(shù)據(jù)庫方面的問題有十幾個,PyQt方面的問題有接近一百個,還有數(shù)十個Python基礎(chǔ)語法的問題。但好在,通過不斷的Google,終于湊出了這么一個成品來。
最終還是把都湊在一個函數(shù)里的代碼重構(gòu)了一下,改寫成了4個模塊:
main.py、Learning.py、LearningDB.py、LearningUI.py
其中LearningDB實(shí)現(xiàn)python與數(shù)據(jù)庫的交互,LearningUI實(shí)現(xiàn)界面的交互,Learning繼承LearningUI類添加上了與LearningDB數(shù)據(jù)庫類的交互,最后通過main主函數(shù)模塊運(yùn)行程序。
其中涉及數(shù)據(jù)庫的知識可參考之前的文章:Python3操作SQL Server數(shù)據(jù)庫(實(shí)例講解),
涉及PyQt的知識可參考:Python3使用PyQt5制作簡單的畫板/手寫板
手寫體識別的主要思路是將手寫的字,用一個列表記錄其所經(jīng)過的點(diǎn),劃分為一個九宮格,然后數(shù)每個格子中點(diǎn)的數(shù)目,將數(shù)目轉(zhuǎn)化為所占總點(diǎn)數(shù)的百分比。然后兩兩保存的九維數(shù),求他們之間的距離,距離越近代表越接近。
2.通過pymssql與數(shù)據(jù)庫的交互
因?yàn)槭褂贸绦蛑跋刃枰ū?,建表我就直接使用SQL語句執(zhí)行了:
create database PyLearningDB drop table table0 create table table0 (dim0 int not null, dim1 int not null, dim2 int not null, dim3 int not null, dim4 int not null, dim5 int not null, dim6 int not null, dim7 int not null, dim8 int not null) drop table table1 create table table1 (dim0 int not null, dim1 int not null, dim2 int not null, dim3 int not null, dim4 int not null, dim5 int not null, dim6 int not null, dim7 int not null, dim8 int not null) drop table table2 create table table2 (dim0 int not null, dim1 int not null, dim2 int not null, dim3 int not null, dim4 int not null, dim5 int not null, dim6 int not null, dim7 int not null, dim8 int not null) drop table table3 create table table3 (dim0 int not null, dim1 int not null, dim2 int not null, dim3 int not null, dim4 int not null, dim5 int not null, dim6 int not null, dim7 int not null, dim8 int not null) drop table table4 create table table4 (dim0 int not null, dim1 int not null, dim2 int not null, dim3 int not null, dim4 int not null, dim5 int not null, dim6 int not null, dim7 int not null, dim8 int not null) drop table table5 create table table5 (dim0 int not null, dim1 int not null, dim2 int not null, dim3 int not null, dim4 int not null, dim5 int not null, dim6 int not null, dim7 int not null, dim8 int not null) drop table table6 create table table6 (dim0 int not null, dim1 int not null, dim2 int not null, dim3 int not null, dim4 int not null, dim5 int not null, dim6 int not null, dim7 int not null, dim8 int not null) drop table table7 create table table7 (dim0 int not null, dim1 int not null, dim2 int not null, dim3 int not null, dim4 int not null, dim5 int not null, dim6 int not null, dim7 int not null, dim8 int not null) drop table table8 create table table8 (dim0 int not null, dim1 int not null, dim2 int not null, dim3 int not null, dim4 int not null, dim5 int not null, dim6 int not null, dim7 int not null, dim8 int not null) drop table table9 create table table9 (dim0 int not null, dim1 int not null, dim2 int not null, dim3 int not null, dim4 int not null, dim5 int not null, dim6 int not null, dim7 int not null, dim8 int not null)
LearningDB.py程序如下:
'''
LearningDB類
功能:定義數(shù)據(jù)庫類,包含一個學(xué)習(xí)函數(shù)learn_data和一個識別函數(shù)identify_data
作者:PyLearn
博客: http://www.cnblogs.com/PyLearn/
最后修改日期: 2017/10/18
'''
import math
import pymssql
class LearningDB():
def __init__(self):
self.conn = pymssql.connect(host='127.0.0.1',
user='sa',
password='123',
database='PyLearningDB',
charset='utf8')
self.cursor = self.conn.cursor()
self.sql = ''
self.distance = 0.0
self.conn.close()
def learn_data(self, table, dim):
'''
學(xué)習(xí)數(shù)據(jù),將數(shù)據(jù)存到對應(yīng)的數(shù)據(jù)庫
table指定哪個表,dim是維度數(shù)組
'''
learn_result = False
try:
if table < 0 or table > 9:
raise Exception("錯誤!table的值為%d!" % table)
for num in dim:
if num < 0:
raise Exception("錯誤!dim的值不能小于0!")
self.conn = pymssql.connect(host='127.0.0.1',
user='sa',
password='123',
database='PyLearningDB',
charset='utf8')
self.cursor = self.conn.cursor()
self.sql = 'insert into table%d values(%d, %d, %d, %d, %d, %d, %d, %d, %d)' %(
table, dim[0], dim[1], dim[2], dim[3], dim[4], dim[5], dim[6], dim[7], dim[8])
self.cursor.execute(self.sql)
self.conn.commit()
learn_result = True
except Exception as ex_learn:
self.conn.rollback()
raise ex_learn
finally:
self.conn.close()
return learn_result
def identify_data(self, test_data):
'''
識別數(shù)據(jù),將數(shù)據(jù)一一對比,返回最接近的近似值
'''
try:
table_data = []
for i in range(10):
table_data.append(self.__get_data(i, test_data))
#返回table_data中最小值的索引
return table_data.index(min(table_data))
except Exception as ex_identify:
raise ex_identify
def __get_data(self, table, test_data):
'''
取出table表中所有數(shù)據(jù)
并與測試數(shù)據(jù)進(jìn)行比較,返回最小值
如果table表中無數(shù)據(jù),則全部取0
'''
try:
if table < 0 or table > 9:
raise Exception("錯誤!table的值不能為%d!" % table)
self.conn = pymssql.connect(host='127.0.0.1',
user='sa',
password='123',
database='PyLearningDB',
charset='utf8')
self.cursor = self.conn.cursor()
self.sql = 'select * from table%d' % table
self.cursor.execute(self.sql)
receive_sql = self.cursor.fetchall()
if not receive_sql:
new_receive_sql = [(0, 0, 0, 0, 0, 0, 0, 0, 0)]
else:
new_receive_sql = receive_sql
finally:
self.conn.close()
#計(jì)算最小值
dim_data = []
for receive_data in new_receive_sql:
dim_data.append(self.__distance_data(test_data, receive_data))
#返回dimData中最小值
return min(dim_data)
def __distance_data(self, test_data, table_data):
'''
求九維空間中兩點(diǎn)之間的距離
'''
self.distance = 0.0
for i in range(9):
self.distance += (test_data[i] - table_data[i]) ** 2
return math.sqrt(self.distance)
3.通過pyqt與界面的交互
LearningUI.py程序如下:
'''
LearningUI類
功能:生成UI界面,以及定義事件處理方法
作者:PyLearn
博客: http://www.cnblogs.com/PyLearn/
最后修改日期: 2017/10/18
'''
from PyQt5.QtWidgets import (QWidget, QPushButton, QLabel, QComboBox, QDesktopWidget)
from PyQt5.QtGui import (QPainter, QPen, QFont)
from PyQt5.QtCore import Qt
class LearningUI(QWidget):
def __init__(self):
super(LearningUI, self).__init__()
self.__init_ui()
#設(shè)置只有鼠標(biāo)按下時才跟蹤移動,否則不按的時候也在畫畫
self.setMouseTracking(False)
#self.pos_xy保存所有繪畫的點(diǎn)
self.pos_xy = []
#設(shè)置pos_x、pos_y方便計(jì)算
self.pos_x = []
self.pos_y = []
#設(shè)置關(guān)聯(lián)事件
self.btn_learn.clicked.connect(self.btn_learn_on_clicked)
self.btn_recognize.clicked.connect(self.btn_recognize_on_clicked)
self.btn_clear.clicked.connect(self.btn_clear_on_clicked)
def __init_ui(self):
'''
定義UI界面:
三個按鈕:學(xué)習(xí)、識別、清屏
btn_learn、btn_recognize、btn_clear
一個組合框:選擇0-9
combo_table
兩條標(biāo)簽:請?jiān)谄聊豢瞻滋幱檬髽?biāo)輸入0-9中的某一個數(shù)字進(jìn)行識別!
2017/10/10 by PyLearn
一條輸出識別結(jié)果的標(biāo)簽
label_output
'''
#添加三個按鈕,分別是學(xué)習(xí)、識別、清屏
self.btn_learn = QPushButton("學(xué)習(xí)", self)
self.btn_learn.setGeometry(50, 400, 70, 40)
self.btn_recognize = QPushButton("識別", self)
self.btn_recognize.setGeometry(320, 400, 70, 40)
self.btn_clear = QPushButton("清屏", self)
self.btn_clear.setGeometry(420, 400, 70, 40)
#添加一個組合框,選擇0-9
self.combo_table = QComboBox(self)
for i in range(10):
self.combo_table.addItem("%d" % i)
self.combo_table.setGeometry(150, 400, 70, 40)
#添加兩條標(biāo)簽
self.label_head = QLabel('請?jiān)谄聊豢瞻滋幱檬髽?biāo)輸入0-9中的某一個數(shù)字進(jìn)行識別!', self)
self.label_head.move(75, 50)
self.label_end = QLabel('2017/10/10 by PyLearn', self)
self.label_end.move(375, 470)
#添加一條輸出識別結(jié)果的標(biāo)簽
'''
setStyleSheet設(shè)置邊框大小、顏色
setFont設(shè)置字體大小、形狀、加粗
setAlignment設(shè)置文本居中
'''
self.label_output = QLabel('', self)
self.label_output.setGeometry(50, 100, 150, 250)
self.label_output.setStyleSheet("QLabel{border:1px solid black;}")
self.label_output.setFont(QFont("Roman times", 100, QFont.Bold))
self.label_output.setAlignment(Qt.AlignCenter)
'''
setFixedSize()固定了窗體的寬度與高度
self.center()將窗體居中顯示
setWindowTitle()設(shè)置窗體的標(biāo)題
'''
self.setFixedSize(550, 500)
self.center()
self.setWindowTitle('0-9手寫體識別(機(jī)器學(xué)習(xí)中的"HelloWorld!")')
def center(self):
'''
窗口居中顯示
'''
qt_center = self.frameGeometry()
desktop_center = QDesktopWidget().availableGeometry().center()
qt_center.moveCenter(desktop_center)
self.move(qt_center.topLeft())
def paintEvent(self, event):
'''
首先判斷pos_xy列表中是不是至少有兩個點(diǎn)了
然后將pos_xy中第一個點(diǎn)賦值給point_start
利用中間變量pos_tmp遍歷整個pos_xy列表
point_end = pos_tmp
判斷point_end是否是斷點(diǎn),如果是
point_start賦值為斷點(diǎn)
continue
判斷point_start是否是斷點(diǎn),如果是
point_start賦值為point_end
continue
畫point_start到point_end之間的線
point_start = point_end
這樣,不斷地將相鄰兩個點(diǎn)之間畫線,就能留下鼠標(biāo)移動軌跡了
'''
painter = QPainter()
painter.begin(self)
pen = QPen(Qt.black, 2, Qt.SolidLine)
painter.setPen(pen)
if len(self.pos_xy) > 1:
point_start = self.pos_xy[0]
for pos_tmp in self.pos_xy:
point_end = pos_tmp
if point_end == (-1, -1):
point_start = point_end
continue
if point_start == (-1, -1):
point_start = point_end
continue
painter.drawLine(point_start[0], point_start[1], point_end[0], point_end[1])
point_start = point_end
painter.end()
def mouseReleaseEvent(self, event):
'''
重寫鼠標(biāo)按住后松開的事件
在每次松開后向pos_xy列表中添加一個斷點(diǎn)(-1, -1)
然后在繪畫時判斷一下是不是斷點(diǎn)就行了
是斷點(diǎn)的話就跳過去,不與之前的連續(xù)
'''
pos_test = (-1, -1)
self.pos_xy.append(pos_test)
self.update()
def mouseMoveEvent(self, event):
'''
按住鼠標(biāo)移動:將移動的點(diǎn)加入self.pos_xy列表
'''
#self.pos_x和self.pos_y總是比self.pos_xy少一到兩個點(diǎn),還不知道原因在哪
self.pos_x.append(event.pos().x())
self.pos_y.append(event.pos().y())
#中間變量pos_tmp提取當(dāng)前點(diǎn)
pos_tmp = (event.pos().x(), event.pos().y())
#pos_tmp添加到self.pos_xy中
self.pos_xy.append(pos_tmp)
self.update()
def btn_learn_on_clicked(self):
'''
需要用到數(shù)據(jù)庫,因此在在子類中實(shí)現(xiàn)
'''
pass
def btn_recognize_on_clicked(self):
'''
需要用到數(shù)據(jù)庫,因此在在子類中實(shí)現(xiàn)
'''
pass
def btn_clear_on_clicked(self):
'''
按下清屏按鈕:
將列表賦值為空
將輸出識別結(jié)果的標(biāo)簽賦值為空
然后刷新界面,重新繪畫即可清屏
'''
self.pos_xy = []
self.pos_x = []
self.pos_y = []
self.label_output.setText('')
self.update()
def get_pos_xy(self):
'''
將手寫體在平面上分為9個格子
計(jì)算每個格子里點(diǎn)的數(shù)量
然后點(diǎn)的數(shù)量轉(zhuǎn)化為占總點(diǎn)數(shù)的百分比
接著返回一個數(shù)組dim[9]
橫軸依次是min_x、min2_x、max2_x、max_x
縱軸依次是min_y、min2_y、max2_y、max_y
'''
if not self.pos_xy:
return None
pos_count = len(self.pos_x)
max_x = max(self.pos_x)
max_y = max(self.pos_y)
min_x = min(self.pos_x)
min_y = min(self.pos_y)
dim = [0, 0, 0, 0, 0, 0, 0, 0, 0]
dis_x = (max_x - min_x) // 3
dis_y = (max_y - min_y) // 3
min2_x = min_x + dis_x
min2_y = min_y + dis_y
max2_x = max_x - dis_x
max2_y = max_y - dis_y
for i in range(len(self.pos_x)):
if self.pos_y[i] >= min_y and self.pos_y[i] < min2_y:
if self.pos_x[i] >= min_x and self.pos_x[i] < min2_x:
dim[0] += 1
continue
if self.pos_x[i] >= min2_x and self.pos_x[i] < max2_x:
dim[1] += 1
continue
if self.pos_x[i] >= max2_x and self.pos_x[i] <= max_x:
dim[2] += 1
continue
elif self.pos_y[i] >= min2_y and self.pos_y[i] < max2_y:
if self.pos_x[i] >= min_x and self.pos_x[i] < min2_x:
dim[3] += 1
continue
if self.pos_x[i] >= min2_x and self.pos_x[i] < max2_x:
dim[4] += 1
continue
if self.pos_x[i] >= max2_x and self.pos_x[i] <= max_x:
dim[5] += 1
continue
elif self.pos_y[i] >= max2_y and self.pos_y[i] <= max_y:
if self.pos_x[i] >= min_x and self.pos_x[i] < min2_x:
dim[6] += 1
continue
if self.pos_x[i] >= min2_x and self.pos_x[i] < max2_x:
dim[7] += 1
continue
if self.pos_x[i] >= max2_x and self.pos_x[i] <= max_x:
dim[8] += 1
continue
else:
pos_count -= 1
continue
#將數(shù)量轉(zhuǎn)化為所占百分比
for num in dim:
num = num * 100 // pos_count
return dim
4.UI與數(shù)據(jù)庫的交互
Learning.py程序如下:
'''
Learning類
功能:重寫LearningUI類中的兩個用到了數(shù)據(jù)庫的方法:
類中添加一個LearningDB類對象的數(shù)據(jù)成員self.learn_db
作者:PyLearn
博客: http://www.cnblogs.com/PyLearn/
最后修改日期: 2017/10/18
'''
from PyQt5.QtWidgets import QMessageBox
from LearningUI import LearningUI
from LearningDB import LearningDB
class Learning(LearningUI):
'''
Learning實(shí)現(xiàn)btn_learn_on_clicked和btn_recognize_on_clicked兩個方法
'''
def __init__(self):
super(Learning, self).__init__()
#學(xué)習(xí)函數(shù)learn_data(table, dim)和一個識別函數(shù)identify_data(test_data)
self.learn_db = LearningDB()
def btn_learn_on_clicked(self):
if not self.pos_xy:
QMessageBox.critical(self, "注意", "請先寫入您要學(xué)習(xí)的數(shù)字!")
return None
#獲取要學(xué)習(xí)的數(shù)字learn_num
learn_num = self.combo_table.currentIndex()
#彈出確認(rèn)對話框
qbox = QMessageBox()
qbox.setIcon(QMessageBox.Information)
qbox.setWindowTitle("請確認(rèn)")
qbox.setText("學(xué)習(xí)數(shù)字 %d ?" % learn_num)
qbox.setStandardButtons(QMessageBox.Yes | QMessageBox.No)
qbox.setDefaultButton(QMessageBox.No)
qbox.button(QMessageBox.Yes).setText("是")
qbox.button(QMessageBox.No).setText("否")
reply = qbox.exec()
#判斷對話框結(jié)果,執(zhí)行程序
if reply == QMessageBox.Yes:
learn_result = False
learn_dim = self.get_pos_xy()
if learn_dim:
learn_result = self.learn_db.learn_data(learn_num, learn_dim)
else:
print('get_pos_xy()函數(shù)返回空值')
return None
if learn_result:
QMessageBox.about(self, "提示", "學(xué)習(xí)成功!")
else:
QMessageBox.about(self, "提示", "學(xué)習(xí)失??!")
else:
return None
def btn_recognize_on_clicked(self):
#如果沒有進(jìn)行繪畫,警告后退出
if not self.pos_xy:
QMessageBox.critical(self, "注意", "請先寫入您要識別的數(shù)字!")
return None
else:
recognize_num = 0
recognize_dim = self.get_pos_xy()
if recognize_dim:
recognize_num = self.learn_db.identify_data(recognize_dim)
else:
print('recognize_dim為空')
return None
self.label_output.setText('%d' % recognize_num)
5.最后的main主函數(shù)
''' 主函數(shù)main 功能:生成Learning對象,進(jìn)入主循環(huán) 作者:PyLearn 最后修改日期: 2017/10/18 ''' import sys from PyQt5.QtWidgets import QApplication from Learning import Learning if __name__ == '__main__': app = QApplication(sys.argv) py_learning = Learning() py_learning.show() sys.exit(app.exec_())
將以上4個程序放在同一個目錄下,直接執(zhí)行main.py就行了。
運(yùn)行界面如下:

學(xué)習(xí)數(shù)字4:

第一次運(yùn)行需要全部學(xué)習(xí)至少一次才能有一點(diǎn)正確率。
識別3:

以上這篇Python3實(shí)現(xiàn)簡單可學(xué)習(xí)的手寫體識別(實(shí)例講解)就是小編分享給大家的全部內(nèi)容了,希望能給大家一個參考,也希望大家多多支持腳本之家。
相關(guān)文章
Python函數(shù)isalnum用法示例小結(jié)
isalnum()函數(shù)是Python中的一個內(nèi)置函數(shù),用于判斷字符串是否只由數(shù)字和字母組成,其內(nèi)部實(shí)現(xiàn)原理比較簡單,只需遍歷字符串中的每一個字符即可,這篇文章主要介紹了Python函數(shù)isalnum用法介紹,需要的朋友可以參考下2024-01-01
Python實(shí)現(xiàn)PS濾鏡功能之波浪特效示例
這篇文章主要介紹了Python實(shí)現(xiàn)PS濾鏡功能之波浪特效,結(jié)合實(shí)例形式分析了Python實(shí)現(xiàn)PS濾鏡波浪特效的原理與相關(guān)操作技巧,需要的朋友可以參考下2018-01-01
Win8.1下安裝Python3.6提示0x80240017錯誤的解決方法
使用Python Fast API發(fā)布API服務(wù)的過程詳解
基于Python實(shí)現(xiàn)牛牛套圈小游戲的示例代碼
在vscode中啟動conda虛擬環(huán)境的思路詳解

