! pip install pyscreenshot

! pip install Pillow

! pip install mss

! pip install pyautogui

! pip install wxPython

# Screen Capture

# Needed Libraries
import pyscreenshot as ImageGrab
import time

# 
images_folder = "images/auto_images/0/"
for i in range(0,5): #5 images
    time.sleep(8) # 8s interval
    im = ImageGrab.grab(bbox=(100,360,1000,1100)) #location of top left of pc window...adjust as required
    print("saved.....", i)
    im.save(images_folder+str(i)+'.png')
    print("clear screen and redraw now...")

saved..... 0

---------------------------------------------------------------------------
FileNotFoundError                         Traceback (most recent call last)
Cell In[8], line 7
      5 im = ImageGrab.grab(bbox=(100,360,1000,1100)) #location of top left of pc window...adjust as required
      6 print("saved.....", i)
----> 7 im.save(images_folder+str(i)+'.png')
      8 print("clear screen and redraw now...")

File c:\Users\senna\AppData\Local\Programs\Python\Python313\Lib\site-packages\PIL\Image.py:2566, in Image.save(self, fp, format, **params)
   2564         fp = builtins.open(filename, "r+b")
   2565     else:
-> 2566         fp = builtins.open(filename, "w+b")
   2567 else:
   2568     fp = cast(IO[bytes], fp)

FileNotFoundError: [Errno 2] No such file or directory: 'images/auto_images/0/0.png'

# Automated Screen Capture Function  

def screen_capture():
    import pyscreenshot as ImageGrab
    import time
    
    images_folder = "images/captured_images/0/"
    for i in range(0,5): #5 images
        time.sleep(8) # 8s interval
        im = ImageGrab.grab(bbox=(60,170,400,500)) #location of top left of pc window...adjust as required
        print("saved.....", i)
        im.save(images_folder+str(i)+'.png')
        print("clear screen and redraw now...")

! pip install opencv-python

# Generate Dataset

import cv2
import csv
import glob

header = ["label"]
for i in range(0,784): #784 because a 28 x 28 matrix is being created
    header.append("pixel"+str(i)) # add extra header labels along the top of the dataframe
with open('datasets/character_dataset.csv', 'a') as f: #open a file, assign name "character_dataset.csv". "a" is append mode. Assign the file object to variablel "f"
    writer = csv.writer(f) #create CSV writer object that writes file f
    writer.writerow(header) #write a single row of header labels to CSV file
for label in range(10): #from 10 folders
    dirList = glob.glob("images/captured_images/"+str(label)+"/*.png")

    for img_path in dirList:
        im = cv2.imread(img_path) #read image data
        im_gray = cv2.cvtColor(im, cv2.COLOR_BGR2GRAY) #convert images to grey scale from BGR
        im_gray = cv2.GaussianBlur(im_gray,(15,15),0) #blur images with GaussianBlur to increase smoothness. 15,15 is kernel size. 0 is auto-calc sigma_x and sigma_y req'd to blur image.
        roi = cv2.resize(im_gray, (28,28), interpolation=cv2.INTER_AREA) #resize images to 28px x 28px. pass thru 1 method of interpolation. stored in variable 'roi' = region of interest
    
        data = []
        data.append(label)
        rows, cols = roi.shape

        # Add px one by one into data array
        for i in range(rows):
            for j in range(cols):
                k = roi[i,j]
                if k > 100: #k is greyscale value. zero is white. setting threshold at 100.
                    k = 1 #flatten data to 1 (black) or
                else:
                    k = 0 #...zero (white)
                data.append(k)
        with open('datasets/character_dataset.csv', 'a') as f: #Opens file in append mode
            writer = csv.writer(f) 
            writer.writerow(data) # Writes one row per processed image

! pip install pandas

! pip install scikit-learn

# Load Dataset  

import pandas as pd
from sklearn.utils import shuffle  #shuffle to randomly order data instead of ordered from small to large

data = pd.read_csv("datasets/character_dataset.csv")
data = shuffle(data)
data

x = data.drop("label", axis= 1) #remove the 1st column from the dataframe. "1" causes vertical separation
y = data["label"]

! pip install matplotlib

# preview one image using Matplotlib

%matplotlib inline
import matplotlib.pyplot as plt
import cv2
idx =  319 #input a row index value...from the 1st column
img = x.loc[idx].values.reshape(28,28) #grab x-values for the index row and reshape into a 28 x 28
print(y[idx])
plt.imshow(img)

9

<matplotlib.image.AxesImage at 0xe13a59a17d90>

# Test-Train Split

from sklearn.model_selection import train_test_split
train_x, test_x, train_y, test_y = train_test_split(x,y, test_size = 0.2) #0.2 = 20% of dataset images will be used for testing purposes

import joblib
from sklearn.svm import SVC
classifier = SVC(kernel="linear", random_state=6) #
classifier.fit(train_x, train_y) #create model
joblib.dump(classifier, "model/digit_recognizer") #save model

['model/digit_recognizer']

from sklearn import metrics
predictions = classifier.predict(test_x) #using only x values, no need for y labels
print("Accuracy:  ", metrics.accuracy_score(predictions, test_y)) #accuracy_score compares the model predictions with the data value label

Accuracy:   0.9375

# Screen Capture

# Needed Libraries
import pyscreenshot as ImageGrab
import time

images_folder = "images/auto_images/94"
for i in range(0,10): #10 images
    time.sleep(8) # 8s interval
    im = ImageGrab.grab(bbox=(150,230,900,900)) #location of top left of pc window...adjust X1, Y1, X2, Y2 as required
    print("saved.....", i)
    im.save(images_folder+str(i)+'.png')
    print("clear screen and redraw now...")

! pip install Numpy

! pip install opencv-python

# Generate Dataset

import cv2
import csv
import glob

header = ["label"]
for i in range(0,784): 
    header.append("pixel"+str(i)) 
with open('datasets/character_dataset.csv', 'a') as f: #input correct dataset CSV file name
    writer = csv.writer(f) 
    writer.writerow(header) 
for label in range(10): 
    dirList = glob.glob("images/captured_images/"+str(label)+"/*.png") #specify the folder where training & testing images are stored
    for img_path in dirList:
        im = cv2.imread(img_path)
        im_gray = cv2.cvtColor(im, cv2.COLOR_BGR2GRAY) 
        im_gray = cv2.GaussianBlur(im_gray,(15,15),0) 
        roi = cv2.resize(im_gray, (28,28), interpolation=cv2.INTER_AREA)
    
        data = []
        data.append(label)
        rows, cols = roi.shape

        # Add px one by one into data array
        for i in range(rows):
            for j in range(cols):
                k = roi[i,j]
                if k > 100: #threshold value
                    k = 1 
                else:
                    k = 0
                data.append(k)
        with open('datasets/character_dataset.csv', 'a') as f: #Opens file in append mode
            writer = csv.writer(f) 
            writer.writerow(data) # Writes one row per processed image

# Load Dataset  

import pandas as pd
from sklearn.utils import shuffle  #shuffle to randomly order data instead of ordered from small to large

data = pd.read_csv("datasets/character_dataset.csv")
data = shuffle(data)
data

x = data.drop("label", axis= 1) #remove the 1st column from the dataframe. "1" causes vertical separation
y = data["label"]

# preview one image using Matplotlib

%matplotlib inline
import matplotlib.pyplot as plt
import cv2
idx =  319 #input a row index value...from the 1st column
img = x.loc[idx].values.reshape(28,28) #grab x-values for the index row and reshape into a 28 x 28
print(y[idx])
plt.imshow(img)

import joblib
from sklearn.svm import SVC
classifier = SVC(kernel="linear", random_state=6) #
classifier.fit(train_x, train_y) #create model
joblib.dump(classifier, "model/digit_recognizer") #save model

from sklearn import metrics
predictions = classifier.predict(test_x) #using only x values, no need for y labels
print("Accuracy:  ", metrics.accuracy_score(predictions, test_y)) #accuracy_score compares the model predictions with the data value label

Data Science/Session 4 > Machine Learning¶

Class Notes¶

Goals for the Week¶

Neural Network¶

Training¶

Models¶

Frameworks¶

Research > Machine Learning¶

Assignment¶

Python & Machine Learning¶

Screen Capture¶

Training Data Generation¶

Generate Dataset from Character Images¶

Loading the Dataset¶

Train the Model¶

Separating into Training & Testing Data¶

Fit a SVM Neural Network Model using SVC and Save the Model using Joblib¶

Calculate Accuracy¶

Extra Work: Running Jupyter Notebook Locally¶

Test-Train Split¶

	label	pixel0	pixel1	pixel2	pixel3	pixel4	pixel5	pixel6	pixel7	pixel8	...	pixel774	pixel775	pixel776	pixel777	pixel778	pixel779	pixel780	pixel781	pixel782	pixel783
308	9	0	0	0	0	0	0	0	0	0	...	0	0	0	0	0	0	0	0	0	0
196	6	0	0	0	0	0	0	0	0	0	...	0	0	0	0	0	0	0	0	0	0
12	0	0	0	0	0	0	0	0	0	0	...	0	0	0	0	0	0	0	0	0	0
63	1	0	0	0	0	0	0	0	0	0	...	0	0	0	0	0	0	0	0	0	0
309	9	0	0	0	0	0	0	0	0	0	...	0	0	0	0	0	0	0	0	0	0
...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...
217	6	0	0	0	0	0	0	0	0	0	...	0	0	0	0	0	0	0	0	0	0
139	4	0	0	0	0	0	0	0	0	0	...	0	0	0	0	0	0	0	0	0	0
31	0	0	0	0	0	0	0	0	0	0	...	0	0	0	0	0	0	0	0	0	0
173	5	0	0	0	0	0	0	0	0	0	...	0	0	0	0	0	0	0	0	0	0
152	4	0	0	0	0	0	0	0	0	0	...	0	0	0	0	0	0	0	0	0	0

	label	pixel0	pixel1	pixel2	pixel3	pixel4	pixel5	pixel6	pixel7	pixel8	...	pixel774	pixel775	pixel776	pixel777	pixel778	pixel779	pixel780	pixel781	pixel782	pixel783
308	9	0	0	0	0	0	0	0	0	0	...	0	0	0	0	0	0	0	0	0	0
196	6	0	0	0	0	0	0	0	0	0	...	0	0	0	0	0	0	0	0	0	0
12	0	0	0	0	0	0	0	0	0	0	...	0	0	0	0	0	0	0	0	0	0
63	1	0	0	0	0	0	0	0	0	0	...	0	0	0	0	0	0	0	0	0	0
309	9	0	0	0	0	0	0	0	0	0	...	0	0	0	0	0	0	0	0	0	0
...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...
217	6	0	0	0	0	0	0	0	0	0	...	0	0	0	0	0	0	0	0	0	0
139	4	0	0	0	0	0	0	0	0	0	...	0	0	0	0	0	0	0	0	0	0
31	0	0	0	0	0	0	0	0	0	0	...	0	0	0	0	0	0	0	0	0	0
173	5	0	0	0	0	0	0	0	0	0	...	0	0	0	0	0	0	0	0	0	0
152	4	0	0	0	0	0	0	0	0	0	...	0	0	0	0	0	0	0	0	0	0

	label	pixel0	pixel1	pixel2	pixel3	pixel4	pixel5	pixel6	pixel7	pixel8	...	pixel774	pixel775	pixel776	pixel777	pixel778	pixel779	pixel780	pixel781	pixel782	pixel783
308	9	0	0	0	0	0	0	0	0	0	...	0	0	0	0	0	0	0	0	0	0
196	6	0	0	0	0	0	0	0	0	0	...	0	0	0	0	0	0	0	0	0	0
12	0	0	0	0	0	0	0	0	0	0	...	0	0	0	0	0	0	0	0	0	0
63	1	0	0	0	0	0	0	0	0	0	...	0	0	0	0	0	0	0	0	0	0
309	9	0	0	0	0	0	0	0	0	0	...	0	0	0	0	0	0	0	0	0	0
...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...
217	6	0	0	0	0	0	0	0	0	0	...	0	0	0	0	0	0	0	0	0	0
139	4	0	0	0	0	0	0	0	0	0	...	0	0	0	0	0	0	0	0	0	0
31	0	0	0	0	0	0	0	0	0	0	...	0	0	0	0	0	0	0	0	0	0
173	5	0	0	0	0	0	0	0	0	0	...	0	0	0	0	0	0	0	0	0	0
152	4	0	0	0	0	0	0	0	0	0	...	0	0	0	0	0	0	0	0	0	0