# Check for fastai dependencies
import sys

try:
    from fastai.vision.all import *
    print("fastai is installed.")
except ImportError:
    print("fastai not found. Please install it via: pip install fastai")
    sys.exit(1)

fastai is installed.

# Define racquet categories
# These names will be passed in the image search request and used to create folders for the images
sports = ["tennis racquet", "badminton racquet", "squash racquet", "pickleball racquet"]

# Base image directory
base_dir = Path("images")

from pathlib import Path
import shutil

# Clean up and create folders
for item in sports:
    sport_folder = item.split()[0].lower()  # Get 'tennis' from 'tennis racquet'
    folder = base_dir / sport_folder
    if folder.exists():
        shutil.rmtree(folder)
        print(f"Removed existing folder: {folder.resolve()}")
        
    folder.mkdir(parents=True, exist_ok=True)
    print(f"Created folder: {folder.resolve()}")

import time, requests
from pathlib import Path
from duckduckgo_search import DDGS
from PIL import Image
from io import BytesIO
from PIL import ImageOps

MAX_SIZE = 400 #pixel size
DELAY = 0.5 #seconds

# Validate image bytes (not corrupted)
def is_valid_image(img_bytes):
    try:
        img = Image.open(BytesIO(img_bytes))
        img.verify()  # Check corruption

        # Re-open the image to access dimensions and file type
        # This is necessary because verify() doesn't load the image data
        # Refer: https://pillow.readthedocs.io/en/stable/reference/Image.html#PIL.Image.Image.verify

        img = Image.open(BytesIO(img_bytes))  

        if img.width < 200 or img.height < 200:
            print(f"Image too small: {img.width}x{img.height}")
            return False
        
        return True
    except Exception:
        return False

# Main download function
def download_images_bing(query, folder_path, max_images):
    print(f"\n~~~ Searching for: {query}")
    count = 0

    with DDGS() as ddgs:
        results = ddgs.images(query, max_results=max_images)
        for result in results:
            url = result.get("image")
            if not url:
                continue

            try:
                response = requests.get(url, timeout=10)
                response.raise_for_status()
                img_bytes = response.content

                if not is_valid_image(img_bytes):
                    continue  

                
                img = Image.open(BytesIO(img_bytes))
                file_ext = img.format.lower()
                if file_ext not in ["jpeg", "jpg", "png"]:
                    print(f"Unsupported image format: {file_ext}")
                    continue

                #resize the images greater than MAX_SIZE to MAX_SIZE     
                img = Image.open(BytesIO(img_bytes))       
                if img.width > MAX_SIZE or img.height > MAX_SIZE:
                    print(f"Resizing image: {img.width}x{img.height}")
                    img = ImageOps.contain(img, (MAX_SIZE, MAX_SIZE))  # Maintains aspect ratio                    
                    img_bytes_io = BytesIO()
                    img.save(img_bytes_io, format=file_ext)
                    img_bytes = img_bytes_io.getvalue()    
                             
                filename = f"{query.replace(' ', '_')}_{count:03d}.{file_ext}"
                filepath = Path(folder_path) / filename

                with open(filepath, "wb") as f:
                    f.write(img_bytes)

                count += 1
                print(f"Saved: {filepath}")

                time.sleep(DELAY)  # preventive measure for possible rate limiting on ddg

            except Exception as e:
                print(f"Error downloading {url}: {e}")

    print(f"Finished downloading {count} images for '{query}'")

# Download images for each racquet category
MAX_IMAGES = 300

for sport in sports:
    folder = Path("images") / sport.split()[0].lower()
    download_images_bing(sport, folder, MAX_IMAGES)

# Verify image downloads
for sport in sports:
    folder = Path("images") / sport.split()[0].lower()
    
    # Count all image files in the folder
    file_count = len(list(folder.glob("*.*")))

    if file_count == 0:
        print(f"No images found in {folder}.")
    else:
        print(f"{file_count} images found in {folder}.")

db = DataBlock(
    blocks=(ImageBlock, CategoryBlock), 
    get_items=get_image_files, 
    splitter=RandomSplitter(valid_pct=0.2, seed=42),
    get_y=parent_label,
    item_tfms=[Resize(192, method='pad')]
)

dls = db.dataloaders(base_dir, bs=64)

learn = vision_learner(dls, resnet18, metrics=error_rate)
learn.fine_tune(3)

/home/commando/python_envs/learn_ml/lib/python3.12/site-packages/PIL/Image.py:1045: UserWarning: Palette images with Transparency expressed in bytes should be converted to RGBA images
  warnings.warn(
/home/commando/python_envs/learn_ml/lib/python3.12/site-packages/PIL/Image.py:1045: UserWarning: Palette images with Transparency expressed in bytes should be converted to RGBA images
  warnings.warn(
/home/commando/python_envs/learn_ml/lib/python3.12/site-packages/PIL/Image.py:1045: UserWarning: Palette images with Transparency expressed in bytes should be converted to RGBA images
  warnings.warn(
/home/commando/python_envs/learn_ml/lib/python3.12/site-packages/PIL/Image.py:1045: UserWarning: Palette images with Transparency expressed in bytes should be converted to RGBA images
  warnings.warn(

/home/commando/python_envs/learn_ml/lib/python3.12/site-packages/PIL/Image.py:1045: UserWarning: Palette images with Transparency expressed in bytes should be converted to RGBA images
  warnings.warn(
/home/commando/python_envs/learn_ml/lib/python3.12/site-packages/PIL/Image.py:1045: UserWarning: Palette images with Transparency expressed in bytes should be converted to RGBA images
  warnings.warn(
/home/commando/python_envs/learn_ml/lib/python3.12/site-packages/PIL/Image.py:1045: UserWarning: Palette images with Transparency expressed in bytes should be converted to RGBA images
  warnings.warn(
/home/commando/python_envs/learn_ml/lib/python3.12/site-packages/PIL/Image.py:1045: UserWarning: Palette images with Transparency expressed in bytes should be converted to RGBA images
  warnings.warn(
/home/commando/python_envs/learn_ml/lib/python3.12/site-packages/PIL/Image.py:1045: UserWarning: Palette images with Transparency expressed in bytes should be converted to RGBA images
  warnings.warn(
/home/commando/python_envs/learn_ml/lib/python3.12/site-packages/PIL/Image.py:1045: UserWarning: Palette images with Transparency expressed in bytes should be converted to RGBA images
  warnings.warn(
22519.95s - thread._ident is None in _get_related_thread!
/home/commando/python_envs/learn_ml/lib/python3.12/site-packages/PIL/Image.py:1045: UserWarning: Palette images with Transparency expressed in bytes should be converted to RGBA images
  warnings.warn(
/home/commando/python_envs/learn_ml/lib/python3.12/site-packages/PIL/Image.py:1045: UserWarning: Palette images with Transparency expressed in bytes should be converted to RGBA images
  warnings.warn(
/home/commando/python_envs/learn_ml/lib/python3.12/site-packages/PIL/Image.py:1045: UserWarning: Palette images with Transparency expressed in bytes should be converted to RGBA images
  warnings.warn(
/home/commando/python_envs/learn_ml/lib/python3.12/site-packages/PIL/Image.py:1045: UserWarning: Palette images with Transparency expressed in bytes should be converted to RGBA images
  warnings.warn(
/home/commando/python_envs/learn_ml/lib/python3.12/site-packages/PIL/Image.py:1045: UserWarning: Palette images with Transparency expressed in bytes should be converted to RGBA images
  warnings.warn(
/home/commando/python_envs/learn_ml/lib/python3.12/site-packages/PIL/Image.py:1045: UserWarning: Palette images with Transparency expressed in bytes should be converted to RGBA images
  warnings.warn(
/home/commando/python_envs/learn_ml/lib/python3.12/site-packages/PIL/Image.py:1045: UserWarning: Palette images with Transparency expressed in bytes should be converted to RGBA images
  warnings.warn(

learn.model     #shows the complete architecture.
learn.model[0]  #shows the base layer (ResNet18).
learn.model[1]  #shows the head (custom classification layers).

learn.loss_func

FlattenedLoss of CrossEntropyLoss()

#set the test images path
test_images_folder = Path("test_images")

prefix_to_label = {
    'b': 'badminton',
    't': 'tennis',
    's': 'squash',
    'p': 'pickleball'
}

'badminton'

total = 0
correct = 0

for img_file in test_images_folder.ls():
    if img_file.suffix.lower() in ['.jpg', '.png', '.jpeg']:
        first_letter = img_file.name[0].lower() #p/b/t/s
        
        if first_letter not in prefix_to_label:
            print(f" -- Skipping :: Unknown prefix '{first_letter}' in filename '{img_file.name}'.")
            continue

        correct_label = prefix_to_label.get(first_letter)
        
        pred_label, pred_idx, probs = learn.predict(img_file)

        #get the probabilities for each category
       
        prob_str = ""
        for i in range(len(probs)):
            prob_percentage = round(probs[i].item()*100, 2)
            prob_category = learn.dls.vocab[i]
            prob_str = f"{prob_str} , {prob_category[0]}: {prob_percentage}"
                
        prob_str = prob_str[3:]       
        
        
        result = "xxx Incorrect xxx"
        if pred_label == correct_label:
            result = "Correct"   
            correct += 1

        total += 1         
        
        print(f" * {img_file.name} | Actual: {correct_label} | Predicted: {pred_label} | Probabilities: [{prob_str}] | {result}")

    else:
        print(f"\n -- Skipping ::  Unsupported file ext: {img_file.name}")

print(f"\n\nTotal images: {total}. Correct: {correct}.")
accuracy = correct / total * 100
print(f"Accuracy: {accuracy:.2f}%")

 -- Skipping :: Unknown prefix 'r' in filename 'r_3.png'.

 * p_2.jpeg | Actual: pickleball | Predicted: pickleball | Probabilities: [b: 0.0 , p: 99.91 , s: 0.01 , t: 0.08] | Correct

 -- Skipping ::  Unsupported file ext: p_football.webp

 * b_broken_1.jpg | Actual: badminton | Predicted: badminton | Probabilities: [b: 80.58 , p: 0.04 , s: 1.09 , t: 18.3] | Correct

 * t_2.jpeg | Actual: tennis | Predicted: tennis | Probabilities: [b: 0.36 , p: 7.9 , s: 0.12 , t: 91.63] | Correct

 * p_1.png | Actual: pickleball | Predicted: pickleball | Probabilities: [b: 0.0 , p: 100.0 , s: 0.0 , t: 0.0] | Correct

 * t_1.png | Actual: tennis | Predicted: squash | Probabilities: [b: 2.24 , p: 0.0 , s: 58.06 , t: 39.7] | xxx Incorrect xxx

 * s_2.png | Actual: squash | Predicted: squash | Probabilities: [b: 33.58 , p: 0.0 , s: 63.36 , t: 3.06] | Correct

 * b_1.png | Actual: badminton | Predicted: badminton | Probabilities: [b: 99.75 , p: 0.01 , s: 0.03 , t: 0.2] | Correct

 * p_22.png | Actual: pickleball | Predicted: pickleball | Probabilities: [b: 0.0 , p: 99.81 , s: 0.01 , t: 0.18] | Correct

 * b_broken_ch_2.png | Actual: badminton | Predicted: badminton | Probabilities: [b: 88.69 , p: 0.2 , s: 7.98 , t: 3.14] | Correct

# Save the trained model
learn.export('racquet_classifier.pkl')

learn_reborn = load_learner('racquet_classifier.pkl')

#Lets try to predict the category of a badminton image using the reborn model
pred_label, pred_idx, probs = learn_reborn.predict('./test_images/b_1.png')
pred_label #it successfully predicts the category as badminton

'badminton'

epoch	train_loss	valid_loss	error_rate	time
0	0.716825	0.562591	0.212290	00:51
1	0.523383	0.567538	0.206704	00:47
2	0.400680	0.560361	0.195531	00:57

epoch	train_loss	valid_loss	error_rate	time
0	0.663238	0.580100	0.201117	00:53
1	0.510640	0.544243	0.173184	00:51
2	0.372500	0.517990	0.150838	00:52

Header	Data Used	Purpose	Is Lower Better?
epoch	—	Indicates how many full passes the model has made over the training dataset.	—
train_loss	Training set	Measures how well the model fits the training data; used to guide weight updates during training.	Yes
valid_loss	Validation set	Evaluates how well the model generalizes to unseen data; key for detecting overfitting.	Yes
error_rate	Validation set	Proportion of incorrect predictions on validation data (1 - accuracy).	Yes
time	Whole epoch	Duration taken to complete one full epoch (training + validation).	—

Aspect	Validation Loss	Error Rate
Definition	A numerical value from the loss function (e.g., cross-entropy)	The fraction of incorrect predictions
What it Measures	How well the model's probability distribution matches the true labels	Whether the model's top predicted class is correct or not
Type	Continuous — can range across real values (e.g., 0.543)	Discrete — typically between 0 and 1 (e.g., 0.17 means 17% wrong)
Sensitivity	Sensitive to confidence in correct predictions	Only considers right vs wrong, regardless of confidence
Output Basis	Calculated from all predicted probabilities	Calculated from final class labels after argmax
Interpretability	More nuanced but harder to interpret directly	Very interpretable — “X% predictions were wrong”
Goal	Minimize it to improve model confidence and accuracy	Minimize it to reduce outright classification errors
Use Case	Guides training and optimization of the model	Helps judge real-world prediction performance

Setup Instructions¶

Create folders where images will be downloaded¶

Downloading Racquet Images¶

Let's proceed to train our model.¶

Training Our Model¶

Training Results¶

Initial Phase (frozen base layer)¶

Fine-Tuning Phase (unfrozen model)¶

Initial Phase (Frozen Base Model)¶

Inspecting the Model¶

Fine-Tuning Phase¶

Unfreezing the Base Model¶

Key Benefits¶

Detailed Explanation of Result Table Headers¶

1. epoch¶

2. train_loss (Training Loss)¶

3. valid_loss (Validation Loss)¶

4. error_rate¶

5. time¶

Summary¶

Training Loss vs. Error Rate¶

Example:¶

Interpreting Train Loss, Valid Loss and Error Rate¶

Testing the Trained Model on Unseen Images¶

Result Evaluation¶

Conclusion¶

- Add More and Better Training Data¶

- Use Data Augmentation¶

- Fine-Tune the Whole Model¶

Saving the Model¶

Thank You!¶