Initial commit

2025-11-23 18:03:01 -08:00
commit 68b9adef1a
14 changed files with 423 additions and 0 deletions
--- a/.gitignore
+++ b/.gitignore
@@ -0,0 +1,4 @@
+__pycache__/
+*.pyc
+*.png
+.DS_Store
--- a/9
+++ b/9
@@ -0,0 +1,9 @@
+FROM python:3.11
+COPY ./app /source
+RUN pip install --upgrade pip
+RUN pip install --no-cache-dir -r /source/requirements.txt
+EXPOSE 3000
+RUN useradd app
+USER app
+WORKDIR source
+CMD ["gunicorn", "-b", "0.0.0.0:3000", "app:app"]
--- a/README.md
+++ b/README.md
@@ -0,0 +1,52 @@
+# shapeAI
+
+_Forked from [@quentinbkk's shape ai](https://github.com/quentinbkk/shapeAI)_
+
+Shape AI is a web app utilizing a classifier model to identify user drawn geometric shapes. Currently, the model can identify drawn squares, rectangles, circles, and triangles.
+
+**[Try it live ✏️](https://shapeai.craisin.tech)**
+
+## Running the App 🏃
+### Docker 🐋
+```bash
+git clone https://github.com/craisined/shapeAI
+cd shapeAI
+docker build -t shapeAI .
+docker run -p 3000:3000 shapeAI
+```
+### Manually 🖥️
+```bash
+git clone https://github.com/craisined/shapeAI
+cd shapeAI
+python3 -m venv env
+source env/bin/activate
+cd app
+pip install -r requirements.txt
+gunicorn -b 0.0.0.0:3000 app:app
+```
+
+## Model Training 💪
+OpenCV is used to synthetically generate training data in ```training/generate_shapes.py```.
+
+Data is stored in ```training/data``` - add and modify the folder to add training cases.
+
+Run ```training/train.py``` to train the model - exports to ```shape_model.keras```.
+
+## Technical Overview 👨‍💻
+### Abilities
+1. High training accuracy - model consistently trains with accuracy > 99%
+2. Fast speed - model has sub 50ms response times
+3. Synthetic data and preproccessing - generates training data and sends user drawing from website to language model
+### Frameworks
+1. Model built with Tensorflow and Keras
+2. Image manipulation built using OpenCV and Pillow
+3. Backend built using Flask
+4. Frontend built using vanilla HTML, CSS, JS
+### Changes from original fork
+1. Web UI and Flask backend added
+2. Synthetic training data altered to produce a more human friendly model
+### WIP
+1. Low accuracy on certain cases - further improve synthetic shape generation
+2. Add confidence for classification - do not display a result if confidence is low
+3. Imporve mobile UI to further prevent scroll while drawing
+4. Expand dataset to various alphanumerical characters
--- a/app/app.py
+++ b/app/app.py
@@ -0,0 +1,29 @@
+from base64 import b64decode
+from flask import Flask, render_template, request
+import io
+from keras.preprocessing.image import img_to_array
+import model
+import numpy as np
+from PIL import Image
+
+app = Flask(__name__)
+HOST="0.0.0.0"
+PORT=3000
+
+@app.route("/")
+def index():
+    return render_template("index.html")
+
+@app.route("/shape_model")
+def shape_model():
+    encoded_img = request.args["img"]
+    encoded_img = encoded_img.replace("data:image/png;base64,", "", 1)
+    img = b64decode(encoded_img)
+    img = Image.open(io.BytesIO(img))
+    img = img.convert("L")
+    img = img_to_array(img)
+    prediction = model.run_model(img)
+    return prediction
+
+if __name__ == "__main__":
+    app.run(HOST, port=PORT)
--- a/app/model.py
+++ b/app/model.py
@@ -0,0 +1,12 @@
+from keras import models, layers
+import numpy as np
+
+model = models.load_model("model/shape_model.keras")
+labels = ["circle ○", "rectangle ▭", "square □", "triangle △"]
+def run_model(image):
+    img = np.expand_dims(image, axis=0)
+    prediction = np.argmax(model.predict(img))
+    return labels[prediction]
+
+if __name__=="__main__":
+    print(run_model(input("Image path: ")))
--- a/app/model/shape_model.keras
+++ b/app/model/shape_model.keras
--- a/app/requirements.txt
+++ b/app/requirements.txt
@@ -0,0 +1,43 @@
+absl-py==2.3.1
+astunparse==1.6.3
+blinker==1.9.0
+certifi==2025.10.5
+charset-normalizer==3.4.4
+click==8.3.0
+Flask==3.1.2
+flatbuffers==25.9.23
+gast==0.6.0
+google-pasta==0.2.0
+grpcio==1.76.0
+gunicorn==23.0.0
+h5py==3.15.1
+idna==3.11
+itsdangerous==2.2.0
+Jinja2==3.1.6
+keras==3.11.3
+libclang==18.1.1
+Markdown==3.9
+markdown-it-py==4.0.0
+MarkupSafe==3.0.3
+mdurl==0.1.2
+ml_dtypes==0.5.3
+namex==0.1.0
+numpy==2.2.6
+opencv-python==4.12.0.88
+opt_einsum==3.4.0
+optree==0.17.0
+packaging==25.0
+pillow==12.0.0
+protobuf==6.33.0
+Pygments==2.19.2
+requests==2.32.5
+rich==14.2.0
+six==1.17.0
+tensorboard==2.20.0
+tensorboard-data-server==0.7.2
+tensorflow==2.20.0
+termcolor==3.1.0
+typing_extensions==4.15.0
+urllib3==2.5.0
+Werkzeug==3.1.3
+wrapt==2.0.0
--- a/app/static/quentin.jpg
+++ b/app/static/quentin.jpg
--- a/app/static/script.js
+++ b/app/static/script.js
@@ -0,0 +1,57 @@
+var c = document.getElementById("canvas");
+var ctx = c.getContext("2d");
+
+var aiBox = document.getElementById("shapeBox");
+
+var isDragging = false;
+
+function draw(e){
+    var canvas_width = 0.4 * document.documentElement.clientWidth;
+    if (document.documentElement.clientWidth <= 1000){
+        canvas_width = 0.8 * document.documentElement.clientWidth;
+    }
+    var rect = canvas.getBoundingClientRect();
+
+    if (e.type.includes(`touch`)) {
+        const { touches, changedTouches } = e.originalEvent ?? e;
+        const touch = touches[0] ?? changedTouches[0];
+        var posx = (touch.pageX - rect.left) * 64 / canvas_width;
+        var posy = (touch.pageY - rect.top) * 64 / canvas_width;
+    } else if (e.type.includes(`mouse`)) {
+        var posx = (e.clientX - rect.left) * 64 / canvas_width;
+        var posy = (e.clientY - rect.top) * 64 / canvas_width;
+    }
+    if (isDragging){
+        ctx.fillStyle = "#000000";
+        ctx.beginPath()
+        ctx.arc(posx, posy, 1, 0, 2*Math.PI);
+        ctx.fill();
+    }
+}
+
+function clear_canvas(){
+    ctx.fillStyle = "#FFFFFF";
+    ctx.beginPath();
+    ctx.fillRect(0, 0, 64, 64);
+    ctx.fill();
+}
+
+function send_image(){
+    var img = c.toDataURL();
+    const params = new URLSearchParams();
+    params.append("img", img);
+    fetch(`/shape_model?${params}`).then(
+        function (r) {return r.text();}
+    ).then(
+        function (r) {aiBox.innerHTML = r;}
+    );
+}
+
+clear_canvas();
+setInterval(send_image, 1000);
+c.addEventListener("mousemove", draw);
+c.addEventListener('touchmove', draw);
+c.addEventListener('mousedown', function(e){isDragging = true;});
+c.addEventListener('touchstart', function(e){isDragging = true;});
+c.addEventListener('mouseup', function(e){isDragging = false;});
+c.addEventListener('touchend', function(e){isDragging = false;});
--- a/app/static/style.css
+++ b/app/static/style.css
@@ -0,0 +1,60 @@
+html, body{
+    margin: 0px;
+    font-family: "Lexend", sans-serif;
+    font-weight: 300;
+    overscroll-behavior-y: contain;
+    overflow-x: hidden;
+}
+#textArea{
+    background: #f8f8ff;
+    width: 40vw;
+    height: 100vh;
+    float: left;
+    display: flex;
+    justify-content: center;
+    align-items: center;
+}
+#drawingArea{
+    width: 60vw;
+    float: right;
+}
+
+#canvas{
+    border-style: solid;
+    border-width: 4px;
+    margin-left: 10vw;
+    margin-right: 10vw;
+    margin-top: calc(50vh - 20vw);
+    width:40vw;
+    height:40vw;
+}
+#quentinImg{
+    display: inline-block;
+    height: 1em;
+    width: auto;
+    border-radius: 30%;
+}
+h1{
+    font-size: 64px;
+}
+h2{
+    font-size: 48px;
+}
+p{
+    font-size: 24px;
+}
+@media only screen and (max-width:1000px)  {
+    #textArea{
+        width: 100vw;
+        height: 20vh;
+    }
+    #drawingArea{
+        width: 100vw;
+        height: 80vh;
+    }
+    #canvas{
+        width: 80vw;
+        height: 80vw;
+        margin-top: calc(40vh - 40vw);
+    }
+}
--- a/app/templates/index.html
+++ b/app/templates/index.html
@@ -0,0 +1,24 @@
+<!DOCTYPE html>
+<html>
+    <head>
+        <title>hello @quentinbkk i have found ur github :D</title>
+        <link href="/static/style.css" rel="stylesheet">
+        <link rel="preconnect" href="https://fonts.googleapis.com">
+        <link rel="preconnect" href="https://fonts.gstatic.com" crossorigin>
+        <link href="https://fonts.googleapis.com/css2?family=Lexend:wght@100..900&display=swap" rel="stylesheet">
+    </head>
+    <body>
+        <div id="textArea">
+            <div>
+                <h1>Shape AI</h1>
+                <h2>I see a <span id="shapeBox">...</span></h2>
+                <p>Based on <a href="https://github.com/quentinbkk/shapeAI">ShapeAI</a> by <a href="https://github.com/quentinbkk">@quentinbkk</a> <img id="quentinImg" src="/static/quentin.jpg"></p>
+            </div>
+        </div>
+        <div id="drawingArea">
+            <canvas id="canvas" id="canvas", width=64px, height=64px></canvas><br>
+            <center><h3 onclick="clear_canvas()">Reset</h3></center>
+        </div>
+    </body>
+    <script src="/static/script.js"></script>
+</html>
--- a/training/generate_shapes.py
+++ b/training/generate_shapes.py
@@ -0,0 +1,65 @@
+import os
+import cv2
+import numpy as np
+import random
+
+IMG_SIZE = 64
+NUM_IMAGES = 250  # Number of images per class
+OUTPUT_DIR = 'data'
+
+# Ensure folders exist
+shapes = ['circle', 'square', 'rectangle', 'triangle']
+for shape in shapes:
+    os.makedirs(os.path.join(OUTPUT_DIR, shape), exist_ok=True)
+
+def draw_circle():
+    img = np.ones((IMG_SIZE, IMG_SIZE), dtype=np.uint8) * 255
+    center = (random.randint(8, 56), random.randint(8, 56))
+    radius = random.randint(4, min(60 - max(center), min(center)))
+    cv2.circle(img, center, radius, (0,), 2)
+    return img
+
+def draw_square():
+    img = np.ones((IMG_SIZE, IMG_SIZE), dtype=np.uint8) * 255
+    start = (random.randint(4, 56), random.randint(4, 56))
+    size = random.randint(4, 60 - max(start))
+    cv2.rectangle(img, start, (start[0]+size + random.randint(0, 3), start[1]+size + random.randint(0, 3)), (0,), 2)
+    return img
+
+def draw_rectangle():
+    img = np.ones((IMG_SIZE, IMG_SIZE), dtype=np.uint8) * 255
+    vertical = random.randint(0, 1)
+    long, short = (random.randint(4, 28), random.randint(33, 56))
+    if vertical:
+        start = (random.randint(4, 60 - short), random.randint(4, 60 - long))
+        width, height = short, long
+    else:
+        start = (random.randint(4, 60 - long), random.randint(4, 60 - short))
+        width, height = long, short
+    cv2.rectangle(img, start, (start[0]+width, start[1]+height), (0,), 2)
+    return img
+
+def draw_triangle():
+    img = np.ones((IMG_SIZE, IMG_SIZE), dtype=np.uint8) * 255
+    pt1 = (random.randint(4, 60), random.randint(4, 60))
+    pt2 = (random.randint(4, 60), random.randint(4, 60))
+    pt3 = (random.randint(4, 60), random.randint(4, 60))
+    points = np.array([pt1, pt2, pt3])
+    cv2.drawContours(img, [points], 0, (0,), 2)
+    return img
+
+draw_functions = {
+    'circle': draw_circle,
+    'square': draw_square,
+    'rectangle': draw_rectangle,
+    'triangle': draw_triangle
+}
+
+# ----- Generate images -----
+for shape in shapes:
+    for i in range(NUM_IMAGES):
+        img = draw_functions[shape]()
+        filename = os.path.join(OUTPUT_DIR, shape, f"{shape}_{i}.png")
+        cv2.imwrite(filename, img)
+
+print("Images generated successfully!")
--- a/training/shape_model.keras
+++ b/training/shape_model.keras
--- a/training/train.py
+++ b/training/train.py
@@ -0,0 +1,68 @@
+import tensorflow as tf
+from keras import layers, models
+from keras.preprocessing import image
+import pathlib
+import numpy as np
+
+IMG_SIZE = 64
+BATCH_SIZE = 8
+NUM_CLASSES = 4
+EPOCHS = 10
+
+data_dir = pathlib.Path("data")
+
+train_ds = tf.keras.utils.image_dataset_from_directory(
+    data_dir,
+    labels='inferred',
+    label_mode='categorical',
+    color_mode='grayscale',
+    batch_size=BATCH_SIZE,
+    image_size=(IMG_SIZE, IMG_SIZE),
+    validation_split=0.2,
+    subset="training",
+    seed=123
+)
+
+val_ds = tf.keras.utils.image_dataset_from_directory(
+    data_dir,
+    labels='inferred',
+    label_mode='categorical',
+    color_mode='grayscale',
+    batch_size=BATCH_SIZE,
+    image_size=(IMG_SIZE, IMG_SIZE),
+    validation_split=0.2,
+    subset="validation",
+    seed=123
+)
+
+AUTOTUNE = tf.data.AUTOTUNE
+train_ds = train_ds.cache().shuffle(100).prefetch(buffer_size=AUTOTUNE)
+val_ds = val_ds.cache().prefetch(buffer_size=AUTOTUNE)
+
+model = models.Sequential([
+    layers.Rescaling(1/255, input_shape=(IMG_SIZE, IMG_SIZE, 1)),
+    layers.Conv2D(32, (3,3), activation='relu'),
+    layers.MaxPooling2D(2,2),
+
+    layers.Conv2D(64, (3,3), activation='relu'),
+    layers.MaxPooling2D(2,2),
+
+    layers.Flatten(),
+    layers.Dense(64, activation='relu'),
+    layers.Dense(NUM_CLASSES, activation='softmax')
+])
+
+model.compile(
+    optimizer='adam',
+    loss='categorical_crossentropy',
+    metrics=['accuracy']
+)
+
+model.fit(
+    train_ds,
+    validation_data=val_ds,
+    epochs=EPOCHS
+)
+
+model.save("shape_model.keras")
+print("Saved model")