Spaces:

immartian
/

betterdigits

Sleeping

App Files Files Community

im2 commited on Sep 12

Commit

d1d4583

•

1 Parent(s): cbb8b31

remolve transformer

Browse files

Files changed (2) hide show

app.py +46 -28
requirements.txt +1 -2

app.py CHANGED Viewed

@@ -2,44 +2,62 @@ import gradio as gr
 import torch
 from torchvision import transforms
 from PIL import Image
-from transformers import AutoModelForImageClassification, AutoFeatureExtractor
-# Load the model and feature extractor from Hugging Face
-model_name = "immartian/improved_digits_recognition"
-model = AutoModelForImageClassification.from_pretrained(model_name)
-feature_extractor = AutoFeatureExtractor.from_pretrained(model_name)
-# Preprocessing function to transform the drawn image into a format the model can recognize
-def preprocess_image(image):
-    # Convert the image into a format suitable for the model
-    image = Image.fromarray(image).convert('L')  # Convert to grayscale
-    image = image.resize((28, 28))  # Resize to 28x28 pixels
-    image = image.convert('RGB')  # Model expects 3-channel images, so convert to RGB
-    inputs = feature_extractor(images=image, return_tensors="pt")
-    return inputs['pixel_values']
-# Prediction function to classify the drawn digit
 def predict_digit(image):
-    # Preprocess the input image
-    inputs = preprocess_image(image)
-    # Make the prediction
-    with torch.no_grad():
-        outputs = model(inputs)
-        predicted_label = outputs.logits.argmax(-1).item()
-    return f"Predicted Digit: {predicted_label}"
-# Gradio interface for drawing the digit and displaying the prediction
-demo = gr.Interface(
     fn=predict_digit,
-    inputs="sketchpad",  # Allow users to draw a digit
     outputs="text",
-    title="MNIST Digit Recognition",
-    description="Draw a digit (0-9) and let the model recognize it!",
-    live=True  # The prediction updates while the user draws
 )
 # Launch the app
 if __name__ == "__main__":
-    demo.launch()

 import torch
 from torchvision import transforms
 from PIL import Image
+# Load the model using PyTorch
+model_path = "https://huggingface.co/immartian/improved_digits_recognition/resolve/main/pytorch_model.bin"
+# Define your ImageClassifier model architecture (same as used during training)
+class ImageClassifier(torch.nn.Module):
+    def __init__(self):
+        super().__init__()
+        self.model = torch.nn.Sequential(
+            torch.nn.Conv2d(1, 32, (3, 3)),
+            torch.nn.ReLU(),
+            torch.nn.Conv2d(32, 64, (3, 3)),
+            torch.nn.ReLU(),
+            torch.nn.Conv2d(64, 64, (3, 3)),
+            torch.nn.ReLU(),
+            torch.nn.AdaptiveAvgPool2d((1, 1)),
+            torch.nn.Flatten(),
+            torch.nn.Linear(64, 10)
+        )
+    def forward(self, x):
+        return self.model(x)
+# Instantiate the model and load weights
+model = ImageClassifier()
+model.load_state_dict(torch.hub.load_state_dict_from_url(model_path))
+model.eval()
+# Gradio preprocessing and prediction pipeline
 def predict_digit(image):
+    # Preprocess the image: resize to 28x28, convert to grayscale, and normalize
+    image = image.convert('L')  # Convert to grayscale
+    transform = transforms.Compose([
+        transforms.Resize((28, 28)),
+        transforms.ToTensor(),
+        transforms.Normalize((0.5,), (0.5,))
+    ])
+    img_tensor = transform(image).unsqueeze(0)  # Add batch dimension
+    # Pass through the model
+    with torch.no_grad():
+        output = model(img_tensor)
+        predicted_label = torch.argmax(output, dim=1).item()
+    return f"Predicted Label: {predicted_label}"
+# Create Gradio Interface
+interface = gr.Interface(
     fn=predict_digit,
+    inputs=gr.Image(source="canvas", tool="editor", type="pil"),  # User can draw on a canvas
     outputs="text",
+    title="Digit Recognizer",
+    description="Draw a digit (0-9) and the model will predict the number!"
 )
 # Launch the app
 if __name__ == "__main__":
+    interface.launch()

requirements.txt CHANGED Viewed

@@ -1,5 +1,4 @@
 torch
 torchvision
 gradio
-transformers
-Pillow  # Required for image processing

 torch
 torchvision
 gradio
+Pillow