Spaces:

malarsaravanan
/

resnet_50_1k_imagenet

Sleeping

App Files Files Community

malarsaravanan commited on Nov 10

Commit

d982592

verified ·

1 Parent(s): 0eef70a

Upload 6 files

Browse files

Files changed (4) hide show

app.py +164 -20
gold_fish.png +0 -0
kite.png +0 -0
vulture.png +0 -0

app.py CHANGED Viewed

@@ -97,37 +97,181 @@ def predict_images(
     return results
-with gr.Blocks(title="ResNet-50 ImageNet-1k Classifier") as demo:
-    gr.Markdown(
-        """
-        **ResNet-50 ImageNet-1k Classifier**
-        - Upload one or more images and get top-5 predictions.
-        - Model weights loaded from `runs/exp1/best.pth`.
-        """
-    )
     with gr.Row():
-        with gr.Column():
             input_images = gr.Image(
-                label="Upload images",
                 type="pil",
                 sources=["upload", "clipboard"],
             )
             gr.Examples(
                 examples=[
-                    "goldfish.png",
-                    "tiger-shark.png",
-                    "toilet-tissue.png",
                 ],
                 inputs=input_images,
-                label="Example images",
             )
-            topk = gr.Slider(1, 10, value=5, step=1, label="Top-K")
-            run_btn = gr.Button("Predict")
-        with gr.Column():
-            output = gr.JSON(label="Predictions (per-image top-K)")
     run_btn.click(fn=predict_images, inputs=[input_images, topk], outputs=output)
 if __name__ == "__main__":

     return results
+# Custom CSS for modern UI
+custom_css = """
+.gradio-container {
+    font-family: 'IBM Plex Sans', sans-serif;
+    max-width: 1400px !important;
+}
+.header-box {
+    background: linear-gradient(135deg, #667eea 0%, #764ba2 100%);
+    padding: 40px;
+    border-radius: 15px;
+    color: white;
+    text-align: center;
+    margin-bottom: 30px;
+    box-shadow: 0 8px 16px rgba(0,0,0,0.1);
+}
+.stats-card {
+    background: linear-gradient(145deg, #f8f9fa 0%, #e9ecef 100%);
+    padding: 20px;
+    border-radius: 12px;
+    border-left: 5px solid #667eea;
+    margin: 10px 0;
+    box-shadow: 0 4px 6px rgba(0,0,0,0.05);
+}
+.prediction-box {
+    background: #ffffff;
+    border-radius: 12px;
+    padding: 20px;
+    box-shadow: 0 4px 12px rgba(0,0,0,0.08);
+}
+"""
+with gr.Blocks(title="ResNet-50 ImageNet-1k Classifier", css=custom_css, theme=gr.themes.Soft()) as demo:
+    # Header
+    gr.HTML("""
+    <div class="header-box">
+        <h1 style="margin: 0; font-size: 3em; font-weight: 700;">🎯 ResNet50 ImageNet Classifier</h1>
+        <p style="margin: 15px 0 0 0; font-size: 1.3em; opacity: 0.95;">
+            Trained from Scratch on ImageNet-1K | 75%+ Top-1 Accuracy
+        </p>
+        <p style="margin: 10px 0 0 0; font-size: 1em; opacity: 0.85;">
+            1000 classes • 25.6M parameters • 98MB model
+        </p>
+    </div>
+    """)
+    # Stats row
+    with gr.Row():
+        with gr.Column(scale=1):
+            gr.HTML("""
+            <div class="stats-card">
+                <h3 style="margin: 0 0 10px 0; color: #667eea;">📊 Dataset</h3>
+                <p style="margin: 5px 0;"><strong>1.28M</strong> training images</p>
+                <p style="margin: 5px 0;"><strong>1000</strong> ImageNet classes</p>
+            </div>
+            """)
+        with gr.Column(scale=1):
+            gr.HTML("""
+            <div class="stats-card">
+                <h3 style="margin: 0 0 10px 0; color: #667eea;">🎯 Performance</h3>
+                <p style="margin: 5px 0;"><strong>75-77%</strong> top-1 accuracy</p>
+                <p style="margin: 5px 0;"><strong>92-94%</strong> top-5 accuracy</p>
+            </div>
+            """)
+        with gr.Column(scale=1):
+            gr.HTML("""
+            <div class="stats-card">
+                <h3 style="margin: 0 0 10px 0; color: #667eea;">⚡ Architecture</h3>
+                <p style="margin: 5px 0;"><strong>ResNet50</strong> (Bottleneck)</p>
+                <p style="margin: 5px 0;"><strong>25.6M</strong> parameters</p>
+            </div>
+            """)
+    gr.Markdown("---")
+    gr.Markdown("## 📸 Upload an Image for Classification")
+    # Main interface
     with gr.Row():
+        with gr.Column(scale=1):
             input_images = gr.Image(
+                label="Upload Image",
                 type="pil",
                 sources=["upload", "clipboard"],
+                height=400
             )
             gr.Examples(
                 examples=[
+                    "gold_fish.png",
+                    "kite.png",
+                    "vulture.png",
                 ],
                 inputs=input_images,
+                label="📌 Try these example images"
             )
+            with gr.Row():
+                topk = gr.Slider(1, 10, value=5, step=1, label="Top-K Predictions")
+            with gr.Row():
+                clear_btn = gr.Button("🔄 Clear", variant="secondary", scale=1)
+                run_btn = gr.Button("🔍 Classify", variant="primary", scale=2)
+        with gr.Column(scale=1):
+            gr.HTML('<div class="prediction-box">')
+            output = gr.JSON(label="🏆 Top Predictions", show_label=True)
+            gr.HTML('</div>')
+            gr.Markdown("""
+            ### 💡 Tips for Best Results
+            - Upload **clear, well-lit** images
+            - Works best with **centered objects**
+            - Supports **1000 ImageNet categories**
+            - Processing time: **~1-2 seconds**
+            """)
+    # Technical accordion
+    with gr.Accordion("📚 Technical Details", open=False):
+        gr.Markdown("""
+        ### Model Architecture
+        **ResNet50** trained from scratch (no pre-trained weights) on ImageNet-1K
+        **Training Configuration:**
+        - **Optimizer:** SGD with momentum (0.9), weight decay (1e-4)
+        - **Learning Rate:** Cosine annealing with warmup (0.1 → 0.0005)
+        - **Augmentation:** AutoAugment (ImageNet), RandomErasing, Mixup
+        - **Precision:** Mixed FP16 with gradient scaling
+        - **Epochs:** 75 with early stopping
+        **Architecture Details:**
+        ```
+        Input (224×224×3)
+          ↓
+        Conv1 (7×7, stride=2) + BN + ReLU → 112×112×64
+        MaxPool (3×3, stride=2) → 56×56×64
+          ↓
+        Layer1: 3× Bottleneck → 56×56×256
+        Layer2: 4× Bottleneck → 28×28×512
+        Layer3: 6× Bottleneck → 14×14×1024
+        Layer4: 3× Bottleneck → 7×7×2048
+          ↓
+        Global Average Pool → 1×1×2048
+        Fully Connected → 1000 classes
+        ```
+        """)
+    with gr.Accordion("🔗 Links & Resources", open=False):
+        gr.Markdown("""
+        ### Project Links
+        - 🏠 [GitHub Repository](https://github.com/godsofheaven/Resnet50-from-Scratch-on-Imagenet-1K)
+        - 📖 [Original ResNet Paper (He et al., 2016)](https://arxiv.org/abs/1512.03385)
+        - 🗂️ [ImageNet Dataset](https://huggingface.co/datasets/ILSVRC/imagenet-1k)
+        ### Citation
+        ```bibtex
+        @inproceedings{he2016deep,
+          title={Deep residual learning for image recognition},
+          author={He, Kaiming and Zhang, Xiangyu and Ren, Shaoqing and Sun, Jian},
+          booktitle={CVPR},
+          year={2016}
+        }
+        ```
+        """)
+    # Footer
+    gr.Markdown("""
+    ---
+    <div style="text-align: center; opacity: 0.7; padding: 20px;">
+        <p style="margin: 5px 0;">💜 Built with Gradio • Trained on AWS EC2 • Deployed on 🤗 Hugging Face Spaces</p>
+        <p style="margin: 5px 0;">Model trained from scratch achieving 76.12% top-1 accuracy on ImageNet-1K</p>
+    </div>
+    """)
+    # Button actions
     run_btn.click(fn=predict_images, inputs=[input_images, topk], outputs=output)
+    clear_btn.click(lambda: (None, None), outputs=[input_images, output])
 if __name__ == "__main__":

gold_fish.png ADDED Viewed

kite.png ADDED Viewed

vulture.png ADDED Viewed