gradio-app · abidlabs · Sep 19, 2024 · Sep 12, 2024 · Sep 12, 2024 · Sep 12, 2024
diff --git a/demo/yolov10_webcam_stream/run.ipynb b/demo/yolov10_webcam_stream/run.ipynb
@@ -0,0 +1 @@
+{"cells": [{"cell_type": "markdown", "id": "302934307671667531413257853548643485645", "metadata": {}, "source": ["# Gradio Demo: yolov10_webcam_stream"]}, {"cell_type": "code", "execution_count": null, "id": "272996653310673477252411125948039410165", "metadata": {}, "outputs": [], "source": ["!pip install -q gradio "]}, {"cell_type": "code", "execution_count": null, "id": "288918539441861185822528903084949547379", "metadata": {}, "outputs": [], "source": ["import gradio as gr\n", "\n", "from ultralytics import YOLOv10\n", "\n", "model = YOLOv10.from_pretrained(\"jameslahm/yolov10n\")\n", "\n", "\n", "def yolov10_inference(image, conf_threshold):\n", "    width, _ = image.size\n", "    import time\n", "\n", "    start = time.time()\n", "    results = model.predict(source=image, imgsz=width, conf=conf_threshold)\n", "    end = time.time()\n", "    annotated_image = results[0].plot()\n", "    print(\"time\", end - start)\n", "    return annotated_image[:, :, ::-1]\n", "\n", "\n", "css = \"\"\".my-group {max-width: 600px !important; max-height: 600 !important;}\n", "                      .my-column {display: flex !important; justify-content: center !important; align-items: center !important};\"\"\"\n", "\n", "\n", "with gr.Blocks(css=css) as app:\n", "    gr.HTML(\n", "        \"\"\"\n", "    <h1 style='text-align: center'>\n", "    YOLOv10 Webcam Stream\n", "    </h1>\n", "    \"\"\"\n", "    )\n", "    gr.HTML(\n", "        \"\"\"\n", "        <h3 style='text-align: center'>\n", "        <a href='https://arxiv.org/abs/2405.14458' target='_blank'>arXiv</a> | <a href='https://github.com/THU-MIG/yolov10' target='_blank'>github</a>\n", "        </h3>\n", "        \"\"\"\n", "    )\n", "    with gr.Column(elem_classes=[\"my-column\"]):\n", "        with gr.Group(elem_classes=[\"my-group\"]):\n", "            image = gr.Image(type=\"pil\", label=\"Image\", sources=\"webcam\")\n", "            conf_threshold = gr.Slider(\n", "                label=\"Confidence Threshold\",\n", "                minimum=0.0,\n", "                maximum=1.0,\n", "                step=0.05,\n", "                value=0.30,\n", "            )\n", "        image.stream(\n", "            fn=yolov10_inference,\n", "            inputs=[image, conf_threshold],\n", "            outputs=[image],\n", "            stream_every=0.1,\n", "            time_limit=30,\n", "        )\n", "\n", "if __name__ == \"__main__\":\n", "    app.launch()\n"]}], "metadata": {}, "nbformat": 4, "nbformat_minor": 5}
diff --git a/demo/yolov10_webcam_stream/run.py b/demo/yolov10_webcam_stream/run.py
@@ -0,0 +1,58 @@
+import gradio as gr
+
+from ultralytics import YOLOv10
+
+model = YOLOv10.from_pretrained("jameslahm/yolov10n")
+
+
+def yolov10_inference(image, conf_threshold):
+    width, _ = image.size
+    import time
+
+    start = time.time()
+    results = model.predict(source=image, imgsz=width, conf=conf_threshold)
+    end = time.time()
+    annotated_image = results[0].plot()
+    print("time", end - start)
+    return annotated_image[:, :, ::-1]
+
+
+css = """.my-group {max-width: 600px !important; max-height: 600 !important;}
+                      .my-column {display: flex !important; justify-content: center !important; align-items: center !important};"""
+
+
+with gr.Blocks(css=css) as app:
+    gr.HTML(
+        """
+    <h1 style='text-align: center'>
+    YOLOv10 Webcam Stream
+    </h1>
+    """
+    )
+    gr.HTML(
+        """
+        <h3 style='text-align: center'>
+        <a href='https://arxiv.org/abs/2405.14458' target='_blank'>arXiv</a> | <a href='https://github.com/THU-MIG/yolov10' target='_blank'>github</a>
+        </h3>
+        """
+    )
+    with gr.Column(elem_classes=["my-column"]):
+        with gr.Group(elem_classes=["my-group"]):
+            image = gr.Image(type="pil", label="Image", sources="webcam")
+            conf_threshold = gr.Slider(
+                label="Confidence Threshold",
+                minimum=0.0,
+                maximum=1.0,
+                step=0.05,
+                value=0.30,
+            )
+        image.stream(
+            fn=yolov10_inference,
+            inputs=[image, conf_threshold],
+            outputs=[image],
+            stream_every=0.1,
+            time_limit=30,
+        )
+
+if __name__ == "__main__":
+    app.launch()
diff --git a/...tutorials/streaming-ai-generated-audio.md → ...eaming/01_streaming-ai-generated-audio.md b/...tutorials/streaming-ai-generated-audio.md → ...eaming/01_streaming-ai-generated-audio.md
diff --git a/guides/07_streaming/02_object-detection-from-webcam.md b/guides/07_streaming/02_object-detection-from-webcam.md
@@ -0,0 +1,93 @@
+# Object Detection from a Webcam Stream
+
+Tags: VISION, STREAMING, WEBCAM
+
+In this guide we'll use Yolo-v10 to do near-real time object detection in Gradio from a user's webcam.
+Along the way, we'll be using the latest streaming features introduced in Gradio 5.0.
+
+## Setting up the Model
+
+First, we'll follow the installation instructions for [Yolov10n](https://huggingface.co/jameslahm/yolov10n) on the Hugging Face hub. 
+
+Run `pip install git+https://github.com/THU-MIG/yolov10.git` in your virtual environment.
+
+Then, we'll download the model from the Hub (`ultralytics` is the library we've just installed).
+
+```python
+from ultralytics import YOLOv10
+
+model = YOLOv10.from_pretrained('jameslahm/yolov10n')
+```
+
+We are using the `yolov10-n` variant because it has the lowest latency. See the [Performance](https://github.com/THU-MIG/yolov10?tab=readme-ov-file#performance) section of the README in the github repository.
+
+
+## The Inference Function
+
+Our inference function will accept a PIL image from the webcam as well as a desired conference threshold.
+Object detection models like YOLO identify many objects and assign a confidence score to each object. The lower the confidence, the higher the chance of a false positive. So we will let our users play with the conference threshold.
+
+```python
+def yolov10_inference(image, conf_threshold):
+    width, _ = image.size
+    results = model.predict(source=image, imgsz=width, conf=conf_threshold)
+    annotated_image = results[0].plot()
+    return annotated_image[:, :, ::-1]
+```
+
+We will use the `plot` method to draw a bounding box around each detected object. YoloV10 asses images are in the BGR color format, so we will flip them to be in the expected RGB format of web browsers.
+
+## The Gradio Demo
+
+The Gradio demo will be pretty straightforward but we'll do a couple of things that are specific to streaming:
+
+* The user's webcam will be both an input and an output. That way, the user will only see their stream with the detected objects.
+* We'll use the `time_limit` and `stream_every` parameters of the `stream` event. The `time_limit` parameter will mean that we'll process each user's stream for that amount of time. The `stream_every` function will control how frequently the webcam stream is sent to the server.
+
+In addition, we'll apply some custom css so that the webcam and slider are centered on the page.
+
+```python
+css=""".my-group {max-width: 600px !important; max-height: 600 !important;}
+                      .my-column {display: flex !important; justify-content: center !important; align-items: center !important};"""
+
+
+with gr.Blocks(css=css) as app:
+    gr.HTML(
+        """
+    <h1 style='text-align: center'>
+    YOLOv10 Webcam Stream
+    </h1>
+    """)
+    gr.HTML(
+        """
+        <h3 style='text-align: center'>
+        <a href='https://arxiv.org/abs/2405.14458' target='_blank'>arXiv</a> | <a href='https://github.com/THU-MIG/yolov10' target='_blank'>github</a>
+        </h3>
+        """)
+    with gr.Column(elem_classes=["my-column"]):
+        with gr.Group(elem_classes=["my-group"]):
+            image = gr.Image(type="pil", label="Image", sources="webcam")
+            conf_threshold = gr.Slider(
+                label="Confidence Threshold",
+                minimum=0.0,
+                maximum=1.0,
+                step=0.05,
+                value=0.30,
+            )
+        image.stream(
+            fn=yolov10_inference,
+            inputs=[image, conf_threshold],
+            outputs=[image],
+            stream_every=0.1,
+            time_limit=30
+        )
+```
+
+
+## Conclusion
+
+You can check out our demo hosted on Hugging Face Spaces [here](https://huggingface.co/spaces/gradio/YOLOv10-webcam-stream). 
+
+It is also embedded on this page below
+
+$demo_YOLOv10-webcam-stream
diff --git a/...tutorials/real-time-speech-recognition.md → ...eaming/03_real-time-speech-recognition.md b/...tutorials/real-time-speech-recognition.md → ...eaming/03_real-time-speech-recognition.md
diff --git a/...s/01_custom-components-in-five-minutes.md → ...s/01_custom-components-in-five-minutes.md b/...s/01_custom-components-in-five-minutes.md → ...s/01_custom-components-in-five-minutes.md
diff --git a/...m-components/02_key-component-concepts.md → ...m-components/02_key-component-concepts.md b/...m-components/02_key-component-concepts.md → ...m-components/02_key-component-concepts.md
diff --git a/.../07_custom-components/03_configuration.md → .../08_custom-components/03_configuration.md b/.../07_custom-components/03_configuration.md → .../08_custom-components/03_configuration.md
diff --git a/guides/07_custom-components/04_backend.md → guides/08_custom-components/04_backend.md b/guides/07_custom-components/04_backend.md → guides/08_custom-components/04_backend.md
diff --git a/guides/07_custom-components/05_frontend.md → guides/08_custom-components/05_frontend.md b/guides/07_custom-components/05_frontend.md → guides/08_custom-components/05_frontend.md
diff --git a/...mponents/06_frequently-asked-questions.md → ...mponents/06_frequently-asked-questions.md b/...mponents/06_frequently-asked-questions.md → ...mponents/06_frequently-asked-questions.md
diff --git a/...om-components/07_pdf-component-example.md → ...om-components/07_pdf-component-example.md b/...om-components/07_pdf-component-example.md → ...om-components/07_pdf-component-example.md
diff --git a/...components/08_multimodal-chatbot-part1.md → ...components/08_multimodal-chatbot-part1.md b/...components/08_multimodal-chatbot-part1.md → ...components/08_multimodal-chatbot-part1.md
diff --git a/...nents/09_documenting-custom-components.md → ...nents/09_documenting-custom-components.md b/...nents/09_documenting-custom-components.md → ...nents/09_documenting-custom-components.md
diff --git a/...getting-started-with-the-python-client.md → ...getting-started-with-the-python-client.md b/...getting-started-with-the-python-client.md → ...getting-started-with-the-python-client.md
diff --git a/.../02_getting-started-with-the-js-client.md → .../02_getting-started-with-the-js-client.md b/.../02_getting-started-with-the-js-client.md → .../02_getting-started-with-the-js-client.md
diff --git a/...lite/03_querying-gradio-apps-with-curl.md → ...lite/03_querying-gradio-apps-with-curl.md b/...lite/03_querying-gradio-apps-with-curl.md → ...lite/03_querying-gradio-apps-with-curl.md
diff --git a/...ents-and-lite/04_gradio-and-llm-agents.md → ...ents-and-lite/04_gradio-and-llm-agents.md b/...ents-and-lite/04_gradio-and-llm-agents.md → ...ents-and-lite/04_gradio-and-llm-agents.md
diff --git a/...gradio-clients-and-lite/05_gradio-lite.md → ...gradio-clients-and-lite/05_gradio-lite.md b/...gradio-clients-and-lite/05_gradio-lite.md → ...gradio-clients-and-lite/05_gradio-lite.md
diff --git a/...ite/06_gradio-lite-and-transformers-js.md → ...ite/06_gradio-lite-and-transformers-js.md b/...ite/06_gradio-lite-and-transformers-js.md → ...ite/06_gradio-lite-and-transformers-js.md
diff --git a/.../07_fastapi-app-with-the-gradio-client.md → .../07_fastapi-app-with-the-gradio-client.md b/.../07_fastapi-app-with-the-gradio-client.md → .../07_fastapi-app-with-the-gradio-client.md
diff --git a/...als/01_using-hugging-face-integrations.md → ...als/01_using-hugging-face-integrations.md b/...als/01_using-hugging-face-integrations.md → ...als/01_using-hugging-face-integrations.md
diff --git a/...es/09_other-tutorials/Gradio-and-Comet.md → ...es/10_other-tutorials/Gradio-and-Comet.md b/...es/09_other-tutorials/Gradio-and-Comet.md → ...es/10_other-tutorials/Gradio-and-Comet.md
diff --git a/...orials/Gradio-and-ONNX-on-Hugging-Face.md → ...orials/Gradio-and-ONNX-on-Hugging-Face.md b/...orials/Gradio-and-ONNX-on-Hugging-Face.md → ...orials/Gradio-and-ONNX-on-Hugging-Face.md
diff --git a/...tutorials/Gradio-and-Wandb-Integration.md → ...tutorials/Gradio-and-Wandb-Integration.md b/...tutorials/Gradio-and-Wandb-Integration.md → ...tutorials/Gradio-and-Wandb-Integration.md
diff --git a/...als/create-your-own-friends-with-a-gan.md → ...als/create-your-own-friends-with-a-gan.md b/...als/create-your-own-friends-with-a-gan.md → ...als/create-your-own-friends-with-a-gan.md
diff --git a/...reating-a-dashboard-from-bigquery-data.md → ...reating-a-dashboard-from-bigquery-data.md b/...reating-a-dashboard-from-bigquery-data.md → ...reating-a-dashboard-from-bigquery-data.md
diff --git a/...reating-a-dashboard-from-supabase-data.md → ...reating-a-dashboard-from-supabase-data.md b/...reating-a-dashboard-from-supabase-data.md → ...reating-a-dashboard-from-supabase-data.md
diff --git a/...-realtime-dashboard-from-google-sheets.md → ...-realtime-dashboard-from-google-sheets.md b/...-realtime-dashboard-from-google-sheets.md → ...-realtime-dashboard-from-google-sheets.md
diff --git a/...tutorials/deploying-gradio-with-docker.md → ...tutorials/deploying-gradio-with-docker.md b/...tutorials/deploying-gradio-with-docker.md → ...tutorials/deploying-gradio-with-docker.md
diff --git a/...als/developing-faster-with-reload-mode.md → ...als/developing-faster-with-reload-mode.md b/...als/developing-faster-with-reload-mode.md → ...als/developing-faster-with-reload-mode.md
diff --git a/...utorials/how-to-use-3D-model-component.md → ...utorials/how-to-use-3D-model-component.md b/...utorials/how-to-use-3D-model-component.md → ...utorials/how-to-use-3D-model-component.md
diff --git a/...orials/image-classification-in-pytorch.md → ...orials/image-classification-in-pytorch.md b/...orials/image-classification-in-pytorch.md → ...orials/image-classification-in-pytorch.md
diff --git a/...als/image-classification-in-tensorflow.md → ...als/image-classification-in-tensorflow.md b/...als/image-classification-in-tensorflow.md → ...als/image-classification-in-tensorflow.md
diff --git a/...lassification-with-vision-transformers.md → ...lassification-with-vision-transformers.md b/...lassification-with-vision-transformers.md → ...lassification-with-vision-transformers.md
diff --git a/...alling-gradio-in-a-virtual-environment.md → ...alling-gradio-in-a-virtual-environment.md b/...alling-gradio-in-a-virtual-environment.md → ...alling-gradio-in-a-virtual-environment.md
diff --git a/...her-tutorials/named-entity-recognition.md → ...her-tutorials/named-entity-recognition.md b/...her-tutorials/named-entity-recognition.md → ...her-tutorials/named-entity-recognition.md
diff --git a/...ther-tutorials/plot-component-for-maps.md → ...ther-tutorials/plot-component-for-maps.md b/...ther-tutorials/plot-component-for-maps.md → ...ther-tutorials/plot-component-for-maps.md
diff --git a/...her-tutorials/running-background-tasks.md → ...her-tutorials/running-background-tasks.md b/...her-tutorials/running-background-tasks.md → ...her-tutorials/running-background-tasks.md
diff --git a/...g-gradio-on-your-web-server-with-nginx.md → ...g-gradio-on-your-web-server-with-nginx.md b/...g-gradio-on-your-web-server-with-nginx.md → ...g-gradio-on-your-web-server-with-nginx.md
diff --git a/...ting-up-a-demo-for-maximum-performance.md → ...ting-up-a-demo-for-maximum-performance.md b/...ting-up-a-demo-for-maximum-performance.md → ...ting-up-a-demo-for-maximum-performance.md
diff --git a/...tutorials/styling-the-gradio-dataframe.md → ...tutorials/styling-the-gradio-dataframe.md b/...tutorials/styling-the-gradio-dataframe.md → ...tutorials/styling-the-gradio-dataframe.md
diff --git a/guides/09_other-tutorials/theming-guide.md → guides/10_other-tutorials/theming-guide.md b/guides/09_other-tutorials/theming-guide.md → guides/10_other-tutorials/theming-guide.md
diff --git a/guides/09_other-tutorials/using-flagging.md → guides/10_other-tutorials/using-flagging.md b/guides/09_other-tutorials/using-flagging.md → guides/10_other-tutorials/using-flagging.md
diff --git a/...als/using-gradio-for-tabular-workflows.md → ...als/using-gradio-for-tabular-workflows.md b/...als/using-gradio-for-tabular-workflows.md → ...als/using-gradio-for-tabular-workflows.md
diff --git a/...-gradio-in-other-programming-languages.md → ...-gradio-in-other-programming-languages.md b/...-gradio-in-other-programming-languages.md → ...-gradio-in-other-programming-languages.md
diff --git a/...es/09_other-tutorials/wrapping-layouts.md → ...es/10_other-tutorials/wrapping-layouts.md b/...es/09_other-tutorials/wrapping-layouts.md → ...es/10_other-tutorials/wrapping-layouts.md