dgstreams examples refactoring (#2)

vlad-nn · vlad-nn · commit a2f57af126fb · 2024-10-03T16:30:35.000-07:00
diff --git a/examples/dgstreams/multi_camera_multi_model_detection.ipynb b/examples/dgstreams/multi_camera_multi_model_detection.ipynb
@@ -28,26 +28,9 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 1,
+   "execution_count": null,
    "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "Name: degirum_tools\n",
-      "Version: 0.10.1\n",
-      "Summary: Tools for PySDK\n",
-      "Home-page: \n",
-      "Author: DeGirum\n",
-      "Author-email: \n",
-      "License: \n",
-      "Location: c:\\users\\shashichilappagari\\anaconda3\\envs\\supervision\\lib\\site-packages\n",
-      "Requires: degirum, ipython, numpy, opencv-python, pafy, pillow, psutil, pycocotools, python-dotenv, pyyaml, requests, scipy, youtube-dl\n",
-      "Required-by: \n"
-     ]
-    }
-   ],
+   "outputs": [],
    "source": [
     "# make sure degirum-tools package is installed\n",
     "!pip show degirum-tools || pip install degirum-tools"
@@ -63,7 +46,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 2,
+   "execution_count": 1,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -81,167 +64,115 @@
     "#     '': ai server serving models from local folder\n",
     "#     path to json file: single model zoo in case of @local inference\n",
     "# model_names: list of AI models to use for inferences (NOTE: they should have the same input size)\n",
-    "# allow_frame_drop:\n",
-    "#     when True, we drop video frames in case when AI performance is not enough to work in real time\n",
-    "#     when False, we buffer video frames to keep up with AI performance\n",
     "hw_location = \"@cloud\"\n",
     "video_sources = [\n",
+    "    \"https://raw.githubusercontent.com/DeGirum/PySDKExamples/main/images/WalkingPeople.mp4\",\n",
     "    \"https://raw.githubusercontent.com/DeGirum/PySDKExamples/main/images/Traffic.mp4\",\n",
-    "    \"https://raw.githubusercontent.com/DeGirum/PySDKExamples/main/images/TrafficHD.mp4\",\n",
     "]\n",
     "model_zoo_url = \"degirum/public\"\n",
     "model_names = [\n",
     "    \"yolo_v5s_hand_det--512x512_quant_n2x_orca1_1\",\n",
     "    \"yolo_v5s_face_det--512x512_quant_n2x_orca1_1\",\n",
     "    \"yolo_v5n_car_det--512x512_quant_n2x_orca1_1\",\n",
     "    \"yolo_v5s_person_det--512x512_quant_n2x_orca1_1\",\n",
-    "]\n",
-    "allow_frame_drop = False"
+    "]"
    ]
   },
   {
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "#### Specify where do you want to run your inferences"
+    "#### The rest of the cells below should run without any modifications"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 3,
+   "execution_count": null,
    "metadata": {},
-   "outputs": [
-    {
-     "ename": "",
-     "evalue": "",
-     "output_type": "error",
-     "traceback": [
-      "\u001b[1;31mThe Kernel crashed while executing code in the current cell or a previous cell. \n",
-      "\u001b[1;31mPlease review the code in the cell(s) to identify a possible cause of the failure. \n",
-      "\u001b[1;31mClick <a href='https://aka.ms/vscodeJupyterKernelCrash'>here</a> for more info. \n",
-      "\u001b[1;31mView Jupyter <a href='command:jupyter.viewOutput'>log</a> for further details."
-     ]
-    }
-   ],
-   "source": [
-    "import degirum as dg, degirum_tools"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 4,
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "Successfully opened video stream 'https://raw.githubusercontent.com/DeGirum/PySDKExamples/main/images/Traffic.mp4'Successfully opened video stream 'https://raw.githubusercontent.com/DeGirum/PySDKExamples/main/images/TrafficHD.mp4'\n",
-      "\n"
-     ]
-    },
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "packet queue is empty, aborting\n",
-      "packet queue is empty, aborting\n",
-      "packet queue is empty, aborting\n",
-      "packet queue is empty, aborting\n"
-     ]
-    }
-   ],
+   "outputs": [],
    "source": [
+    "import degirum as dg, degirum_tools\n",
     "from degirum_tools import streams as dgstreams\n",
     "\n",
-    "c = dgstreams.Composition()\n",
-    "\n",
-    "batch_size = len(\n",
-    "    video_sources\n",
-    ")  # set AI server batch size equal to the # of video sources for lowest latency\n",
-    "\n",
     "# create PySDK AI model objects\n",
-    "models = []\n",
-    "for mi, model_name in enumerate(model_names):\n",
-    "    model = dg.load_model(\n",
+    "models = [\n",
+    "    dg.load_model(\n",
     "        model_name=model_name,\n",
     "        inference_host_address=hw_location,\n",
     "        zoo_url=model_zoo_url,\n",
     "        token=degirum_tools.get_token(),\n",
+    "        overlay_line_width=2,\n",
     "    )\n",
-    "    model.measure_time = True\n",
-    "    model.eager_batch_size = batch_size\n",
-    "    model.frame_queue_depth = batch_size\n",
-    "    models.append(model)\n",
+    "    for model_name in model_names\n",
+    "]\n",
     "\n",
     "# check that all models have the same input configuration\n",
-    "models_have_same_input = True\n",
-    "for model in models[1:]:\n",
-    "    if (\n",
-    "        type(model._preprocessor) != type(models[0]._preprocessor)\n",
-    "        or model.model_info.InputH != models[0].model_info.InputH\n",
-    "        or model.model_info.InputW != models[0].model_info.InputW\n",
-    "    ):\n",
-    "        models_have_same_input = False\n",
-    "\n",
-    "resizers = []\n",
-    "\n",
-    "# create video sources and image resizers\n",
-    "# (we use separate resizers to do resize only once per source when possible, to improve performance),\n",
-    "# connect each resizer to corresponding video source\n",
-    "for src in video_sources:\n",
-    "    source = c.add(dgstreams.VideoSourceGizmo(src))\n",
-    "    if models_have_same_input:\n",
-    "        resizer = c.add(\n",
-    "            dgstreams.AiPreprocessGizmo(\n",
-    "                models[0], stream_depth=2, allow_drop=allow_frame_drop\n",
-    "            )\n",
-    "        )\n",
-    "    else:\n",
-    "        resizer = c.add(dgstreams.FanoutGizmo(allow_drop=allow_frame_drop))\n",
+    "assert all(\n",
+    "    type(model._preprocessor) == type(models[0]._preprocessor)\n",
+    "    and model.model_info.InputH == models[0].model_info.InputH\n",
+    "    and model.model_info.InputW == models[0].model_info.InputW\n",
+    "    for model in models[1:]\n",
+    ")\n",
     "\n",
-    "    resizer.connect_to(source)  # connect resizer to video source\n",
-    "    resizers.append(resizer)\n",
+    "# create video source gizmos;\n",
+    "# stop_composition_on_end=True to stop whole composition when one (shorter) video source ends\n",
+    "sources = [\n",
+    "    dgstreams.VideoSourceGizmo(src, stop_composition_on_end=True)\n",
+    "    for src in video_sources\n",
+    "]\n",
     "\n",
-    "# create result combiner\n",
-    "combiner = c.add(dgstreams.AiResultCombiningGizmo(len(models)))\n",
+    "# create image resizer gizmos, one per video source\n",
+    "# (we use separate resizers to do resize only once per source to improve performance)\n",
+    "resizers = [dgstreams.AiPreprocessGizmo(models[0]) for _ in video_sources]\n",
     "\n",
-    "# create multi-input detector gizmos,\n",
-    "# connect each detector gizmo to every resizer gizmo,\n",
-    "# connect result combiner gizmo to each detector gizmo\n",
-    "for mi, model in enumerate(models):\n",
-    "    # create AI gizmo (aka detector) from the model\n",
-    "    detector = c.add(\n",
-    "        dgstreams.AiSimpleGizmo(model, stream_depth=2, inp_cnt=len(video_sources))\n",
-    "    )\n",
-    "\n",
-    "    # connect detector gizmo to each resizer gizmo\n",
-    "    for fi, resizer in enumerate(resizers):\n",
-    "        detector.connect_to(resizer, fi)\n",
+    "# create multi-input detector gizmos, one per model\n",
+    "detectors = [\n",
+    "    dgstreams.AiSimpleGizmo(model, inp_cnt=len(video_sources)) for model in models\n",
+    "]\n",
     "\n",
-    "    # connect result combiner gizmo to detector gizmo\n",
-    "    combiner.connect_to(detector, mi)\n",
+    "# create result combiner gizmo to combine results from all detectors into single result\n",
+    "combiner = dgstreams.AiResultCombiningGizmo(len(models))\n",
     "\n",
     "# create multi-window video multiplexing display gizmo\n",
-    "# and connect it to combiner gizmo\n",
     "win_captions = [f\"Stream #{i}: {str(src)}\" for i, src in enumerate(video_sources)]\n",
-    "display = c.add(\n",
-    "    dgstreams.VideoDisplayGizmo(\n",
-    "        win_captions, show_ai_overlay=True, show_fps=True, multiplex=True\n",
-    "    )\n",
+    "display = dgstreams.VideoDisplayGizmo(\n",
+    "    win_captions, show_ai_overlay=True, show_fps=True, multiplex=True\n",
     ")\n",
-    "display.connect_to(combiner)\n",
     "\n",
-    "# start composition\n",
-    "c.start()"
+    "# connect all gizmos in the pipeline\n",
+    "# source[i] -> resizer[i] -> detector[j] -> combiner -> display\n",
+    "pipeline = (\n",
+    "    # each source is connected to corresponding resizer\n",
+    "    (source >> resizer for source, resizer in zip(sources, resizers)),\n",
+    "    # each resizer is connected to every detector\n",
+    "    (\n",
+    "        resizer >> detector[ri]\n",
+    "        for detector in detectors\n",
+    "        for ri, resizer in enumerate(resizers)\n",
+    "    ),\n",
+    "    # each detector is connected to result combiner\n",
+    "    (detector >> combiner[di] for di, detector in enumerate(detectors)),\n",
+    "    # result combiner is connected to display\n",
+    "    combiner >> display,\n",
+    ")\n",
+    "\n",
+    "# create and start composition with given pipeline\n",
+    "dgstreams.Composition(*pipeline).start()"
    ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
   }
  ],
  "metadata": {
   "kernelspec": {
-   "display_name": "Python (supervision)",
+   "display_name": "base",
    "language": "python",
-   "name": "supervision"
+   "name": "python3"
   },
   "language_info": {
    "codemirror_mode": {
@@ -253,7 +184,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.9.18"
+   "version": "3.9.16"
   },
   "orig_nbformat": 4
  },