Merge pull request #424 from roboflow/fix/how-to-segment-videos-with-segment-anything-3

SkalskiP · web-flow · commit 635f0731b323 · 2026-02-03T17:30:26.000+01:00
fix `How to Segment Videos with Segment Anything 3 (SAM3)` notebook
diff --git a/notebooks/how-to-segment-videos-with-segment-anything-3.ipynb b/notebooks/how-to-segment-videos-with-segment-anything-3.ipynb
@@ -81,23 +81,23 @@
           "base_uri": "https://localhost:8080/"
         },
         "id": "ILPFDHXR8Cfh",
-        "outputId": "b521ae11-7ada-4858-9fb6-b7978c157695"
+        "outputId": "de1d8bb0-5268-40c2-e233-c416cccd7c1b"
       },
       "outputs": [
         {
-          "name": "stdout",
           "output_type": "stream",
+          "name": "stdout",
           "text": [
-            "Thu Nov 20 12:06:00 2025       \n",
+            "Tue Feb  3 16:05:05 2026       \n",
             "+-----------------------------------------------------------------------------------------+\n",
             "| NVIDIA-SMI 550.54.15              Driver Version: 550.54.15      CUDA Version: 12.4     |\n",
             "|-----------------------------------------+------------------------+----------------------+\n",
             "| GPU  Name                 Persistence-M | Bus-Id          Disp.A | Volatile Uncorr. ECC |\n",
             "| Fan  Temp   Perf          Pwr:Usage/Cap |           Memory-Usage | GPU-Util  Compute M. |\n",
             "|                                         |                        |               MIG M. |\n",
             "|=========================================+========================+======================|\n",
-            "|   0  NVIDIA A100-SXM4-80GB          Off |   00000000:00:05.0 Off |                    0 |\n",
-            "| N/A   35C    P0             57W /  400W |       0MiB /  81920MiB |      0%      Default |\n",
+            "|   0  NVIDIA A100-SXM4-40GB          Off |   00000000:00:04.0 Off |                    0 |\n",
+            "| N/A   29C    P0             43W /  400W |       0MiB /  40960MiB |      0%      Default |\n",
             "|                                         |                        |             Disabled |\n",
             "+-----------------------------------------+------------------------+----------------------+\n",
             "                                                                                         \n",
@@ -124,15 +124,15 @@
           "base_uri": "https://localhost:8080/"
         },
         "id": "Vw3admXIqMlC",
-        "outputId": "61d7c09c-6f72-41ce-edb8-9d7de99e208d"
+        "outputId": "5420cfd5-332f-4ea4-8c31-c454940efe0e"
       },
       "outputs": [
         {
-          "name": "stdout",
           "output_type": "stream",
+          "name": "stdout",
           "text": [
-            "PyTorch version: 2.8.0+cu126\n",
-            "Torchvision version: 0.23.0+cu126\n",
+            "PyTorch version: 2.9.0+cu126\n",
+            "Torchvision version: 0.24.0+cu126\n",
             "CUDA is available: True\n"
           ]
         }
@@ -176,9 +176,22 @@
       "execution_count": null,
       "id": "eM_DGtMk_gFM",
       "metadata": {
-        "id": "eM_DGtMk_gFM"
+        "id": "eM_DGtMk_gFM",
+        "outputId": "8a3874c0-be38-4440-8052-c78885641d3b",
+        "colab": {
+          "base_uri": "https://localhost:8080/"
+        }
       },
-      "outputs": [],
+      "outputs": [
+        {
+          "output_type": "stream",
+          "name": "stdout",
+          "text": [
+            "\u001b[?25l   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m0.0/212.4 kB\u001b[0m \u001b[31m?\u001b[0m eta \u001b[36m-:--:--\u001b[0m\r\u001b[2K   \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m212.4/212.4 kB\u001b[0m \u001b[31m6.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[?25h"
+          ]
+        }
+      ],
       "source": [
         "!pip install -q supervision jupyter_bbox_widget"
       ]
@@ -275,12 +288,12 @@
           "base_uri": "https://localhost:8080/"
         },
         "id": "QynbB5AgFhML",
-        "outputId": "a59946c8-0c2a-4f4d-bf47-61a96e6f21ed"
+        "outputId": "e139269c-6149-45e5-8bbd-f324fdbf9a11"
       },
       "outputs": [
         {
-          "name": "stdout",
           "output_type": "stream",
+          "name": "stdout",
           "text": [
             "HOME: /content\n"
           ]
@@ -332,38 +345,11 @@
       "execution_count": null,
       "id": "y51dHwSKO2CX",
       "metadata": {
-        "colab": {
-          "base_uri": "https://localhost:8080/"
-        },
-        "id": "y51dHwSKO2CX",
-        "outputId": "fd7ae78f-a881-41de-d193-3bab847f2cb8"
+        "id": "y51dHwSKO2CX"
       },
-      "outputs": [
-        {
-          "name": "stderr",
-          "output_type": "stream",
-          "text": [
-            "\u001b[0m\u001b[32mINFO 2025-11-20 14:02:37,450 35343 sam3_video_predictor.py: 299:\u001b[0m using the following GPU IDs: [0]\n",
-            "\u001b[0m\u001b[32mINFO 2025-11-20 14:02:37,564 35343 sam3_video_predictor.py: 315:\u001b[0m \n",
-            "\n",
-            "\n",
-            "\t*** START loading model on all ranks ***\n",
-            "\n",
-            "\n",
-            "\u001b[0m\u001b[32mINFO 2025-11-20 14:02:37,564 35343 sam3_video_predictor.py: 317:\u001b[0m loading model on rank=0 with world_size=1 -- this could take a while ...\n",
-            "\u001b[0m\u001b[32mINFO 2025-11-20 14:02:46,745 35343 sam3_video_base.py: 124:\u001b[0m setting max_num_objects=10000 and num_obj_for_compile=16\n",
-            "\u001b[0m\u001b[32mINFO 2025-11-20 14:02:51,644 35343 sam3_video_predictor.py: 319:\u001b[0m loading model on rank=0 with world_size=1 -- DONE locally\n",
-            "\u001b[0m\u001b[32mINFO 2025-11-20 14:02:51,645 35343 sam3_video_predictor.py: 330:\u001b[0m \n",
-            "\n",
-            "\n",
-            "\t*** DONE loading model on all ranks ***\n",
-            "\n",
-            "\n"
-          ]
-        }
-      ],
+      "outputs": [],
       "source": [
-        "predictor = build_sam3_video_predictor(gpus_to_use=DEVICES)"
+        "predictor = build_sam3_video_predictor(bpe_path=\"/content/sam3/sam3/assets/bpe_simple_vocab_16e6.txt.gz\", gpus_to_use=DEVICES)"
       ]
     },
     {
@@ -1631,4 +1617,4 @@
   },
   "nbformat": 4,
   "nbformat_minor": 5
-}
+}