Fix

JanuszL · JanuszL · commit c4149116bbfe · 2025-12-05T13:39:01.000+01:00
Signed-off-by: Janusz Lisiecki &lt;jlisiecki@nvidia.com&gt;
diff --git a/dali/python/nvidia/dali/plugin/pytorch/loader_evaluator/__init__.py b/dali/python/nvidia/dali/plugin/pytorch/loader_evaluator/__init__.py
@@ -13,6 +13,5 @@
 # limitations under the License.
 
 from .loader import LoaderEvaluator
-from .metrics import PerformanceMetrics
 
-__all__ = ["LoaderEvaluator", "PerformanceMetrics"]
+__all__ = ["LoaderEvaluator"]
diff --git a/docs/examples/frameworks/pytorch/loader_evaluator/pytorch_data_loader_evaluator.ipynb b/docs/examples/frameworks/pytorch/loader_evaluator/pytorch_data_loader_evaluator.ipynb
@@ -26,9 +26,17 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 1,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Using device: cuda\n"
+     ]
+    }
+   ],
    "source": [
     "import os\n",
     "import time\n",
@@ -60,9 +68,17 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 2,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Dataset size: 1000\n"
+     ]
+    }
+   ],
    "source": [
     "# Our model\n",
     "class UltraLightModel(nn.Module):\n",
@@ -136,7 +152,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 3,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -176,9 +192,53 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 4,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Baseline Training (Real Data Loading)\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "Epoch 0: 100%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 63/63 [00:03<00:00, 17.77it/s, Time=3.5s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Epoch 0 - Time: 3.55s\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "Epoch 1: 100%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 63/63 [00:03<00:00, 17.90it/s, Time=3.5s]"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Epoch 1 - Time: 3.52s\n",
+      "Baseline average epoch time: 3.53s\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "\n"
+     ]
+    }
+   ],
    "source": [
     "# Your existing training setup\n",
     "model = UltraLightModel(num_classes=1000).to(device)\n",
@@ -209,7 +269,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 5,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -228,9 +288,53 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 6,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "No-Overhead Training (Cached Data Loading)\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "Epoch 0: 100%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 63/63 [00:00<00:00, 65.49it/s, Time=1.0s]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Epoch 0 - Time: 0.96s\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "Epoch 1: 100%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 63/63 [00:00<00:00, 64.57it/s, Time=1.0s]"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Epoch 1 - Time: 0.98s\n",
+      "No-Overhead average epoch time: 0.97s\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "\n"
+     ]
+    }
+   ],
    "source": [
     "# Train with the same setup, just different dataloader\n",
     "print(\"No-Overhead Training (Cached Data Loading)\")\n",
@@ -256,9 +360,25 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 7,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\n",
+      "Performance Comparison:\n",
+      "Baseline:     3.53s per epoch\n",
+      "No-Overhead:  0.97s per epoch\n",
+      "Speedup:      3.64x\n",
+      "Time saved:   2.56s per epoch (72.6%)\n",
+      "\n",
+      "*** DATA LOADING BOTTLENECK DETECTED ***\n",
+      "You could speed up training by 72.6% by optimizing data loading.\n"
+     ]
+    }
+   ],
    "source": [
     "# Compare performance\n",
     "speedup = baseline_avg_time / sol_avg_time\n",
@@ -322,7 +442,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.12.3"
+   "version": "3.10.19"
   }
  },
  "nbformat": 4,
diff --git a/qa/TL0_python-self-test-core/test_body.sh b/qa/TL0_python-self-test-core/test_body.sh
@@ -22,7 +22,6 @@ test_py_with_framework() {
     done
 
     ${python_new_invoke_test} -A '!slow,!pytorch,!mxnet,!cupy' test_backend_impl
-    ${python_new_invoke_test} -A '!slow,!pytorch,!mxnet,!cupy' test_pytorch_loader_evaluator
 
     if [ -z "$DALI_ENABLE_SANITIZERS" ]; then
         ${python_new_invoke_test} -A 'numba' -s type_annotations
@@ -39,6 +38,7 @@ test_py() {
     python test_coco_tfrecord.py -i 64
     python test_data_containers.py -s -b 20
     python test_data_containers.py -s -b 20 -n
+    ${python_new_invoke_test} test_pytorch_loader_evaluator
 }
 
 test_autograph() {