From e10358fec096e31556aac154bfdfc3be2f22de8d Mon Sep 17 00:00:00 2001 From: Yosshi999 Date: Sun, 26 Jan 2025 07:43:52 +0900 Subject: [PATCH 1/4] Fix broken codeblock --- recipes_source/recipes/profiler_recipe.py | 33 +++++++++++------------ 1 file changed, 16 insertions(+), 17 deletions(-) diff --git a/recipes_source/recipes/profiler_recipe.py b/recipes_source/recipes/profiler_recipe.py index 4d43726e71f..82f262f6c55 100644 --- a/recipes_source/recipes/profiler_recipe.py +++ b/recipes_source/recipes/profiler_recipe.py @@ -220,23 +220,22 @@ # # .. code-block:: sh # -#------------------------------------------------------- ------------ ------------ ------------ ------------ ------------ -# Name Self XPU Self XPU % XPU total XPU time avg # of Calls -# ------------------------------------------------------- ------------ ------------ ------------ ------------ ------------ -# model_inference 0.000us 0.00% 2.567ms 2.567ms 1 -# aten::conv2d 0.000us 0.00% 1.871ms 93.560us 20 -# aten::convolution 0.000us 0.00% 1.871ms 93.560us 20 -# aten::_convolution 0.000us 0.00% 1.871ms 93.560us 20 -# aten::convolution_overrideable 1.871ms 72.89% 1.871ms 93.560us 20 -# gen_conv 1.484ms 57.82% 1.484ms 74.216us 20 -# aten::batch_norm 0.000us 0.00% 432.640us 21.632us 20 -# aten::_batch_norm_impl_index 0.000us 0.00% 432.640us 21.632us 20 -# aten::native_batch_norm 432.640us 16.85% 432.640us 21.632us 20 -# conv_reorder 386.880us 15.07% 386.880us 6.448us 60 -# ------------------------------------------------------- ------------ ------------ ------------ ------------ ------------ -# Self CPU time total: 712.486ms -# Self XPU time total: 2.567ms - +# ------------------------------------------------------- ------------ ------------ ------------ ------------ ------------ +# Name Self XPU Self XPU % XPU total XPU time avg # of Calls +# ------------------------------------------------------- ------------ ------------ ------------ ------------ ------------ +# model_inference 0.000us 0.00% 2.567ms 2.567ms 1 +# aten::conv2d 0.000us 0.00% 1.871ms 93.560us 20 +# aten::convolution 0.000us 0.00% 1.871ms 93.560us 20 +# aten::_convolution 0.000us 0.00% 1.871ms 93.560us 20 +# aten::convolution_overrideable 1.871ms 72.89% 1.871ms 93.560us 20 +# gen_conv 1.484ms 57.82% 1.484ms 74.216us 20 +# aten::batch_norm 0.000us 0.00% 432.640us 21.632us 20 +# aten::_batch_norm_impl_index 0.000us 0.00% 432.640us 21.632us 20 +# aten::native_batch_norm 432.640us 16.85% 432.640us 21.632us 20 +# conv_reorder 386.880us 15.07% 386.880us 6.448us 60 +# ------------------------------------------------------- ------------ ------------ ------------ ------------ ------------ +# Self CPU time total: 712.486ms +# Self XPU time total: 2.567ms # From d866112fa1a620b645c71ca532a35d42af9e4c50 Mon Sep 17 00:00:00 2001 From: Svetlana Karslioglu Date: Tue, 28 Jan 2025 10:56:32 -0800 Subject: [PATCH 2/4] trying a different table format --- recipes_source/recipes/profiler_recipe.py | 5 ++--- 1 file changed, 2 insertions(+), 3 deletions(-) diff --git a/recipes_source/recipes/profiler_recipe.py b/recipes_source/recipes/profiler_recipe.py index 82f262f6c55..86c7057a58b 100644 --- a/recipes_source/recipes/profiler_recipe.py +++ b/recipes_source/recipes/profiler_recipe.py @@ -218,9 +218,8 @@ ###################################################################### # The resulting table output (omitting some columns): # -# .. code-block:: sh # -# ------------------------------------------------------- ------------ ------------ ------------ ------------ ------------ +# ========================================================= ============ ============ ============ ============ ============ # Name Self XPU Self XPU % XPU total XPU time avg # of Calls # ------------------------------------------------------- ------------ ------------ ------------ ------------ ------------ # model_inference 0.000us 0.00% 2.567ms 2.567ms 1 @@ -233,7 +232,7 @@ # aten::_batch_norm_impl_index 0.000us 0.00% 432.640us 21.632us 20 # aten::native_batch_norm 432.640us 16.85% 432.640us 21.632us 20 # conv_reorder 386.880us 15.07% 386.880us 6.448us 60 -# ------------------------------------------------------- ------------ ------------ ------------ ------------ ------------ +# ========================================================= ============ ============ ============ ============ ============ # Self CPU time total: 712.486ms # Self XPU time total: 2.567ms # From 0df487272f516f44229c63a2a308aa206cad063e Mon Sep 17 00:00:00 2001 From: Svetlana Karslioglu Date: Tue, 28 Jan 2025 15:26:17 -0800 Subject: [PATCH 3/4] Update profiler_recipe.py --- recipes_source/recipes/profiler_recipe.py | 34 +++++++++++------------ 1 file changed, 17 insertions(+), 17 deletions(-) diff --git a/recipes_source/recipes/profiler_recipe.py b/recipes_source/recipes/profiler_recipe.py index 86c7057a58b..138c8358504 100644 --- a/recipes_source/recipes/profiler_recipe.py +++ b/recipes_source/recipes/profiler_recipe.py @@ -218,23 +218,23 @@ ###################################################################### # The resulting table output (omitting some columns): # -# -# ========================================================= ============ ============ ============ ============ ============ -# Name Self XPU Self XPU % XPU total XPU time avg # of Calls -# ------------------------------------------------------- ------------ ------------ ------------ ------------ ------------ -# model_inference 0.000us 0.00% 2.567ms 2.567ms 1 -# aten::conv2d 0.000us 0.00% 1.871ms 93.560us 20 -# aten::convolution 0.000us 0.00% 1.871ms 93.560us 20 -# aten::_convolution 0.000us 0.00% 1.871ms 93.560us 20 -# aten::convolution_overrideable 1.871ms 72.89% 1.871ms 93.560us 20 -# gen_conv 1.484ms 57.82% 1.484ms 74.216us 20 -# aten::batch_norm 0.000us 0.00% 432.640us 21.632us 20 -# aten::_batch_norm_impl_index 0.000us 0.00% 432.640us 21.632us 20 -# aten::native_batch_norm 432.640us 16.85% 432.640us 21.632us 20 -# conv_reorder 386.880us 15.07% 386.880us 6.448us 60 -# ========================================================= ============ ============ ============ ============ ============ -# Self CPU time total: 712.486ms -# Self XPU time total: 2.567ms +# =========================================================== ============ ============ ============ ============ ============ +# Name Self XPU Self XPU % XPU total XPU time avg # of Calls +# =========================================================== ============ ============ ============ ============ ============ +# model_inference 0.000us 0.00% 2.567ms 2.567ms 1 +# aten::conv2d 0.000us 0.00% 1.871ms 93.560us 20 +# aten::convolution 0.000us 0.00% 1.871ms 93.560us 20 +# aten::_convolution 0.000us 0.00% 1.871ms 93.560us 20 +# aten::convolution_overrideable 1.871ms 72.89% 1.871ms 93.560us 20 +# gen_conv 1.484ms 57.82% 1.484ms 74.216us 20 +# aten::batch_norm 0.000us 0.00% 432.640us 21.632us 20 +# aten::_batch_norm_impl_index 0.000us 0.00% 432.640us 21.632us 20 +# aten::native_batch_norm 432.640us 16.85% 432.640us 21.632us 20 +# conv_reorder 386.880us 15.07% 386.880us 6.448us 60 +# ----------------------------------------------------------- ------------------------------------------------------ ------------ +# Self CPU time total: 712.486ms +# Self XPU time total: 2.567ms +# =========================================================== ============ ============ ============ ============ ============ # From f8f4511be31585bc9a2146e178630bc7e5fe3b51 Mon Sep 17 00:00:00 2001 From: Svetlana Karslioglu Date: Fri, 21 Mar 2025 10:09:41 -0700 Subject: [PATCH 4/4] Update profiler_recipe.py --- recipes_source/recipes/profiler_recipe.py | 33 +++++++++++------------ 1 file changed, 16 insertions(+), 17 deletions(-) diff --git a/recipes_source/recipes/profiler_recipe.py b/recipes_source/recipes/profiler_recipe.py index 138c8358504..acfc274a689 100644 --- a/recipes_source/recipes/profiler_recipe.py +++ b/recipes_source/recipes/profiler_recipe.py @@ -218,25 +218,24 @@ ###################################################################### # The resulting table output (omitting some columns): # -# =========================================================== ============ ============ ============ ============ ============ -# Name Self XPU Self XPU % XPU total XPU time avg # of Calls -# =========================================================== ============ ============ ============ ============ ============ -# model_inference 0.000us 0.00% 2.567ms 2.567ms 1 -# aten::conv2d 0.000us 0.00% 1.871ms 93.560us 20 -# aten::convolution 0.000us 0.00% 1.871ms 93.560us 20 -# aten::_convolution 0.000us 0.00% 1.871ms 93.560us 20 -# aten::convolution_overrideable 1.871ms 72.89% 1.871ms 93.560us 20 -# gen_conv 1.484ms 57.82% 1.484ms 74.216us 20 -# aten::batch_norm 0.000us 0.00% 432.640us 21.632us 20 -# aten::_batch_norm_impl_index 0.000us 0.00% 432.640us 21.632us 20 -# aten::native_batch_norm 432.640us 16.85% 432.640us 21.632us 20 -# conv_reorder 386.880us 15.07% 386.880us 6.448us 60 -# ----------------------------------------------------------- ------------------------------------------------------ ------------ + +###################################################################### +# --------------------------------- ------------ ------------ ------------ ------------ ------------ +# Name Self XPU Self XPU % XPU total XPU time avg # of Calls +# --------------------------------- ------------ ------------ ------------ ------------ ------------ +# model_inference 0.000us 0.00% 2.567ms 2.567ms 1 +# aten::conv2d 0.000us 0.00% 1.871ms 93.560us 20 +# aten::convolution 0.000us 0.00% 1.871ms 93.560us 20 +# aten::_convolution 0.000us 0.00% 1.871ms 93.560us 20 +# aten::convolution_overrideable 1.871ms 72.89% 1.871ms 93.560us 20 +# gen_conv 1.484ms 57.82% 1.484ms 74.216us 20 +# aten::batch_norm 0.000us 0.00% 432.640us 21.632us 20 +# aten::_batch_norm_impl_index 0.000us 0.00% 432.640us 21.632us 20 +# aten::native_batch_norm 432.640us 16.85% 432.640us 21.632us 20 +# conv_reorder 386.880us 15.07% 386.880us 6.448us 60 +# --------------------------------- ------------ ------------ ------------ ------------ ------------ # Self CPU time total: 712.486ms # Self XPU time total: 2.567ms -# =========================================================== ============ ============ ============ ============ ============ -# - ###################################################################### # Note the occurrence of on-device kernels in the output (e.g. ``sgemm_32x32x32_NN``).