@@ -406,7 +406,7 @@ struct AicpuExecutor {
406406 );
407407 cur_thread_completed++;
408408 if (mixed_complete) {
409- #if PTO2_DUMP_TENSOR
409+ #if PTO2_PROFILING
410410 if (get_enable_dump_tensor ()) {
411411 dump_tensors_for_task<PTO2_SUBTASK_SLOT_COUNT>(
412412 thread_idx, slot_state, TensorDumpStage::AFTER_COMPLETION,
@@ -515,7 +515,7 @@ struct AicpuExecutor {
515515 ,
516516 bool profiling_enabled
517517#endif
518- #if PTO2_PROFILING || PTO2_DUMP_TENSOR
518+ #if PTO2_PROFILING
519519 ,
520520 int32_t thread_idx
521521#endif
@@ -944,7 +944,7 @@ int32_t AicpuExecutor::resolve_and_dispatch_pto2(Runtime *runtime, int32_t threa
944944 perf_aicpu_set_orch_thread_idx (sched_thread_num_);
945945 }
946946#endif
947- #if PTO2_DUMP_TENSOR
947+ #if PTO2_PROFILING
948948 if (get_enable_dump_tensor ()) {
949949 dump_tensor_init (orch_to_sched_ ? thread_num_ : sched_thread_num_);
950950 }
@@ -1163,7 +1163,7 @@ int32_t AicpuExecutor::resolve_and_dispatch_pto2(Runtime *runtime, int32_t threa
11631163 uint64_t t_setup_start = get_sys_cnt_aicpu ();
11641164#endif
11651165 ResourceCount rc = shape_resource_count (shape);
1166- #if PTO2_DUMP_TENSOR
1166+ #if PTO2_PROFILING
11671167 if (get_enable_dump_tensor ()) {
11681168 dump_tensors_for_task<PTO2_SUBTASK_SLOT_COUNT>(
11691169 thread_idx, *slot_state, TensorDumpStage::BEFORE_DISPATCH,
@@ -1183,7 +1183,7 @@ int32_t AicpuExecutor::resolve_and_dispatch_pto2(Runtime *runtime, int32_t threa
11831183 ,
11841184 profiling_enabled
11851185#endif
1186- #if PTO2_PROFILING || PTO2_DUMP_TENSOR
1186+ #if PTO2_PROFILING
11871187 ,
11881188 thread_idx
11891189#endif
@@ -1197,7 +1197,7 @@ int32_t AicpuExecutor::resolve_and_dispatch_pto2(Runtime *runtime, int32_t threa
11971197 ,
11981198 profiling_enabled
11991199#endif
1200- #if PTO2_PROFILING || PTO2_DUMP_TENSOR
1200+ #if PTO2_PROFILING
12011201 ,
12021202 thread_idx
12031203#endif
@@ -1210,7 +1210,7 @@ int32_t AicpuExecutor::resolve_and_dispatch_pto2(Runtime *runtime, int32_t threa
12101210 ,
12111211 profiling_enabled
12121212#endif
1213- #if PTO2_PROFILING || PTO2_DUMP_TENSOR
1213+ #if PTO2_PROFILING
12141214 ,
12151215 thread_idx
12161216#endif
@@ -1272,7 +1272,7 @@ int32_t AicpuExecutor::resolve_and_dispatch_pto2(Runtime *runtime, int32_t threa
12721272#endif
12731273 Cluster &c = tracker.clusters [ci];
12741274 ResourceCount rc = shape_resource_count (shape);
1275- #if PTO2_DUMP_TENSOR
1275+ #if PTO2_PROFILING
12761276 if (get_enable_dump_tensor ()) {
12771277 dump_tensors_for_task<PTO2_SUBTASK_SLOT_COUNT>(
12781278 thread_idx, *slot_state, TensorDumpStage::BEFORE_DISPATCH,
@@ -1292,7 +1292,7 @@ int32_t AicpuExecutor::resolve_and_dispatch_pto2(Runtime *runtime, int32_t threa
12921292 ,
12931293 profiling_enabled
12941294#endif
1295- #if PTO2_PROFILING || PTO2_DUMP_TENSOR
1295+ #if PTO2_PROFILING
12961296 ,
12971297 thread_idx
12981298#endif
@@ -1306,7 +1306,7 @@ int32_t AicpuExecutor::resolve_and_dispatch_pto2(Runtime *runtime, int32_t threa
13061306 ,
13071307 profiling_enabled
13081308#endif
1309- #if PTO2_PROFILING || PTO2_DUMP_TENSOR
1309+ #if PTO2_PROFILING
13101310 ,
13111311 thread_idx
13121312#endif
@@ -1319,7 +1319,7 @@ int32_t AicpuExecutor::resolve_and_dispatch_pto2(Runtime *runtime, int32_t threa
13191319 ,
13201320 profiling_enabled
13211321#endif
1322- #if PTO2_PROFILING || PTO2_DUMP_TENSOR
1322+ #if PTO2_PROFILING
13231323 ,
13241324 thread_idx
13251325#endif
@@ -1650,7 +1650,7 @@ int32_t AicpuExecutor::resolve_and_dispatch_pto2(Runtime *runtime, int32_t threa
16501650 perf_aicpu_flush_phase_buffers (thread_idx);
16511651 }
16521652#endif
1653- #if PTO2_DUMP_TENSOR
1653+ #if PTO2_PROFILING
16541654 if (get_enable_dump_tensor ()) {
16551655 dump_tensor_flush (thread_idx);
16561656 }
0 commit comments