diff --git a/qdp_project/evaluation-results/perf.new.svg b/qdp_project/evaluation-results/perf.new.svg index a877d29..35d398c 100644 --- a/qdp_project/evaluation-results/perf.new.svg +++ b/qdp_project/evaluation-results/perf.new.svg @@ -1,6 +1,6 @@ - + @@ -421,2141 +421,2985 @@ } ]]> - + Flame Graph - + Reset Zoom Search ic - + -qi_submit_sync (5,274,943 samples, 0.05%) - +__rcu_read_unlock (1,731,123 samples, 0.01%) + -std::thread::_M_start_thread (2,576,245 samples, 0.02%) - +__this_cpu_preempt_check (25,764,878 samples, 0.16%) + -entry_SYSCALL_64_after_hwframe (4,816,807 samples, 0.04%) - +qi_flush_piotlb (25,914,646 samples, 0.16%) + -do_syscall_64 (7,832,406 samples, 0.07%) - +check_preemption_disabled (401,410,663 samples, 2.48%) +ch.. -advise_stack_range (3,340,721 samples, 0.03%) - +set_nlink (1,728,057 samples, 0.01%) + -task_work_run (3,977,278 samples, 0.04%) - +perf_adjust_freq_unthr_context (2,063,358 samples, 0.01%) + -perf_iterate_sb.constprop.0 (1,544,977 samples, 0.01%) - +__alloc_file (1,521,361 samples, 0.01%) + -asm_sysvec_apic_timer_interrupt (2,180,552 samples, 0.02%) - +__irqentry_text_end (5,277,538 samples, 0.03%) + -perf_adjust_freq_unthr_context (8,995,452 samples, 0.08%) - +tick_sched_handle (8,465,801 samples, 0.05%) + -down_write (2,575,917 samples, 0.02%) - +__sysvec_apic_timer_interrupt (2,063,358 samples, 0.01%) + -__libc_start_call_main (6,715,787,788 samples, 61.85%) -__libc_start_call_main +page_counter_try_charge (11,449,245 samples, 0.07%) + -lru_gen_del_folio.constprop.0 (1,727,547 samples, 0.02%) - +exit_to_user_mode_prepare (2,039,626 samples, 0.01%) + -__mod_lruvec_page_state (3,747,166 samples, 0.03%) - +__count_memcg_events (230,601,478 samples, 1.42%) + -do_syscall_64 (1,418,159 samples, 0.01%) - +handle_mm_fault (10,328,096 samples, 0.06%) + -exit_to_user_mode_prepare (1,005,518 samples, 0.01%) - +release_pages (371,292,083 samples, 2.29%) +r.. -__libc_openat64 (2,539,730 samples, 0.02%) - +tlb_finish_mmu (1,724,696 samples, 0.01%) + -charge_memcg (1,731,219 samples, 0.02%) - +___slab_alloc (1,728,614 samples, 0.01%) + -qi_submit_sync (14,767,685 samples, 0.14%) - +__this_cpu_preempt_check (3,457,940 samples, 0.02%) + -__mem_cgroup_charge (1,731,219 samples, 0.02%) - +qi_flush_dev_iotlb_pasid (18,132,952 samples, 0.11%) + -syscall (3,456,757 samples, 0.03%) - +__list_add_valid (7,429,220 samples, 0.05%) + -entry_SYSCALL_64_after_hwframe (29,370,212 samples, 0.27%) - +debug_smp_processor_id (1,728,934 samples, 0.01%) + -perf_iterate_sb.constprop.0 (11,662,927 samples, 0.11%) - +__rcu_read_unlock (1,385,792 samples, 0.01%) + -__mem_cgroup_uncharge (1,727,729 samples, 0.02%) - +percpu_counter_add_batch (26,305,263 samples, 0.16%) + -do_anonymous_page (1,731,219 samples, 0.02%) - +__rcu_read_unlock (1,384,840 samples, 0.01%) + -dev_attr_show (6,597,170 samples, 0.06%) - +__list_del_entry_valid (1,728,946 samples, 0.01%) + -vm_area_alloc (2,149,175 samples, 0.02%) - +qi_submit_sync (23,329,066 samples, 0.14%) + -folio_batch_move_lru (1,728,947 samples, 0.02%) - +__GI_munmap (2,526,127 samples, 0.02%) + -dml::handler<dml::mem_copy_operation, dml::execution_interface<dml::hardware, std::allocator<unsigned char> >::allocator_type> dml::submit<dml::hardware, dml::execution_interface<dml::hardware, std::allocator<unsigned char> > > (44,280,626 samples, 0.41%) - +__mod_lruvec_page_state (47,483,010 samples, 0.29%) + -release_pages (12,951,918 samples, 0.12%) - +check_preemption_disabled (7,602,620 samples, 0.05%) + -exit_mmap (1,418,159 samples, 0.01%) - +exc_page_fault (2,637,120,970 samples, 16.27%) +exc_page_fault -numa_alloc_onnode (27,306,291 samples, 0.25%) - +path_openat (6,619,563 samples, 0.04%) + -mod_memcg_state (2,519,582 samples, 0.02%) - +mod_memcg_state (2,592,882 samples, 0.02%) + -vfs_fstatat (1,412,403 samples, 0.01%) - +[anon] (6,570,847 samples, 0.04%) + -kernfs_fop_release (2,475,815 samples, 0.02%) - +perf_adjust_freq_unthr_context (2,283,316 samples, 0.01%) + -__mod_memcg_state (2,519,582 samples, 0.02%) - +__irq_exit_rcu (1,441,994 samples, 0.01%) + -do_user_addr_fault (7,222,744 samples, 0.07%) - +qi_submit_sync (19,100,039 samples, 0.12%) + -sum_check (1,624,148,506 samples, 14.96%) -sum_check +__this_cpu_preempt_check (26,809,929 samples, 0.17%) + -qi_flush_dev_iotlb_pasid (6,025,194 samples, 0.06%) - +__mmu_notifier_invalidate_range_end (39,887,334 samples, 0.25%) + -Sum<unsigned long>::simd_agg (407,977,039 samples, 3.76%) -Sum<.. +do_syscall_64 (26,333,316 samples, 0.16%) + -_start (6,715,901,033 samples, 61.85%) -_start +do_user_addr_fault (11,869,290 samples, 0.07%) + -vma_alloc_folio (867,846,598 samples, 7.99%) -vma_alloc_f.. +qi_submit_sync (18,114,625 samples, 0.11%) + -syscall_exit_to_user_mode (1,005,518 samples, 0.01%) - +exit_to_user_mode_prepare (58,618,006 samples, 0.36%) + -_IO_new_file_close_it (4,816,807 samples, 0.04%) - +tick_sched_timer (2,063,358 samples, 0.01%) + -do_huge_pmd_anonymous_page (1,850,694,882 samples, 17.05%) -do_huge_pmd_anonymous_page +__rcu_read_unlock (2,592,182 samples, 0.02%) + -std::__new_allocator<dml::detail::ml::utils::structure_from<dml::detail::descriptor, dml::detail::completion_record> >::allocate (30,229,702 samples, 0.28%) - +free_pgd_range (1,728,837 samples, 0.01%) + -dml::submit<dml::hardware, dml::execution_interface<dml::hardware, std::allocator<unsigned char> > > (30,983,963 samples, 0.29%) - +__GI_munmap (631,219,928 samples, 3.89%) +__GI.. -__fput (2,475,815 samples, 0.02%) - +scheduler_tick (7,602,506 samples, 0.05%) + -unmap_vmas (2,592,830 samples, 0.02%) - +check_preemption_disabled (21,640,909 samples, 0.13%) + -do_dentry_open (1,013,775 samples, 0.01%) - +pmd_page_vaddr (1,381,985 samples, 0.01%) + -asm_exc_page_fault (1,717,471 samples, 0.02%) - +_raw_spin_lock_irqsave (1,728,173 samples, 0.01%) + -perf_iterate_ctx (11,662,927 samples, 0.11%) - +perf_event_task_tick (5,355,090 samples, 0.03%) + -free_unref_page (9,497,058 samples, 0.09%) - +entry_SYSCALL_64_after_hwframe (6,619,563 samples, 0.04%) + -mod_lruvec_page_state.constprop.0 (1,728,266 samples, 0.02%) - +__sysvec_apic_timer_interrupt (2,245,481 samples, 0.01%) + -__list_del_entry_valid (2,986,041 samples, 0.03%) - +exc_page_fault (3,976,510 samples, 0.02%) + -exc_page_fault (1,717,471 samples, 0.02%) - +__rcu_read_unlock (2,983,890 samples, 0.02%) + -sysvec_apic_timer_interrupt (2,180,552 samples, 0.02%) - +__irqentry_text_end (8,888,592 samples, 0.05%) + -__libc_open64 (1,013,775 samples, 0.01%) - +get_page_from_freelist (364,537,587 samples, 2.25%) +g.. -entry_SYSCALL_64_after_hwframe (1,412,403 samples, 0.01%) - +__x64_sys_openat (6,619,563 samples, 0.04%) + -do_mprotect_pkey (12,999,915 samples, 0.12%) - +__rcu_read_unlock (6,528,679 samples, 0.04%) + -free_unref_page_prepare (22,481,129 samples, 0.21%) - +perf_adjust_freq_unthr_context (2,245,481 samples, 0.01%) + -chrdev_open (1,013,775 samples, 0.01%) - +should_fail_alloc_page (1,906,805 samples, 0.01%) + -asm_exc_page_fault (1,852,943,584 samples, 17.07%) -asm_exc_page_fault +perf_event_mmap (5,865,007 samples, 0.04%) + -do_syscall_64 (124,499,915 samples, 1.15%) - +charge_memcg (760,371,765 samples, 4.69%) +charg.. -exc_page_fault (1,316,699,581 samples, 12.13%) -exc_page_fault +folio_mapping (8,465,905 samples, 0.05%) + -memcg_check_events (1,812,415 samples, 0.02%) - +__x64_sys_openat (10,343,181 samples, 0.06%) + -intel_invalidate_range (37,178,741 samples, 0.34%) - +check_preemption_disabled (1,728,842 samples, 0.01%) + -do_syscall_64 (3,456,757 samples, 0.03%) - +try_charge_memcg (114,897,606 samples, 0.71%) + -qi_flush_piotlb (14,767,685 samples, 0.14%) - +[unknown] (12,117,966 samples, 0.07%) + -dml::detail::ml::task<std::allocator<unsigned char> >::task (30,229,702 samples, 0.28%) - +alloc_empty_file (1,521,361 samples, 0.01%) + -check_preemption_disabled (1,474,772 samples, 0.01%) - +__this_cpu_preempt_check (1,731,498 samples, 0.01%) + -asm_sysvec_apic_timer_interrupt (2,241,589 samples, 0.02%) - +scheduler_tick (2,278,320 samples, 0.01%) + -ksys_read (10,850,783 samples, 0.10%) - +__list_del_entry_valid (4,309,390 samples, 0.03%) + -folio_add_lru (1,728,947 samples, 0.02%) - +perf_adjust_freq_unthr_context (1,574,246 samples, 0.01%) + -accfg_get_param_long (5,596,223 samples, 0.05%) - +asm_sysvec_apic_timer_interrupt (3,109,788 samples, 0.02%) + -__mod_lruvec_state (1,728,947 samples, 0.02%) - +kernel_clone (12,965,505 samples, 0.08%) + -[libstdc++.so.6.0.32] (3,527,419,633 samples, 32.49%) -[libstdc++.so.6.0.32] +irqentry_exit_to_user_mode (62,939,871 samples, 0.39%) + -_mm512_stream_load_si512 (174,354,821 samples, 1.61%) - +sync_regs (413,796,021 samples, 2.55%) +sy.. -do_user_addr_fault (1,316,699,581 samples, 12.13%) -do_user_addr_fault +__vm_munmap (223,811,903 samples, 1.38%) + -__rmqueue_pcplist (1,232,673 samples, 0.01%) - +do_syscall_64 (7,285,314 samples, 0.04%) + -entry_SYSCALL_64_after_hwframe (3,382,035 samples, 0.03%) - +vscnprintf (3,234,164 samples, 0.02%) + -__GI___getdelim (30,878,762 samples, 0.28%) - +QDPBench (16,206,959,562 samples, 99.99%) +QDPBench -tick_sched_timer (1,365,948 samples, 0.01%) - +syscall (4,322,528 samples, 0.03%) + -entry_SYSCALL_64_after_hwframe (3,340,721 samples, 0.03%) - +mas_wr_modify (1,611,669 samples, 0.01%) + -__x64_sys_futex (1,709,662 samples, 0.02%) - +lru_gen_add_folio (57,788,644 samples, 0.36%) + -__folio_alloc (2,215,907 samples, 0.02%) - +_raw_spin_unlock (9,345,492 samples, 0.06%) + -std::thread& std::vector<std::thread, std::allocator<std::thread> >::emplace_back<void (2,576,245 samples, 0.02%) - +__sysvec_apic_timer_interrupt (8,465,801 samples, 0.05%) + -link_path_walk.part.0.constprop.0 (4,734,613 samples, 0.04%) - +do_anonymous_page (2,190,520,220 samples, 13.52%) +do_anonymous_page -vma_merge (2,577,034 samples, 0.02%) - +preempt_count_sub (1,727,550 samples, 0.01%) + -qi_flush_piotlb (5,274,943 samples, 0.05%) - +__alloc_pages (3,459,598 samples, 0.02%) + -do_syscall_64 (1,665,609 samples, 0.02%) - +__list_del_entry_valid (7,949,489 samples, 0.05%) + -down_read_trylock (1,616,803 samples, 0.01%) - +asm_sysvec_apic_timer_interrupt (5,887,488 samples, 0.04%) + -std::thread::thread<void (2,576,245 samples, 0.02%) - +entry_SYSCALL_64_after_hwframe (3,042,426 samples, 0.02%) + -_raw_spin_lock (1,729,481 samples, 0.02%) - +check_preemption_disabled (6,052,507 samples, 0.04%) + -clear_page_erms (3,102,402 samples, 0.03%) - +__this_cpu_preempt_check (5,760,224 samples, 0.04%) + -__hrtimer_run_queues (1,300,420 samples, 0.01%) - +Aggregation<unsigned long, Sum, (1,313,451,843 samples, 8.10%) +Aggregation.. -node_read_meminfo (6,597,170 samples, 0.06%) - +update_process_times (10,360,017 samples, 0.06%) + -kmem_cache_alloc_node (2,596,627 samples, 0.02%) - +__hrtimer_run_queues (5,355,090 samples, 0.03%) + -device_add (1,013,775 samples, 0.01%) - +__rcu_read_unlock (5,184,321 samples, 0.03%) + -numa_node_size64 (49,206,680 samples, 0.45%) - +__GI_munmap (223,811,903 samples, 1.38%) + -mmap_region (20,376,546 samples, 0.19%) - +check_preemption_disabled (1,386,303 samples, 0.01%) + -__GI___libc_malloc (18,102,965 samples, 0.17%) - +__list_del_entry_valid (11,336,378 samples, 0.07%) + -syscall_exit_to_user_mode (4,089,240 samples, 0.04%) - +sysfs_emit_at (3,234,164 samples, 0.02%) + -__hrtimer_run_queues (1,365,948 samples, 0.01%) - +vm_normal_page (4,316,877 samples, 0.03%) + -clear_page_erms (1,701,012 samples, 0.02%) - +__list_add_valid (3,449,886 samples, 0.02%) + -inherit_event.isra.0 (6,922,986 samples, 0.06%) - +__bitmap_intersects (24,387,328 samples, 0.15%) + -do_user_addr_fault (1,717,471 samples, 0.02%) - +__sysvec_apic_timer_interrupt (2,246,370 samples, 0.01%) + -__alloc_pages (1,508,595,053 samples, 13.89%) -__alloc_pages +sysfs_kf_seq_show (6,809,146 samples, 0.04%) + -__vm_munmap (16,406,617 samples, 0.15%) - +unmap_vmas (201,189,251 samples, 1.24%) + -dsacache::CacheData::Deallocate (124,499,915 samples, 1.15%) - +__alloc_pages (183,731,242 samples, 1.13%) + -__mod_node_page_state (1,728,266 samples, 0.02%) - +__libc_open64 (10,343,181 samples, 0.06%) + -get_page_from_freelist (2,898,882 samples, 0.03%) - +rcu_core (1,379,377 samples, 0.01%) + -__mmu_notifier_invalidate_range_end (10,596,312 samples, 0.10%) - +preempt_count_add (4,794,004 samples, 0.03%) + -memcg_slab_post_alloc_hook (2,149,175 samples, 0.02%) - +up_read (16,620,144 samples, 0.10%) + -page_remove_rmap (1,729,439 samples, 0.02%) - +do_filp_open (6,619,563 samples, 0.04%) + -__pthread_clockjoin_ex (1,709,662 samples, 0.02%) - +qi_flush_dev_iotlb_pasid (4,322,030 samples, 0.03%) + -path_openat (1,014,603 samples, 0.01%) - +qi_flush_piotlb (20,054,794 samples, 0.12%) + -do_syscall_64 (1,412,403 samples, 0.01%) - +irqentry_enter (3,604,921 samples, 0.02%) + -kernel_clone (6,922,986 samples, 0.06%) - +entry_SYSCALL_64_after_hwframe (7,285,314 samples, 0.04%) + -__kmem_cache_alloc_node (1,664,645 samples, 0.02%) - +asm_sysvec_apic_timer_interrupt (2,991,599 samples, 0.02%) + -QDPBench (10,857,675,450 samples, 100.00%) -QDPBench +access_error (4,323,828 samples, 0.03%) + -sysfs_emit_at (4,018,619 samples, 0.04%) - +do_vmi_align_munmap (223,811,903 samples, 1.38%) + -__x64_sys_munmap (16,406,617 samples, 0.15%) - +sysvec_apic_timer_interrupt (9,329,419 samples, 0.06%) + -mbind_range (2,522,606 samples, 0.02%) - +__GI___libc_read (10,554,047 samples, 0.07%) + -unmap_page_range (2,592,830 samples, 0.02%) - +pud_val (5,676,206 samples, 0.04%) + -dsacache::CacheData::~CacheData (124,499,915 samples, 1.15%) - +__list_add_valid (4,309,404 samples, 0.03%) + -scan_b (1,479,617,976 samples, 13.63%) -scan_b +preempt_count_add (6,397,320 samples, 0.04%) + -__folio_alloc (2,898,882 samples, 0.03%) - +free_swap_cache (3,456,165 samples, 0.02%) + -do_sys_openat2 (7,832,406 samples, 0.07%) - +debug_smp_processor_id (2,591,959 samples, 0.02%) + -qi_submit_sync (25,935,644 samples, 0.24%) - +sysvec_apic_timer_interrupt (1,727,237 samples, 0.01%) + -_raw_spin_lock (1,728,713 samples, 0.02%) - +irqentry_exit (4,836,719 samples, 0.03%) + -__alloc_pages (867,087,699 samples, 7.99%) -__alloc_pages +seq_read_iter (9,400,040 samples, 0.06%) + -hrtimer_interrupt (8,995,452 samples, 0.08%) - +__mod_zone_page_state (23,323,934 samples, 0.14%) + -__GI_mprotect (29,370,212 samples, 0.27%) - +check_preemption_disabled (12,963,237 samples, 0.08%) + -sysvec_apic_timer_interrupt (2,241,589 samples, 0.02%) - +perf_event_task_tick (9,675,240 samples, 0.06%) + -__GI__IO_file_doallocate (19,515,368 samples, 0.18%) - +Sum<unsigned long>::simd_agg (354,247,613 samples, 2.19%) +S.. -inode_permission (2,233,658 samples, 0.02%) - +__rcu_read_lock (1,904,837 samples, 0.01%) + -copy_process (6,922,986 samples, 0.06%) - +mtree_range_walk (34,877,092 samples, 0.22%) + -vscnprintf (4,018,619 samples, 0.04%) - +aggr_j (1,314,752,767 samples, 8.11%) +aggr_j -__GI___close (1,005,518 samples, 0.01%) - +free_swap_cache (1,729,335 samples, 0.01%) + -__GI___libc_read (11,363,394 samples, 0.10%) - +idxd_cdev_release (1,664,053 samples, 0.01%) + -__GI_madvise (3,340,721 samples, 0.03%) - +update_process_times (5,355,090 samples, 0.03%) + -__libc_open64 (7,832,406 samples, 0.07%) - +__this_cpu_preempt_check (4,683,300 samples, 0.03%) + -handle_mm_fault (7,222,744 samples, 0.07%) - +mmap_region (25,499,134 samples, 0.16%) + -__kmalloc_node (1,664,645 samples, 0.02%) - +__mod_memcg_lruvec_state (10,718,577 samples, 0.07%) + -__vm_munmap (124,499,915 samples, 1.15%) - +inherit_task_group.isra.0 (11,236,456 samples, 0.07%) + -sysmalloc (29,370,212 samples, 0.27%) - +update_process_times (2,246,370 samples, 0.01%) + -__rmqueue_pcplist (6,972,673 samples, 0.06%) - +do_user_addr_fault (3,976,510 samples, 0.02%) + -unmap_region (121,905,385 samples, 1.12%) - +free_pages_and_swap_cache (1,729,335 samples, 0.01%) + -grow_heap (29,370,212 samples, 0.27%) - +tick_sched_handle (2,246,370 samples, 0.01%) + -allocate_stack (2,576,245 samples, 0.02%) - +sysvec_apic_timer_interrupt (12,664,791 samples, 0.08%) + -__GI_munmap (124,499,915 samples, 1.15%) - +__get_free_pages (1,710,021 samples, 0.01%) + -qi_submit_sync (2,478,462 samples, 0.02%) - +debug_smp_processor_id (1,729,538 samples, 0.01%) + -__futex_abstimed_wait_common (1,709,662 samples, 0.02%) - +charge_memcg (1,653,189,141 samples, 10.20%) +charge_memcg -exc_page_fault (7,222,744 samples, 0.07%) - +__hrtimer_run_queues (2,893,175 samples, 0.02%) + -_mm512_mask_add_epi64 (407,977,039 samples, 3.76%) -_mm5.. +do_anonymous_page (9,297,301 samples, 0.06%) + -do_mmap (21,476,337 samples, 0.20%) - +__handle_mm_fault (3,976,510 samples, 0.02%) + -dsacache::Cache::Access (1,478,760,036 samples, 13.62%) -dsacache::Cache::Acc.. +tlb_batch_pages_flush (144,307,316 samples, 0.89%) + -__mem_cgroup_charge (8,853,813 samples, 0.08%) - +do_syscall_64 (4,322,528 samples, 0.03%) + -do_syscall_64 (1,013,775 samples, 0.01%) - +perf_event_task_tick (2,246,370 samples, 0.01%) + -do_vmi_align_munmap (16,406,617 samples, 0.15%) - +scheduler_tick (2,893,175 samples, 0.02%) + -accfg_device_get_first (1,369,844 samples, 0.01%) - +tick_sched_handle (2,063,358 samples, 0.01%) + -perf_event_task_tick (1,365,948 samples, 0.01%) - +intel_invalidate_range (39,887,334 samples, 0.25%) + -__GI__IO_file_open (7,832,406 samples, 0.07%) - +scheduler_tick (2,245,481 samples, 0.01%) + -internal_get_user_pages_fast (2,235,330 samples, 0.02%) - +__list_add_valid (1,385,651 samples, 0.01%) + -dsacache::Cache::Clear (124,499,915 samples, 1.15%) - +qi_submit_sync (20,054,794 samples, 0.12%) + -lru_add_fn (3,945,551 samples, 0.04%) - +get_page_from_freelist (1,710,021 samples, 0.01%) + -do_syscall_64 (957,900 samples, 0.01%) - +memcg_account_kmem (1,383,928 samples, 0.01%) + -entry_SYSCALL_64_after_hwframe (1,014,603 samples, 0.01%) - +__rcu_read_lock (2,593,786 samples, 0.02%) + -inherit_task_group.isra.0 (6,922,986 samples, 0.06%) - +copy_process (12,965,505 samples, 0.08%) + -release_pages (29,397,390 samples, 0.27%) - +__mod_memcg_state (1,729,751 samples, 0.01%) + -void std::destroy_at<std::pair<unsigned char* const, dsacache::CacheData> > (124,499,915 samples, 1.15%) - +task_work_run (1,526,525 samples, 0.01%) + -hrtimer_interrupt (1,365,948 samples, 0.01%) - +scheduler_tick (10,360,017 samples, 0.06%) + -do_syscall_64 (23,194,745 samples, 0.21%) - +check_preemption_disabled (9,484,188 samples, 0.06%) + -vma_merge (2,522,606 samples, 0.02%) - +do_syscall_64 (47,131,812 samples, 0.29%) + -unsigned int std::uniform_int_distribution<unsigned long>::_S_nd<unsigned long, std::mersenne_twister_engine<unsigned long, 32ul, 624ul, 397ul, 31ul, 2567483615ul, 11ul, 4294967295ul, 7ul, 2636928640ul, 15ul, 4022730752ul, 18ul, 1812433253ul>, unsigned int> (1,707,102,197 samples, 15.72%) -unsigned int std::unifor.. +folio_add_new_anon_rmap (155,498,365 samples, 0.96%) + -do_vmi_align_munmap (124,499,915 samples, 1.15%) - +__do_sys_clone3 (12,965,505 samples, 0.08%) + -kernfs_iop_permission (1,719,405 samples, 0.02%) - +__kmem_cache_alloc_node (1,726,629 samples, 0.01%) + -unmap_page_range (5,187,701 samples, 0.05%) - +lru_add_fn (239,656,735 samples, 1.48%) + -devices_init (1,369,844 samples, 0.01%) - +__get_vma_policy (2,956,261 samples, 0.02%) + -tick_sched_handle (1,365,948 samples, 0.01%) - +__mod_zone_page_state (6,900,606 samples, 0.04%) + -unsigned long std::uniform_int_distribution<unsigned long>::operator (2,651,695,239 samples, 24.42%) -unsigned long std::uniform_int_distrib.. +do_mmap (25,499,134 samples, 0.16%) + -dsacache::Cache::SubmitTask (1,474,554,916 samples, 13.58%) -dsacache::Cache::Sub.. +check_preemption_disabled (6,047,369 samples, 0.04%) + -__mmu_notifier_invalidate_range (37,178,741 samples, 0.34%) - +link_path_walk.part.0.constprop.0 (4,837,854 samples, 0.03%) + -do_syscall_64 (4,816,807 samples, 0.04%) - +_raw_spin_lock_irqsave (1,374,549 samples, 0.01%) + -number (1,718,765 samples, 0.02%) - +__hrtimer_run_queues (10,360,017 samples, 0.06%) + -__GI___close_nocancel (4,816,807 samples, 0.04%) - +preempt_count_sub (3,617,185 samples, 0.02%) + -__x64_sys_openat (7,832,406 samples, 0.07%) - +dsacache::Cache::AllocOnNode (4,643,768,628 samples, 28.65%) +dsacache::Cache::AllocOnNode -__alloc_pages (2,215,907 samples, 0.02%) - +_raw_spin_lock_irqsave (7,950,760 samples, 0.05%) + -do_filp_open (7,021,877 samples, 0.06%) - +all (16,207,832,029 samples, 100%) + -aggr_j (1,283,482,019 samples, 11.82%) -aggr_j +__memcg_kmem_charge_page (1,902,465 samples, 0.01%) + -format_decode (1,657,716 samples, 0.02%) - +__count_memcg_events (24,740,787 samples, 0.15%) + -std::mersenne_twister_engine<unsigned long, 32ul, 624ul, 397ul, 31ul, 2567483615ul, 11ul, 4294967295ul, 7ul, 2636928640ul, 15ul, 4022730752ul, 18ul, 1812433253ul>::operator (990,880,606 samples, 9.13%) -std::mersenne.. +clear_page_erms (44,854,476 samples, 0.28%) + -update_process_times (1,300,420 samples, 0.01%) - +__mod_zone_page_state (2,246,759 samples, 0.01%) + -hrtimer_interrupt (2,020,732 samples, 0.02%) - +_raw_spin_lock (1,471,343 samples, 0.01%) + -futex_wait (1,709,662 samples, 0.02%) - +__GI_mprotect (48,514,489 samples, 0.30%) + -uncharge_batch (1,727,729 samples, 0.02%) - +inc_mm_counter (28,550,483 samples, 0.18%) + -dml::core::dispatcher::hw_device::initialize_new_device (10,649,925 samples, 0.10%) - +__count_memcg_events (576,028,915 samples, 3.55%) +__c.. -intel_invalidate_range (49,276,701 samples, 0.45%) - +lru_gen_add_folio (174,186,514 samples, 1.07%) + -exit_to_user_mode_prepare (1,526,259 samples, 0.01%) - +check_preemption_disabled (3,458,836 samples, 0.02%) + -std::thread::join (1,709,662 samples, 0.02%) - +preempt_count_sub (5,398,063 samples, 0.03%) + -lru_gen_add_folio (3,945,551 samples, 0.04%) - +sync_regs (177,790,295 samples, 1.10%) + -dml::core::dispatcher::hw_dispatcher::initialize_hw (12,436,625 samples, 0.11%) - +error_entry (21,589,852 samples, 0.13%) + -try_grab_folio (1,464,761 samples, 0.01%) - +mbind_range (2,699,413 samples, 0.02%) + -check_preemption_disabled (974,903 samples, 0.01%) - +unmap_region (223,811,903 samples, 1.38%) + -accfg_get_param_str (2,020,121 samples, 0.02%) - +do_anonymous_page (3,976,510 samples, 0.02%) + -main (6,713,260,491 samples, 61.83%) -main +[[heap]] (1,729,927 samples, 0.01%) + -change_protection (21,306,971 samples, 0.20%) - +asm_sysvec_apic_timer_interrupt (2,620,554 samples, 0.02%) + -qi_submit_sync (18,156,520 samples, 0.17%) - +asm_exc_page_fault (3,976,510 samples, 0.02%) + -preempt_count_add (1,729,481 samples, 0.02%) - +hrtimer_interrupt (2,063,358 samples, 0.01%) + -tlb_batch_pages_flush (13,813,787 samples, 0.13%) - +entry_SYSCALL_64_after_hwframe (47,131,812 samples, 0.29%) + -numa_node_of_cpu (1,719,530 samples, 0.02%) - +folio_add_lru (158,132,049 samples, 0.98%) + -__hrtimer_run_queues (8,995,452 samples, 0.08%) - +asm_exc_page_fault (4,023,289,231 samples, 24.82%) +asm_exc_page_fault -free_tail_page_prepare (5,179,307 samples, 0.05%) - +__this_cpu_preempt_check (1,726,873 samples, 0.01%) + -__fput (1,005,518 samples, 0.01%) - +sysvec_apic_timer_interrupt (2,246,370 samples, 0.01%) + -__x64_sys_madvise (3,340,721 samples, 0.03%) - +alloc_empty_file (1,548,099 samples, 0.01%) + -lock_vma_under_rcu (2,662,357 samples, 0.02%) - +__x64_sys_munmap (631,219,928 samples, 3.89%) +__x6.. -std::_Hashtable<unsigned char*, std::pair<unsigned char* const, dsacache::CacheData>, std::allocator<std::pair<unsigned char* const, dsacache::CacheData> >, std::__detail::_Select1st, std::equal_to<unsigned char*>, std::hash<unsigned char*>, std::__detail::_Mod_range_hashing, std::__detail::_Default_ranged_hash, std::__detail::_Prime_rehash_policy, std::__detail::_Hashtable_traits<false, false, true> >::clear (124,499,915 samples, 1.15%) - +_raw_spin_trylock (18,163,797 samples, 0.11%) + -path_openat (2,028,052 samples, 0.02%) - +exit_to_user_mode_prepare (1,664,053 samples, 0.01%) + -dsacache::Cache::ExecuteCopy (44,280,626 samples, 0.41%) - +sysvec_apic_timer_interrupt (5,887,488 samples, 0.04%) + -std::mersenne_twister_engine<unsigned long, 32ul, 624ul, 397ul, 31ul, 2567483615ul, 11ul, 4294967295ul, 7ul, 2636928640ul, 15ul, 4022730752ul, 18ul, 1812433253ul>::operator (596,422,567 samples, 5.49%) -std::me.. +intel_invalidate_range (41,443,691 samples, 0.26%) + -do_syscall_64 (10,850,783 samples, 0.10%) - +getname_flags.part.0 (1,895,237 samples, 0.01%) + -sysfs_kf_seq_show (6,597,170 samples, 0.06%) - +asm_exc_page_fault (2,936,586,182 samples, 18.12%) +asm_exc_page_fault -entry_SYSCALL_64_after_hwframe (1,665,609 samples, 0.02%) - +check_preemption_disabled (77,177,405 samples, 0.48%) + -__pthread_create_2_1 (2,576,245 samples, 0.02%) - +tick_sched_handle (10,360,017 samples, 0.06%) + -asm_exc_page_fault (7,813,295 samples, 0.07%) - +try_charge_memcg (2,593,139 samples, 0.02%) + -accfg_get_param_long (1,927,699 samples, 0.02%) - +perf_adjust_freq_unthr_context (2,278,320 samples, 0.01%) + -get_page_from_freelist (1,232,673 samples, 0.01%) - +cgroup_rstat_updated (1,903,621 samples, 0.01%) + -change_protection (10,596,312 samples, 0.10%) - +preempt_count_add (2,425,287 samples, 0.01%) + -__fput (1,014,019 samples, 0.01%) - +scheduler_tick (5,355,090 samples, 0.03%) + -mprotect_fixup (12,141,289 samples, 0.11%) - +do_syscall_64 (2,526,127 samples, 0.02%) + -qi_submit_sync (23,341,057 samples, 0.21%) - +__list_add_valid (1,730,109 samples, 0.01%) + -free_tail_page_prepare (17,289,659 samples, 0.16%) - +x86_pmu_event_init (2,593,062 samples, 0.02%) + -vfs_read (10,850,783 samples, 0.10%) - +__hrtimer_run_queues (2,162,393 samples, 0.01%) + -std::pair<unsigned char* const, dsacache::CacheData>::~pair (124,499,915 samples, 1.15%) - +__bitmap_intersects (14,543,038 samples, 0.09%) + -mem_cgroup_charge_statistics (1,608,803 samples, 0.01%) - +memcg_check_events (642,670,660 samples, 3.97%) +memc.. -do_vmi_munmap (124,499,915 samples, 1.15%) - +free_unref_page_commit (19,858,618 samples, 0.12%) + -__count_memcg_events (1,834,351 samples, 0.02%) - +check_preemption_disabled (4,836,501 samples, 0.03%) + -all (10,857,675,452 samples, 100%) - +free_pcppages_bulk (94,989,678 samples, 0.59%) + -scan_a (764,319,638 samples, 7.04%) -scan_a +access_error (7,347,830 samples, 0.05%) + -entry_SYSCALL_64_after_hwframe (3,456,757 samples, 0.03%) - +[libstdc++.so.6.0.32] (6,716,810,165 samples, 41.44%) +[libstdc++.so.6.0.32] -update_process_times (8,995,452 samples, 0.08%) - +__this_cpu_preempt_check (4,321,815 samples, 0.03%) + -__sysvec_apic_timer_interrupt (2,020,732 samples, 0.02%) - +__rcu_read_lock (2,756,901 samples, 0.02%) + -__mmu_notifier_invalidate_range_end (49,276,701 samples, 0.45%) - +__mod_lruvec_state (30,240,095 samples, 0.19%) + -__mod_lruvec_state (1,246,575 samples, 0.01%) - +sysfs_emit_at (1,728,036 samples, 0.01%) + -clear_page_erms (312,006,524 samples, 2.87%) -cl.. +p4d_offset (3,678,345 samples, 0.02%) + -clear_page_erms (683,869,034 samples, 6.30%) -clear_pa.. +mas_wr_node_store (1,611,669 samples, 0.01%) + -entry_SYSCALL_64_after_hwframe (12,999,915 samples, 0.12%) - +perf_event_alloc (9,508,489 samples, 0.06%) + -clear_page_erms (370,773,520 samples, 3.41%) -cle.. +__x64_sys_munmap (223,811,903 samples, 1.38%) + -entry_SYSCALL_64_after_hwframe (1,013,775 samples, 0.01%) - +__count_memcg_events (55,586,950 samples, 0.34%) + -_raw_spin_lock_irqsave (1,728,447 samples, 0.02%) - +perf_event_task_tick (2,063,358 samples, 0.01%) + -__cond_resched (5,709,094 samples, 0.05%) - +__vm_munmap (631,219,928 samples, 3.89%) +__vm.. -_IO_new_file_underflow (30,878,762 samples, 0.28%) - +preempt_count_add (3,288,567 samples, 0.02%) + -do_user_addr_fault (1,852,943,584 samples, 17.07%) -do_user_addr_fault +__folio_alloc (184,596,394 samples, 1.14%) + -[unknown] (4,194,714 samples, 0.04%) - +__this_cpu_preempt_check (12,272,089 samples, 0.08%) + -vma_alloc_folio (1,509,460,438 samples, 13.90%) -vma_alloc_folio +sysmalloc (3,976,510 samples, 0.02%) + -task_work_run (1,005,518 samples, 0.01%) - +perf_event_init_task (11,236,456 samples, 0.07%) + -vsnprintf (4,018,619 samples, 0.04%) - +free_unref_page_list (52,679,292 samples, 0.33%) + -do_filp_open (2,028,052 samples, 0.02%) - +__x64_sys_madvise (2,414,556 samples, 0.01%) + -task_mm_cid_work (1,726,993 samples, 0.02%) - +_raw_spin_lock (15,235,294 samples, 0.09%) + -__sysvec_apic_timer_interrupt (1,365,948 samples, 0.01%) - +__this_cpu_preempt_check (5,176,773 samples, 0.03%) + -do_syscall_64 (29,370,212 samples, 0.27%) - +unmap_page_range (222,087,207 samples, 1.37%) + -exit_to_user_mode_prepare (1,726,993 samples, 0.02%) - +pfn_pte (3,458,350 samples, 0.02%) + -do_filp_open (1,014,603 samples, 0.01%) - +vm_normal_page (4,324,302 samples, 0.03%) + -numa_node_of_cpu (1,530,542 samples, 0.01%) - +__mod_lruvec_state (4,158,167 samples, 0.03%) + -entry_SYSCALL_64_after_hwframe (10,850,783 samples, 0.10%) - +__rcu_read_unlock (2,940,300 samples, 0.02%) + -__x64_sys_openat (1,014,603 samples, 0.01%) - +get_mem_cgroup_from_mm (58,724,220 samples, 0.36%) + -tick_sched_handle (8,995,452 samples, 0.08%) - +down_write (1,729,175 samples, 0.01%) + -qi_flush_dev_iotlb_pasid (23,341,057 samples, 0.21%) - +mas_walk (46,004,269 samples, 0.28%) + -free_unref_page (22,481,129 samples, 0.21%) - +handle_mm_fault (3,976,510 samples, 0.02%) + -__cond_resched (6,573,644 samples, 0.06%) - +preempt_count_sub (2,753,956 samples, 0.02%) + -std::allocator<dml::detail::ml::utils::structure_from<dml::detail::descriptor, dml::detail::completion_record> >::allocate (30,229,702 samples, 0.28%) - +check_preemption_disabled (3,112,802 samples, 0.02%) + -call_init (1,196,824 samples, 0.01%) - +do_syscall_64 (6,619,563 samples, 0.04%) + -__mod_lruvec_page_state (1,728,266 samples, 0.02%) - +kernel_mbind (7,285,314 samples, 0.04%) + -charge_memcg (4,949,036 samples, 0.05%) - +std::mersenne_twister_engine<unsigned long, 32ul, 624ul, 397ul, 31ul, 2567483615ul, 11ul, 4294967295ul, 7ul, 2636928640ul, 15ul, 4022730752ul, 18ul, 1812433253ul>::operator (577,343,172 samples, 3.56%) +std.. -wqs_init (8,620,835 samples, 0.08%) - +std::mersenne_twister_engine<unsigned long, 32ul, 624ul, 397ul, 31ul, 2567483615ul, 11ul, 4294967295ul, 7ul, 2636928640ul, 15ul, 4022730752ul, 18ul, 1812433253ul>::_M_gen_rand (452,955,873 samples, 2.79%) +st.. -__rmqueue_pcplist (26,751,206 samples, 0.25%) - +perf_event_task_tick (2,283,316 samples, 0.01%) + -zap_huge_pmd (3,457,292 samples, 0.03%) - +__rcu_read_lock (3,194,875 samples, 0.02%) + -scheduler_tick (1,365,948 samples, 0.01%) - +charge_memcg (3,112,277 samples, 0.02%) + -folio_add_lru (2,701,975 samples, 0.02%) - +preempt_count_add (11,074,593 samples, 0.07%) + -__handle_mm_fault (7,222,744 samples, 0.07%) - +__list_add_valid (2,423,562 samples, 0.01%) + -perf_iterate_ctx (5,486,207 samples, 0.05%) - +__tlb_remove_page_size (1,728,884 samples, 0.01%) + -perf_event_mmap (1,544,977 samples, 0.01%) - +lru_add_fn (85,654,057 samples, 0.53%) + -sync_regs (4,312,756 samples, 0.04%) - +page_counter_try_charge (21,586,297 samples, 0.13%) + -void fill_mt<unsigned long> (4,943,244,832 samples, 45.53%) -void fill_mt<unsigned long> +__mod_zone_page_state (11,241,303 samples, 0.07%) + -path_openat (7,021,877 samples, 0.06%) - +irqentry_enter (6,704,632 samples, 0.04%) + -__GI__IO_doallocbuf (19,515,368 samples, 0.18%) - +_raw_spin_unlock_irqrestore (3,973,456 samples, 0.02%) + -unsigned int std::uniform_int_distribution<unsigned long>::_S_nd<unsigned long, std::mersenne_twister_engine<unsigned long, 32ul, 624ul, 397ul, 31ul, 2567483615ul, 11ul, 4294967295ul, 7ul, 2636928640ul, 15ul, 4022730752ul, 18ul, 1812433253ul>, unsigned int> (596,422,567 samples, 5.49%) -unsigne.. +entry_SYSCALL_64_after_hwframe (10,264,737 samples, 0.06%) + -entry_SYSCALL_64_after_hwframe (2,038,073 samples, 0.02%) - +free_pcppages_bulk (33,679,763 samples, 0.21%) + -free_compound_page (1,727,729 samples, 0.02%) - +_raw_spin_lock_irqsave (1,904,959 samples, 0.01%) + -sysvec_apic_timer_interrupt (8,995,452 samples, 0.08%) - +debug_smp_processor_id (1,729,254 samples, 0.01%) + -security_vm_enough_memory_mm (1,591,769 samples, 0.01%) - +handle_mm_fault (2,421,988,931 samples, 14.94%) +handle_mm_fault -__GI_exit (2,527,297 samples, 0.02%) - +__libc_openat64 (7,131,806 samples, 0.04%) + -do_mprotect_pkey (29,370,212 samples, 0.27%) - +asm_sysvec_apic_timer_interrupt (2,728,444 samples, 0.02%) + -_IO_new_fclose (4,816,807 samples, 0.04%) - +check_preemption_disabled (3,632,125 samples, 0.02%) + -__GI___mmap64 (23,194,745 samples, 0.21%) - +sysvec_apic_timer_interrupt (2,278,320 samples, 0.01%) + -handle_mm_fault (1,852,943,584 samples, 17.07%) -handle_mm_fault +tick_sched_handle (5,355,090 samples, 0.03%) + -std::mersenne_twister_engine<unsigned long, 32ul, 624ul, 397ul, 31ul, 2567483615ul, 11ul, 4294967295ul, 7ul, 2636928640ul, 15ul, 4022730752ul, 18ul, 1812433253ul>::_M_gen_rand (426,886,794 samples, 3.93%) -std:.. +up_read (42,836,892 samples, 0.26%) + -do_sys_openat2 (1,014,603 samples, 0.01%) - +syscall_exit_to_user_mode (2,039,626 samples, 0.01%) + -__GI___fstatat64 (1,412,403 samples, 0.01%) - +__bitmap_intersects (1,384,048 samples, 0.01%) + -idxd_cdev_open (1,013,775 samples, 0.01%) - +vma_alloc_folio (570,274,722 samples, 3.52%) +vma.. -vm_mmap_pgoff (23,194,745 samples, 0.21%) - +mod_lruvec_page_state.constprop.0 (2,756,901 samples, 0.02%) + -mod_lruvec_page_state.constprop.0 (3,747,166 samples, 0.03%) - +free_unref_page_list (155,397,189 samples, 0.96%) + -__alloc_pages (2,898,882 samples, 0.03%) - +__mod_node_page_state (22,459,612 samples, 0.14%) + -groups_init (2,409,723 samples, 0.02%) - +__rcu_read_lock (1,727,825 samples, 0.01%) + -std::__detail::_Hashtable_alloc<std::allocator<std::__detail::_Hash_node<std::pair<unsigned char* const, dsacache::CacheData>, false> > >::_M_deallocate_node (124,499,915 samples, 1.15%) - +mpol_new (1,729,408 samples, 0.01%) + -_IO_new_file_fopen (8,432,767 samples, 0.08%) - +__mod_zone_page_state (11,928,541 samples, 0.07%) + -__mod_lruvec_page_state (1,710,376 samples, 0.02%) - +folio_add_new_anon_rmap (50,707,542 samples, 0.31%) + -vma_alloc_folio (2,215,907 samples, 0.02%) - +intel_invalidate_range (9,503,744 samples, 0.06%) + -clear_huge_page (396,622,667 samples, 3.65%) -clea.. +qi_flush_piotlb (5,181,714 samples, 0.03%) + -__GI_munmap (1,665,609 samples, 0.02%) - +unsigned int std::uniform_int_distribution<unsigned long>::_S_nd<unsigned long, std::mersenne_twister_engine<unsigned long, 32ul, 624ul, 397ul, 31ul, 2567483615ul, 11ul, 4294967295ul, 7ul, 2636928640ul, 15ul, 4022730752ul, 18ul, 1812433253ul>, unsigned int> (1,677,046,261 samples, 10.35%) +unsigned int st.. -_mid_memalign (30,229,702 samples, 0.28%) - +scheduler_tick (2,246,370 samples, 0.01%) + -vfs_read (957,900 samples, 0.01%) - +do_madvise (2,414,556 samples, 0.01%) + -__list_del_entry_valid (1,232,673 samples, 0.01%) - +perf_iterate_ctx (16,121,901 samples, 0.10%) + -read (1,018,420 samples, 0.01%) - +tick_sched_timer (2,245,481 samples, 0.01%) + -entry_SYSCALL_64_after_hwframe (1,005,518 samples, 0.01%) - +__split_vma (5,183,584 samples, 0.03%) + -mas_store_prealloc (1,537,267 samples, 0.01%) - +fpregs_assert_state_consistent (28,171,663 samples, 0.17%) + -void std::allocator_traits<std::allocator<std::__detail::_Hash_node<std::pair<unsigned char* const, dsacache::CacheData>, false> > >::destroy<std::pair<unsigned char* const, dsacache::CacheData> > (124,499,915 samples, 1.15%) - +__sysvec_apic_timer_interrupt (2,893,175 samples, 0.02%) + -__x64_sys_mprotect (29,370,212 samples, 0.27%) - +__sysvec_apic_timer_interrupt (2,162,393 samples, 0.01%) + -do_syscall_64 (1,005,518 samples, 0.01%) - +check_preemption_disabled (6,043,809 samples, 0.04%) + -handle_mm_fault (1,312,938,533 samples, 12.09%) -handle_mm_fault +vm_mmap_pgoff (25,499,134 samples, 0.16%) + -do_sys_openat2 (1,013,775 samples, 0.01%) - +memcg_slab_post_alloc_hook (1,548,099 samples, 0.01%) + -kmem_cache_alloc (2,149,175 samples, 0.02%) - +change_protection (39,887,334 samples, 0.25%) + -unmap_vmas (54,464,402 samples, 0.50%) - +hrtimer_interrupt (5,355,090 samples, 0.03%) + -dsacache::Cache::GetCacheNode (2,577,577 samples, 0.02%) - +__mod_node_page_state (8,645,452 samples, 0.05%) + -dsacache::Cache::Access (4,987,299 samples, 0.05%) - +folio_lruvec_lock_irqsave (1,729,327 samples, 0.01%) + -__mod_lruvec_state (1,728,266 samples, 0.02%) - +__sysvec_apic_timer_interrupt (5,355,090 samples, 0.03%) + -vfs_statx (1,412,403 samples, 0.01%) - +_raw_spin_lock (51,474,392 samples, 0.32%) + -update_process_times (1,365,948 samples, 0.01%) - +check_preemption_disabled (3,977,351 samples, 0.02%) + -folio_batch_move_lru (2,701,975 samples, 0.02%) - +__this_cpu_preempt_check (4,321,339 samples, 0.03%) + -do_syscall_64 (3,382,035 samples, 0.03%) - +do_user_addr_fault (2,373,989,107 samples, 14.65%) +do_user_addr_fault -pte_alloc_one (10,782,226 samples, 0.10%) - +__mem_cgroup_uncharge_list (6,915,224 samples, 0.04%) + -dml::detail::ml::buffer<std::allocator<unsigned char>, dml::detail::descriptor, dml::detail::completion_record>::buffer (30,229,702 samples, 0.28%) - +vfs_read (9,400,040 samples, 0.06%) + -entry_SYSCALL_64_after_hwframe (957,900 samples, 0.01%) - +__rcu_read_lock (8,296,345 samples, 0.05%) + -tlb_batch_pages_flush (29,397,390 samples, 0.27%) - +_mm512_mask_add_epi64 (354,247,613 samples, 2.19%) +_.. -__next_zones_zonelist (1,695,609 samples, 0.02%) - +lru_gen_del_folio.constprop.0 (156,312,784 samples, 0.96%) + -free_unref_page_prepare (9,497,058 samples, 0.09%) - +format_decode (2,370,200 samples, 0.01%) + -__run_exit_handlers (2,527,297 samples, 0.02%) - +vma_alloc_folio (3,120,052 samples, 0.02%) + -__x64_sys_openat (1,013,775 samples, 0.01%) - +__mod_lruvec_state (3,458,121 samples, 0.02%) + -do_mbind (3,382,035 samples, 0.03%) - +_raw_spin_trylock (1,576,484 samples, 0.01%) + -kernel_mbind (3,382,035 samples, 0.03%) - +check_preemption_disabled (6,848,033 samples, 0.04%) + -get_page_from_freelist (2,215,907 samples, 0.02%) - +qi_flush_dev_iotlb_pasid (19,100,039 samples, 0.12%) + -_IO_new_file_init_internal (1,489,012 samples, 0.01%) - +__mod_node_page_state (25,518,507 samples, 0.16%) + -__folio_alloc (1,508,595,053 samples, 13.89%) -__folio_alloc +perf_adjust_freq_unthr_context (7,602,506 samples, 0.05%) + -mbind (3,382,035 samples, 0.03%) - +void fill_mt<unsigned long> (6,081,590,595 samples, 37.52%) +void fill_mt<unsigned long> -qi_submit_sync (19,022,221 samples, 0.18%) - +get_page_from_freelist (1,557,133 samples, 0.01%) + -auto dml::detail::submit<dml::hardware, dml::mem_copy_operation, dml::execution_interface<dml::hardware, std::allocator<unsigned char> >, dml::submit<dml::hardware, dml::execution_interface<dml::hardware, std::allocator<unsigned char> > > (44,280,626 samples, 0.41%) - +preempt_count_add (8,205,165 samples, 0.05%) + -qi_flush_piotlb (25,935,644 samples, 0.24%) - +page_remove_rmap (38,029,000 samples, 0.23%) + -device_parse (8,620,835 samples, 0.08%) - +do_syscall_64 (3,042,426 samples, 0.02%) + -vma_alloc_folio (3,551,167 samples, 0.03%) - +__next_zones_zonelist (10,036,556 samples, 0.06%) + -dsacache::Cache::GetCacheNode (4,987,299 samples, 0.05%) - +cgroup_rstat_updated (4,777,645 samples, 0.03%) + -decltype (2,576,245 samples, 0.02%) - +__mod_lruvec_state (11,239,478 samples, 0.07%) + -exit_to_user_mode_prepare (4,089,240 samples, 0.04%) - +vma_merge (2,699,413 samples, 0.02%) + -qi_flush_dev_iotlb_pasid (5,321,369 samples, 0.05%) - +_mm512_stream_load_si512 (195,062,083 samples, 1.20%) + -clear_huge_page (333,454,013 samples, 3.07%) -cle.. +_raw_spin_unlock (8,129,458 samples, 0.05%) + -__count_memcg_events (1,102,429 samples, 0.01%) - +free_pages_and_swap_cache (3,456,165 samples, 0.02%) + -__sysvec_apic_timer_interrupt (8,995,452 samples, 0.08%) - +__x64_sys_get_mempolicy (4,322,528 samples, 0.03%) + -__alloc_pages (1,729,251 samples, 0.02%) - +mem_cgroup_charge_statistics (282,944,823 samples, 1.75%) + -do_syscall_64 (16,406,617 samples, 0.15%) - +__mod_lruvec_state (30,405,460 samples, 0.19%) + -do_sys_openat2 (2,028,052 samples, 0.02%) - +__GI___getdelim (1,729,911 samples, 0.01%) + -add_wq (8,112,387 samples, 0.07%) - +std::mersenne_twister_engine<unsigned long, 32ul, 624ul, 397ul, 31ul, 2567483615ul, 11ul, 4294967295ul, 7ul, 2636928640ul, 15ul, 4022730752ul, 18ul, 1812433253ul>::operator (1,001,161,895 samples, 6.18%) +std::mer.. -Filter<unsigned long, LT, (764,319,624 samples, 7.04%) -Filter<un.. +intel_invalidate_range (44,047,598 samples, 0.27%) + -lru_gen_del_folio.constprop.0 (1,729,406 samples, 0.02%) - +__mmu_notifier_invalidate_range (44,912,926 samples, 0.28%) + -__x64_sys_munmap (124,499,915 samples, 1.15%) - +policy_node (11,566,513 samples, 0.07%) + -perf_event_task_tick (8,995,452 samples, 0.08%) - +__rcu_read_unlock (1,899,272 samples, 0.01%) + -unsigned long std::uniform_int_distribution<unsigned long>::operator (596,422,567 samples, 5.49%) -unsigne.. +__this_cpu_preempt_check (3,630,476 samples, 0.02%) + -__x64_sys_exit_group (1,418,159 samples, 0.01%) - +__rmqueue_pcplist (2,557,377 samples, 0.02%) + -folio_batch_move_lru (3,945,551 samples, 0.04%) - +hrtimer_interrupt (2,246,370 samples, 0.01%) + -dsacache::Cache::SubmitTask (13,296,663 samples, 0.12%) - +blk_cgroup_congested (7,785,255 samples, 0.05%) + -tick_sched_timer (1,300,420 samples, 0.01%) - +lru_gen_del_folio.constprop.0 (68,287,267 samples, 0.42%) + -std::__detail::_Hashtable_alloc<std::allocator<std::__detail::_Hash_node<std::pair<unsigned char* const, dsacache::CacheData>, false> > >::_M_deallocate_nodes (124,499,915 samples, 1.15%) - +std::unordered_map<unsigned char*, dsacache::CacheData, std::hash<unsigned char*>, std::equal_to<unsigned char*>, std::allocator<std::pair<unsigned char* const, dsacache::CacheData> > >::clear (631,219,928 samples, 3.89%) +std:.. -kernfs_seq_start (1,981,537 samples, 0.02%) - +qi_flush_dev_iotlb_pasid (23,329,066 samples, 0.14%) + -memcg_account_kmem (2,519,582 samples, 0.02%) - +entry_SYSCALL_64_after_hwframe (631,219,928 samples, 3.89%) +entr.. -folio_add_new_anon_rmap (1,710,376 samples, 0.02%) - +folio_mapping (3,117,433 samples, 0.02%) + -_int_malloc (17,243,479 samples, 0.16%) - +tick_sched_handle (2,245,481 samples, 0.01%) + -__mmu_notifier_invalidate_range_end (21,306,971 samples, 0.20%) - +clear_page_erms (88,446,554 samples, 0.55%) + -__GI___libc_read (957,900 samples, 0.01%) - +perf_adjust_freq_unthr_context (5,355,090 samples, 0.03%) + -dml::core::dispatcher::hw_queue::initialize_new_queue (2,029,090 samples, 0.02%) - +exc_page_fault (2,385,002,551 samples, 14.72%) +exc_page_fault -start_thread (3,530,760,354 samples, 32.52%) -start_thread +syscall (8,148,987 samples, 0.05%) + -__this_cpu_preempt_check (1,035,514 samples, 0.01%) - +do_syscall_64 (10,264,737 samples, 0.06%) + -perf_event_alloc (6,057,194 samples, 0.06%) - +dsacache::Cache::SubmitTask (4,644,633,394 samples, 28.66%) +dsacache::Cache::SubmitTask -unsigned long std::uniform_int_distribution<unsigned long>::operator (2,659,479,023 samples, 24.49%) -unsigned long std::uniform_int_distrib.. +hrtimer_interrupt (2,162,393 samples, 0.01%) + -__do_sys_newfstatat (1,412,403 samples, 0.01%) - +__GI_madvise (2,414,556 samples, 0.01%) + -read (957,900 samples, 0.01%) - +__fput (1,664,053 samples, 0.01%) + -do_vmi_munmap (16,406,617 samples, 0.15%) - +entry_SYSCALL_64_after_hwframe (10,343,181 samples, 0.06%) + -Vector_Loader<unsigned long, (174,354,821 samples, 1.61%) - +__mmu_notifier_invalidate_range_end (41,443,691 samples, 0.26%) + -__GI__IO_link_in (1,489,012 samples, 0.01%) - +__mem_cgroup_uncharge_list (13,828,510 samples, 0.09%) + -call_init (1,196,824 samples, 0.01%) - +__this_cpu_preempt_check (2,594,993 samples, 0.02%) + -vm_unmapped_area (1,099,791 samples, 0.01%) - +check_preemption_disabled (6,327,743 samples, 0.04%) + -devices_init (2,865,392 samples, 0.03%) - +free_pgtables (1,728,837 samples, 0.01%) + -do_syscall_64 (2,539,730 samples, 0.02%) - +__mod_memcg_lruvec_state (24,524,493 samples, 0.15%) + -asm_sysvec_apic_timer_interrupt (1,285,604 samples, 0.01%) - +__handle_mm_fault (9,811,818 samples, 0.06%) + -intel_invalidate_range (10,596,312 samples, 0.10%) - +fpregs_assert_state_consistent (6,327,743 samples, 0.04%) + -syscall_exit_to_user_mode (1,526,259 samples, 0.01%) - +vsnprintf (1,728,036 samples, 0.01%) + -tlb_finish_mmu (67,440,983 samples, 0.62%) - +release_pages (7,617,475 samples, 0.05%) + -do_syscall_64 (3,340,721 samples, 0.03%) - +entry_SYSCALL_64_after_hwframe (2,526,127 samples, 0.02%) + -_dl_init (1,196,824 samples, 0.01%) - +preempt_count_sub (1,899,511 samples, 0.01%) + -mas_wr_store_entry.isra.0 (1,730,304 samples, 0.02%) - +__alloc_pages (1,710,021 samples, 0.01%) + -qi_flush_piotlb (19,022,221 samples, 0.18%) - +mas_store_prealloc (2,476,464 samples, 0.02%) + -openat (1,014,603 samples, 0.01%) - +main (8,522,536,197 samples, 52.58%) +main -__mmu_notifier_invalidate_range_end (2,478,462 samples, 0.02%) - +pmd_val (3,328,679 samples, 0.02%) + -kernel_get_mempolicy (3,456,757 samples, 0.03%) - +pmd_install (1,728,616 samples, 0.01%) + -do_huge_pmd_anonymous_page (6,842,888 samples, 0.06%) - +numa_node_size64 (5,705,774 samples, 0.04%) + -_raw_spin_lock (2,066,301 samples, 0.02%) - +scheduler_tick (1,574,246 samples, 0.01%) + -scheduler_tick (1,256,830 samples, 0.01%) - +debug_smp_processor_id (221,057,514 samples, 1.36%) + -qi_submit_sync (5,321,369 samples, 0.05%) - +sum_check (1,809,416,252 samples, 11.16%) +sum_check -get_mem_cgroup_from_mm (3,904,777 samples, 0.04%) - +preempt_count_sub (3,048,074 samples, 0.02%) + -get_page_from_freelist (864,889,410 samples, 7.97%) -get_page_fr.. +uncharge_folio (6,915,224 samples, 0.04%) + -intel_invalidate_range (21,306,971 samples, 0.20%) - +__alloc_pages (485,198,496 samples, 2.99%) +__.. -do_syscall_64 (2,038,073 samples, 0.02%) - +__mod_node_page_state (17,247,278 samples, 0.11%) + -entry_SYSCALL_64_after_hwframe (124,499,915 samples, 1.15%) - +__mem_cgroup_charge (1,699,033,875 samples, 10.48%) +__mem_cgroup_ch.. -__alloc_pages (7,035,060 samples, 0.06%) - +__rcu_read_lock (2,245,039 samples, 0.01%) + -__page_cache_release (1,727,547 samples, 0.02%) - +entry_SYSCALL_64_after_hwframe (4,322,528 samples, 0.03%) + -__libc_openat64 (1,014,603 samples, 0.01%) - +intel_invalidate_range (2,414,556 samples, 0.01%) + -__libc_start_main_impl (6,715,787,788 samples, 61.85%) -__libc_start_main_impl +__mod_node_page_state (41,576,218 samples, 0.26%) + -do_anonymous_page (13,645,186 samples, 0.13%) - +__mod_lruvec_page_state (107,097,574 samples, 0.66%) + -path_openat (1,013,775 samples, 0.01%) - +__alloc_file (1,548,099 samples, 0.01%) + -dsacache::Cache::AllocOnNode (1,427,696,755 samples, 13.15%) -dsacache::Cache::Al.. +kernel_get_mempolicy (4,322,528 samples, 0.03%) + -accfg_wq_get_first (8,620,835 samples, 0.08%) - +__GI___close (3,042,426 samples, 0.02%) + -dml::core::hardware_device::submit (13,296,663 samples, 0.12%) - +__this_cpu_preempt_check (6,056,290 samples, 0.04%) + -do_filp_open (1,013,775 samples, 0.01%) - +asm_sysvec_apic_timer_interrupt (1,727,237 samples, 0.01%) + -up_read (1,064,042 samples, 0.01%) - +mod_memcg_state (1,383,928 samples, 0.01%) + -irqentry_exit_to_user_mode (1,726,993 samples, 0.02%) - +check_preemption_disabled (73,048,716 samples, 0.45%) + -asm_exc_page_fault (1,330,852,392 samples, 12.26%) -asm_exc_page_fault +folio_add_lru_vma (1,731,736 samples, 0.01%) + -folio_add_lru (3,945,551 samples, 0.04%) - +check_preemption_disabled (1,728,587 samples, 0.01%) + -count_memcg_events.constprop.0 (1,834,351 samples, 0.02%) - +__mod_lruvec_state (9,871,985 samples, 0.06%) + -__GI___libc_read (957,900 samples, 0.01%) +__mem_cgroup_charge (3,112,277 samples, 0.02%) + + + +check_preemption_disabled (3,440,581 samples, 0.02%) + + + +__hrtimer_run_queues (2,063,358 samples, 0.01%) + + + +tick_sched_timer (2,162,393 samples, 0.01%) + + + +__GI___libc_read (10,264,737 samples, 0.06%) + + + +__rcu_read_unlock (2,991,213 samples, 0.02%) + + + +sysvec_apic_timer_interrupt (2,186,103 samples, 0.01%) + + + +do_syscall_64 (2,414,556 samples, 0.01%) + + + +__free_one_page (82,061,399 samples, 0.51%) + + + +lock_vma_under_rcu (39,381,654 samples, 0.24%) + + + +entry_SYSCALL_64_after_hwframe (26,333,316 samples, 0.16%) + + + +__mod_lruvec_page_state (2,756,901 samples, 0.02%) + + + +try_charge_memcg (332,641,086 samples, 2.05%) +t.. + + +preempt_count_add (2,593,410 samples, 0.02%) + + + +do_vmi_align_munmap (629,492,317 samples, 3.88%) +do_v.. + + +pte_alloc_one (11,365,173 samples, 0.07%) + + + +entry_SYSCALL_64_after_hwframe (2,414,556 samples, 0.01%) + + + +cgroup_rstat_updated (1,728,929 samples, 0.01%) + + + +free_unref_page_commit (6,908,677 samples, 0.04%) + + + +__hrtimer_run_queues (2,278,320 samples, 0.01%) + + + +unsigned int std::uniform_int_distribution<unsigned long>::_S_nd<unsigned long, std::mersenne_twister_engine<unsigned long, 32ul, 624ul, 397ul, 31ul, 2567483615ul, 11ul, 4294967295ul, 7ul, 2636928640ul, 15ul, 4022730752ul, 18ul, 1812433253ul>, unsigned int> (577,343,172 samples, 3.56%) +uns.. + + +__handle_mm_fault (2,258,462,859 samples, 13.93%) +__handle_mm_fault + + +__this_cpu_preempt_check (4,313,782 samples, 0.03%) + + + +check_preemption_disabled (6,049,007 samples, 0.04%) + + + +__get_vma_policy (4,653,204 samples, 0.03%) + + + +entry_SYSCALL_64_after_hwframe (223,811,903 samples, 1.38%) + + + +qi_submit_sync (18,132,952 samples, 0.11%) + + + +exc_page_fault (12,385,269 samples, 0.08%) + + + +asm_sysvec_apic_timer_interrupt (2,245,175 samples, 0.01%) + + + +tlb_batch_pages_flush (374,748,248 samples, 2.31%) +t.. + + +error_entry (14,065,002 samples, 0.09%) + + + +tick_sched_timer (2,278,320 samples, 0.01%) + + + +__rcu_read_unlock (2,592,426 samples, 0.02%) + + + +__this_cpu_preempt_check (3,458,279 samples, 0.02%) + + + +qi_flush_piotlb (1,548,669 samples, 0.01%) + + + +preempt_count_sub (1,381,854 samples, 0.01%) + + + +do_syscall_64 (12,965,505 samples, 0.08%) + + + +hrtimer_interrupt (2,278,320 samples, 0.01%) + + + +folio_lruvec_lock_irqsave (1,904,959 samples, 0.01%) + + + +pmd_val (3,288,956 samples, 0.02%) + + + +preempt_count_add (3,627,638 samples, 0.02%) + + + +kmem_cache_alloc_node (1,728,614 samples, 0.01%) + + + +debug_smp_processor_id (10,372,104 samples, 0.06%) + + + +check_preemption_disabled (8,708,595 samples, 0.05%) + + + +get_page_from_freelist (3,422,251 samples, 0.02%) + + + +__this_cpu_preempt_check (3,425,436 samples, 0.02%) + + + +pmd_val (3,918,355 samples, 0.02%) + + + +__mod_lruvec_page_state (22,469,918 samples, 0.14%) + + + +__rcu_read_lock (1,732,716 samples, 0.01%) + + + +qi_flush_piotlb (18,114,625 samples, 0.11%) + + + +do_sys_openat2 (10,343,181 samples, 0.06%) + + + +__memcg_kmem_charge_page (5,186,021 samples, 0.03%) + + + +scan_a (751,624,882 samples, 4.64%) +scan_a + + +pte_alloc_one (5,184,340 samples, 0.03%) + + + +dev_attr_show (6,809,146 samples, 0.04%) + + + +policy_nodemask (56,949,042 samples, 0.35%) + + + +mas_store_prealloc (2,592,295 samples, 0.02%) + + + +do_mbind (7,285,314 samples, 0.04%) + + + +debug_smp_processor_id (3,973,430 samples, 0.02%) + + + +percpu_counter_add_batch (1,730,526 samples, 0.01%) + + + +__rcu_read_unlock (1,728,004 samples, 0.01%) + + + +__hrtimer_run_queues (2,245,481 samples, 0.01%) + + + +check_preemption_disabled (2,418,520 samples, 0.01%) + + + +percpu_counter_add_batch (58,295,338 samples, 0.36%) + + + +hrtimer_interrupt (11,222,797 samples, 0.07%) + + + +__rcu_read_lock (1,464,514 samples, 0.01%) + + + +memcg_check_events (324,055,059 samples, 2.00%) +m.. + + +release_pages (31,089,671 samples, 0.19%) + + + +kmem_cache_alloc (2,581,815 samples, 0.02%) + + + +perf_event_task_tick (2,278,320 samples, 0.01%) + + + +release_pages (142,577,981 samples, 0.88%) + + + +irqentry_exit (2,251,736 samples, 0.01%) + + + +pmd_page_vaddr (1,728,374 samples, 0.01%) + + + +__GI___mmap64 (26,333,316 samples, 0.16%) + + + +syscall_exit_to_user_mode (1,664,053 samples, 0.01%) + + + +check_preemption_disabled (32,527,454 samples, 0.20%) + + + +__rcu_read_unlock (1,731,608 samples, 0.01%) + + + +mas_destroy (1,727,716 samples, 0.01%) + + + +check_preemption_disabled (10,889,743 samples, 0.07%) + + + +cpuset_nodemask_valid_mems_allowed (19,900,595 samples, 0.12%) + + + +perf_try_init_event (2,593,062 samples, 0.02%) + + + +preempt_count_sub (1,729,334 samples, 0.01%) + + + +do_vmi_munmap (630,356,301 samples, 3.89%) +do_v.. + + +sysvec_apic_timer_interrupt (2,991,599 samples, 0.02%) + + + +do_mprotect_pkey (47,131,812 samples, 0.29%) + + + +start_thread (6,716,810,165 samples, 41.44%) +start_thread + + +error_entry (7,613,455 samples, 0.05%) + + + +_raw_spin_unlock (4,277,367 samples, 0.03%) + + + +unsigned long std::uniform_int_distribution<unsigned long>::operator (2,520,803,377 samples, 15.55%) +unsigned long std::unif.. + + +cgroup_rstat_updated (61,926,692 samples, 0.38%) + + + +tick_sched_handle (2,278,320 samples, 0.01%) + + + +tick_sched_timer (5,355,090 samples, 0.03%) + + + +debug_smp_processor_id (2,246,138 samples, 0.01%) + + + +kmem_cache_alloc (1,548,099 samples, 0.01%) + + + +perf_iterate_ctx (5,865,007 samples, 0.04%) + + + +irqentry_exit_to_user_mode (19,484,681 samples, 0.12%) + + + +mas_walk (14,117,731 samples, 0.09%) + + + +__mod_lruvec_state (20,706,100 samples, 0.13%) + + + +__hrtimer_run_queues (8,465,801 samples, 0.05%) + + + +perf_iterate_sb.constprop.0 (16,121,901 samples, 0.10%) + + + +do_vmi_munmap (223,811,903 samples, 1.38%) + + + +update_process_times (2,245,481 samples, 0.01%) + + + +__x64_sys_mprotect (47,131,812 samples, 0.29%) + + + +kernfs_iop_permission (1,728,057 samples, 0.01%) + + + +__mem_cgroup_charge (2,049,112 samples, 0.01%) + + + +hrtimer_interrupt (8,465,801 samples, 0.05%) + + + +__strstr_avx512 (4,322,214 samples, 0.03%) -check_preemption_disabled (1,564,788 samples, 0.01%) - +cgroup_rstat_updated (4,839,302 samples, 0.03%) + + + +do_sys_openat2 (6,619,563 samples, 0.04%) + + + +__alloc_pages (3,120,052 samples, 0.02%) + + + +__handle_mm_fault (2,305,694,402 samples, 14.23%) +__handle_mm_fault + + +qi_submit_sync (25,914,646 samples, 0.16%) + + + +check_preemption_disabled (31,051,499 samples, 0.19%) + + + +count_memcg_events.constprop.0 (65,432,651 samples, 0.40%) + + + +__rmqueue_pcplist (47,501,338 samples, 0.29%) + + + +__folio_alloc (489,765,877 samples, 3.02%) +__f.. + + +folio_batch_move_lru (312,730,145 samples, 1.93%) +f.. + + +check_preemption_disabled (111,881,835 samples, 0.69%) + + + +Filter<unsigned long, LT, (751,624,882 samples, 4.64%) +Filte.. + + +check_preemption_disabled (1,726,700 samples, 0.01%) + + + +__rmqueue_pcplist (146,774,456 samples, 0.91%) + + + +blk_cgroup_congested (23,031,269 samples, 0.14%) + + + +check_preemption_disabled (196,786,129 samples, 1.21%) + + + +asm_exc_page_fault (15,936,351 samples, 0.10%) + + + +unsigned long std::uniform_int_distribution<unsigned long>::operator (577,343,172 samples, 3.56%) +uns.. + + +asm_exc_page_fault (1,382,677 samples, 0.01%) + + + +__mod_memcg_lruvec_state (7,440,535 samples, 0.05%) + + + +unsigned long std::uniform_int_distribution<unsigned long>::operator (2,537,063,843 samples, 15.65%) +unsigned long std::unifo.. + + +do_syscall_64 (223,811,903 samples, 1.38%) + + + +clear_page_erms (1,710,021 samples, 0.01%) + + + +__rcu_read_lock (3,381,251 samples, 0.02%) + + + +vscnprintf (1,728,036 samples, 0.01%) + + + +kthread_blkcg (2,246,198 samples, 0.01%) + + + +perf_event_task_tick (7,602,506 samples, 0.05%) + + + +cgroup_rstat_updated (1,728,374 samples, 0.01%) + + + +inc_mm_counter (61,807,041 samples, 0.38%) + + + +page_remove_rmap (93,239,356 samples, 0.58%) + + + +_raw_spin_unlock (1,730,821 samples, 0.01%) + + + +tick_sched_handle (2,893,175 samples, 0.02%) + + + +__this_cpu_preempt_check (4,145,333 samples, 0.03%) + + + +qi_submit_sync (4,322,030 samples, 0.03%) + + + +__mod_node_page_state (4,158,167 samples, 0.03%) + + + +qi_submit_sync (5,181,714 samples, 0.03%) + + + +free_unref_page_prepare (22,438,221 samples, 0.14%) + + + +__tlb_remove_page_size (6,899,955 samples, 0.04%) + + + +__alloc_pages (8,608,272 samples, 0.05%) + + + +exit_to_user_mode_prepare (18,964,450 samples, 0.12%) + + + +__list_add_valid (8,611,190 samples, 0.05%) + + + +__kmalloc_node (1,726,629 samples, 0.01%) + + + +check_preemption_disabled (3,459,535 samples, 0.02%) + + + +vma_complete (2,592,295 samples, 0.02%) + + + +__this_cpu_preempt_check (32,095,349 samples, 0.20%) + + + +__list_del_entry_valid (3,459,006 samples, 0.02%) + + + +preempt_count_add (5,366,477 samples, 0.03%) + + + +unmap_region (624,308,733 samples, 3.85%) +unma.. + + +__pte_alloc (6,049,416 samples, 0.04%) + + + +__this_cpu_preempt_check (4,323,636 samples, 0.03%) + + + +debug_smp_processor_id (1,386,577 samples, 0.01%) + + + +Vector_Loader<unsigned long, (195,062,083 samples, 1.20%) + + + +__this_cpu_preempt_check (2,591,919 samples, 0.02%) + + + +preempt_count_add (8,040,132 samples, 0.05%) + + + +preempt_count_sub (1,380,697 samples, 0.01%) + + + +dsacache::Cache::Access (4,645,243,908 samples, 28.66%) +dsacache::Cache::Access + + +__mod_zone_page_state (18,795,883 samples, 0.12%) + + + +vsnprintf (3,234,164 samples, 0.02%) + + + +cgroup_rstat_updated (34,145,553 samples, 0.21%) + + + +update_process_times (2,063,358 samples, 0.01%) + + + +policy_nodemask (4,672,639 samples, 0.03%) + + + +__rcu_read_lock (5,021,773 samples, 0.03%) + + + +__libc_start_call_main (8,746,348,100 samples, 53.96%) +__libc_start_call_main + + +check_preemption_disabled (4,139,630 samples, 0.03%) + + + +perf_event_task_tick (1,574,246 samples, 0.01%) + + + +dsacache::Cache::Clear (631,219,928 samples, 3.89%) +dsac.. + + +uncharge_folio (12,963,246 samples, 0.08%) + + + +_raw_spin_lock (1,725,924 samples, 0.01%) + + + +cgroup_rstat_updated (4,485,426 samples, 0.03%) + + + +tick_sched_timer (2,893,175 samples, 0.02%) + + + +kernfs_fop_release (1,526,525 samples, 0.01%) + + + +unmap_page_range (159,745,560 samples, 0.99%) + + + +down_read_trylock (15,230,357 samples, 0.09%) + + + +mprotect_fixup (46,614,236 samples, 0.29%) + + + +pmd_pfn (5,184,907 samples, 0.03%) + + + +__mmu_notifier_invalidate_range (10,369,502 samples, 0.06%) + + + +vma_alloc_folio (204,481,337 samples, 1.26%) + + + +kmem_cache_alloc (1,729,408 samples, 0.01%) + + + +preempt_count_sub (1,731,876 samples, 0.01%) + + + +__d_lookup (2,050,788 samples, 0.01%) + + + +in_lock_functions (2,412,515 samples, 0.01%) + + + +irqentry_enter_from_user_mode (1,877,779 samples, 0.01%) + + + +__mod_memcg_lruvec_state (9,511,849 samples, 0.06%) + + + +hrtimer_interrupt (2,893,175 samples, 0.02%) + + + +__mod_memcg_lruvec_state (19,862,062 samples, 0.12%) + + + +__do_softirq (1,441,994 samples, 0.01%) + + + +get_page_from_freelist (3,120,052 samples, 0.02%) + + + +perf_adjust_freq_unthr_context (9,675,240 samples, 0.06%) + + + +scan_b (4,650,432,516 samples, 28.69%) +scan_b + + +asm_sysvec_apic_timer_interrupt (9,329,419 samples, 0.06%) + + + +__folio_throttle_swaprate (9,169,536 samples, 0.06%) + + + +get_page_from_freelist (157,592,549 samples, 0.97%) + + + +__mod_zone_page_state (14,694,578 samples, 0.09%) + + + +__sysvec_apic_timer_interrupt (2,278,320 samples, 0.01%) + + + +check_preemption_disabled (58,966,339 samples, 0.36%) + + + +check_preemption_disabled (7,777,020 samples, 0.05%) + + + +hugetlb_report_node_meminfo (1,728,036 samples, 0.01%) + + + +inherit_event.isra.0 (11,236,456 samples, 0.07%) + + + +folio_add_lru_vma (3,974,835 samples, 0.02%) + + + +_raw_spin_trylock (1,698,365 samples, 0.01%) + + + +__mod_node_page_state (9,006,170 samples, 0.06%) + + + +lookup_fast (2,050,788 samples, 0.01%) + + + +__this_cpu_preempt_check (2,771,309 samples, 0.02%) + + + +unmap_vmas (222,087,207 samples, 1.37%) + + + +tick_sched_handle (1,574,246 samples, 0.01%) + + + +sysvec_apic_timer_interrupt (2,620,554 samples, 0.02%) + -lru_gen_add_folio (2,271,523 samples, 0.02%) - +_int_malloc (2,059,139 samples, 0.01%) + -std::allocator_traits<std::allocator<dml::detail::ml::utils::structure_from<dml::detail::descriptor, dml::detail::completion_record> > >::allocate (30,229,702 samples, 0.28%) - +error_entry (11,074,932 samples, 0.07%) + -auto dml::detail::ml::make_mem_move_task<std::allocator<unsigned char> > (30,229,702 samples, 0.28%) - +internal_get_user_pages_fast (4,322,528 samples, 0.03%) + -entry_SYSCALL_64_after_hwframe (7,832,406 samples, 0.07%) - +alloc_fd (1,471,343 samples, 0.01%) + -__sysfs_device_parse (8,620,835 samples, 0.08%) - +hrtimer_interrupt (2,245,481 samples, 0.01%) + -clone3 (3,537,683,340 samples, 32.58%) -clone3 +do_anonymous_page (2,153,169,542 samples, 13.28%) +do_anonymous_page -__sysfs_device_parse (2,409,723 samples, 0.02%) - +path_openat (6,976,601 samples, 0.04%) + -mprotect_fixup (29,370,212 samples, 0.27%) - +update_process_times (8,465,801 samples, 0.05%) + -mutex_lock (1,981,537 samples, 0.02%) - +sysvec_apic_timer_interrupt (3,109,788 samples, 0.02%) + -sysmalloc (15,576,431 samples, 0.14%) - +debug_smp_processor_id (2,956,695 samples, 0.02%) + -__GI__IO_doallocbuf (19,515,368 samples, 0.18%) - +folio_batch_move_lru (109,200,750 samples, 0.67%) + -tick_sched_timer (8,995,452 samples, 0.08%) - +__rcu_read_lock (1,489,894 samples, 0.01%) + -__x64_sys_mprotect (12,999,915 samples, 0.12%) - +ksys_read (10,264,737 samples, 0.06%) + -__fopen_internal (10,781,028 samples, 0.10%) - +policy_node (2,252,700 samples, 0.01%) + -__memset (1,731,249 samples, 0.02%) - +tick_sched_timer (8,465,801 samples, 0.05%) + -dml::core::dispatcher::hw_dispatcher::~hw_dispatcher (1,665,609 samples, 0.02%) - +check_preemption_disabled (2,424,276 samples, 0.01%) + -_int_memalign (30,229,702 samples, 0.28%) - +mtree_range_walk (10,031,196 samples, 0.06%) + -__memcg_kmem_charge_page (5,802,387 samples, 0.05%) - +update_process_times (2,893,175 samples, 0.02%) + -do_futex (1,709,662 samples, 0.02%) - +_raw_spin_trylock (43,514,592 samples, 0.27%) + -grow_heap (13,858,960 samples, 0.13%) - +__hrtimer_run_queues (2,246,370 samples, 0.01%) + -lru_add_fn (1,728,947 samples, 0.02%) - +rcu_do_batch (1,379,377 samples, 0.01%) + -pte_alloc_one (1,729,251 samples, 0.02%) - +_raw_spin_lock_irqsave (1,729,327 samples, 0.01%) + -try_charge_memcg (3,358,641 samples, 0.03%) - +__this_cpu_preempt_check (24,241,462 samples, 0.15%) + -__mod_node_page_state (1,246,575 samples, 0.01%) - +do_filp_open (6,976,601 samples, 0.04%) + -intel_invalidate_range (2,478,462 samples, 0.02%) - +__mod_memcg_lruvec_state (19,842,648 samples, 0.12%) + -perf_event_mmap (11,662,927 samples, 0.11%) - +handle_mm_fault (2,303,102,379 samples, 14.21%) +handle_mm_fault -operator new (30,229,702 samples, 0.28%) - +__mod_memcg_lruvec_state (25,147,826 samples, 0.16%) + -do_exit (1,418,159 samples, 0.01%) - +__slab_alloc.isra.0 (1,728,614 samples, 0.01%) + -__mod_memcg_lruvec_state (1,134,175 samples, 0.01%) - +perf_event_mmap (16,121,901 samples, 0.10%) + -__GI___libc_read (11,363,394 samples, 0.10%) - +__list_del_entry_valid (6,043,320 samples, 0.04%) + -_dl_start_user (1,196,824 samples, 0.01%) - +folio_add_lru (394,763,299 samples, 2.44%) +fo.. -__futex_abstimed_wait_common64 (1,709,662 samples, 0.02%) - +perf_iterate_sb.constprop.0 (5,865,007 samples, 0.04%) + -entry_SYSCALL_64_after_hwframe (23,194,745 samples, 0.21%) - +do_syscall_64 (10,343,181 samples, 0.06%) + -exc_page_fault (1,852,943,584 samples, 17.07%) -exc_page_fault +memcg_account_kmem (2,592,882 samples, 0.02%) + -__x64_sys_get_mempolicy (3,456,757 samples, 0.03%) - +__rcu_read_lock (2,592,868 samples, 0.02%) + -dml::core::dispatcher::hw_dispatcher::hw_dispatcher (12,436,625 samples, 0.11%) - +debug_smp_processor_id (1,727,400 samples, 0.01%) + -arch_get_unmapped_area_topdown (1,099,791 samples, 0.01%) - +folio_lruvec_lock_irqsave (7,950,760 samples, 0.05%) + -__mem_cgroup_charge (4,164,584 samples, 0.04%) - +refill_stock (1,729,560 samples, 0.01%) + -perf_event_mmap (5,486,207 samples, 0.05%) - +__rcu_read_lock (1,384,957 samples, 0.01%) + -__GI___close (2,038,073 samples, 0.02%) - +__list_add_valid (2,587,208 samples, 0.02%) + -charge_memcg (3,957,434 samples, 0.04%) - +__mod_lruvec_state (44,622,164 samples, 0.28%) + -sysvec_apic_timer_interrupt (1,285,604 samples, 0.01%) - +perf_event_task_tick (2,245,481 samples, 0.01%) + -qi_flush_piotlb (2,478,462 samples, 0.02%) - +check_preemption_disabled (16,992,550 samples, 0.10%) + -qi_flush_dev_iotlb_pasid (18,156,520 samples, 0.17%) - +__pte_alloc (13,093,789 samples, 0.08%) + -do_madvise (3,340,721 samples, 0.03%) - +mem_cgroup_charge_statistics (608,500,805 samples, 3.75%) +mem_.. -ksys_read (957,900 samples, 0.01%) - +__list_del_entry_valid (1,728,945 samples, 0.01%) + -dml::detail::ml::impl::hardware::submit (13,296,663 samples, 0.12%) - +do_syscall_64 (631,219,928 samples, 3.89%) +do_s.. -clear_page_erms (1,266,328 samples, 0.01%) - +__rcu_read_lock (5,186,156 samples, 0.03%) + -__GI_munmap (16,406,617 samples, 0.15%) - +zap_page_range_single (2,414,556 samples, 0.01%) + -do_group_exit (1,418,159 samples, 0.01%) - +preempt_count_add (4,155,736 samples, 0.03%) + -entry_SYSCALL_64_after_hwframe (16,406,617 samples, 0.15%) - +__this_cpu_preempt_check (1,385,854 samples, 0.01%) + -void std::vector<std::thread, std::allocator<std::thread> >::_M_realloc_insert<void (2,576,245 samples, 0.02%) - +task_work_run (1,664,053 samples, 0.01%) + -device_parse (2,409,723 samples, 0.02%) - +memcg_check_events (1,728,888 samples, 0.01%) + -void std::allocator_traits<std::allocator<std::thread> >::construct<std::thread, void (2,576,245 samples, 0.02%) - +tlb_finish_mmu (421,390,645 samples, 2.60%) +tl.. -task_work_run (1,526,259 samples, 0.01%) - +charge_memcg (1,548,168 samples, 0.01%) + -lru_gen_add_folio (1,728,947 samples, 0.02%) - +cgroup_rstat_updated (1,721,075 samples, 0.01%) + -mas_store_gfp (1,730,304 samples, 0.02%) - +kmem_cache_free_bulk.part.0 (1,727,716 samples, 0.01%) + -do_syscall_64 (12,999,915 samples, 0.12%) - +__free_one_page (30,221,167 samples, 0.19%) + -dml::core::dispatcher::hw_dispatcher::get_instance (12,436,625 samples, 0.11%) - +lock_vma_under_rcu (106,404,566 samples, 0.66%) + -get_unmapped_area (1,099,791 samples, 0.01%) - +__next_zones_zonelist (87,664,406 samples, 0.54%) + -zap_page_range_single (2,478,462 samples, 0.02%) - +debug_smp_processor_id (22,758,393 samples, 0.14%) + -do_syscall_64 (1,709,662 samples, 0.02%) - +__cond_resched (1,727,496 samples, 0.01%) + -do_huge_pmd_anonymous_page (1,293,979,138 samples, 11.92%) -do_huge_pmd_anony.. +asm_sysvec_apic_timer_interrupt (12,664,791 samples, 0.08%) + -task_work_run (1,726,993 samples, 0.02%) - +asm_sysvec_apic_timer_interrupt (2,246,370 samples, 0.01%) + -perf_iterate_sb.constprop.0 (5,486,207 samples, 0.05%) - +qi_submit_sync (1,548,669 samples, 0.01%) + -try_charge_memcg (3,282,805 samples, 0.03%) - +debug_smp_processor_id (1,385,515 samples, 0.01%) + -__folio_alloc (867,087,699 samples, 7.99%) -__folio_alloc +pgd_none (2,590,952 samples, 0.02%) + -openat (2,539,730 samples, 0.02%) - +_raw_spin_unlock (4,139,803 samples, 0.03%) + -__mmput (1,418,159 samples, 0.01%) - +__this_cpu_preempt_check (4,607,217 samples, 0.03%) + -__handle_mm_fault (1,852,426,101 samples, 17.06%) -__handle_mm_fault +tick_sched_timer (2,246,370 samples, 0.01%) + -asm_sysvec_apic_timer_interrupt (10,722,445 samples, 0.10%) - +__mem_cgroup_charge (833,673,002 samples, 5.14%) +__mem_.. -__GI___mmap64 (23,194,745 samples, 0.21%) - +clone3 (12,965,505 samples, 0.08%) + -do_syscall_64 (6,922,986 samples, 0.06%) - +__mmu_notifier_invalidate_range_end (2,414,556 samples, 0.01%) + -qi_submit_sync (6,025,194 samples, 0.06%) - +__this_cpu_preempt_check (4,330,273 samples, 0.03%) + -tlb_finish_mmu (13,813,787 samples, 0.13%) - +__this_cpu_preempt_check (4,322,897 samples, 0.03%) + -entry_SYSCALL_64_after_hwframe (2,539,730 samples, 0.02%) - +get_mem_cgroup_from_mm (40,302,192 samples, 0.25%) + -clear_huge_page (3,619,034 samples, 0.03%) - +entry_SYSCALL_64_after_hwframe (12,965,505 samples, 0.08%) + -entry_SYSCALL_64_after_hwframe (1,709,662 samples, 0.02%) - +__GI___mmap64 (26,333,316 samples, 0.16%) + -page_counter_try_charge (1,715,991 samples, 0.02%) - +vm_area_alloc (2,581,815 samples, 0.02%) + -entry_SYSCALL_64_after_hwframe (1,418,159 samples, 0.01%) - +__list_add_valid (3,338,406 samples, 0.02%) + -clear_page_erms (1,291,549,968 samples, 11.90%) -clear_page_erms +inode_permission (3,456,198 samples, 0.02%) + -do_syscall_64 (1,014,603 samples, 0.01%) - +__fput (1,526,525 samples, 0.01%) + -malloc_consolidate (963,610 samples, 0.01%) - +folio_add_lru (2,064,658 samples, 0.01%) + -tick_sched_handle (1,300,420 samples, 0.01%) - +down_read_trylock (41,606,229 samples, 0.26%) + -scheduler_tick (8,995,452 samples, 0.08%) - +folio_batch_move_lru (1,548,407 samples, 0.01%) + -lru_add_fn (2,271,523 samples, 0.02%) - +free_unref_page_prepare (6,049,849 samples, 0.04%) + -entry_SYSCALL_64_after_hwframe (6,922,986 samples, 0.06%) - +update_process_times (2,278,320 samples, 0.01%) + -syscall (3,382,035 samples, 0.03%) - +__list_del_entry_valid (9,469,892 samples, 0.06%) + -perf_adjust_freq_unthr_context (1,365,948 samples, 0.01%) - +check_preemption_disabled (14,665,213 samples, 0.09%) + -__mod_node_page_state (1,728,947 samples, 0.02%) - +scheduler_tick (2,063,358 samples, 0.01%) + -seq_read_iter (10,243,352 samples, 0.09%) - +check_preemption_disabled (3,458,859 samples, 0.02%) + -seq_read_iter (957,900 samples, 0.01%) - +__mod_memcg_lruvec_state (13,825,662 samples, 0.09%) + -std::unordered_map<unsigned char*, dsacache::CacheData, std::hash<unsigned char*>, std::equal_to<unsigned char*>, std::allocator<std::pair<unsigned char* const, dsacache::CacheData> > >::clear (124,499,915 samples, 1.15%) - +do_user_addr_fault (2,617,163,464 samples, 16.15%) +do_user_addr_fault -add_group (2,409,723 samples, 0.02%) - +check_preemption_disabled (15,909,322 samples, 0.10%) + -__handle_mm_fault (1,309,922,715 samples, 12.06%) -__handle_mm_fault +update_process_times (1,574,246 samples, 0.01%) + -get_page_from_freelist (1,507,729,794 samples, 13.89%) -get_page_from_freelist +count_memcg_events.constprop.0 (27,509,915 samples, 0.17%) + -memcg_check_events (1,590,395 samples, 0.01%) - +tick_sched_timer (10,360,017 samples, 0.06%) + -perf_iterate_ctx (1,544,977 samples, 0.01%) - +__sysvec_apic_timer_interrupt (11,222,797 samples, 0.07%) + -_int_malloc (30,229,702 samples, 0.28%) - +__mod_lruvec_page_state (33,576,507 samples, 0.21%) + -__do_sys_clone3 (6,922,986 samples, 0.06%) - +perf_adjust_freq_unthr_context (2,246,370 samples, 0.01%) + -__GI_mprotect (13,858,960 samples, 0.13%) - +__folio_alloc (3,120,052 samples, 0.02%) + -Aggregation<unsigned long, Sum, (1,278,494,713 samples, 11.78%) -Aggregation<unsig.. +node_read_meminfo (5,827,344 samples, 0.04%) + -unmap_region (16,406,617 samples, 0.15%) - +__folio_throttle_swaprate (23,640,355 samples, 0.15%) + -perf_event_init_task (6,922,986 samples, 0.06%) - +asm_sysvec_apic_timer_interrupt (2,278,320 samples, 0.01%) + -__x64_sys_openat (2,028,052 samples, 0.02%) - +__mod_node_page_state (3,458,121 samples, 0.02%) +