162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0-only 262306a36Sopenharmony_ci/* 362306a36Sopenharmony_ci * mm/percpu-debug.c 462306a36Sopenharmony_ci * 562306a36Sopenharmony_ci * Copyright (C) 2017 Facebook Inc. 662306a36Sopenharmony_ci * Copyright (C) 2017 Dennis Zhou <dennis@kernel.org> 762306a36Sopenharmony_ci * 862306a36Sopenharmony_ci * Prints statistics about the percpu allocator and backing chunks. 962306a36Sopenharmony_ci */ 1062306a36Sopenharmony_ci#include <linux/debugfs.h> 1162306a36Sopenharmony_ci#include <linux/list.h> 1262306a36Sopenharmony_ci#include <linux/percpu.h> 1362306a36Sopenharmony_ci#include <linux/seq_file.h> 1462306a36Sopenharmony_ci#include <linux/sort.h> 1562306a36Sopenharmony_ci#include <linux/vmalloc.h> 1662306a36Sopenharmony_ci 1762306a36Sopenharmony_ci#include "percpu-internal.h" 1862306a36Sopenharmony_ci 1962306a36Sopenharmony_ci#define P(X, Y) \ 2062306a36Sopenharmony_ci seq_printf(m, " %-20s: %12lld\n", X, (long long int)Y) 2162306a36Sopenharmony_ci 2262306a36Sopenharmony_cistruct percpu_stats pcpu_stats; 2362306a36Sopenharmony_cistruct pcpu_alloc_info pcpu_stats_ai; 2462306a36Sopenharmony_ci 2562306a36Sopenharmony_cistatic int cmpint(const void *a, const void *b) 2662306a36Sopenharmony_ci{ 2762306a36Sopenharmony_ci return *(int *)a - *(int *)b; 2862306a36Sopenharmony_ci} 2962306a36Sopenharmony_ci 3062306a36Sopenharmony_ci/* 3162306a36Sopenharmony_ci * Iterates over all chunks to find the max nr_alloc entries. 3262306a36Sopenharmony_ci */ 3362306a36Sopenharmony_cistatic int find_max_nr_alloc(void) 3462306a36Sopenharmony_ci{ 3562306a36Sopenharmony_ci struct pcpu_chunk *chunk; 3662306a36Sopenharmony_ci int slot, max_nr_alloc; 3762306a36Sopenharmony_ci 3862306a36Sopenharmony_ci max_nr_alloc = 0; 3962306a36Sopenharmony_ci for (slot = 0; slot < pcpu_nr_slots; slot++) 4062306a36Sopenharmony_ci list_for_each_entry(chunk, &pcpu_chunk_lists[slot], list) 4162306a36Sopenharmony_ci max_nr_alloc = max(max_nr_alloc, chunk->nr_alloc); 4262306a36Sopenharmony_ci 4362306a36Sopenharmony_ci return max_nr_alloc; 4462306a36Sopenharmony_ci} 4562306a36Sopenharmony_ci 4662306a36Sopenharmony_ci/* 4762306a36Sopenharmony_ci * Prints out chunk state. Fragmentation is considered between 4862306a36Sopenharmony_ci * the beginning of the chunk to the last allocation. 4962306a36Sopenharmony_ci * 5062306a36Sopenharmony_ci * All statistics are in bytes unless stated otherwise. 5162306a36Sopenharmony_ci */ 5262306a36Sopenharmony_cistatic void chunk_map_stats(struct seq_file *m, struct pcpu_chunk *chunk, 5362306a36Sopenharmony_ci int *buffer) 5462306a36Sopenharmony_ci{ 5562306a36Sopenharmony_ci struct pcpu_block_md *chunk_md = &chunk->chunk_md; 5662306a36Sopenharmony_ci int i, last_alloc, as_len, start, end; 5762306a36Sopenharmony_ci int *alloc_sizes, *p; 5862306a36Sopenharmony_ci /* statistics */ 5962306a36Sopenharmony_ci int sum_frag = 0, max_frag = 0; 6062306a36Sopenharmony_ci int cur_min_alloc = 0, cur_med_alloc = 0, cur_max_alloc = 0; 6162306a36Sopenharmony_ci 6262306a36Sopenharmony_ci alloc_sizes = buffer; 6362306a36Sopenharmony_ci 6462306a36Sopenharmony_ci /* 6562306a36Sopenharmony_ci * find_last_bit returns the start value if nothing found. 6662306a36Sopenharmony_ci * Therefore, we must determine if it is a failure of find_last_bit 6762306a36Sopenharmony_ci * and set the appropriate value. 6862306a36Sopenharmony_ci */ 6962306a36Sopenharmony_ci last_alloc = find_last_bit(chunk->alloc_map, 7062306a36Sopenharmony_ci pcpu_chunk_map_bits(chunk) - 7162306a36Sopenharmony_ci chunk->end_offset / PCPU_MIN_ALLOC_SIZE - 1); 7262306a36Sopenharmony_ci last_alloc = test_bit(last_alloc, chunk->alloc_map) ? 7362306a36Sopenharmony_ci last_alloc + 1 : 0; 7462306a36Sopenharmony_ci 7562306a36Sopenharmony_ci as_len = 0; 7662306a36Sopenharmony_ci start = chunk->start_offset / PCPU_MIN_ALLOC_SIZE; 7762306a36Sopenharmony_ci 7862306a36Sopenharmony_ci /* 7962306a36Sopenharmony_ci * If a bit is set in the allocation map, the bound_map identifies 8062306a36Sopenharmony_ci * where the allocation ends. If the allocation is not set, the 8162306a36Sopenharmony_ci * bound_map does not identify free areas as it is only kept accurate 8262306a36Sopenharmony_ci * on allocation, not free. 8362306a36Sopenharmony_ci * 8462306a36Sopenharmony_ci * Positive values are allocations and negative values are free 8562306a36Sopenharmony_ci * fragments. 8662306a36Sopenharmony_ci */ 8762306a36Sopenharmony_ci while (start < last_alloc) { 8862306a36Sopenharmony_ci if (test_bit(start, chunk->alloc_map)) { 8962306a36Sopenharmony_ci end = find_next_bit(chunk->bound_map, last_alloc, 9062306a36Sopenharmony_ci start + 1); 9162306a36Sopenharmony_ci alloc_sizes[as_len] = 1; 9262306a36Sopenharmony_ci } else { 9362306a36Sopenharmony_ci end = find_next_bit(chunk->alloc_map, last_alloc, 9462306a36Sopenharmony_ci start + 1); 9562306a36Sopenharmony_ci alloc_sizes[as_len] = -1; 9662306a36Sopenharmony_ci } 9762306a36Sopenharmony_ci 9862306a36Sopenharmony_ci alloc_sizes[as_len++] *= (end - start) * PCPU_MIN_ALLOC_SIZE; 9962306a36Sopenharmony_ci 10062306a36Sopenharmony_ci start = end; 10162306a36Sopenharmony_ci } 10262306a36Sopenharmony_ci 10362306a36Sopenharmony_ci /* 10462306a36Sopenharmony_ci * The negative values are free fragments and thus sorting gives the 10562306a36Sopenharmony_ci * free fragments at the beginning in largest first order. 10662306a36Sopenharmony_ci */ 10762306a36Sopenharmony_ci if (as_len > 0) { 10862306a36Sopenharmony_ci sort(alloc_sizes, as_len, sizeof(int), cmpint, NULL); 10962306a36Sopenharmony_ci 11062306a36Sopenharmony_ci /* iterate through the unallocated fragments */ 11162306a36Sopenharmony_ci for (i = 0, p = alloc_sizes; *p < 0 && i < as_len; i++, p++) { 11262306a36Sopenharmony_ci sum_frag -= *p; 11362306a36Sopenharmony_ci max_frag = max(max_frag, -1 * (*p)); 11462306a36Sopenharmony_ci } 11562306a36Sopenharmony_ci 11662306a36Sopenharmony_ci cur_min_alloc = alloc_sizes[i]; 11762306a36Sopenharmony_ci cur_med_alloc = alloc_sizes[(i + as_len - 1) / 2]; 11862306a36Sopenharmony_ci cur_max_alloc = alloc_sizes[as_len - 1]; 11962306a36Sopenharmony_ci } 12062306a36Sopenharmony_ci 12162306a36Sopenharmony_ci P("nr_alloc", chunk->nr_alloc); 12262306a36Sopenharmony_ci P("max_alloc_size", chunk->max_alloc_size); 12362306a36Sopenharmony_ci P("empty_pop_pages", chunk->nr_empty_pop_pages); 12462306a36Sopenharmony_ci P("first_bit", chunk_md->first_free); 12562306a36Sopenharmony_ci P("free_bytes", chunk->free_bytes); 12662306a36Sopenharmony_ci P("contig_bytes", chunk_md->contig_hint * PCPU_MIN_ALLOC_SIZE); 12762306a36Sopenharmony_ci P("sum_frag", sum_frag); 12862306a36Sopenharmony_ci P("max_frag", max_frag); 12962306a36Sopenharmony_ci P("cur_min_alloc", cur_min_alloc); 13062306a36Sopenharmony_ci P("cur_med_alloc", cur_med_alloc); 13162306a36Sopenharmony_ci P("cur_max_alloc", cur_max_alloc); 13262306a36Sopenharmony_ci seq_putc(m, '\n'); 13362306a36Sopenharmony_ci} 13462306a36Sopenharmony_ci 13562306a36Sopenharmony_cistatic int percpu_stats_show(struct seq_file *m, void *v) 13662306a36Sopenharmony_ci{ 13762306a36Sopenharmony_ci struct pcpu_chunk *chunk; 13862306a36Sopenharmony_ci int slot, max_nr_alloc; 13962306a36Sopenharmony_ci int *buffer; 14062306a36Sopenharmony_ci 14162306a36Sopenharmony_cialloc_buffer: 14262306a36Sopenharmony_ci spin_lock_irq(&pcpu_lock); 14362306a36Sopenharmony_ci max_nr_alloc = find_max_nr_alloc(); 14462306a36Sopenharmony_ci spin_unlock_irq(&pcpu_lock); 14562306a36Sopenharmony_ci 14662306a36Sopenharmony_ci /* there can be at most this many free and allocated fragments */ 14762306a36Sopenharmony_ci buffer = vmalloc_array(2 * max_nr_alloc + 1, sizeof(int)); 14862306a36Sopenharmony_ci if (!buffer) 14962306a36Sopenharmony_ci return -ENOMEM; 15062306a36Sopenharmony_ci 15162306a36Sopenharmony_ci spin_lock_irq(&pcpu_lock); 15262306a36Sopenharmony_ci 15362306a36Sopenharmony_ci /* if the buffer allocated earlier is too small */ 15462306a36Sopenharmony_ci if (max_nr_alloc < find_max_nr_alloc()) { 15562306a36Sopenharmony_ci spin_unlock_irq(&pcpu_lock); 15662306a36Sopenharmony_ci vfree(buffer); 15762306a36Sopenharmony_ci goto alloc_buffer; 15862306a36Sopenharmony_ci } 15962306a36Sopenharmony_ci 16062306a36Sopenharmony_ci#define PL(X) \ 16162306a36Sopenharmony_ci seq_printf(m, " %-20s: %12lld\n", #X, (long long int)pcpu_stats_ai.X) 16262306a36Sopenharmony_ci 16362306a36Sopenharmony_ci seq_printf(m, 16462306a36Sopenharmony_ci "Percpu Memory Statistics\n" 16562306a36Sopenharmony_ci "Allocation Info:\n" 16662306a36Sopenharmony_ci "----------------------------------------\n"); 16762306a36Sopenharmony_ci PL(unit_size); 16862306a36Sopenharmony_ci PL(static_size); 16962306a36Sopenharmony_ci PL(reserved_size); 17062306a36Sopenharmony_ci PL(dyn_size); 17162306a36Sopenharmony_ci PL(atom_size); 17262306a36Sopenharmony_ci PL(alloc_size); 17362306a36Sopenharmony_ci seq_putc(m, '\n'); 17462306a36Sopenharmony_ci 17562306a36Sopenharmony_ci#undef PL 17662306a36Sopenharmony_ci 17762306a36Sopenharmony_ci#define PU(X) \ 17862306a36Sopenharmony_ci seq_printf(m, " %-20s: %12llu\n", #X, (unsigned long long)pcpu_stats.X) 17962306a36Sopenharmony_ci 18062306a36Sopenharmony_ci seq_printf(m, 18162306a36Sopenharmony_ci "Global Stats:\n" 18262306a36Sopenharmony_ci "----------------------------------------\n"); 18362306a36Sopenharmony_ci PU(nr_alloc); 18462306a36Sopenharmony_ci PU(nr_dealloc); 18562306a36Sopenharmony_ci PU(nr_cur_alloc); 18662306a36Sopenharmony_ci PU(nr_max_alloc); 18762306a36Sopenharmony_ci PU(nr_chunks); 18862306a36Sopenharmony_ci PU(nr_max_chunks); 18962306a36Sopenharmony_ci PU(min_alloc_size); 19062306a36Sopenharmony_ci PU(max_alloc_size); 19162306a36Sopenharmony_ci P("empty_pop_pages", pcpu_nr_empty_pop_pages); 19262306a36Sopenharmony_ci seq_putc(m, '\n'); 19362306a36Sopenharmony_ci 19462306a36Sopenharmony_ci#undef PU 19562306a36Sopenharmony_ci 19662306a36Sopenharmony_ci seq_printf(m, 19762306a36Sopenharmony_ci "Per Chunk Stats:\n" 19862306a36Sopenharmony_ci "----------------------------------------\n"); 19962306a36Sopenharmony_ci 20062306a36Sopenharmony_ci if (pcpu_reserved_chunk) { 20162306a36Sopenharmony_ci seq_puts(m, "Chunk: <- Reserved Chunk\n"); 20262306a36Sopenharmony_ci chunk_map_stats(m, pcpu_reserved_chunk, buffer); 20362306a36Sopenharmony_ci } 20462306a36Sopenharmony_ci 20562306a36Sopenharmony_ci for (slot = 0; slot < pcpu_nr_slots; slot++) { 20662306a36Sopenharmony_ci list_for_each_entry(chunk, &pcpu_chunk_lists[slot], list) { 20762306a36Sopenharmony_ci if (chunk == pcpu_first_chunk) 20862306a36Sopenharmony_ci seq_puts(m, "Chunk: <- First Chunk\n"); 20962306a36Sopenharmony_ci else if (slot == pcpu_to_depopulate_slot) 21062306a36Sopenharmony_ci seq_puts(m, "Chunk (to_depopulate)\n"); 21162306a36Sopenharmony_ci else if (slot == pcpu_sidelined_slot) 21262306a36Sopenharmony_ci seq_puts(m, "Chunk (sidelined):\n"); 21362306a36Sopenharmony_ci else 21462306a36Sopenharmony_ci seq_puts(m, "Chunk:\n"); 21562306a36Sopenharmony_ci chunk_map_stats(m, chunk, buffer); 21662306a36Sopenharmony_ci } 21762306a36Sopenharmony_ci } 21862306a36Sopenharmony_ci 21962306a36Sopenharmony_ci spin_unlock_irq(&pcpu_lock); 22062306a36Sopenharmony_ci 22162306a36Sopenharmony_ci vfree(buffer); 22262306a36Sopenharmony_ci 22362306a36Sopenharmony_ci return 0; 22462306a36Sopenharmony_ci} 22562306a36Sopenharmony_ciDEFINE_SHOW_ATTRIBUTE(percpu_stats); 22662306a36Sopenharmony_ci 22762306a36Sopenharmony_cistatic int __init init_percpu_stats_debugfs(void) 22862306a36Sopenharmony_ci{ 22962306a36Sopenharmony_ci debugfs_create_file("percpu_stats", 0444, NULL, NULL, 23062306a36Sopenharmony_ci &percpu_stats_fops); 23162306a36Sopenharmony_ci 23262306a36Sopenharmony_ci return 0; 23362306a36Sopenharmony_ci} 23462306a36Sopenharmony_ci 23562306a36Sopenharmony_cilate_initcall(init_percpu_stats_debugfs); 236