1ebccf1e3SJoseph Koshy /*- 24d846d26SWarner Losh * SPDX-License-Identifier: BSD-2-Clause 3718cf2ccSPedro F. Giffuni * 4122ccdc1SJoseph Koshy * Copyright (c) 2003-2008 Joseph Koshy 5d07f36b0SJoseph Koshy * Copyright (c) 2007 The FreeBSD Foundation 6e6b475e0SMatt Macy * Copyright (c) 2018 Matthew Macy 7ebccf1e3SJoseph Koshy * All rights reserved. 8ebccf1e3SJoseph Koshy * 9d07f36b0SJoseph Koshy * Portions of this software were developed by A. Joseph Koshy under 10d07f36b0SJoseph Koshy * sponsorship from the FreeBSD Foundation and Google, Inc. 11d07f36b0SJoseph Koshy * 12ebccf1e3SJoseph Koshy * Redistribution and use in source and binary forms, with or without 13ebccf1e3SJoseph Koshy * modification, are permitted provided that the following conditions 14ebccf1e3SJoseph Koshy * are met: 15ebccf1e3SJoseph Koshy * 1. Redistributions of source code must retain the above copyright 16ebccf1e3SJoseph Koshy * notice, this list of conditions and the following disclaimer. 17ebccf1e3SJoseph Koshy * 2. Redistributions in binary form must reproduce the above copyright 18ebccf1e3SJoseph Koshy * notice, this list of conditions and the following disclaimer in the 19ebccf1e3SJoseph Koshy * documentation and/or other materials provided with the distribution. 20ebccf1e3SJoseph Koshy * 21ebccf1e3SJoseph Koshy * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 22ebccf1e3SJoseph Koshy * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 23ebccf1e3SJoseph Koshy * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 24ebccf1e3SJoseph Koshy * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 25ebccf1e3SJoseph Koshy * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 26ebccf1e3SJoseph Koshy * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 27ebccf1e3SJoseph Koshy * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 28ebccf1e3SJoseph Koshy * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 29ebccf1e3SJoseph Koshy * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 30ebccf1e3SJoseph Koshy * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 31ebccf1e3SJoseph Koshy * SUCH DAMAGE. 32ebccf1e3SJoseph Koshy */ 33ebccf1e3SJoseph Koshy 34ebccf1e3SJoseph Koshy #include <sys/cdefs.h> 35ebccf1e3SJoseph Koshy __FBSDID("$FreeBSD$"); 36ebccf1e3SJoseph Koshy 37ebccf1e3SJoseph Koshy #include <sys/param.h> 389b1d850bSMark Johnston #include <sys/systm.h> 399978bd99SMark Johnston #include <sys/domainset.h> 40ebccf1e3SJoseph Koshy #include <sys/eventhandler.h> 41ebccf1e3SJoseph Koshy #include <sys/jail.h> 42ebccf1e3SJoseph Koshy #include <sys/kernel.h> 43f263522aSJoseph Koshy #include <sys/kthread.h> 44ebccf1e3SJoseph Koshy #include <sys/limits.h> 45ebccf1e3SJoseph Koshy #include <sys/lock.h> 46ebccf1e3SJoseph Koshy #include <sys/malloc.h> 47ebccf1e3SJoseph Koshy #include <sys/module.h> 48e9b5dc16SJoseph Koshy #include <sys/mount.h> 49ebccf1e3SJoseph Koshy #include <sys/mutex.h> 50ebccf1e3SJoseph Koshy #include <sys/pmc.h> 51ebccf1e3SJoseph Koshy #include <sys/pmckern.h> 52f263522aSJoseph Koshy #include <sys/pmclog.h> 53acd3428bSRobert Watson #include <sys/priv.h> 54ebccf1e3SJoseph Koshy #include <sys/proc.h> 55ebccf1e3SJoseph Koshy #include <sys/queue.h> 56f263522aSJoseph Koshy #include <sys/resourcevar.h> 5789f6b863SAttilio Rao #include <sys/rwlock.h> 58ebccf1e3SJoseph Koshy #include <sys/sched.h> 59ebccf1e3SJoseph Koshy #include <sys/signalvar.h> 60ebccf1e3SJoseph Koshy #include <sys/smp.h> 61ebccf1e3SJoseph Koshy #include <sys/sx.h> 62ebccf1e3SJoseph Koshy #include <sys/sysctl.h> 63ebccf1e3SJoseph Koshy #include <sys/sysent.h> 640204d85aSMatt Macy #include <sys/syslog.h> 659b1d850bSMark Johnston #include <sys/taskqueue.h> 66f263522aSJoseph Koshy #include <sys/vnode.h> 67ebccf1e3SJoseph Koshy 6849874f6eSJoseph Koshy #include <sys/linker.h> /* needs to be after <sys/malloc.h> */ 6949874f6eSJoseph Koshy 70f263522aSJoseph Koshy #include <machine/atomic.h> 71ebccf1e3SJoseph Koshy #include <machine/md_var.h> 72ebccf1e3SJoseph Koshy 73bf792d68SJoseph Koshy #include <vm/vm.h> 74bf792d68SJoseph Koshy #include <vm/vm_extern.h> 75bf792d68SJoseph Koshy #include <vm/pmap.h> 76bf792d68SJoseph Koshy #include <vm/vm_map.h> 77bf792d68SJoseph Koshy #include <vm/vm_object.h> 78bf792d68SJoseph Koshy 79f5f9340bSFabien Thomas #include "hwpmc_soft.h" 80f5f9340bSFabien Thomas 81693cd307SMitchell Horne #define PMC_EPOCH_ENTER() \ 82693cd307SMitchell Horne struct epoch_tracker pmc_et; \ 83693cd307SMitchell Horne epoch_enter_preempt(global_epoch_preempt, &pmc_et) 84693cd307SMitchell Horne 85693cd307SMitchell Horne #define PMC_EPOCH_EXIT() \ 86693cd307SMitchell Horne epoch_exit_preempt(global_epoch_preempt, &pmc_et) 876573d758SMatt Macy 88ebccf1e3SJoseph Koshy /* 89ebccf1e3SJoseph Koshy * Types 90ebccf1e3SJoseph Koshy */ 91ebccf1e3SJoseph Koshy 92ebccf1e3SJoseph Koshy enum pmc_flags { 93ebccf1e3SJoseph Koshy PMC_FLAG_NONE = 0x00, /* do nothing */ 94ebccf1e3SJoseph Koshy PMC_FLAG_REMOVE = 0x01, /* atomically remove entry from hash */ 95ebccf1e3SJoseph Koshy PMC_FLAG_ALLOCATE = 0x02, /* add entry to hash if not found */ 966161b98cSMatt Macy PMC_FLAG_NOWAIT = 0x04, /* do not wait for mallocs */ 97ebccf1e3SJoseph Koshy }; 98ebccf1e3SJoseph Koshy 99ebccf1e3SJoseph Koshy /* 100ebccf1e3SJoseph Koshy * The offset in sysent where the syscall is allocated. 101ebccf1e3SJoseph Koshy */ 102ebccf1e3SJoseph Koshy static int pmc_syscall_num = NO_SYSCALL; 103693cd307SMitchell Horne 104ebccf1e3SJoseph Koshy struct pmc_cpu **pmc_pcpu; /* per-cpu state */ 105ebccf1e3SJoseph Koshy pmc_value_t *pmc_pcpu_saved; /* saved PMC values: CSW handling */ 106ebccf1e3SJoseph Koshy 107ebccf1e3SJoseph Koshy #define PMC_PCPU_SAVED(C, R) pmc_pcpu_saved[(R) + md->pmd_npmc * (C)] 108ebccf1e3SJoseph Koshy 109ebccf1e3SJoseph Koshy struct mtx_pool *pmc_mtxpool; 110ebccf1e3SJoseph Koshy static int *pmc_pmcdisp; /* PMC row dispositions */ 111ebccf1e3SJoseph Koshy 112ebccf1e3SJoseph Koshy #define PMC_ROW_DISP_IS_FREE(R) (pmc_pmcdisp[(R)] == 0) 113ebccf1e3SJoseph Koshy #define PMC_ROW_DISP_IS_THREAD(R) (pmc_pmcdisp[(R)] > 0) 114ebccf1e3SJoseph Koshy #define PMC_ROW_DISP_IS_STANDALONE(R) (pmc_pmcdisp[(R)] < 0) 115ebccf1e3SJoseph Koshy 116ebccf1e3SJoseph Koshy #define PMC_MARK_ROW_FREE(R) do { \ 117ebccf1e3SJoseph Koshy pmc_pmcdisp[(R)] = 0; \ 118ebccf1e3SJoseph Koshy } while (0) 119ebccf1e3SJoseph Koshy 120ebccf1e3SJoseph Koshy #define PMC_MARK_ROW_STANDALONE(R) do { \ 121ebccf1e3SJoseph Koshy KASSERT(pmc_pmcdisp[(R)] <= 0, ("[pmc,%d] row disposition error", \ 122ebccf1e3SJoseph Koshy __LINE__)); \ 123ebccf1e3SJoseph Koshy atomic_add_int(&pmc_pmcdisp[(R)], -1); \ 124122ccdc1SJoseph Koshy KASSERT(pmc_pmcdisp[(R)] >= (-pmc_cpu_max_active()), \ 125122ccdc1SJoseph Koshy ("[pmc,%d] row disposition error", __LINE__)); \ 126ebccf1e3SJoseph Koshy } while (0) 127ebccf1e3SJoseph Koshy 128ebccf1e3SJoseph Koshy #define PMC_UNMARK_ROW_STANDALONE(R) do { \ 129ebccf1e3SJoseph Koshy atomic_add_int(&pmc_pmcdisp[(R)], 1); \ 130ebccf1e3SJoseph Koshy KASSERT(pmc_pmcdisp[(R)] <= 0, ("[pmc,%d] row disposition error", \ 131ebccf1e3SJoseph Koshy __LINE__)); \ 132ebccf1e3SJoseph Koshy } while (0) 133ebccf1e3SJoseph Koshy 134ebccf1e3SJoseph Koshy #define PMC_MARK_ROW_THREAD(R) do { \ 135ebccf1e3SJoseph Koshy KASSERT(pmc_pmcdisp[(R)] >= 0, ("[pmc,%d] row disposition error", \ 136ebccf1e3SJoseph Koshy __LINE__)); \ 137ebccf1e3SJoseph Koshy atomic_add_int(&pmc_pmcdisp[(R)], 1); \ 138ebccf1e3SJoseph Koshy } while (0) 139ebccf1e3SJoseph Koshy 140ebccf1e3SJoseph Koshy #define PMC_UNMARK_ROW_THREAD(R) do { \ 141ebccf1e3SJoseph Koshy atomic_add_int(&pmc_pmcdisp[(R)], -1); \ 142ebccf1e3SJoseph Koshy KASSERT(pmc_pmcdisp[(R)] >= 0, ("[pmc,%d] row disposition error", \ 143ebccf1e3SJoseph Koshy __LINE__)); \ 144ebccf1e3SJoseph Koshy } while (0) 145ebccf1e3SJoseph Koshy 146ebccf1e3SJoseph Koshy /* various event handlers */ 14729f4e216SMark Johnston static eventhandler_tag pmc_exit_tag, pmc_fork_tag, pmc_kld_load_tag, 14829f4e216SMark Johnston pmc_kld_unload_tag; 149ebccf1e3SJoseph Koshy 150ebccf1e3SJoseph Koshy /* Module statistics */ 151e6b475e0SMatt Macy struct pmc_driverstats pmc_stats; 152e6b475e0SMatt Macy 153ebccf1e3SJoseph Koshy /* Machine/processor dependent operations */ 1540cfab8ddSJoseph Koshy static struct pmc_mdep *md; 155ebccf1e3SJoseph Koshy 156ebccf1e3SJoseph Koshy /* 157ebccf1e3SJoseph Koshy * Hash tables mapping owner processes and target threads to PMCs. 158ebccf1e3SJoseph Koshy */ 159ebccf1e3SJoseph Koshy struct mtx pmc_processhash_mtx; /* spin mutex */ 160ebccf1e3SJoseph Koshy static u_long pmc_processhashmask; 161ebccf1e3SJoseph Koshy static LIST_HEAD(pmc_processhash, pmc_process) *pmc_processhash; 162ebccf1e3SJoseph Koshy 163ebccf1e3SJoseph Koshy /* 164ebccf1e3SJoseph Koshy * Hash table of PMC owner descriptors. This table is protected by 165ebccf1e3SJoseph Koshy * the shared PMC "sx" lock. 166ebccf1e3SJoseph Koshy */ 167ebccf1e3SJoseph Koshy static u_long pmc_ownerhashmask; 168ebccf1e3SJoseph Koshy static LIST_HEAD(pmc_ownerhash, pmc_owner) *pmc_ownerhash; 169ebccf1e3SJoseph Koshy 170ebccf1e3SJoseph Koshy /* 171f263522aSJoseph Koshy * List of PMC owners with system-wide sampling PMCs. 172f263522aSJoseph Koshy */ 1730f8d79d9SMatt Macy static CK_LIST_HEAD(, pmc_owner) pmc_ss_owners; 174f263522aSJoseph Koshy 1756161b98cSMatt Macy /* 1766161b98cSMatt Macy * List of free thread entries. This is protected by the spin 1776161b98cSMatt Macy * mutex. 1786161b98cSMatt Macy */ 1796161b98cSMatt Macy static struct mtx pmc_threadfreelist_mtx; /* spin mutex */ 1806161b98cSMatt Macy static LIST_HEAD(, pmc_thread) pmc_threadfreelist; 1816161b98cSMatt Macy static int pmc_threadfreelist_entries = 0; 182693cd307SMitchell Horne #define THREADENTRY_SIZE (sizeof(struct pmc_thread) + \ 183693cd307SMitchell Horne (md->pmd_npmc * sizeof(struct pmc_threadpmcstate))) 1846161b98cSMatt Macy 1856161b98cSMatt Macy /* 1866161b98cSMatt Macy * Task to free thread descriptors 1876161b98cSMatt Macy */ 1889b1d850bSMark Johnston static struct task free_task; 189f263522aSJoseph Koshy 190f263522aSJoseph Koshy /* 191e829eb6dSJoseph Koshy * A map of row indices to classdep structures. 192e829eb6dSJoseph Koshy */ 193e829eb6dSJoseph Koshy static struct pmc_classdep **pmc_rowindex_to_classdep; 194e829eb6dSJoseph Koshy 195e829eb6dSJoseph Koshy /* 196ebccf1e3SJoseph Koshy * Prototypes 197ebccf1e3SJoseph Koshy */ 198ebccf1e3SJoseph Koshy 199680f1afdSJohn Baldwin #ifdef HWPMC_DEBUG 200ebccf1e3SJoseph Koshy static int pmc_debugflags_sysctl_handler(SYSCTL_HANDLER_ARGS); 201ebccf1e3SJoseph Koshy static int pmc_debugflags_parse(char *newstr, char *fence); 202ebccf1e3SJoseph Koshy #endif 203ebccf1e3SJoseph Koshy 204ebccf1e3SJoseph Koshy static int load(struct module *module, int cmd, void *arg); 205693cd307SMitchell Horne static int pmc_add_sample(ring_type_t ring, struct pmc *pm, 206693cd307SMitchell Horne struct trapframe *tf); 2076161b98cSMatt Macy static void pmc_add_thread_descriptors_from_proc(struct proc *p, 2086161b98cSMatt Macy struct pmc_process *pp); 209f263522aSJoseph Koshy static int pmc_attach_process(struct proc *p, struct pmc *pm); 210ebccf1e3SJoseph Koshy static struct pmc *pmc_allocate_pmc_descriptor(void); 211f263522aSJoseph Koshy static struct pmc_owner *pmc_allocate_owner_descriptor(struct proc *p); 212f263522aSJoseph Koshy static int pmc_attach_one_process(struct proc *p, struct pmc *pm); 213c514a571SMitchell Horne static bool pmc_can_allocate_row(int ri, enum pmc_mode mode); 214c514a571SMitchell Horne static bool pmc_can_allocate_rowindex(struct proc *p, unsigned int ri, 215c5153e19SJoseph Koshy int cpu); 216f263522aSJoseph Koshy static int pmc_can_attach(struct pmc *pm, struct proc *p); 217693cd307SMitchell Horne static void pmc_capture_user_callchain(int cpu, int soft, 218693cd307SMitchell Horne struct trapframe *tf); 219f263522aSJoseph Koshy static void pmc_cleanup(void); 220f263522aSJoseph Koshy static int pmc_detach_process(struct proc *p, struct pmc *pm); 221f263522aSJoseph Koshy static int pmc_detach_one_process(struct proc *p, struct pmc *pm, 222f263522aSJoseph Koshy int flags); 223f263522aSJoseph Koshy static void pmc_destroy_owner_descriptor(struct pmc_owner *po); 22406796b67SMark Johnston static void pmc_destroy_pmc_descriptor(struct pmc *pm); 2256161b98cSMatt Macy static void pmc_destroy_process_descriptor(struct pmc_process *pp); 226ebccf1e3SJoseph Koshy static struct pmc_owner *pmc_find_owner_descriptor(struct proc *p); 227ebccf1e3SJoseph Koshy static int pmc_find_pmc(pmc_id_t pmcid, struct pmc **pm); 228f263522aSJoseph Koshy static struct pmc *pmc_find_pmc_descriptor_in_process(struct pmc_owner *po, 229f263522aSJoseph Koshy pmc_id_t pmc); 230f263522aSJoseph Koshy static struct pmc_process *pmc_find_process_descriptor(struct proc *p, 231f263522aSJoseph Koshy uint32_t mode); 2326161b98cSMatt Macy static struct pmc_thread *pmc_find_thread_descriptor(struct pmc_process *pp, 2336161b98cSMatt Macy struct thread *td, uint32_t mode); 234c5153e19SJoseph Koshy static void pmc_force_context_switch(void); 235ebccf1e3SJoseph Koshy static void pmc_link_target_process(struct pmc *pm, 236ebccf1e3SJoseph Koshy struct pmc_process *pp); 237d07f36b0SJoseph Koshy static void pmc_log_all_process_mappings(struct pmc_owner *po); 238d07f36b0SJoseph Koshy static void pmc_log_kernel_mappings(struct pmc *pm); 239d07f36b0SJoseph Koshy static void pmc_log_process_mappings(struct pmc_owner *po, struct proc *p); 240f263522aSJoseph Koshy static void pmc_maybe_remove_owner(struct pmc_owner *po); 241e4fbd039SMitchell Horne static void pmc_post_callchain_callback(void); 242e4fbd039SMitchell Horne static void pmc_process_allproc(struct pmc *pm); 243f263522aSJoseph Koshy static void pmc_process_csw_in(struct thread *td); 244f263522aSJoseph Koshy static void pmc_process_csw_out(struct thread *td); 245c4981694SMitchell Horne static void pmc_process_exec(struct thread *td, 246c4981694SMitchell Horne struct pmckern_procexec *pk); 247ebccf1e3SJoseph Koshy static void pmc_process_exit(void *arg, struct proc *p); 248ebccf1e3SJoseph Koshy static void pmc_process_fork(void *arg, struct proc *p1, 249ebccf1e3SJoseph Koshy struct proc *p2, int n); 250e4fbd039SMitchell Horne static void pmc_process_proccreate(struct proc *p); 251d9f1b8dbSMatt Macy static void pmc_process_samples(int cpu, ring_type_t soft); 252e4fbd039SMitchell Horne static void pmc_process_threadcreate(struct thread *td); 253e4fbd039SMitchell Horne static void pmc_process_threadexit(struct thread *td); 2546161b98cSMatt Macy static void pmc_process_thread_add(struct thread *td); 2556161b98cSMatt Macy static void pmc_process_thread_delete(struct thread *td); 2565de96e33SMatt Macy static void pmc_process_thread_userret(struct thread *td); 257e4fbd039SMitchell Horne static void pmc_release_pmc_descriptor(struct pmc *pmc); 258f263522aSJoseph Koshy static void pmc_remove_owner(struct pmc_owner *po); 259f263522aSJoseph Koshy static void pmc_remove_process_descriptor(struct pmc_process *pp); 260ebccf1e3SJoseph Koshy static int pmc_start(struct pmc *pm); 261ebccf1e3SJoseph Koshy static int pmc_stop(struct pmc *pm); 262f263522aSJoseph Koshy static int pmc_syscall_handler(struct thread *td, void *syscall_args); 2636161b98cSMatt Macy static struct pmc_thread *pmc_thread_descriptor_pool_alloc(void); 2646161b98cSMatt Macy static void pmc_thread_descriptor_pool_drain(void); 2656161b98cSMatt Macy static void pmc_thread_descriptor_pool_free(struct pmc_thread *pt); 266f263522aSJoseph Koshy static void pmc_unlink_target_process(struct pmc *pmc, 267f263522aSJoseph Koshy struct pmc_process *pp); 268e4fbd039SMitchell Horne 269f5f9340bSFabien Thomas static int generic_switch_in(struct pmc_cpu *pc, struct pmc_process *pp); 270f5f9340bSFabien Thomas static int generic_switch_out(struct pmc_cpu *pc, struct pmc_process *pp); 271f5f9340bSFabien Thomas static struct pmc_mdep *pmc_generic_cpu_initialize(void); 272f5f9340bSFabien Thomas static void pmc_generic_cpu_finalize(struct pmc_mdep *md); 273ebfaf69cSMatt Macy 274ebccf1e3SJoseph Koshy /* 275ebccf1e3SJoseph Koshy * Kernel tunables and sysctl(8) interface. 276ebccf1e3SJoseph Koshy */ 277ebccf1e3SJoseph Koshy 278f5f9340bSFabien Thomas SYSCTL_DECL(_kern_hwpmc); 2797029da5cSPawel Biernacki SYSCTL_NODE(_kern_hwpmc, OID_AUTO, stats, CTLFLAG_RW | CTLFLAG_MPSAFE, 0, 2807029da5cSPawel Biernacki "HWPMC stats"); 281e6b475e0SMatt Macy 282e6b475e0SMatt Macy /* Stats. */ 283e6b475e0SMatt Macy SYSCTL_COUNTER_U64(_kern_hwpmc_stats, OID_AUTO, intr_ignored, CTLFLAG_RW, 284693cd307SMitchell Horne &pmc_stats.pm_intr_ignored, 285693cd307SMitchell Horne "# of interrupts ignored"); 286e6b475e0SMatt Macy SYSCTL_COUNTER_U64(_kern_hwpmc_stats, OID_AUTO, intr_processed, CTLFLAG_RW, 287693cd307SMitchell Horne &pmc_stats.pm_intr_processed, 288693cd307SMitchell Horne "# of interrupts processed"); 289e6b475e0SMatt Macy SYSCTL_COUNTER_U64(_kern_hwpmc_stats, OID_AUTO, intr_bufferfull, CTLFLAG_RW, 290693cd307SMitchell Horne &pmc_stats.pm_intr_bufferfull, 291693cd307SMitchell Horne "# of interrupts where buffer was full"); 292e6b475e0SMatt Macy SYSCTL_COUNTER_U64(_kern_hwpmc_stats, OID_AUTO, syscalls, CTLFLAG_RW, 293693cd307SMitchell Horne &pmc_stats.pm_syscalls, 294693cd307SMitchell Horne "# of syscalls"); 295e6b475e0SMatt Macy SYSCTL_COUNTER_U64(_kern_hwpmc_stats, OID_AUTO, syscall_errors, CTLFLAG_RW, 296693cd307SMitchell Horne &pmc_stats.pm_syscall_errors, 297693cd307SMitchell Horne "# of syscall_errors"); 298e6b475e0SMatt Macy SYSCTL_COUNTER_U64(_kern_hwpmc_stats, OID_AUTO, buffer_requests, CTLFLAG_RW, 299693cd307SMitchell Horne &pmc_stats.pm_buffer_requests, 300693cd307SMitchell Horne "# of buffer requests"); 301693cd307SMitchell Horne SYSCTL_COUNTER_U64(_kern_hwpmc_stats, OID_AUTO, buffer_requests_failed, 302693cd307SMitchell Horne CTLFLAG_RW, &pmc_stats.pm_buffer_requests_failed, 303693cd307SMitchell Horne "# of buffer requests which failed"); 304e6b475e0SMatt Macy SYSCTL_COUNTER_U64(_kern_hwpmc_stats, OID_AUTO, log_sweeps, CTLFLAG_RW, 305693cd307SMitchell Horne &pmc_stats.pm_log_sweeps, 306693cd307SMitchell Horne "# of times samples were processed"); 3075de96e33SMatt Macy SYSCTL_COUNTER_U64(_kern_hwpmc_stats, OID_AUTO, merges, CTLFLAG_RW, 308693cd307SMitchell Horne &pmc_stats.pm_merges, 309693cd307SMitchell Horne "# of times kernel stack was found for user trace"); 3105de96e33SMatt Macy SYSCTL_COUNTER_U64(_kern_hwpmc_stats, OID_AUTO, overwrites, CTLFLAG_RW, 311693cd307SMitchell Horne &pmc_stats.pm_overwrites, 312693cd307SMitchell Horne "# of times a sample was overwritten before being logged"); 313ebccf1e3SJoseph Koshy 314d07f36b0SJoseph Koshy static int pmc_callchaindepth = PMC_CALLCHAIN_DEPTH; 315af3b2549SHans Petter Selasky SYSCTL_INT(_kern_hwpmc, OID_AUTO, callchaindepth, CTLFLAG_RDTUN, 316693cd307SMitchell Horne &pmc_callchaindepth, 0, 317693cd307SMitchell Horne "depth of call chain records"); 318d07f36b0SJoseph Koshy 31924e337beSRyan Moeller char pmc_cpuid[PMC_CPUID_LEN]; 320e6b475e0SMatt Macy SYSCTL_STRING(_kern_hwpmc, OID_AUTO, cpuid, CTLFLAG_RD, 321693cd307SMitchell Horne pmc_cpuid, 0, 322693cd307SMitchell Horne "cpu version string"); 323693cd307SMitchell Horne 324680f1afdSJohn Baldwin #ifdef HWPMC_DEBUG 325f263522aSJoseph Koshy struct pmc_debugflags pmc_debugflags = PMC_DEBUG_DEFAULT_FLAGS; 326ebccf1e3SJoseph Koshy char pmc_debugstr[PMC_DEBUG_STRSIZE]; 327ebccf1e3SJoseph Koshy TUNABLE_STR(PMC_SYSCTL_NAME_PREFIX "debugflags", pmc_debugstr, 328ebccf1e3SJoseph Koshy sizeof(pmc_debugstr)); 329ebccf1e3SJoseph Koshy SYSCTL_PROC(_kern_hwpmc, OID_AUTO, debugflags, 3301886cef6SAlexander Motin CTLTYPE_STRING | CTLFLAG_RWTUN | CTLFLAG_NOFETCH | CTLFLAG_MPSAFE, 3317029da5cSPawel Biernacki 0, 0, pmc_debugflags_sysctl_handler, "A", 3327029da5cSPawel Biernacki "debug flags"); 333ebccf1e3SJoseph Koshy #endif 334ebccf1e3SJoseph Koshy 335ebccf1e3SJoseph Koshy /* 33601c35b67SMitchell Horne * kern.hwpmc.hashsize -- determines the number of rows in the 337ebccf1e3SJoseph Koshy * of the hash table used to look up threads 338ebccf1e3SJoseph Koshy */ 339ebccf1e3SJoseph Koshy static int pmc_hashsize = PMC_HASH_SIZE; 340af3b2549SHans Petter Selasky SYSCTL_INT(_kern_hwpmc, OID_AUTO, hashsize, CTLFLAG_RDTUN, 341693cd307SMitchell Horne &pmc_hashsize, 0, 342693cd307SMitchell Horne "rows in hash tables"); 343ebccf1e3SJoseph Koshy 344ebccf1e3SJoseph Koshy /* 345d07f36b0SJoseph Koshy * kern.hwpmc.nsamples --- number of PC samples/callchain stacks per CPU 346ebccf1e3SJoseph Koshy */ 347f263522aSJoseph Koshy static int pmc_nsamples = PMC_NSAMPLES; 348af3b2549SHans Petter Selasky SYSCTL_INT(_kern_hwpmc, OID_AUTO, nsamples, CTLFLAG_RDTUN, 349693cd307SMitchell Horne &pmc_nsamples, 0, 350693cd307SMitchell Horne "number of PC samples per CPU"); 351ebccf1e3SJoseph Koshy 352d9f1b8dbSMatt Macy static uint64_t pmc_sample_mask = PMC_NSAMPLES - 1; 353d07f36b0SJoseph Koshy 354ebccf1e3SJoseph Koshy /* 355f263522aSJoseph Koshy * kern.hwpmc.mtxpoolsize -- number of mutexes in the mutex pool. 356ebccf1e3SJoseph Koshy */ 357ebccf1e3SJoseph Koshy static int pmc_mtxpool_size = PMC_MTXPOOL_SIZE; 358af3b2549SHans Petter Selasky SYSCTL_INT(_kern_hwpmc, OID_AUTO, mtxpoolsize, CTLFLAG_RDTUN, 359693cd307SMitchell Horne &pmc_mtxpool_size, 0, 360693cd307SMitchell Horne "size of spin mutex pool"); 361ebccf1e3SJoseph Koshy 362ebccf1e3SJoseph Koshy /* 3636161b98cSMatt Macy * kern.hwpmc.threadfreelist_entries -- number of free entries 3646161b98cSMatt Macy */ 3656161b98cSMatt Macy SYSCTL_INT(_kern_hwpmc, OID_AUTO, threadfreelist_entries, CTLFLAG_RD, 366693cd307SMitchell Horne &pmc_threadfreelist_entries, 0, 367693cd307SMitchell Horne "number of available thread entries"); 3686161b98cSMatt Macy 3696161b98cSMatt Macy /* 3706161b98cSMatt Macy * kern.hwpmc.threadfreelist_max -- maximum number of free entries 3716161b98cSMatt Macy */ 3726161b98cSMatt Macy static int pmc_threadfreelist_max = PMC_THREADLIST_MAX; 3736161b98cSMatt Macy SYSCTL_INT(_kern_hwpmc, OID_AUTO, threadfreelist_max, CTLFLAG_RW, 3746161b98cSMatt Macy &pmc_threadfreelist_max, 0, 3756161b98cSMatt Macy "maximum number of available thread entries before freeing some"); 3766161b98cSMatt Macy 3776161b98cSMatt Macy /* 378ca341f3cSJohn Baldwin * kern.hwpmc.mincount -- minimum sample count 379ca341f3cSJohn Baldwin */ 380ca341f3cSJohn Baldwin static u_int pmc_mincount = 1000; 381ca341f3cSJohn Baldwin SYSCTL_INT(_kern_hwpmc, OID_AUTO, mincount, CTLFLAG_RWTUN, 382ca341f3cSJohn Baldwin &pmc_mincount, 0, 383ca341f3cSJohn Baldwin "minimum count for sampling counters"); 384ca341f3cSJohn Baldwin 385ca341f3cSJohn Baldwin /* 386ebccf1e3SJoseph Koshy * security.bsd.unprivileged_syspmcs -- allow non-root processes to 387ebccf1e3SJoseph Koshy * allocate system-wide PMCs. 388ebccf1e3SJoseph Koshy * 389ebccf1e3SJoseph Koshy * Allowing unprivileged processes to allocate system PMCs is convenient 390ebccf1e3SJoseph Koshy * if system-wide measurements need to be taken concurrently with other 391ebccf1e3SJoseph Koshy * per-process measurements. This feature is turned off by default. 392ebccf1e3SJoseph Koshy */ 393ebccf1e3SJoseph Koshy static int pmc_unprivileged_syspmcs = 0; 394af3b2549SHans Petter Selasky SYSCTL_INT(_security_bsd, OID_AUTO, unprivileged_syspmcs, CTLFLAG_RWTUN, 395ebccf1e3SJoseph Koshy &pmc_unprivileged_syspmcs, 0, 396ebccf1e3SJoseph Koshy "allow unprivileged process to allocate system PMCs"); 397ebccf1e3SJoseph Koshy 398f263522aSJoseph Koshy /* 399f263522aSJoseph Koshy * Hash function. Discard the lower 2 bits of the pointer since 400f263522aSJoseph Koshy * these are always zero for our uses. The hash multiplier is 401f263522aSJoseph Koshy * round((2^LONG_BIT) * ((sqrt(5)-1)/2)). 402f263522aSJoseph Koshy */ 403ebccf1e3SJoseph Koshy #if LONG_BIT == 64 404ebccf1e3SJoseph Koshy #define _PMC_HM 11400714819323198486u 405ebccf1e3SJoseph Koshy #elif LONG_BIT == 32 406ebccf1e3SJoseph Koshy #define _PMC_HM 2654435769u 407ebccf1e3SJoseph Koshy #else 408ebccf1e3SJoseph Koshy #error Must know the size of 'long' to compile 409ebccf1e3SJoseph Koshy #endif 410ebccf1e3SJoseph Koshy 411ebccf1e3SJoseph Koshy #define PMC_HASH_PTR(P,M) ((((unsigned long) (P) >> 2) * _PMC_HM) & (M)) 412ebccf1e3SJoseph Koshy 413ebccf1e3SJoseph Koshy /* 414ebccf1e3SJoseph Koshy * Syscall structures 415ebccf1e3SJoseph Koshy */ 416ebccf1e3SJoseph Koshy 417ebccf1e3SJoseph Koshy /* The `sysent' for the new syscall */ 418ebccf1e3SJoseph Koshy static struct sysent pmc_sysent = { 4191cfbc451SKonstantin Belousov .sy_narg = 2, 4201cfbc451SKonstantin Belousov .sy_call = pmc_syscall_handler, 421ebccf1e3SJoseph Koshy }; 422ebccf1e3SJoseph Koshy 423ebccf1e3SJoseph Koshy static struct syscall_module_data pmc_syscall_mod = { 4241cfbc451SKonstantin Belousov .chainevh = load, 4251cfbc451SKonstantin Belousov .chainarg = NULL, 4261cfbc451SKonstantin Belousov .offset = &pmc_syscall_num, 4271cfbc451SKonstantin Belousov .new_sysent = &pmc_sysent, 4281cfbc451SKonstantin Belousov .old_sysent = { .sy_narg = 0, .sy_call = NULL }, 4291cfbc451SKonstantin Belousov .flags = SY_THR_STATIC_KLD, 430ebccf1e3SJoseph Koshy }; 431ebccf1e3SJoseph Koshy 432ebccf1e3SJoseph Koshy static moduledata_t pmc_mod = { 4331cfbc451SKonstantin Belousov .name = PMC_MODULE_NAME, 4341cfbc451SKonstantin Belousov .evhand = syscall_module_handler, 4351cfbc451SKonstantin Belousov .priv = &pmc_syscall_mod, 436ebccf1e3SJoseph Koshy }; 437ebccf1e3SJoseph Koshy 438fdce57a0SJohn Baldwin #ifdef EARLY_AP_STARTUP 439fdce57a0SJohn Baldwin DECLARE_MODULE(pmc, pmc_mod, SI_SUB_SYSCALLS, SI_ORDER_ANY); 440fdce57a0SJohn Baldwin #else 441ebccf1e3SJoseph Koshy DECLARE_MODULE(pmc, pmc_mod, SI_SUB_SMP, SI_ORDER_ANY); 442fdce57a0SJohn Baldwin #endif 443ebccf1e3SJoseph Koshy MODULE_VERSION(pmc, PMC_VERSION); 444ebccf1e3SJoseph Koshy 445680f1afdSJohn Baldwin #ifdef HWPMC_DEBUG 446f263522aSJoseph Koshy enum pmc_dbgparse_state { 447f263522aSJoseph Koshy PMCDS_WS, /* in whitespace */ 448f263522aSJoseph Koshy PMCDS_MAJOR, /* seen a major keyword */ 449f263522aSJoseph Koshy PMCDS_MINOR 450f263522aSJoseph Koshy }; 451f263522aSJoseph Koshy 452ebccf1e3SJoseph Koshy static int 453ebccf1e3SJoseph Koshy pmc_debugflags_parse(char *newstr, char *fence) 454ebccf1e3SJoseph Koshy { 455f263522aSJoseph Koshy struct pmc_debugflags *tmpflags; 456f263522aSJoseph Koshy size_t kwlen; 45701c35b67SMitchell Horne char c, *p, *q; 45801c35b67SMitchell Horne int error, *newbits, tmp; 45901c35b67SMitchell Horne int found; 460ebccf1e3SJoseph Koshy 461e11e3f18SDag-Erling Smørgrav tmpflags = malloc(sizeof(*tmpflags), M_PMC, M_WAITOK | M_ZERO); 462ebccf1e3SJoseph Koshy 463f263522aSJoseph Koshy error = 0; 464d5ee4074SMitchell Horne for (p = newstr; p < fence && (c = *p); p++) { 465f263522aSJoseph Koshy /* skip white space */ 466f263522aSJoseph Koshy if (c == ' ' || c == '\t') 467f263522aSJoseph Koshy continue; 468f263522aSJoseph Koshy 469f263522aSJoseph Koshy /* look for a keyword followed by "=" */ 470f263522aSJoseph Koshy for (q = p; p < fence && (c = *p) && c != '='; p++) 471f263522aSJoseph Koshy ; 472f263522aSJoseph Koshy if (c != '=') { 473f263522aSJoseph Koshy error = EINVAL; 474f263522aSJoseph Koshy goto done; 475ebccf1e3SJoseph Koshy } 476ebccf1e3SJoseph Koshy 477f263522aSJoseph Koshy kwlen = p - q; 478f263522aSJoseph Koshy newbits = NULL; 479ebccf1e3SJoseph Koshy 480f263522aSJoseph Koshy /* lookup flag group name */ 481f263522aSJoseph Koshy #define DBG_SET_FLAG_MAJ(S,F) \ 482f263522aSJoseph Koshy if (kwlen == sizeof(S)-1 && strncmp(q, S, kwlen) == 0) \ 483f263522aSJoseph Koshy newbits = &tmpflags->pdb_ ## F; 484ebccf1e3SJoseph Koshy 485f263522aSJoseph Koshy DBG_SET_FLAG_MAJ("cpu", CPU); 486f263522aSJoseph Koshy DBG_SET_FLAG_MAJ("csw", CSW); 487f263522aSJoseph Koshy DBG_SET_FLAG_MAJ("logging", LOG); 488f263522aSJoseph Koshy DBG_SET_FLAG_MAJ("module", MOD); 489f263522aSJoseph Koshy DBG_SET_FLAG_MAJ("md", MDP); 490f263522aSJoseph Koshy DBG_SET_FLAG_MAJ("owner", OWN); 491f263522aSJoseph Koshy DBG_SET_FLAG_MAJ("pmc", PMC); 492f263522aSJoseph Koshy DBG_SET_FLAG_MAJ("process", PRC); 493f263522aSJoseph Koshy DBG_SET_FLAG_MAJ("sampling", SAM); 49401c35b67SMitchell Horne #undef DBG_SET_FLAG_MAJ 495ebccf1e3SJoseph Koshy 496f263522aSJoseph Koshy if (newbits == NULL) { 497f263522aSJoseph Koshy error = EINVAL; 498f263522aSJoseph Koshy goto done; 499ebccf1e3SJoseph Koshy } 500ebccf1e3SJoseph Koshy 501f263522aSJoseph Koshy p++; /* skip the '=' */ 502ebccf1e3SJoseph Koshy 503f263522aSJoseph Koshy /* Now parse the individual flags */ 504f263522aSJoseph Koshy tmp = 0; 505f263522aSJoseph Koshy newflag: 506f263522aSJoseph Koshy for (q = p; p < fence && (c = *p); p++) 507f263522aSJoseph Koshy if (c == ' ' || c == '\t' || c == ',') 508f263522aSJoseph Koshy break; 509f263522aSJoseph Koshy 510f263522aSJoseph Koshy /* p == fence or c == ws or c == "," or c == 0 */ 511f263522aSJoseph Koshy 512f263522aSJoseph Koshy if ((kwlen = p - q) == 0) { 513f263522aSJoseph Koshy *newbits = tmp; 514f263522aSJoseph Koshy continue; 515f263522aSJoseph Koshy } 516f263522aSJoseph Koshy 517f263522aSJoseph Koshy found = 0; 518f263522aSJoseph Koshy #define DBG_SET_FLAG_MIN(S,F) \ 519f263522aSJoseph Koshy if (kwlen == sizeof(S)-1 && strncmp(q, S, kwlen) == 0) \ 520f263522aSJoseph Koshy tmp |= found = (1 << PMC_DEBUG_MIN_ ## F) 521f263522aSJoseph Koshy 522f263522aSJoseph Koshy /* a '*' denotes all possible flags in the group */ 523f263522aSJoseph Koshy if (kwlen == 1 && *q == '*') 524f263522aSJoseph Koshy tmp = found = ~0; 525f263522aSJoseph Koshy /* look for individual flag names */ 526f263522aSJoseph Koshy DBG_SET_FLAG_MIN("allocaterow", ALR); 527f263522aSJoseph Koshy DBG_SET_FLAG_MIN("allocate", ALL); 528f263522aSJoseph Koshy DBG_SET_FLAG_MIN("attach", ATT); 529f263522aSJoseph Koshy DBG_SET_FLAG_MIN("bind", BND); 530f263522aSJoseph Koshy DBG_SET_FLAG_MIN("config", CFG); 531f263522aSJoseph Koshy DBG_SET_FLAG_MIN("exec", EXC); 532f263522aSJoseph Koshy DBG_SET_FLAG_MIN("exit", EXT); 533f263522aSJoseph Koshy DBG_SET_FLAG_MIN("find", FND); 534f263522aSJoseph Koshy DBG_SET_FLAG_MIN("flush", FLS); 535f263522aSJoseph Koshy DBG_SET_FLAG_MIN("fork", FRK); 536f263522aSJoseph Koshy DBG_SET_FLAG_MIN("getbuf", GTB); 537f263522aSJoseph Koshy DBG_SET_FLAG_MIN("hook", PMH); 538f263522aSJoseph Koshy DBG_SET_FLAG_MIN("init", INI); 539f263522aSJoseph Koshy DBG_SET_FLAG_MIN("intr", INT); 540f263522aSJoseph Koshy DBG_SET_FLAG_MIN("linktarget", TLK); 541f263522aSJoseph Koshy DBG_SET_FLAG_MIN("mayberemove", OMR); 542f263522aSJoseph Koshy DBG_SET_FLAG_MIN("ops", OPS); 543f263522aSJoseph Koshy DBG_SET_FLAG_MIN("read", REA); 544f263522aSJoseph Koshy DBG_SET_FLAG_MIN("register", REG); 545f263522aSJoseph Koshy DBG_SET_FLAG_MIN("release", REL); 546f263522aSJoseph Koshy DBG_SET_FLAG_MIN("remove", ORM); 547f263522aSJoseph Koshy DBG_SET_FLAG_MIN("sample", SAM); 548f263522aSJoseph Koshy DBG_SET_FLAG_MIN("scheduleio", SIO); 549f263522aSJoseph Koshy DBG_SET_FLAG_MIN("select", SEL); 550f263522aSJoseph Koshy DBG_SET_FLAG_MIN("signal", SIG); 551f263522aSJoseph Koshy DBG_SET_FLAG_MIN("swi", SWI); 552f263522aSJoseph Koshy DBG_SET_FLAG_MIN("swo", SWO); 553f263522aSJoseph Koshy DBG_SET_FLAG_MIN("start", STA); 554f263522aSJoseph Koshy DBG_SET_FLAG_MIN("stop", STO); 555f263522aSJoseph Koshy DBG_SET_FLAG_MIN("syscall", PMS); 556f263522aSJoseph Koshy DBG_SET_FLAG_MIN("unlinktarget", TUL); 557f263522aSJoseph Koshy DBG_SET_FLAG_MIN("write", WRI); 55801c35b67SMitchell Horne #undef DBG_SET_FLAG_MIN 559f263522aSJoseph Koshy if (found == 0) { 560f263522aSJoseph Koshy /* unrecognized flag name */ 561f263522aSJoseph Koshy error = EINVAL; 562f263522aSJoseph Koshy goto done; 563f263522aSJoseph Koshy } 564f263522aSJoseph Koshy 565f263522aSJoseph Koshy if (c == 0 || c == ' ' || c == '\t') { /* end of flag group */ 566f263522aSJoseph Koshy *newbits = tmp; 567f263522aSJoseph Koshy continue; 568f263522aSJoseph Koshy } 569f263522aSJoseph Koshy 570f263522aSJoseph Koshy p++; 571f263522aSJoseph Koshy goto newflag; 572f263522aSJoseph Koshy } 573f263522aSJoseph Koshy 574f263522aSJoseph Koshy /* save the new flag set */ 575f263522aSJoseph Koshy bcopy(tmpflags, &pmc_debugflags, sizeof(pmc_debugflags)); 576f263522aSJoseph Koshy done: 5771ede983cSDag-Erling Smørgrav free(tmpflags, M_PMC); 57852ebac7fSMitchell Horne return (error); 579ebccf1e3SJoseph Koshy } 580ebccf1e3SJoseph Koshy 581ebccf1e3SJoseph Koshy static int 582ebccf1e3SJoseph Koshy pmc_debugflags_sysctl_handler(SYSCTL_HANDLER_ARGS) 583ebccf1e3SJoseph Koshy { 584ebccf1e3SJoseph Koshy char *fence, *newstr; 585ebccf1e3SJoseph Koshy int error; 58601c35b67SMitchell Horne u_int n; 587ebccf1e3SJoseph Koshy 588ebccf1e3SJoseph Koshy n = sizeof(pmc_debugstr); 589e829eb6dSJoseph Koshy newstr = malloc(n, M_PMC, M_WAITOK | M_ZERO); 59001c35b67SMitchell Horne strlcpy(newstr, pmc_debugstr, n); 591ebccf1e3SJoseph Koshy 592ebccf1e3SJoseph Koshy error = sysctl_handle_string(oidp, newstr, n, req); 593ebccf1e3SJoseph Koshy 594ebccf1e3SJoseph Koshy /* if there is a new string, parse and copy it */ 595ebccf1e3SJoseph Koshy if (error == 0 && req->newptr != NULL) { 596f263522aSJoseph Koshy fence = newstr + (n < req->newlen ? n : req->newlen + 1); 597d5ee4074SMitchell Horne error = pmc_debugflags_parse(newstr, fence); 598d5ee4074SMitchell Horne if (error == 0) 599d5ee4074SMitchell Horne strlcpy(pmc_debugstr, newstr, sizeof(pmc_debugstr)); 600ebccf1e3SJoseph Koshy } 6011ede983cSDag-Erling Smørgrav free(newstr, M_PMC); 602ebccf1e3SJoseph Koshy 60352ebac7fSMitchell Horne return (error); 604ebccf1e3SJoseph Koshy } 605ebccf1e3SJoseph Koshy #endif 606ebccf1e3SJoseph Koshy 607ebccf1e3SJoseph Koshy /* 608e829eb6dSJoseph Koshy * Map a row index to a classdep structure and return the adjusted row 609e829eb6dSJoseph Koshy * index for the PMC class index. 610e829eb6dSJoseph Koshy */ 611e829eb6dSJoseph Koshy static struct pmc_classdep * 61201c35b67SMitchell Horne pmc_ri_to_classdep(struct pmc_mdep *md __unused, int ri, int *adjri) 613e829eb6dSJoseph Koshy { 614e829eb6dSJoseph Koshy struct pmc_classdep *pcd; 615e829eb6dSJoseph Koshy 616e829eb6dSJoseph Koshy KASSERT(ri >= 0 && ri < md->pmd_npmc, 617e829eb6dSJoseph Koshy ("[pmc,%d] illegal row-index %d", __LINE__, ri)); 618e829eb6dSJoseph Koshy 619e829eb6dSJoseph Koshy pcd = pmc_rowindex_to_classdep[ri]; 620e829eb6dSJoseph Koshy KASSERT(pcd != NULL, 621e5087dd8SRui Paulo ("[pmc,%d] ri %d null pcd", __LINE__, ri)); 622e829eb6dSJoseph Koshy 623e829eb6dSJoseph Koshy *adjri = ri - pcd->pcd_ri; 624e829eb6dSJoseph Koshy KASSERT(*adjri >= 0 && *adjri < pcd->pcd_num, 625e829eb6dSJoseph Koshy ("[pmc,%d] adjusted row-index %d", __LINE__, *adjri)); 626e829eb6dSJoseph Koshy 627e829eb6dSJoseph Koshy return (pcd); 628e829eb6dSJoseph Koshy } 629e829eb6dSJoseph Koshy 630e829eb6dSJoseph Koshy /* 631ebccf1e3SJoseph Koshy * Concurrency Control 632ebccf1e3SJoseph Koshy * 633ebccf1e3SJoseph Koshy * The driver manages the following data structures: 634ebccf1e3SJoseph Koshy * 635ebccf1e3SJoseph Koshy * - target process descriptors, one per target process 636ebccf1e3SJoseph Koshy * - owner process descriptors (and attached lists), one per owner process 637ebccf1e3SJoseph Koshy * - lookup hash tables for owner and target processes 638ebccf1e3SJoseph Koshy * - PMC descriptors (and attached lists) 639ebccf1e3SJoseph Koshy * - per-cpu hardware state 640ebccf1e3SJoseph Koshy * - the 'hook' variable through which the kernel calls into 641ebccf1e3SJoseph Koshy * this module 642ebccf1e3SJoseph Koshy * - the machine hardware state (managed by the MD layer) 643ebccf1e3SJoseph Koshy * 644ebccf1e3SJoseph Koshy * These data structures are accessed from: 645ebccf1e3SJoseph Koshy * 646ebccf1e3SJoseph Koshy * - thread context-switch code 647ebccf1e3SJoseph Koshy * - interrupt handlers (possibly on multiple cpus) 648ebccf1e3SJoseph Koshy * - kernel threads on multiple cpus running on behalf of user 649ebccf1e3SJoseph Koshy * processes doing system calls 650ebccf1e3SJoseph Koshy * - this driver's private kernel threads 651ebccf1e3SJoseph Koshy * 652ebccf1e3SJoseph Koshy * = Locks and Locking strategy = 653ebccf1e3SJoseph Koshy * 654ebccf1e3SJoseph Koshy * The driver uses four locking strategies for its operation: 655ebccf1e3SJoseph Koshy * 656382d30cdSJoseph Koshy * - The global SX lock "pmc_sx" is used to protect internal 657382d30cdSJoseph Koshy * data structures. 658ebccf1e3SJoseph Koshy * 659382d30cdSJoseph Koshy * Calls into the module by syscall() start with this lock being 660382d30cdSJoseph Koshy * held in exclusive mode. Depending on the requested operation, 661382d30cdSJoseph Koshy * the lock may be downgraded to 'shared' mode to allow more 662382d30cdSJoseph Koshy * concurrent readers into the module. Calls into the module from 663382d30cdSJoseph Koshy * other parts of the kernel acquire the lock in shared mode. 664ebccf1e3SJoseph Koshy * 665ebccf1e3SJoseph Koshy * This SX lock is held in exclusive mode for any operations that 666ebccf1e3SJoseph Koshy * modify the linkages between the driver's internal data structures. 667ebccf1e3SJoseph Koshy * 668ebccf1e3SJoseph Koshy * The 'pmc_hook' function pointer is also protected by this lock. 669ebccf1e3SJoseph Koshy * It is only examined with the sx lock held in exclusive mode. The 670382d30cdSJoseph Koshy * kernel module is allowed to be unloaded only with the sx lock held 671382d30cdSJoseph Koshy * in exclusive mode. In normal syscall handling, after acquiring the 672382d30cdSJoseph Koshy * pmc_sx lock we first check that 'pmc_hook' is non-null before 673382d30cdSJoseph Koshy * proceeding. This prevents races between the thread unloading the module 674382d30cdSJoseph Koshy * and other threads seeking to use the module. 675ebccf1e3SJoseph Koshy * 676ebccf1e3SJoseph Koshy * - Lookups of target process structures and owner process structures 677ebccf1e3SJoseph Koshy * cannot use the global "pmc_sx" SX lock because these lookups need 678ebccf1e3SJoseph Koshy * to happen during context switches and in other critical sections 679ebccf1e3SJoseph Koshy * where sleeping is not allowed. We protect these lookup tables 680ebccf1e3SJoseph Koshy * with their own private spin-mutexes, "pmc_processhash_mtx" and 681382d30cdSJoseph Koshy * "pmc_ownerhash_mtx". 682ebccf1e3SJoseph Koshy * 683ebccf1e3SJoseph Koshy * - Interrupt handlers work in a lock free manner. At interrupt 684ebccf1e3SJoseph Koshy * time, handlers look at the PMC pointer (phw->phw_pmc) configured 685ebccf1e3SJoseph Koshy * when the PMC was started. If this pointer is NULL, the interrupt 686ebccf1e3SJoseph Koshy * is ignored after updating driver statistics. We ensure that this 687ebccf1e3SJoseph Koshy * pointer is set (using an atomic operation if necessary) before the 688ebccf1e3SJoseph Koshy * PMC hardware is started. Conversely, this pointer is unset atomically 689ebccf1e3SJoseph Koshy * only after the PMC hardware is stopped. 690ebccf1e3SJoseph Koshy * 691ebccf1e3SJoseph Koshy * We ensure that everything needed for the operation of an 692ebccf1e3SJoseph Koshy * interrupt handler is available without it needing to acquire any 693ebccf1e3SJoseph Koshy * locks. We also ensure that a PMC's software state is destroyed only 694ebccf1e3SJoseph Koshy * after the PMC is taken off hardware (on all CPUs). 695ebccf1e3SJoseph Koshy * 696ebccf1e3SJoseph Koshy * - Context-switch handling with process-private PMCs needs more 697ebccf1e3SJoseph Koshy * care. 698ebccf1e3SJoseph Koshy * 699ebccf1e3SJoseph Koshy * A given process may be the target of multiple PMCs. For example, 700ebccf1e3SJoseph Koshy * PMCATTACH and PMCDETACH may be requested by a process on one CPU 701ebccf1e3SJoseph Koshy * while the target process is running on another. A PMC could also 702ebccf1e3SJoseph Koshy * be getting released because its owner is exiting. We tackle 703ebccf1e3SJoseph Koshy * these situations in the following manner: 704ebccf1e3SJoseph Koshy * 705ebccf1e3SJoseph Koshy * - each target process structure 'pmc_process' has an array 706ebccf1e3SJoseph Koshy * of 'struct pmc *' pointers, one for each hardware PMC. 707ebccf1e3SJoseph Koshy * 708ebccf1e3SJoseph Koshy * - At context switch IN time, each "target" PMC in RUNNING state 709ebccf1e3SJoseph Koshy * gets started on hardware and a pointer to each PMC is copied into 710ebccf1e3SJoseph Koshy * the per-cpu phw array. The 'runcount' for the PMC is 711ebccf1e3SJoseph Koshy * incremented. 712ebccf1e3SJoseph Koshy * 713ebccf1e3SJoseph Koshy * - At context switch OUT time, all process-virtual PMCs are stopped 714ebccf1e3SJoseph Koshy * on hardware. The saved value is added to the PMCs value field 715ebccf1e3SJoseph Koshy * only if the PMC is in a non-deleted state (the PMCs state could 716ebccf1e3SJoseph Koshy * have changed during the current time slice). 717ebccf1e3SJoseph Koshy * 718ebccf1e3SJoseph Koshy * Note that since in-between a switch IN on a processor and a switch 719ebccf1e3SJoseph Koshy * OUT, the PMC could have been released on another CPU. Therefore 720ebccf1e3SJoseph Koshy * context switch OUT always looks at the hardware state to turn 721ebccf1e3SJoseph Koshy * OFF PMCs and will update a PMC's saved value only if reachable 722ebccf1e3SJoseph Koshy * from the target process record. 723ebccf1e3SJoseph Koshy * 724ebccf1e3SJoseph Koshy * - OP PMCRELEASE could be called on a PMC at any time (the PMC could 725ebccf1e3SJoseph Koshy * be attached to many processes at the time of the call and could 726ebccf1e3SJoseph Koshy * be active on multiple CPUs). 727ebccf1e3SJoseph Koshy * 728ebccf1e3SJoseph Koshy * We prevent further scheduling of the PMC by marking it as in 729ebccf1e3SJoseph Koshy * state 'DELETED'. If the runcount of the PMC is non-zero then 730ebccf1e3SJoseph Koshy * this PMC is currently running on a CPU somewhere. The thread 7314d70511aSJohn Baldwin * doing the PMCRELEASE operation waits by repeatedly doing a 7324d70511aSJohn Baldwin * pause() till the runcount comes to zero. 733ebccf1e3SJoseph Koshy * 734382d30cdSJoseph Koshy * The contents of a PMC descriptor (struct pmc) are protected using 735382d30cdSJoseph Koshy * a spin-mutex. In order to save space, we use a mutex pool. 736382d30cdSJoseph Koshy * 737382d30cdSJoseph Koshy * In terms of lock types used by witness(4), we use: 738382d30cdSJoseph Koshy * - Type "pmc-sx", used by the global SX lock. 739382d30cdSJoseph Koshy * - Type "pmc-sleep", for sleep mutexes used by logger threads. 740382d30cdSJoseph Koshy * - Type "pmc-per-proc", for protecting PMC owner descriptors. 741382d30cdSJoseph Koshy * - Type "pmc-leaf", used for all other spin mutexes. 742ebccf1e3SJoseph Koshy */ 743ebccf1e3SJoseph Koshy 744ebccf1e3SJoseph Koshy /* 74501c35b67SMitchell Horne * Save the CPU binding of the current kthread. 746ebccf1e3SJoseph Koshy */ 747eff9ee7cSAlexander Motin void 748ebccf1e3SJoseph Koshy pmc_save_cpu_binding(struct pmc_binding *pb) 749ebccf1e3SJoseph Koshy { 7504a3690dfSJohn Baldwin PMCDBG0(CPU,BND,2, "save-cpu"); 751982d11f8SJeff Roberson thread_lock(curthread); 752ebccf1e3SJoseph Koshy pb->pb_bound = sched_is_bound(curthread); 753ebccf1e3SJoseph Koshy pb->pb_cpu = curthread->td_oncpu; 754eff9ee7cSAlexander Motin pb->pb_priority = curthread->td_priority; 755982d11f8SJeff Roberson thread_unlock(curthread); 7564a3690dfSJohn Baldwin PMCDBG1(CPU,BND,2, "save-cpu cpu=%d", pb->pb_cpu); 757ebccf1e3SJoseph Koshy } 758ebccf1e3SJoseph Koshy 759ebccf1e3SJoseph Koshy /* 76001c35b67SMitchell Horne * Restore the CPU binding of the current thread. 761ebccf1e3SJoseph Koshy */ 762eff9ee7cSAlexander Motin void 763ebccf1e3SJoseph Koshy pmc_restore_cpu_binding(struct pmc_binding *pb) 764ebccf1e3SJoseph Koshy { 7654a3690dfSJohn Baldwin PMCDBG2(CPU,BND,2, "restore-cpu curcpu=%d restore=%d", 766ebccf1e3SJoseph Koshy curthread->td_oncpu, pb->pb_cpu); 767982d11f8SJeff Roberson thread_lock(curthread); 768ebccf1e3SJoseph Koshy sched_bind(curthread, pb->pb_cpu); 769eff9ee7cSAlexander Motin if (!pb->pb_bound) 770ebccf1e3SJoseph Koshy sched_unbind(curthread); 771eff9ee7cSAlexander Motin sched_prio(curthread, pb->pb_priority); 772982d11f8SJeff Roberson thread_unlock(curthread); 7734a3690dfSJohn Baldwin PMCDBG0(CPU,BND,2, "restore-cpu done"); 774ebccf1e3SJoseph Koshy } 775ebccf1e3SJoseph Koshy 776ebccf1e3SJoseph Koshy /* 77701c35b67SMitchell Horne * Move execution over to the specified CPU and bind it there. 778ebccf1e3SJoseph Koshy */ 779eff9ee7cSAlexander Motin void 780ebccf1e3SJoseph Koshy pmc_select_cpu(int cpu) 781ebccf1e3SJoseph Koshy { 782122ccdc1SJoseph Koshy KASSERT(cpu >= 0 && cpu < pmc_cpu_max(), 783ebccf1e3SJoseph Koshy ("[pmc,%d] bad cpu number %d", __LINE__, cpu)); 784ebccf1e3SJoseph Koshy 785122ccdc1SJoseph Koshy /* Never move to an inactive CPU. */ 786122ccdc1SJoseph Koshy KASSERT(pmc_cpu_is_active(cpu), ("[pmc,%d] selecting inactive " 787122ccdc1SJoseph Koshy "CPU %d", __LINE__, cpu)); 788ebccf1e3SJoseph Koshy 7894a3690dfSJohn Baldwin PMCDBG1(CPU,SEL,2, "select-cpu cpu=%d", cpu); 790982d11f8SJeff Roberson thread_lock(curthread); 791eff9ee7cSAlexander Motin sched_prio(curthread, PRI_MIN); 792ebccf1e3SJoseph Koshy sched_bind(curthread, cpu); 793982d11f8SJeff Roberson thread_unlock(curthread); 794ebccf1e3SJoseph Koshy 795ebccf1e3SJoseph Koshy KASSERT(curthread->td_oncpu == cpu, 796ebccf1e3SJoseph Koshy ("[pmc,%d] CPU not bound [cpu=%d, curr=%d]", __LINE__, 797ebccf1e3SJoseph Koshy cpu, curthread->td_oncpu)); 798ebccf1e3SJoseph Koshy 7994a3690dfSJohn Baldwin PMCDBG1(CPU,SEL,2, "select-cpu cpu=%d ok", cpu); 800ebccf1e3SJoseph Koshy } 801ebccf1e3SJoseph Koshy 802ebccf1e3SJoseph Koshy /* 803c5153e19SJoseph Koshy * Force a context switch. 804c5153e19SJoseph Koshy * 8054d70511aSJohn Baldwin * We do this by pause'ing for 1 tick -- invoking mi_switch() is not 806c5153e19SJoseph Koshy * guaranteed to force a context switch. 807c5153e19SJoseph Koshy */ 808c5153e19SJoseph Koshy static void 809c5153e19SJoseph Koshy pmc_force_context_switch(void) 810c5153e19SJoseph Koshy { 811c5153e19SJoseph Koshy 8124d70511aSJohn Baldwin pause("pmcctx", 1); 813c5153e19SJoseph Koshy } 814c5153e19SJoseph Koshy 815f992dd4bSMatt Macy uint64_t 816f992dd4bSMatt Macy pmc_rdtsc(void) 817f992dd4bSMatt Macy { 818f992dd4bSMatt Macy #if defined(__i386__) || defined(__amd64__) 819f992dd4bSMatt Macy if (__predict_true(amd_feature & AMDID_RDTSCP)) 82052ebac7fSMitchell Horne return (rdtscp()); 821f992dd4bSMatt Macy else 82252ebac7fSMitchell Horne return (rdtsc()); 823f992dd4bSMatt Macy #else 82452ebac7fSMitchell Horne return (get_cyclecount()); 825f992dd4bSMatt Macy #endif 826f992dd4bSMatt Macy } 827f992dd4bSMatt Macy 828c5153e19SJoseph Koshy /* 829f263522aSJoseph Koshy * Get the file name for an executable. This is a simple wrapper 830f263522aSJoseph Koshy * around vn_fullpath(9). 831ebccf1e3SJoseph Koshy */ 832f263522aSJoseph Koshy static void 83315139246SJoseph Koshy pmc_getfilename(struct vnode *v, char **fullpath, char **freepath) 834ebccf1e3SJoseph Koshy { 835ebccf1e3SJoseph Koshy 836f263522aSJoseph Koshy *fullpath = "unknown"; 837f263522aSJoseph Koshy *freepath = NULL; 838feabaaf9SMateusz Guzik vn_fullpath(v, fullpath, freepath); 839ebccf1e3SJoseph Koshy } 840ebccf1e3SJoseph Koshy 841ebccf1e3SJoseph Koshy /* 84201c35b67SMitchell Horne * Remove a process owning PMCs. 843ebccf1e3SJoseph Koshy */ 844ebccf1e3SJoseph Koshy void 845ebccf1e3SJoseph Koshy pmc_remove_owner(struct pmc_owner *po) 846ebccf1e3SJoseph Koshy { 847f263522aSJoseph Koshy struct pmc *pm, *tmp; 848ebccf1e3SJoseph Koshy 849ebccf1e3SJoseph Koshy sx_assert(&pmc_sx, SX_XLOCKED); 850ebccf1e3SJoseph Koshy 8514a3690dfSJohn Baldwin PMCDBG1(OWN,ORM,1, "remove-owner po=%p", po); 852ebccf1e3SJoseph Koshy 853ebccf1e3SJoseph Koshy /* Remove descriptor from the owner hash table */ 854ebccf1e3SJoseph Koshy LIST_REMOVE(po, po_next); 855ebccf1e3SJoseph Koshy 856f263522aSJoseph Koshy /* release all owned PMC descriptors */ 857f263522aSJoseph Koshy LIST_FOREACH_SAFE(pm, &po->po_pmcs, pm_next, tmp) { 8584a3690dfSJohn Baldwin PMCDBG1(OWN,ORM,2, "pmc=%p", pm); 859f263522aSJoseph Koshy KASSERT(pm->pm_owner == po, 860f263522aSJoseph Koshy ("[pmc,%d] owner %p != po %p", __LINE__, pm->pm_owner, po)); 861ebccf1e3SJoseph Koshy 862f263522aSJoseph Koshy pmc_release_pmc_descriptor(pm); /* will unlink from the list */ 86306796b67SMark Johnston pmc_destroy_pmc_descriptor(pm); 864ebccf1e3SJoseph Koshy } 865ebccf1e3SJoseph Koshy 866f263522aSJoseph Koshy KASSERT(po->po_sscount == 0, 867f263522aSJoseph Koshy ("[pmc,%d] SS count not zero", __LINE__)); 868ebccf1e3SJoseph Koshy KASSERT(LIST_EMPTY(&po->po_pmcs), 869ebccf1e3SJoseph Koshy ("[pmc,%d] PMC list not empty", __LINE__)); 870ebccf1e3SJoseph Koshy 871f263522aSJoseph Koshy /* de-configure the log file if present */ 872c5153e19SJoseph Koshy if (po->po_flags & PMC_PO_OWNS_LOGFILE) 873f263522aSJoseph Koshy pmclog_deconfigure_log(po); 874ebccf1e3SJoseph Koshy } 875ebccf1e3SJoseph Koshy 876ebccf1e3SJoseph Koshy /* 87701c35b67SMitchell Horne * Remove an owner process record if all conditions are met. 878ebccf1e3SJoseph Koshy */ 879ebccf1e3SJoseph Koshy static void 880ebccf1e3SJoseph Koshy pmc_maybe_remove_owner(struct pmc_owner *po) 881ebccf1e3SJoseph Koshy { 882ebccf1e3SJoseph Koshy 8834a3690dfSJohn Baldwin PMCDBG1(OWN,OMR,1, "maybe-remove-owner po=%p", po); 884ebccf1e3SJoseph Koshy 885ebccf1e3SJoseph Koshy /* 886ebccf1e3SJoseph Koshy * Remove owner record if 887ebccf1e3SJoseph Koshy * - this process does not own any PMCs 888ebccf1e3SJoseph Koshy * - this process has not allocated a system-wide sampling buffer 889ebccf1e3SJoseph Koshy */ 890ebccf1e3SJoseph Koshy if (LIST_EMPTY(&po->po_pmcs) && 891c5153e19SJoseph Koshy ((po->po_flags & PMC_PO_OWNS_LOGFILE) == 0)) { 892ebccf1e3SJoseph Koshy pmc_remove_owner(po); 893f263522aSJoseph Koshy pmc_destroy_owner_descriptor(po); 894ebccf1e3SJoseph Koshy } 895ebccf1e3SJoseph Koshy } 896ebccf1e3SJoseph Koshy 897ebccf1e3SJoseph Koshy /* 898ebccf1e3SJoseph Koshy * Add an association between a target process and a PMC. 899ebccf1e3SJoseph Koshy */ 900ebccf1e3SJoseph Koshy static void 901ebccf1e3SJoseph Koshy pmc_link_target_process(struct pmc *pm, struct pmc_process *pp) 902ebccf1e3SJoseph Koshy { 903ebccf1e3SJoseph Koshy struct pmc_target *pt; 90401c35b67SMitchell Horne struct pmc_thread *pt_td __diagused; 90501c35b67SMitchell Horne int ri; 906ebccf1e3SJoseph Koshy 907ebccf1e3SJoseph Koshy sx_assert(&pmc_sx, SX_XLOCKED); 908ebccf1e3SJoseph Koshy KASSERT(pm != NULL && pp != NULL, 909ebccf1e3SJoseph Koshy ("[pmc,%d] Null pm %p or pp %p", __LINE__, pm, pp)); 910f263522aSJoseph Koshy KASSERT(PMC_IS_VIRTUAL_MODE(PMC_TO_MODE(pm)), 911f263522aSJoseph Koshy ("[pmc,%d] Attaching a non-process-virtual pmc=%p to pid=%d", 912f263522aSJoseph Koshy __LINE__, pm, pp->pp_proc->p_pid)); 913fa630f35SFabien Thomas KASSERT(pp->pp_refcnt >= 0 && pp->pp_refcnt <= ((int) md->pmd_npmc - 1), 914ebccf1e3SJoseph Koshy ("[pmc,%d] Illegal reference count %d for process record %p", 915ebccf1e3SJoseph Koshy __LINE__, pp->pp_refcnt, (void *) pp)); 916ebccf1e3SJoseph Koshy 917c5153e19SJoseph Koshy ri = PMC_TO_ROWINDEX(pm); 918ebccf1e3SJoseph Koshy 9194a3690dfSJohn Baldwin PMCDBG3(PRC,TLK,1, "link-target pmc=%p ri=%d pmc-process=%p", 920ebccf1e3SJoseph Koshy pm, ri, pp); 921ebccf1e3SJoseph Koshy 922680f1afdSJohn Baldwin #ifdef HWPMC_DEBUG 923d5ee4074SMitchell Horne LIST_FOREACH(pt, &pm->pm_targets, pt_next) { 924ebccf1e3SJoseph Koshy if (pt->pt_process == pp) 925ebccf1e3SJoseph Koshy KASSERT(0, ("[pmc,%d] pp %p already in pmc %p targets", 926ebccf1e3SJoseph Koshy __LINE__, pp, pm)); 927d5ee4074SMitchell Horne } 928ebccf1e3SJoseph Koshy #endif 929e829eb6dSJoseph Koshy pt = malloc(sizeof(struct pmc_target), M_PMC, M_WAITOK | M_ZERO); 930ebccf1e3SJoseph Koshy pt->pt_process = pp; 931ebccf1e3SJoseph Koshy 932ebccf1e3SJoseph Koshy LIST_INSERT_HEAD(&pm->pm_targets, pt, pt_next); 933ebccf1e3SJoseph Koshy 934122eceefSJohn Baldwin atomic_store_rel_ptr((uintptr_t *)&pp->pp_pmcs[ri].pp_pmc, 935122eceefSJohn Baldwin (uintptr_t)pm); 936ebccf1e3SJoseph Koshy 9376b8c8cd8SJoseph Koshy if (pm->pm_owner->po_owner == pp->pp_proc) 938c5153e19SJoseph Koshy pm->pm_flags |= PMC_F_ATTACHED_TO_OWNER; 9396b8c8cd8SJoseph Koshy 940f263522aSJoseph Koshy /* 941f263522aSJoseph Koshy * Initialize the per-process values at this row index. 942f263522aSJoseph Koshy */ 943f263522aSJoseph Koshy pp->pp_pmcs[ri].pp_pmcval = PMC_TO_MODE(pm) == PMC_MODE_TS ? 944f263522aSJoseph Koshy pm->pm_sc.pm_reloadcount : 0; 945ebccf1e3SJoseph Koshy pp->pp_refcnt++; 946ebccf1e3SJoseph Koshy 9476161b98cSMatt Macy #ifdef INVARIANTS 9486161b98cSMatt Macy /* Confirm that the per-thread values at this row index are cleared. */ 9496161b98cSMatt Macy if (PMC_TO_MODE(pm) == PMC_MODE_TS) { 9506161b98cSMatt Macy mtx_lock_spin(pp->pp_tdslock); 9516161b98cSMatt Macy LIST_FOREACH(pt_td, &pp->pp_tds, pt_next) { 9526161b98cSMatt Macy KASSERT(pt_td->pt_pmcs[ri].pt_pmcval == (pmc_value_t) 0, 9536161b98cSMatt Macy ("[pmc,%d] pt_pmcval not cleared for pid=%d at " 9546161b98cSMatt Macy "ri=%d", __LINE__, pp->pp_proc->p_pid, ri)); 9556161b98cSMatt Macy } 9566161b98cSMatt Macy mtx_unlock_spin(pp->pp_tdslock); 9576161b98cSMatt Macy } 9586161b98cSMatt Macy #endif 959ebccf1e3SJoseph Koshy } 960ebccf1e3SJoseph Koshy 961ebccf1e3SJoseph Koshy /* 962ebccf1e3SJoseph Koshy * Removes the association between a target process and a PMC. 963ebccf1e3SJoseph Koshy */ 964ebccf1e3SJoseph Koshy static void 965ebccf1e3SJoseph Koshy pmc_unlink_target_process(struct pmc *pm, struct pmc_process *pp) 966ebccf1e3SJoseph Koshy { 967ebccf1e3SJoseph Koshy int ri; 968f263522aSJoseph Koshy struct proc *p; 969ebccf1e3SJoseph Koshy struct pmc_target *ptgt; 9706161b98cSMatt Macy struct pmc_thread *pt; 971ebccf1e3SJoseph Koshy 972ebccf1e3SJoseph Koshy sx_assert(&pmc_sx, SX_XLOCKED); 973ebccf1e3SJoseph Koshy 974ebccf1e3SJoseph Koshy KASSERT(pm != NULL && pp != NULL, 975ebccf1e3SJoseph Koshy ("[pmc,%d] Null pm %p or pp %p", __LINE__, pm, pp)); 976ebccf1e3SJoseph Koshy 977fa630f35SFabien Thomas KASSERT(pp->pp_refcnt >= 1 && pp->pp_refcnt <= (int) md->pmd_npmc, 978ebccf1e3SJoseph Koshy ("[pmc,%d] Illegal ref count %d on process record %p", 979ebccf1e3SJoseph Koshy __LINE__, pp->pp_refcnt, (void *) pp)); 980ebccf1e3SJoseph Koshy 981c5153e19SJoseph Koshy ri = PMC_TO_ROWINDEX(pm); 982ebccf1e3SJoseph Koshy 9834a3690dfSJohn Baldwin PMCDBG3(PRC,TUL,1, "unlink-target pmc=%p ri=%d pmc-process=%p", 984ebccf1e3SJoseph Koshy pm, ri, pp); 985ebccf1e3SJoseph Koshy 986ebccf1e3SJoseph Koshy KASSERT(pp->pp_pmcs[ri].pp_pmc == pm, 987ebccf1e3SJoseph Koshy ("[pmc,%d] PMC ri %d mismatch pmc %p pp->[ri] %p", __LINE__, 988ebccf1e3SJoseph Koshy ri, pm, pp->pp_pmcs[ri].pp_pmc)); 989ebccf1e3SJoseph Koshy 990ebccf1e3SJoseph Koshy pp->pp_pmcs[ri].pp_pmc = NULL; 991ebccf1e3SJoseph Koshy pp->pp_pmcs[ri].pp_pmcval = (pmc_value_t)0; 992ebccf1e3SJoseph Koshy 9936161b98cSMatt Macy /* Clear the per-thread values at this row index. */ 9946161b98cSMatt Macy if (PMC_TO_MODE(pm) == PMC_MODE_TS) { 9956161b98cSMatt Macy mtx_lock_spin(pp->pp_tdslock); 9966161b98cSMatt Macy LIST_FOREACH(pt, &pp->pp_tds, pt_next) 9976161b98cSMatt Macy pt->pt_pmcs[ri].pt_pmcval = (pmc_value_t)0; 9986161b98cSMatt Macy mtx_unlock_spin(pp->pp_tdslock); 9996161b98cSMatt Macy } 10006161b98cSMatt Macy 1001c5153e19SJoseph Koshy /* Remove owner-specific flags */ 1002c5153e19SJoseph Koshy if (pm->pm_owner->po_owner == pp->pp_proc) { 1003c5153e19SJoseph Koshy pp->pp_flags &= ~PMC_PP_ENABLE_MSR_ACCESS; 1004c5153e19SJoseph Koshy pm->pm_flags &= ~PMC_F_ATTACHED_TO_OWNER; 1005c5153e19SJoseph Koshy } 10066b8c8cd8SJoseph Koshy 1007ebccf1e3SJoseph Koshy pp->pp_refcnt--; 1008ebccf1e3SJoseph Koshy 1009ebccf1e3SJoseph Koshy /* Remove the target process from the PMC structure */ 1010ebccf1e3SJoseph Koshy LIST_FOREACH(ptgt, &pm->pm_targets, pt_next) 1011ebccf1e3SJoseph Koshy if (ptgt->pt_process == pp) 1012ebccf1e3SJoseph Koshy break; 1013ebccf1e3SJoseph Koshy 1014ebccf1e3SJoseph Koshy KASSERT(ptgt != NULL, ("[pmc,%d] process %p (pp: %p) not found " 1015ebccf1e3SJoseph Koshy "in pmc %p", __LINE__, pp->pp_proc, pp, pm)); 1016ebccf1e3SJoseph Koshy 1017ebccf1e3SJoseph Koshy LIST_REMOVE(ptgt, pt_next); 10181ede983cSDag-Erling Smørgrav free(ptgt, M_PMC); 1019f263522aSJoseph Koshy 1020f263522aSJoseph Koshy /* if the PMC now lacks targets, send the owner a SIGIO */ 1021f263522aSJoseph Koshy if (LIST_EMPTY(&pm->pm_targets)) { 1022f263522aSJoseph Koshy p = pm->pm_owner->po_owner; 1023f263522aSJoseph Koshy PROC_LOCK(p); 10248451d0ddSKip Macy kern_psignal(p, SIGIO); 1025f263522aSJoseph Koshy PROC_UNLOCK(p); 1026f263522aSJoseph Koshy 1027693cd307SMitchell Horne PMCDBG2(PRC,SIG,2, "signalling proc=%p signal=%d", p, SIGIO); 1028ebccf1e3SJoseph Koshy } 1029ebccf1e3SJoseph Koshy } 1030ebccf1e3SJoseph Koshy 1031ebccf1e3SJoseph Koshy /* 1032ebccf1e3SJoseph Koshy * Check if PMC 'pm' may be attached to target process 't'. 1033ebccf1e3SJoseph Koshy */ 1034ebccf1e3SJoseph Koshy 1035ebccf1e3SJoseph Koshy static int 1036ebccf1e3SJoseph Koshy pmc_can_attach(struct pmc *pm, struct proc *t) 1037ebccf1e3SJoseph Koshy { 1038ebccf1e3SJoseph Koshy struct proc *o; /* pmc owner */ 1039ebccf1e3SJoseph Koshy struct ucred *oc, *tc; /* owner, target credentials */ 1040ebccf1e3SJoseph Koshy int decline_attach, i; 1041ebccf1e3SJoseph Koshy 1042ebccf1e3SJoseph Koshy /* 1043ebccf1e3SJoseph Koshy * A PMC's owner can always attach that PMC to itself. 1044ebccf1e3SJoseph Koshy */ 1045ebccf1e3SJoseph Koshy 1046ebccf1e3SJoseph Koshy if ((o = pm->pm_owner->po_owner) == t) 1047ebccf1e3SJoseph Koshy return 0; 1048ebccf1e3SJoseph Koshy 1049ebccf1e3SJoseph Koshy PROC_LOCK(o); 1050ebccf1e3SJoseph Koshy oc = o->p_ucred; 1051ebccf1e3SJoseph Koshy crhold(oc); 1052ebccf1e3SJoseph Koshy PROC_UNLOCK(o); 1053ebccf1e3SJoseph Koshy 1054ebccf1e3SJoseph Koshy PROC_LOCK(t); 1055ebccf1e3SJoseph Koshy tc = t->p_ucred; 1056ebccf1e3SJoseph Koshy crhold(tc); 1057ebccf1e3SJoseph Koshy PROC_UNLOCK(t); 1058ebccf1e3SJoseph Koshy 1059ebccf1e3SJoseph Koshy /* 1060ebccf1e3SJoseph Koshy * The effective uid of the PMC owner should match at least one 1061ebccf1e3SJoseph Koshy * of the {effective,real,saved} uids of the target process. 1062ebccf1e3SJoseph Koshy */ 1063ebccf1e3SJoseph Koshy 1064ebccf1e3SJoseph Koshy decline_attach = oc->cr_uid != tc->cr_uid && 1065ebccf1e3SJoseph Koshy oc->cr_uid != tc->cr_svuid && 1066ebccf1e3SJoseph Koshy oc->cr_uid != tc->cr_ruid; 1067ebccf1e3SJoseph Koshy 1068ebccf1e3SJoseph Koshy /* 1069ebccf1e3SJoseph Koshy * Every one of the target's group ids, must be in the owner's 1070ebccf1e3SJoseph Koshy * group list. 1071ebccf1e3SJoseph Koshy */ 1072ebccf1e3SJoseph Koshy for (i = 0; !decline_attach && i < tc->cr_ngroups; i++) 1073ebccf1e3SJoseph Koshy decline_attach = !groupmember(tc->cr_groups[i], oc); 1074ebccf1e3SJoseph Koshy 1075ebccf1e3SJoseph Koshy /* check the read and saved gids too */ 1076ebccf1e3SJoseph Koshy if (decline_attach == 0) 1077ebccf1e3SJoseph Koshy decline_attach = !groupmember(tc->cr_rgid, oc) || 1078ebccf1e3SJoseph Koshy !groupmember(tc->cr_svgid, oc); 1079ebccf1e3SJoseph Koshy 1080ebccf1e3SJoseph Koshy crfree(tc); 1081ebccf1e3SJoseph Koshy crfree(oc); 1082ebccf1e3SJoseph Koshy 1083ebccf1e3SJoseph Koshy return !decline_attach; 1084ebccf1e3SJoseph Koshy } 1085ebccf1e3SJoseph Koshy 1086ebccf1e3SJoseph Koshy /* 1087ebccf1e3SJoseph Koshy * Attach a process to a PMC. 1088ebccf1e3SJoseph Koshy */ 1089ebccf1e3SJoseph Koshy static int 1090ebccf1e3SJoseph Koshy pmc_attach_one_process(struct proc *p, struct pmc *pm) 1091ebccf1e3SJoseph Koshy { 10926161b98cSMatt Macy int ri, error; 1093f263522aSJoseph Koshy char *fullpath, *freepath; 1094ebccf1e3SJoseph Koshy struct pmc_process *pp; 1095ebccf1e3SJoseph Koshy 1096ebccf1e3SJoseph Koshy sx_assert(&pmc_sx, SX_XLOCKED); 1097ebccf1e3SJoseph Koshy 10984a3690dfSJohn Baldwin PMCDBG5(PRC,ATT,2, "attach-one pm=%p ri=%d proc=%p (%d, %s)", pm, 1099c5153e19SJoseph Koshy PMC_TO_ROWINDEX(pm), p, p->p_pid, p->p_comm); 1100ebccf1e3SJoseph Koshy 1101ebccf1e3SJoseph Koshy /* 1102ebccf1e3SJoseph Koshy * Locate the process descriptor corresponding to process 'p', 1103ebccf1e3SJoseph Koshy * allocating space as needed. 1104ebccf1e3SJoseph Koshy * 1105ebccf1e3SJoseph Koshy * Verify that rowindex 'pm_rowindex' is free in the process 1106ebccf1e3SJoseph Koshy * descriptor. 1107ebccf1e3SJoseph Koshy * 1108ebccf1e3SJoseph Koshy * If not, allocate space for a descriptor and link the 1109ebccf1e3SJoseph Koshy * process descriptor and PMC. 1110ebccf1e3SJoseph Koshy */ 1111c5153e19SJoseph Koshy ri = PMC_TO_ROWINDEX(pm); 1112ebccf1e3SJoseph Koshy 11136161b98cSMatt Macy /* mark process as using HWPMCs */ 11146161b98cSMatt Macy PROC_LOCK(p); 11156161b98cSMatt Macy p->p_flag |= P_HWPMC; 11166161b98cSMatt Macy PROC_UNLOCK(p); 1117ebccf1e3SJoseph Koshy 11186161b98cSMatt Macy if ((pp = pmc_find_process_descriptor(p, PMC_FLAG_ALLOCATE)) == NULL) { 11196161b98cSMatt Macy error = ENOMEM; 11206161b98cSMatt Macy goto fail; 11216161b98cSMatt Macy } 1122ebccf1e3SJoseph Koshy 11236161b98cSMatt Macy if (pp->pp_pmcs[ri].pp_pmc == pm) {/* already present at slot [ri] */ 11246161b98cSMatt Macy error = EEXIST; 11256161b98cSMatt Macy goto fail; 11266161b98cSMatt Macy } 11276161b98cSMatt Macy 11286161b98cSMatt Macy if (pp->pp_pmcs[ri].pp_pmc != NULL) { 11296161b98cSMatt Macy error = EBUSY; 11306161b98cSMatt Macy goto fail; 11316161b98cSMatt Macy } 1132ebccf1e3SJoseph Koshy 1133ebccf1e3SJoseph Koshy pmc_link_target_process(pm, pp); 1134ebccf1e3SJoseph Koshy 1135f263522aSJoseph Koshy if (PMC_IS_SAMPLING_MODE(PMC_TO_MODE(pm)) && 1136f263522aSJoseph Koshy (pm->pm_flags & PMC_F_ATTACHED_TO_OWNER) == 0) 1137f263522aSJoseph Koshy pm->pm_flags |= PMC_F_NEEDS_LOGFILE; 1138f263522aSJoseph Koshy 1139f263522aSJoseph Koshy pm->pm_flags |= PMC_F_ATTACH_DONE; /* mark as attached */ 1140f263522aSJoseph Koshy 1141f263522aSJoseph Koshy /* issue an attach event to a configured log file */ 1142f263522aSJoseph Koshy if (pm->pm_owner->po_flags & PMC_PO_OWNS_LOGFILE) { 1143db57c70aSKonstantin Belousov if (p->p_flag & P_KPROC) { 1144d67023a1SJeff Roberson fullpath = kernelname; 1145d67023a1SJeff Roberson freepath = NULL; 11460fb2c5d6SKonstantin Belousov } else { 11470fb2c5d6SKonstantin Belousov pmc_getfilename(p->p_textvp, &fullpath, &freepath); 1148f263522aSJoseph Koshy pmclog_process_pmcattach(pm, p->p_pid, fullpath); 11490fb2c5d6SKonstantin Belousov } 11501ede983cSDag-Erling Smørgrav free(freepath, M_TEMP); 1151d07f36b0SJoseph Koshy if (PMC_IS_SAMPLING_MODE(PMC_TO_MODE(pm))) 1152d07f36b0SJoseph Koshy pmc_log_process_mappings(pm->pm_owner, p); 1153f263522aSJoseph Koshy } 1154ebccf1e3SJoseph Koshy 11556161b98cSMatt Macy return (0); 11566161b98cSMatt Macy fail: 11576161b98cSMatt Macy PROC_LOCK(p); 11586161b98cSMatt Macy p->p_flag &= ~P_HWPMC; 11596161b98cSMatt Macy PROC_UNLOCK(p); 11606161b98cSMatt Macy return (error); 1161ebccf1e3SJoseph Koshy } 1162ebccf1e3SJoseph Koshy 1163ebccf1e3SJoseph Koshy /* 1164ebccf1e3SJoseph Koshy * Attach a process and optionally its children 1165ebccf1e3SJoseph Koshy */ 1166ebccf1e3SJoseph Koshy static int 1167ebccf1e3SJoseph Koshy pmc_attach_process(struct proc *p, struct pmc *pm) 1168ebccf1e3SJoseph Koshy { 1169ebccf1e3SJoseph Koshy int error; 1170ebccf1e3SJoseph Koshy struct proc *top; 1171ebccf1e3SJoseph Koshy 1172ebccf1e3SJoseph Koshy sx_assert(&pmc_sx, SX_XLOCKED); 1173ebccf1e3SJoseph Koshy 11744a3690dfSJohn Baldwin PMCDBG5(PRC,ATT,1, "attach pm=%p ri=%d proc=%p (%d, %s)", pm, 1175c5153e19SJoseph Koshy PMC_TO_ROWINDEX(pm), p, p->p_pid, p->p_comm); 1176c5153e19SJoseph Koshy 1177c5153e19SJoseph Koshy /* 1178c5153e19SJoseph Koshy * If this PMC successfully allowed a GETMSR operation 1179c5153e19SJoseph Koshy * in the past, disallow further ATTACHes. 1180c5153e19SJoseph Koshy */ 1181c5153e19SJoseph Koshy if ((pm->pm_flags & PMC_PP_ENABLE_MSR_ACCESS) != 0) 118252ebac7fSMitchell Horne return (EPERM); 1183ebccf1e3SJoseph Koshy 1184ebccf1e3SJoseph Koshy if ((pm->pm_flags & PMC_F_DESCENDANTS) == 0) 118552ebac7fSMitchell Horne return (pmc_attach_one_process(p, pm)); 1186ebccf1e3SJoseph Koshy 1187ebccf1e3SJoseph Koshy /* 1188ebccf1e3SJoseph Koshy * Traverse all child processes, attaching them to 1189ebccf1e3SJoseph Koshy * this PMC. 1190ebccf1e3SJoseph Koshy */ 1191ebccf1e3SJoseph Koshy sx_slock(&proctree_lock); 1192ebccf1e3SJoseph Koshy 1193ebccf1e3SJoseph Koshy top = p; 1194ebccf1e3SJoseph Koshy for (;;) { 1195ebccf1e3SJoseph Koshy if ((error = pmc_attach_one_process(p, pm)) != 0) 1196ebccf1e3SJoseph Koshy break; 1197ebccf1e3SJoseph Koshy if (!LIST_EMPTY(&p->p_children)) 1198ebccf1e3SJoseph Koshy p = LIST_FIRST(&p->p_children); 1199ebccf1e3SJoseph Koshy else for (;;) { 1200ebccf1e3SJoseph Koshy if (p == top) 1201ebccf1e3SJoseph Koshy goto done; 1202ebccf1e3SJoseph Koshy if (LIST_NEXT(p, p_sibling)) { 1203ebccf1e3SJoseph Koshy p = LIST_NEXT(p, p_sibling); 1204ebccf1e3SJoseph Koshy break; 1205ebccf1e3SJoseph Koshy } 1206ebccf1e3SJoseph Koshy p = p->p_pptr; 1207ebccf1e3SJoseph Koshy } 1208ebccf1e3SJoseph Koshy } 1209ebccf1e3SJoseph Koshy 1210d5ee4074SMitchell Horne if (error != 0) 1211ebccf1e3SJoseph Koshy (void)pmc_detach_process(top, pm); 1212ebccf1e3SJoseph Koshy 1213ebccf1e3SJoseph Koshy done: 1214ebccf1e3SJoseph Koshy sx_sunlock(&proctree_lock); 121552ebac7fSMitchell Horne return (error); 1216ebccf1e3SJoseph Koshy } 1217ebccf1e3SJoseph Koshy 1218ebccf1e3SJoseph Koshy /* 1219ebccf1e3SJoseph Koshy * Detach a process from a PMC. If there are no other PMCs tracking 1220ebccf1e3SJoseph Koshy * this process, remove the process structure from its hash table. If 1221ebccf1e3SJoseph Koshy * 'flags' contains PMC_FLAG_REMOVE, then free the process structure. 1222ebccf1e3SJoseph Koshy */ 1223ebccf1e3SJoseph Koshy static int 1224ebccf1e3SJoseph Koshy pmc_detach_one_process(struct proc *p, struct pmc *pm, int flags) 1225ebccf1e3SJoseph Koshy { 1226ebccf1e3SJoseph Koshy int ri; 1227ebccf1e3SJoseph Koshy struct pmc_process *pp; 1228ebccf1e3SJoseph Koshy 1229ebccf1e3SJoseph Koshy sx_assert(&pmc_sx, SX_XLOCKED); 1230ebccf1e3SJoseph Koshy 1231ebccf1e3SJoseph Koshy KASSERT(pm != NULL, 1232ebccf1e3SJoseph Koshy ("[pmc,%d] null pm pointer", __LINE__)); 1233ebccf1e3SJoseph Koshy 1234c5153e19SJoseph Koshy ri = PMC_TO_ROWINDEX(pm); 1235ebccf1e3SJoseph Koshy 12364a3690dfSJohn Baldwin PMCDBG6(PRC,ATT,2, "detach-one pm=%p ri=%d proc=%p (%d, %s) flags=0x%x", 1237c5153e19SJoseph Koshy pm, ri, p, p->p_pid, p->p_comm, flags); 1238ebccf1e3SJoseph Koshy 1239ebccf1e3SJoseph Koshy if ((pp = pmc_find_process_descriptor(p, 0)) == NULL) 124052ebac7fSMitchell Horne return (ESRCH); 1241ebccf1e3SJoseph Koshy 1242ebccf1e3SJoseph Koshy if (pp->pp_pmcs[ri].pp_pmc != pm) 124352ebac7fSMitchell Horne return (EINVAL); 1244ebccf1e3SJoseph Koshy 1245ebccf1e3SJoseph Koshy pmc_unlink_target_process(pm, pp); 1246ebccf1e3SJoseph Koshy 1247f263522aSJoseph Koshy /* Issue a detach entry if a log file is configured */ 1248f263522aSJoseph Koshy if (pm->pm_owner->po_flags & PMC_PO_OWNS_LOGFILE) 1249f263522aSJoseph Koshy pmclog_process_pmcdetach(pm, p->p_pid); 1250f263522aSJoseph Koshy 1251ebccf1e3SJoseph Koshy /* 1252b790c193SPedro F. Giffuni * If there are no PMCs targeting this process, we remove its 1253ebccf1e3SJoseph Koshy * descriptor from the target hash table and unset the P_HWPMC 1254ebccf1e3SJoseph Koshy * flag in the struct proc. 1255ebccf1e3SJoseph Koshy */ 1256fa630f35SFabien Thomas KASSERT(pp->pp_refcnt >= 0 && pp->pp_refcnt <= (int) md->pmd_npmc, 1257ebccf1e3SJoseph Koshy ("[pmc,%d] Illegal refcnt %d for process struct %p", 1258ebccf1e3SJoseph Koshy __LINE__, pp->pp_refcnt, pp)); 1259ebccf1e3SJoseph Koshy 1260ebccf1e3SJoseph Koshy if (pp->pp_refcnt != 0) /* still a target of some PMC */ 126152ebac7fSMitchell Horne return (0); 1262ebccf1e3SJoseph Koshy 1263ebccf1e3SJoseph Koshy pmc_remove_process_descriptor(pp); 1264ebccf1e3SJoseph Koshy 1265ebccf1e3SJoseph Koshy if (flags & PMC_FLAG_REMOVE) 12666161b98cSMatt Macy pmc_destroy_process_descriptor(pp); 1267ebccf1e3SJoseph Koshy 1268ebccf1e3SJoseph Koshy PROC_LOCK(p); 1269ebccf1e3SJoseph Koshy p->p_flag &= ~P_HWPMC; 1270ebccf1e3SJoseph Koshy PROC_UNLOCK(p); 1271ebccf1e3SJoseph Koshy 127252ebac7fSMitchell Horne return (0); 1273ebccf1e3SJoseph Koshy } 1274ebccf1e3SJoseph Koshy 1275ebccf1e3SJoseph Koshy /* 1276ebccf1e3SJoseph Koshy * Detach a process and optionally its descendants from a PMC. 1277ebccf1e3SJoseph Koshy */ 1278ebccf1e3SJoseph Koshy static int 1279ebccf1e3SJoseph Koshy pmc_detach_process(struct proc *p, struct pmc *pm) 1280ebccf1e3SJoseph Koshy { 1281ebccf1e3SJoseph Koshy struct proc *top; 1282ebccf1e3SJoseph Koshy 1283ebccf1e3SJoseph Koshy sx_assert(&pmc_sx, SX_XLOCKED); 1284ebccf1e3SJoseph Koshy 12854a3690dfSJohn Baldwin PMCDBG5(PRC,ATT,1, "detach pm=%p ri=%d proc=%p (%d, %s)", pm, 1286c5153e19SJoseph Koshy PMC_TO_ROWINDEX(pm), p, p->p_pid, p->p_comm); 1287ebccf1e3SJoseph Koshy 1288ebccf1e3SJoseph Koshy if ((pm->pm_flags & PMC_F_DESCENDANTS) == 0) 128952ebac7fSMitchell Horne return (pmc_detach_one_process(p, pm, PMC_FLAG_REMOVE)); 1290ebccf1e3SJoseph Koshy 1291ebccf1e3SJoseph Koshy /* 1292ebccf1e3SJoseph Koshy * Traverse all children, detaching them from this PMC. We 1293ebccf1e3SJoseph Koshy * ignore errors since we could be detaching a PMC from a 1294ebccf1e3SJoseph Koshy * partially attached proc tree. 1295ebccf1e3SJoseph Koshy */ 1296ebccf1e3SJoseph Koshy sx_slock(&proctree_lock); 1297ebccf1e3SJoseph Koshy 1298ebccf1e3SJoseph Koshy top = p; 1299ebccf1e3SJoseph Koshy for (;;) { 1300ebccf1e3SJoseph Koshy (void)pmc_detach_one_process(p, pm, PMC_FLAG_REMOVE); 1301ebccf1e3SJoseph Koshy 1302d5ee4074SMitchell Horne if (!LIST_EMPTY(&p->p_children)) { 1303ebccf1e3SJoseph Koshy p = LIST_FIRST(&p->p_children); 1304d5ee4074SMitchell Horne } else { 1305d5ee4074SMitchell Horne for (;;) { 1306ebccf1e3SJoseph Koshy if (p == top) 1307ebccf1e3SJoseph Koshy goto done; 1308ebccf1e3SJoseph Koshy if (LIST_NEXT(p, p_sibling)) { 1309ebccf1e3SJoseph Koshy p = LIST_NEXT(p, p_sibling); 1310ebccf1e3SJoseph Koshy break; 1311ebccf1e3SJoseph Koshy } 1312ebccf1e3SJoseph Koshy p = p->p_pptr; 1313ebccf1e3SJoseph Koshy } 1314ebccf1e3SJoseph Koshy } 1315d5ee4074SMitchell Horne } 1316ebccf1e3SJoseph Koshy done: 1317ebccf1e3SJoseph Koshy sx_sunlock(&proctree_lock); 1318f263522aSJoseph Koshy if (LIST_EMPTY(&pm->pm_targets)) 1319f263522aSJoseph Koshy pm->pm_flags &= ~PMC_F_ATTACH_DONE; 1320f263522aSJoseph Koshy 132152ebac7fSMitchell Horne return (0); 1322ebccf1e3SJoseph Koshy } 1323ebccf1e3SJoseph Koshy 1324ebccf1e3SJoseph Koshy /* 1325c4981694SMitchell Horne * Handle events after an exec() for a process: 1326c4981694SMitchell Horne * - Inform log owners of the new exec() event 1327c4981694SMitchell Horne * - Release any PMCs owned by the process before the exec() 1328c4981694SMitchell Horne * - Detach PMCs from the target if required 1329c4981694SMitchell Horne */ 1330c4981694SMitchell Horne static void 1331c4981694SMitchell Horne pmc_process_exec(struct thread *td, struct pmckern_procexec *pk) 1332c4981694SMitchell Horne { 1333c4981694SMitchell Horne struct pmc *pm; 1334c4981694SMitchell Horne struct pmc_owner *po; 1335c4981694SMitchell Horne struct pmc_process *pp; 1336c4981694SMitchell Horne struct proc *p; 1337c4981694SMitchell Horne char *fullpath, *freepath; 1338c4981694SMitchell Horne u_int ri; 1339c4981694SMitchell Horne bool is_using_hwpmcs; 1340c4981694SMitchell Horne 1341c4981694SMitchell Horne sx_assert(&pmc_sx, SX_XLOCKED); 1342c4981694SMitchell Horne 1343c4981694SMitchell Horne p = td->td_proc; 1344c4981694SMitchell Horne pmc_getfilename(p->p_textvp, &fullpath, &freepath); 1345c4981694SMitchell Horne 1346c4981694SMitchell Horne PMC_EPOCH_ENTER(); 1347c4981694SMitchell Horne /* Inform owners of SS mode PMCs of the exec event. */ 1348c4981694SMitchell Horne CK_LIST_FOREACH(po, &pmc_ss_owners, po_ssnext) { 1349c4981694SMitchell Horne if ((po->po_flags & PMC_PO_OWNS_LOGFILE) != 0) { 1350c4981694SMitchell Horne pmclog_process_procexec(po, PMC_ID_INVALID, p->p_pid, 1351c4981694SMitchell Horne pk->pm_baseaddr, pk->pm_dynaddr, fullpath); 1352c4981694SMitchell Horne } 1353c4981694SMitchell Horne } 1354c4981694SMitchell Horne PMC_EPOCH_EXIT(); 1355c4981694SMitchell Horne 1356c4981694SMitchell Horne PROC_LOCK(p); 1357c4981694SMitchell Horne is_using_hwpmcs = (p->p_flag & P_HWPMC) != 0; 1358c4981694SMitchell Horne PROC_UNLOCK(p); 1359c4981694SMitchell Horne 1360c4981694SMitchell Horne if (!is_using_hwpmcs) { 1361c4981694SMitchell Horne if (freepath != NULL) 1362c4981694SMitchell Horne free(freepath, M_TEMP); 1363c4981694SMitchell Horne return; 1364c4981694SMitchell Horne } 1365c4981694SMitchell Horne 1366c4981694SMitchell Horne /* 1367c4981694SMitchell Horne * PMCs are not inherited across an exec(): remove any PMCs that this 1368c4981694SMitchell Horne * process is the owner of. 1369c4981694SMitchell Horne */ 1370c4981694SMitchell Horne if ((po = pmc_find_owner_descriptor(p)) != NULL) { 1371c4981694SMitchell Horne pmc_remove_owner(po); 1372c4981694SMitchell Horne pmc_destroy_owner_descriptor(po); 1373c4981694SMitchell Horne } 1374c4981694SMitchell Horne 1375c4981694SMitchell Horne /* 1376c4981694SMitchell Horne * If the process being exec'ed is not the target of any PMC, we are 1377c4981694SMitchell Horne * done. 1378c4981694SMitchell Horne */ 1379c4981694SMitchell Horne if ((pp = pmc_find_process_descriptor(p, 0)) == NULL) { 1380c4981694SMitchell Horne if (freepath != NULL) 1381c4981694SMitchell Horne free(freepath, M_TEMP); 1382c4981694SMitchell Horne return; 1383c4981694SMitchell Horne } 1384c4981694SMitchell Horne 1385c4981694SMitchell Horne /* 1386c4981694SMitchell Horne * Log the exec event to all monitoring owners. Skip owners who have 1387c4981694SMitchell Horne * already received the event because they had system sampling PMCs 1388c4981694SMitchell Horne * active. 1389c4981694SMitchell Horne */ 1390c4981694SMitchell Horne for (ri = 0; ri < md->pmd_npmc; ri++) { 1391c4981694SMitchell Horne if ((pm = pp->pp_pmcs[ri].pp_pmc) == NULL) 1392c4981694SMitchell Horne continue; 1393c4981694SMitchell Horne 1394c4981694SMitchell Horne po = pm->pm_owner; 1395c4981694SMitchell Horne if (po->po_sscount == 0 && 1396c4981694SMitchell Horne (po->po_flags & PMC_PO_OWNS_LOGFILE) != 0) { 1397c4981694SMitchell Horne pmclog_process_procexec(po, pm->pm_id, p->p_pid, 1398c4981694SMitchell Horne pk->pm_baseaddr, pk->pm_dynaddr, fullpath); 1399c4981694SMitchell Horne } 1400c4981694SMitchell Horne } 1401c4981694SMitchell Horne 1402c4981694SMitchell Horne if (freepath != NULL) 1403c4981694SMitchell Horne free(freepath, M_TEMP); 1404c4981694SMitchell Horne 1405c4981694SMitchell Horne PMCDBG4(PRC,EXC,1, "exec proc=%p (%d, %s) cred-changed=%d", 1406c4981694SMitchell Horne p, p->p_pid, p->p_comm, pk->pm_credentialschanged); 1407c4981694SMitchell Horne 1408c4981694SMitchell Horne if (pk->pm_credentialschanged == 0) /* no change */ 1409c4981694SMitchell Horne return; 1410c4981694SMitchell Horne 1411c4981694SMitchell Horne /* 1412c4981694SMitchell Horne * If the newly exec()'ed process has a different credential 1413c4981694SMitchell Horne * than before, allow it to be the target of a PMC only if 1414c4981694SMitchell Horne * the PMC's owner has sufficient privilege. 1415c4981694SMitchell Horne */ 1416c4981694SMitchell Horne for (ri = 0; ri < md->pmd_npmc; ri++) { 1417c4981694SMitchell Horne if ((pm = pp->pp_pmcs[ri].pp_pmc) != NULL) { 1418c4981694SMitchell Horne if (pmc_can_attach(pm, td->td_proc) != 0) { 1419c4981694SMitchell Horne pmc_detach_one_process(td->td_proc, pm, 1420c4981694SMitchell Horne PMC_FLAG_NONE); 1421c4981694SMitchell Horne } 1422c4981694SMitchell Horne } 1423c4981694SMitchell Horne } 1424c4981694SMitchell Horne 1425c4981694SMitchell Horne KASSERT(pp->pp_refcnt >= 0 && pp->pp_refcnt <= md->pmd_npmc, 1426c4981694SMitchell Horne ("[pmc,%d] Illegal ref count %u on pp %p", __LINE__, 1427c4981694SMitchell Horne pp->pp_refcnt, pp)); 1428c4981694SMitchell Horne 1429c4981694SMitchell Horne /* 1430c4981694SMitchell Horne * If this process is no longer the target of any 1431c4981694SMitchell Horne * PMCs, we can remove the process entry and free 1432c4981694SMitchell Horne * up space. 1433c4981694SMitchell Horne */ 1434c4981694SMitchell Horne if (pp->pp_refcnt == 0) { 1435c4981694SMitchell Horne pmc_remove_process_descriptor(pp); 1436c4981694SMitchell Horne pmc_destroy_process_descriptor(pp); 1437c4981694SMitchell Horne } 1438c4981694SMitchell Horne } 1439c4981694SMitchell Horne 1440c4981694SMitchell Horne /* 144101c35b67SMitchell Horne * Thread context switch IN. 1442ebccf1e3SJoseph Koshy */ 1443f263522aSJoseph Koshy static void 1444f263522aSJoseph Koshy pmc_process_csw_in(struct thread *td) 1445ebccf1e3SJoseph Koshy { 1446ebccf1e3SJoseph Koshy struct pmc *pm; 144701c35b67SMitchell Horne struct pmc_classdep *pcd; 1448ebccf1e3SJoseph Koshy struct pmc_cpu *pc; 1449aee6e7dcSMateusz Guzik struct pmc_hw *phw __diagused; 1450e829eb6dSJoseph Koshy struct pmc_process *pp; 14516161b98cSMatt Macy struct pmc_thread *pt; 145201c35b67SMitchell Horne struct proc *p; 145301c35b67SMitchell Horne pmc_value_t newvalue; 145401c35b67SMitchell Horne int cpu; 145501c35b67SMitchell Horne u_int adjri, ri; 1456ebccf1e3SJoseph Koshy 1457ebccf1e3SJoseph Koshy p = td->td_proc; 14586161b98cSMatt Macy pt = NULL; 1459ebccf1e3SJoseph Koshy if ((pp = pmc_find_process_descriptor(p, PMC_FLAG_NONE)) == NULL) 1460f263522aSJoseph Koshy return; 1461ebccf1e3SJoseph Koshy 1462ebccf1e3SJoseph Koshy KASSERT(pp->pp_proc == td->td_proc, 1463ebccf1e3SJoseph Koshy ("[pmc,%d] not my thread state", __LINE__)); 1464ebccf1e3SJoseph Koshy 1465f263522aSJoseph Koshy critical_enter(); /* no preemption from this point */ 1466ebccf1e3SJoseph Koshy 1467ebccf1e3SJoseph Koshy cpu = PCPU_GET(cpuid); /* td->td_oncpu is invalid */ 1468ebccf1e3SJoseph Koshy 14694a3690dfSJohn Baldwin PMCDBG5(CSW,SWI,1, "cpu=%d proc=%p (%d, %s) pp=%p", cpu, p, 1470ebccf1e3SJoseph Koshy p->p_pid, p->p_comm, pp); 1471ebccf1e3SJoseph Koshy 1472122ccdc1SJoseph Koshy KASSERT(cpu >= 0 && cpu < pmc_cpu_max(), 1473b790c193SPedro F. Giffuni ("[pmc,%d] weird CPU id %d", __LINE__, cpu)); 1474ebccf1e3SJoseph Koshy 1475ebccf1e3SJoseph Koshy pc = pmc_pcpu[cpu]; 1476ebccf1e3SJoseph Koshy for (ri = 0; ri < md->pmd_npmc; ri++) { 1477ebccf1e3SJoseph Koshy if ((pm = pp->pp_pmcs[ri].pp_pmc) == NULL) 1478ebccf1e3SJoseph Koshy continue; 1479ebccf1e3SJoseph Koshy 1480c5153e19SJoseph Koshy KASSERT(PMC_IS_VIRTUAL_MODE(PMC_TO_MODE(pm)), 1481ebccf1e3SJoseph Koshy ("[pmc,%d] Target PMC in non-virtual mode (%d)", 1482c5153e19SJoseph Koshy __LINE__, PMC_TO_MODE(pm))); 1483c5153e19SJoseph Koshy KASSERT(PMC_TO_ROWINDEX(pm) == ri, 1484ebccf1e3SJoseph Koshy ("[pmc,%d] Row index mismatch pmc %d != ri %d", 1485c5153e19SJoseph Koshy __LINE__, PMC_TO_ROWINDEX(pm), ri)); 1486ebccf1e3SJoseph Koshy 1487ebccf1e3SJoseph Koshy /* 1488ebccf1e3SJoseph Koshy * Only PMCs that are marked as 'RUNNING' need 1489ebccf1e3SJoseph Koshy * be placed on hardware. 1490ebccf1e3SJoseph Koshy */ 1491ebccf1e3SJoseph Koshy if (pm->pm_state != PMC_STATE_RUNNING) 1492ebccf1e3SJoseph Koshy continue; 1493ebccf1e3SJoseph Koshy 1494d9f1b8dbSMatt Macy KASSERT(counter_u64_fetch(pm->pm_runcount) >= 0, 149501c35b67SMitchell Horne ("[pmc,%d] pm=%p runcount %ju", __LINE__, pm, 149601c35b67SMitchell Horne (uintmax_t)counter_u64_fetch(pm->pm_runcount))); 1497d9f1b8dbSMatt Macy 1498ebccf1e3SJoseph Koshy /* increment PMC runcount */ 1499e6b475e0SMatt Macy counter_u64_add(pm->pm_runcount, 1); 1500ebccf1e3SJoseph Koshy 1501ebccf1e3SJoseph Koshy /* configure the HWPMC we are going to use. */ 1502e829eb6dSJoseph Koshy pcd = pmc_ri_to_classdep(md, ri, &adjri); 150301c35b67SMitchell Horne (void)pcd->pcd_config_pmc(cpu, adjri, pm); 1504ebccf1e3SJoseph Koshy 1505ebccf1e3SJoseph Koshy phw = pc->pc_hwpmcs[ri]; 1506ebccf1e3SJoseph Koshy 1507ebccf1e3SJoseph Koshy KASSERT(phw != NULL, 1508ebccf1e3SJoseph Koshy ("[pmc,%d] null hw pointer", __LINE__)); 1509ebccf1e3SJoseph Koshy 1510ebccf1e3SJoseph Koshy KASSERT(phw->phw_pmc == pm, 1511ebccf1e3SJoseph Koshy ("[pmc,%d] hw->pmc %p != pmc %p", __LINE__, 1512ebccf1e3SJoseph Koshy phw->phw_pmc, pm)); 1513ebccf1e3SJoseph Koshy 1514f263522aSJoseph Koshy /* 1515f263522aSJoseph Koshy * Write out saved value and start the PMC. 1516f263522aSJoseph Koshy * 15176161b98cSMatt Macy * Sampling PMCs use a per-thread value, while 1518f263522aSJoseph Koshy * counting mode PMCs use a per-pmc value that is 1519f263522aSJoseph Koshy * inherited across descendants. 1520f263522aSJoseph Koshy */ 1521f263522aSJoseph Koshy if (PMC_TO_MODE(pm) == PMC_MODE_TS) { 15226161b98cSMatt Macy if (pt == NULL) 15236161b98cSMatt Macy pt = pmc_find_thread_descriptor(pp, td, 15246161b98cSMatt Macy PMC_FLAG_NONE); 15256161b98cSMatt Macy 15266161b98cSMatt Macy KASSERT(pt != NULL, 15276161b98cSMatt Macy ("[pmc,%d] No thread found for td=%p", __LINE__, 15286161b98cSMatt Macy td)); 15296161b98cSMatt Macy 1530f263522aSJoseph Koshy mtx_pool_lock_spin(pmc_mtxpool, pm); 15315eaa6f01SJonathan T. Looney 15325eaa6f01SJonathan T. Looney /* 15336161b98cSMatt Macy * If we have a thread descriptor, use the per-thread 15346161b98cSMatt Macy * counter in the descriptor. If not, we will use 15356161b98cSMatt Macy * a per-process counter. 15366161b98cSMatt Macy * 15376161b98cSMatt Macy * TODO: Remove the per-process "safety net" once 15386161b98cSMatt Macy * we have thoroughly tested that we don't hit the 15396161b98cSMatt Macy * above assert. 15405eaa6f01SJonathan T. Looney */ 15416161b98cSMatt Macy if (pt != NULL) { 15426161b98cSMatt Macy if (pt->pt_pmcs[ri].pt_pmcval > 0) 15436161b98cSMatt Macy newvalue = pt->pt_pmcs[ri].pt_pmcval; 15446161b98cSMatt Macy else 15456161b98cSMatt Macy newvalue = pm->pm_sc.pm_reloadcount; 15466161b98cSMatt Macy } else { 15476161b98cSMatt Macy /* 15486161b98cSMatt Macy * Use the saved value calculated after the most 15496161b98cSMatt Macy * recent time a thread using the shared counter 15506161b98cSMatt Macy * switched out. Reset the saved count in case 15516161b98cSMatt Macy * another thread from this process switches in 15526161b98cSMatt Macy * before any threads switch out. 15536161b98cSMatt Macy */ 15546161b98cSMatt Macy newvalue = pp->pp_pmcs[ri].pp_pmcval; 15556161b98cSMatt Macy pp->pp_pmcs[ri].pp_pmcval = 15566161b98cSMatt Macy pm->pm_sc.pm_reloadcount; 15576161b98cSMatt Macy } 1558f263522aSJoseph Koshy mtx_pool_unlock_spin(pmc_mtxpool, pm); 15596161b98cSMatt Macy KASSERT(newvalue > 0 && newvalue <= 15606161b98cSMatt Macy pm->pm_sc.pm_reloadcount, 15616161b98cSMatt Macy ("[pmc,%d] pmcval outside of expected range cpu=%d " 15626161b98cSMatt Macy "ri=%d pmcval=%jx pm_reloadcount=%jx", __LINE__, 15636161b98cSMatt Macy cpu, ri, newvalue, pm->pm_sc.pm_reloadcount)); 1564f263522aSJoseph Koshy } else { 1565f263522aSJoseph Koshy KASSERT(PMC_TO_MODE(pm) == PMC_MODE_TC, 1566f263522aSJoseph Koshy ("[pmc,%d] illegal mode=%d", __LINE__, 1567f263522aSJoseph Koshy PMC_TO_MODE(pm))); 1568ebccf1e3SJoseph Koshy mtx_pool_lock_spin(pmc_mtxpool, pm); 1569ebccf1e3SJoseph Koshy newvalue = PMC_PCPU_SAVED(cpu, ri) = 1570ebccf1e3SJoseph Koshy pm->pm_gv.pm_savedvalue; 1571ebccf1e3SJoseph Koshy mtx_pool_unlock_spin(pmc_mtxpool, pm); 1572f263522aSJoseph Koshy } 1573f263522aSJoseph Koshy 15744a3690dfSJohn Baldwin PMCDBG3(CSW,SWI,1,"cpu=%d ri=%d new=%jd", cpu, ri, newvalue); 1575ebccf1e3SJoseph Koshy 157601c35b67SMitchell Horne (void)pcd->pcd_write_pmc(cpu, adjri, pm, newvalue); 1577a3924968SJonathan T. Looney 1578a3924968SJonathan T. Looney /* If a sampling mode PMC, reset stalled state. */ 1579a3924968SJonathan T. Looney if (PMC_TO_MODE(pm) == PMC_MODE_TS) 1580e6b475e0SMatt Macy pm->pm_pcpu_state[cpu].pps_stalled = 0; 1581a3924968SJonathan T. Looney 1582a3924968SJonathan T. Looney /* Indicate that we desire this to run. */ 1583e6b475e0SMatt Macy pm->pm_pcpu_state[cpu].pps_cpustate = 1; 1584a3924968SJonathan T. Looney 1585a3924968SJonathan T. Looney /* Start the PMC. */ 158601c35b67SMitchell Horne (void)pcd->pcd_start_pmc(cpu, adjri, pm); 1587ebccf1e3SJoseph Koshy } 1588ebccf1e3SJoseph Koshy 1589ebccf1e3SJoseph Koshy /* 159001c35b67SMitchell Horne * Perform any other architecture/cpu dependent thread 1591ebccf1e3SJoseph Koshy * switch-in actions. 1592ebccf1e3SJoseph Koshy */ 15936b8c8cd8SJoseph Koshy (void)(*md->pmd_switch_in)(pc, pp); 1594ebccf1e3SJoseph Koshy 1595ebccf1e3SJoseph Koshy critical_exit(); 1596ebccf1e3SJoseph Koshy } 1597ebccf1e3SJoseph Koshy 1598ebccf1e3SJoseph Koshy /* 1599ebccf1e3SJoseph Koshy * Thread context switch OUT. 1600ebccf1e3SJoseph Koshy */ 1601f263522aSJoseph Koshy static void 1602f263522aSJoseph Koshy pmc_process_csw_out(struct thread *td) 1603ebccf1e3SJoseph Koshy { 1604ebccf1e3SJoseph Koshy struct pmc *pm; 160501c35b67SMitchell Horne struct pmc_classdep *pcd; 1606ebccf1e3SJoseph Koshy struct pmc_cpu *pc; 1607e829eb6dSJoseph Koshy struct pmc_process *pp; 16086161b98cSMatt Macy struct pmc_thread *pt = NULL; 160901c35b67SMitchell Horne struct proc *p; 161001c35b67SMitchell Horne pmc_value_t newvalue; 161101c35b67SMitchell Horne int64_t tmp; 161201c35b67SMitchell Horne enum pmc_mode mode; 161301c35b67SMitchell Horne int cpu; 161401c35b67SMitchell Horne u_int adjri, ri; 1615ebccf1e3SJoseph Koshy 1616ebccf1e3SJoseph Koshy /* 1617ebccf1e3SJoseph Koshy * Locate our process descriptor; this may be NULL if 1618ebccf1e3SJoseph Koshy * this process is exiting and we have already removed 1619ebccf1e3SJoseph Koshy * the process from the target process table. 1620ebccf1e3SJoseph Koshy * 1621ebccf1e3SJoseph Koshy * Note that due to kernel preemption, multiple 1622ebccf1e3SJoseph Koshy * context switches may happen while the process is 1623ebccf1e3SJoseph Koshy * exiting. 1624ebccf1e3SJoseph Koshy * 1625ebccf1e3SJoseph Koshy * Note also that if the target process cannot be 1626ebccf1e3SJoseph Koshy * found we still need to deconfigure any PMCs that 1627ebccf1e3SJoseph Koshy * are currently running on hardware. 1628ebccf1e3SJoseph Koshy */ 1629ebccf1e3SJoseph Koshy p = td->td_proc; 1630ebccf1e3SJoseph Koshy pp = pmc_find_process_descriptor(p, PMC_FLAG_NONE); 1631ebccf1e3SJoseph Koshy 1632ebccf1e3SJoseph Koshy critical_enter(); 1633ebccf1e3SJoseph Koshy 1634ebccf1e3SJoseph Koshy cpu = PCPU_GET(cpuid); /* td->td_oncpu is invalid */ 1635ebccf1e3SJoseph Koshy 16364a3690dfSJohn Baldwin PMCDBG5(CSW,SWO,1, "cpu=%d proc=%p (%d, %s) pp=%p", cpu, p, 1637ebccf1e3SJoseph Koshy p->p_pid, p->p_comm, pp); 1638ebccf1e3SJoseph Koshy 1639122ccdc1SJoseph Koshy KASSERT(cpu >= 0 && cpu < pmc_cpu_max(), 1640b790c193SPedro F. Giffuni ("[pmc,%d weird CPU id %d", __LINE__, cpu)); 1641ebccf1e3SJoseph Koshy 1642ebccf1e3SJoseph Koshy pc = pmc_pcpu[cpu]; 1643ebccf1e3SJoseph Koshy 1644ebccf1e3SJoseph Koshy /* 1645ebccf1e3SJoseph Koshy * When a PMC gets unlinked from a target PMC, it will 1646ebccf1e3SJoseph Koshy * be removed from the target's pp_pmc[] array. 1647ebccf1e3SJoseph Koshy * 1648ebccf1e3SJoseph Koshy * However, on a MP system, the target could have been 1649ebccf1e3SJoseph Koshy * executing on another CPU at the time of the unlink. 1650ebccf1e3SJoseph Koshy * So, at context switch OUT time, we need to look at 1651ebccf1e3SJoseph Koshy * the hardware to determine if a PMC is scheduled on 1652ebccf1e3SJoseph Koshy * it. 1653ebccf1e3SJoseph Koshy */ 1654ebccf1e3SJoseph Koshy for (ri = 0; ri < md->pmd_npmc; ri++) { 1655e829eb6dSJoseph Koshy pcd = pmc_ri_to_classdep(md, ri, &adjri); 1656c5153e19SJoseph Koshy pm = NULL; 1657e829eb6dSJoseph Koshy (void)(*pcd->pcd_get_config)(cpu, adjri, &pm); 1658ebccf1e3SJoseph Koshy 1659ebccf1e3SJoseph Koshy if (pm == NULL) /* nothing at this row index */ 1660ebccf1e3SJoseph Koshy continue; 1661ebccf1e3SJoseph Koshy 1662f263522aSJoseph Koshy mode = PMC_TO_MODE(pm); 1663f263522aSJoseph Koshy if (!PMC_IS_VIRTUAL_MODE(mode)) 1664ebccf1e3SJoseph Koshy continue; /* not a process virtual PMC */ 1665ebccf1e3SJoseph Koshy 1666c5153e19SJoseph Koshy KASSERT(PMC_TO_ROWINDEX(pm) == ri, 1667ebccf1e3SJoseph Koshy ("[pmc,%d] ri mismatch pmc(%d) ri(%d)", 1668c5153e19SJoseph Koshy __LINE__, PMC_TO_ROWINDEX(pm), ri)); 1669ebccf1e3SJoseph Koshy 1670a3924968SJonathan T. Looney /* 1671a3924968SJonathan T. Looney * Change desired state, and then stop if not stalled. 1672a3924968SJonathan T. Looney * This two-step dance should avoid race conditions where 1673a3924968SJonathan T. Looney * an interrupt re-enables the PMC after this code has 1674a3924968SJonathan T. Looney * already checked the pm_stalled flag. 1675a3924968SJonathan T. Looney */ 1676e6b475e0SMatt Macy pm->pm_pcpu_state[cpu].pps_cpustate = 0; 1677e6b475e0SMatt Macy if (pm->pm_pcpu_state[cpu].pps_stalled == 0) 167801c35b67SMitchell Horne (void)pcd->pcd_stop_pmc(cpu, adjri, pm); 1679ebccf1e3SJoseph Koshy 1680d9f1b8dbSMatt Macy KASSERT(counter_u64_fetch(pm->pm_runcount) > 0, 168101c35b67SMitchell Horne ("[pmc,%d] pm=%p runcount %ju", __LINE__, pm, 168201c35b67SMitchell Horne (uintmax_t)counter_u64_fetch(pm->pm_runcount))); 1683d9f1b8dbSMatt Macy 1684ebccf1e3SJoseph Koshy /* reduce this PMC's runcount */ 1685e6b475e0SMatt Macy counter_u64_add(pm->pm_runcount, -1); 1686ebccf1e3SJoseph Koshy 1687ebccf1e3SJoseph Koshy /* 1688ebccf1e3SJoseph Koshy * If this PMC is associated with this process, 1689ebccf1e3SJoseph Koshy * save the reading. 1690ebccf1e3SJoseph Koshy */ 1691593077d6SAndriy Gapon if (pm->pm_state != PMC_STATE_DELETED && pp != NULL && 1692593077d6SAndriy Gapon pp->pp_pmcs[ri].pp_pmc != NULL) { 1693ebccf1e3SJoseph Koshy KASSERT(pm == pp->pp_pmcs[ri].pp_pmc, 1694f263522aSJoseph Koshy ("[pmc,%d] pm %p != pp_pmcs[%d] %p", __LINE__, 1695f263522aSJoseph Koshy pm, ri, pp->pp_pmcs[ri].pp_pmc)); 1696ebccf1e3SJoseph Koshy KASSERT(pp->pp_refcnt > 0, 1697ebccf1e3SJoseph Koshy ("[pmc,%d] pp refcnt = %d", __LINE__, 1698ebccf1e3SJoseph Koshy pp->pp_refcnt)); 1699ebccf1e3SJoseph Koshy 170001c35b67SMitchell Horne (void)pcd->pcd_read_pmc(cpu, adjri, pm, &newvalue); 1701ebccf1e3SJoseph Koshy 1702f263522aSJoseph Koshy if (mode == PMC_MODE_TS) { 17036161b98cSMatt Macy PMCDBG3(CSW,SWO,1,"cpu=%d ri=%d val=%jd (samp)", 17046161b98cSMatt Macy cpu, ri, newvalue); 1705f263522aSJoseph Koshy 17066161b98cSMatt Macy if (pt == NULL) 17076161b98cSMatt Macy pt = pmc_find_thread_descriptor(pp, td, 17086161b98cSMatt Macy PMC_FLAG_NONE); 17096161b98cSMatt Macy 17106161b98cSMatt Macy KASSERT(pt != NULL, 17116161b98cSMatt Macy ("[pmc,%d] No thread found for td=%p", 17126161b98cSMatt Macy __LINE__, td)); 17136161b98cSMatt Macy 1714f263522aSJoseph Koshy mtx_pool_lock_spin(pmc_mtxpool, pm); 17155eaa6f01SJonathan T. Looney 17166161b98cSMatt Macy /* 17176161b98cSMatt Macy * If we have a thread descriptor, save the 17186161b98cSMatt Macy * per-thread counter in the descriptor. If not, 17196161b98cSMatt Macy * we will update the per-process counter. 17206161b98cSMatt Macy * 17216161b98cSMatt Macy * TODO: Remove the per-process "safety net" 17226161b98cSMatt Macy * once we have thoroughly tested that we 17236161b98cSMatt Macy * don't hit the above assert. 17246161b98cSMatt Macy */ 1725d5ee4074SMitchell Horne if (pt != NULL) { 17266161b98cSMatt Macy pt->pt_pmcs[ri].pt_pmcval = newvalue; 1727d5ee4074SMitchell Horne } else { 17286161b98cSMatt Macy /* 17296161b98cSMatt Macy * For sampling process-virtual PMCs, 17306161b98cSMatt Macy * newvalue is the number of events to 17316161b98cSMatt Macy * be seen until the next sampling 17326161b98cSMatt Macy * interrupt. We can just add the events 17336161b98cSMatt Macy * left from this invocation to the 17346161b98cSMatt Macy * counter, then adjust in case we 17356161b98cSMatt Macy * overflow our range. 17366161b98cSMatt Macy * 17376161b98cSMatt Macy * (Recall that we reload the counter 17386161b98cSMatt Macy * every time we use it.) 17396161b98cSMatt Macy */ 17405eaa6f01SJonathan T. Looney pp->pp_pmcs[ri].pp_pmcval += newvalue; 17415eaa6f01SJonathan T. Looney if (pp->pp_pmcs[ri].pp_pmcval > 1742d5ee4074SMitchell Horne pm->pm_sc.pm_reloadcount) { 17435eaa6f01SJonathan T. Looney pp->pp_pmcs[ri].pp_pmcval -= 1744f263522aSJoseph Koshy pm->pm_sc.pm_reloadcount; 17456161b98cSMatt Macy } 1746d5ee4074SMitchell Horne } 1747f263522aSJoseph Koshy mtx_pool_unlock_spin(pmc_mtxpool, pm); 1748f263522aSJoseph Koshy } else { 17495eaa6f01SJonathan T. Looney tmp = newvalue - PMC_PCPU_SAVED(cpu, ri); 17505eaa6f01SJonathan T. Looney 17515eaa6f01SJonathan T. Looney PMCDBG3(CSW,SWO,1,"cpu=%d ri=%d tmp=%jd (count)", 17525eaa6f01SJonathan T. Looney cpu, ri, tmp); 1753f263522aSJoseph Koshy 1754f263522aSJoseph Koshy /* 1755f263522aSJoseph Koshy * For counting process-virtual PMCs, 1756f263522aSJoseph Koshy * we expect the count to be 1757f263522aSJoseph Koshy * increasing monotonically, modulo a 64 1758f263522aSJoseph Koshy * bit wraparound. 1759f263522aSJoseph Koshy */ 17600c8cc7b0SKonstantin Belousov KASSERT(tmp >= 0, 1761ebccf1e3SJoseph Koshy ("[pmc,%d] negative increment cpu=%d " 1762ebccf1e3SJoseph Koshy "ri=%d newvalue=%jx saved=%jx " 1763ebccf1e3SJoseph Koshy "incr=%jx", __LINE__, cpu, ri, 1764f263522aSJoseph Koshy newvalue, PMC_PCPU_SAVED(cpu, ri), tmp)); 1765ebccf1e3SJoseph Koshy 1766ebccf1e3SJoseph Koshy mtx_pool_lock_spin(pmc_mtxpool, pm); 1767ebccf1e3SJoseph Koshy pm->pm_gv.pm_savedvalue += tmp; 1768ebccf1e3SJoseph Koshy pp->pp_pmcs[ri].pp_pmcval += tmp; 1769ebccf1e3SJoseph Koshy mtx_pool_unlock_spin(pmc_mtxpool, pm); 1770ebccf1e3SJoseph Koshy 1771f263522aSJoseph Koshy if (pm->pm_flags & PMC_F_LOG_PROCCSW) 1772a85289cfSMatt Macy pmclog_process_proccsw(pm, pp, tmp, td); 1773f263522aSJoseph Koshy } 1774ebccf1e3SJoseph Koshy } 1775ebccf1e3SJoseph Koshy 177601c35b67SMitchell Horne /* Mark hardware as free. */ 177701c35b67SMitchell Horne (void)pcd->pcd_config_pmc(cpu, adjri, NULL); 1778ebccf1e3SJoseph Koshy } 1779ebccf1e3SJoseph Koshy 1780ebccf1e3SJoseph Koshy /* 178101c35b67SMitchell Horne * Perform any other architecture/cpu dependent thread 1782ebccf1e3SJoseph Koshy * switch out functions. 1783ebccf1e3SJoseph Koshy */ 17846b8c8cd8SJoseph Koshy (void)(*md->pmd_switch_out)(pc, pp); 1785ebccf1e3SJoseph Koshy 1786ebccf1e3SJoseph Koshy critical_exit(); 1787f263522aSJoseph Koshy } 1788f263522aSJoseph Koshy 1789f263522aSJoseph Koshy /* 17906161b98cSMatt Macy * A new thread for a process. 17916161b98cSMatt Macy */ 17926161b98cSMatt Macy static void 17936161b98cSMatt Macy pmc_process_thread_add(struct thread *td) 17946161b98cSMatt Macy { 17956161b98cSMatt Macy struct pmc_process *pmc; 17966161b98cSMatt Macy 17976161b98cSMatt Macy pmc = pmc_find_process_descriptor(td->td_proc, PMC_FLAG_NONE); 17986161b98cSMatt Macy if (pmc != NULL) 17996161b98cSMatt Macy pmc_find_thread_descriptor(pmc, td, PMC_FLAG_ALLOCATE); 18006161b98cSMatt Macy } 18016161b98cSMatt Macy 18026161b98cSMatt Macy /* 18036161b98cSMatt Macy * A thread delete for a process. 18046161b98cSMatt Macy */ 18056161b98cSMatt Macy static void 18066161b98cSMatt Macy pmc_process_thread_delete(struct thread *td) 18076161b98cSMatt Macy { 18086161b98cSMatt Macy struct pmc_process *pmc; 18096161b98cSMatt Macy 18106161b98cSMatt Macy pmc = pmc_find_process_descriptor(td->td_proc, PMC_FLAG_NONE); 18116161b98cSMatt Macy if (pmc != NULL) 18126161b98cSMatt Macy pmc_thread_descriptor_pool_free(pmc_find_thread_descriptor(pmc, 18136161b98cSMatt Macy td, PMC_FLAG_REMOVE)); 18146161b98cSMatt Macy } 18156161b98cSMatt Macy 18166161b98cSMatt Macy /* 18175de96e33SMatt Macy * A userret() call for a thread. 18185de96e33SMatt Macy */ 18195de96e33SMatt Macy static void 18205de96e33SMatt Macy pmc_process_thread_userret(struct thread *td) 18215de96e33SMatt Macy { 1822ac7012d2SMatt Macy sched_pin(); 1823ac7012d2SMatt Macy pmc_capture_user_callchain(curcpu, PMC_UR, td->td_frame); 1824ac7012d2SMatt Macy sched_unpin(); 18255de96e33SMatt Macy } 18265de96e33SMatt Macy 18275de96e33SMatt Macy /* 182849874f6eSJoseph Koshy * A mapping change for a process. 182949874f6eSJoseph Koshy */ 183049874f6eSJoseph Koshy static void 183149874f6eSJoseph Koshy pmc_process_mmap(struct thread *td, struct pmckern_map_in *pkm) 183249874f6eSJoseph Koshy { 183349874f6eSJoseph Koshy const struct pmc *pm; 183449874f6eSJoseph Koshy const struct pmc_process *pp; 183501c35b67SMitchell Horne struct pmc_owner *po; 183601c35b67SMitchell Horne char *fullpath, *freepath; 183701c35b67SMitchell Horne pid_t pid; 183801c35b67SMitchell Horne int ri; 183901c35b67SMitchell Horne 184001c35b67SMitchell Horne MPASS(!in_epoch(global_epoch_preempt)); 184149874f6eSJoseph Koshy 184249874f6eSJoseph Koshy freepath = fullpath = NULL; 184349874f6eSJoseph Koshy pmc_getfilename((struct vnode *)pkm->pm_file, &fullpath, &freepath); 184449874f6eSJoseph Koshy 184549874f6eSJoseph Koshy pid = td->td_proc->p_pid; 184649874f6eSJoseph Koshy 18476573d758SMatt Macy PMC_EPOCH_ENTER(); 184849874f6eSJoseph Koshy /* Inform owners of all system-wide sampling PMCs. */ 1849d5ee4074SMitchell Horne CK_LIST_FOREACH(po, &pmc_ss_owners, po_ssnext) { 185049874f6eSJoseph Koshy if (po->po_flags & PMC_PO_OWNS_LOGFILE) 1851d5ee4074SMitchell Horne pmclog_process_map_in(po, pid, pkm->pm_address, 1852d5ee4074SMitchell Horne fullpath); 1853d5ee4074SMitchell Horne } 185449874f6eSJoseph Koshy 185549874f6eSJoseph Koshy if ((pp = pmc_find_process_descriptor(td->td_proc, 0)) == NULL) 185649874f6eSJoseph Koshy goto done; 185749874f6eSJoseph Koshy 185849874f6eSJoseph Koshy /* 185949874f6eSJoseph Koshy * Inform sampling PMC owners tracking this process. 186049874f6eSJoseph Koshy */ 1861d5ee4074SMitchell Horne for (ri = 0; ri < md->pmd_npmc; ri++) { 186249874f6eSJoseph Koshy if ((pm = pp->pp_pmcs[ri].pp_pmc) != NULL && 1863d5ee4074SMitchell Horne PMC_IS_SAMPLING_MODE(PMC_TO_MODE(pm))) { 186449874f6eSJoseph Koshy pmclog_process_map_in(pm->pm_owner, 186549874f6eSJoseph Koshy pid, pkm->pm_address, fullpath); 1866d5ee4074SMitchell Horne } 1867d5ee4074SMitchell Horne } 186849874f6eSJoseph Koshy 186949874f6eSJoseph Koshy done: 1870d5ee4074SMitchell Horne if (freepath != NULL) 18711ede983cSDag-Erling Smørgrav free(freepath, M_TEMP); 18726573d758SMatt Macy PMC_EPOCH_EXIT(); 187349874f6eSJoseph Koshy } 187449874f6eSJoseph Koshy 187549874f6eSJoseph Koshy /* 187649874f6eSJoseph Koshy * Log an munmap request. 187749874f6eSJoseph Koshy */ 187849874f6eSJoseph Koshy static void 187949874f6eSJoseph Koshy pmc_process_munmap(struct thread *td, struct pmckern_map_out *pkm) 188049874f6eSJoseph Koshy { 188149874f6eSJoseph Koshy const struct pmc *pm; 188249874f6eSJoseph Koshy const struct pmc_process *pp; 188301c35b67SMitchell Horne struct pmc_owner *po; 188401c35b67SMitchell Horne pid_t pid; 188501c35b67SMitchell Horne int ri; 188649874f6eSJoseph Koshy 188749874f6eSJoseph Koshy pid = td->td_proc->p_pid; 188849874f6eSJoseph Koshy 18896573d758SMatt Macy PMC_EPOCH_ENTER(); 1890d5ee4074SMitchell Horne CK_LIST_FOREACH(po, &pmc_ss_owners, po_ssnext) { 189149874f6eSJoseph Koshy if (po->po_flags & PMC_PO_OWNS_LOGFILE) 189249874f6eSJoseph Koshy pmclog_process_map_out(po, pid, pkm->pm_address, 189349874f6eSJoseph Koshy pkm->pm_address + pkm->pm_size); 1894d5ee4074SMitchell Horne } 18956573d758SMatt Macy PMC_EPOCH_EXIT(); 189649874f6eSJoseph Koshy 189749874f6eSJoseph Koshy if ((pp = pmc_find_process_descriptor(td->td_proc, 0)) == NULL) 189849874f6eSJoseph Koshy return; 189949874f6eSJoseph Koshy 1900d5ee4074SMitchell Horne for (ri = 0; ri < md->pmd_npmc; ri++) { 1901d5ee4074SMitchell Horne pm = pp->pp_pmcs[ri].pp_pmc; 1902d5ee4074SMitchell Horne if (pm != NULL && PMC_IS_SAMPLING_MODE(PMC_TO_MODE(pm))) { 19037c9f60e3SJoseph Koshy pmclog_process_map_out(pm->pm_owner, pid, 19047c9f60e3SJoseph Koshy pkm->pm_address, pkm->pm_address + pkm->pm_size); 190549874f6eSJoseph Koshy } 1906d5ee4074SMitchell Horne } 1907d5ee4074SMitchell Horne } 190849874f6eSJoseph Koshy 190949874f6eSJoseph Koshy /* 1910d07f36b0SJoseph Koshy * Log mapping information about the kernel. 1911d07f36b0SJoseph Koshy */ 1912d07f36b0SJoseph Koshy static void 1913d07f36b0SJoseph Koshy pmc_log_kernel_mappings(struct pmc *pm) 1914d07f36b0SJoseph Koshy { 1915d07f36b0SJoseph Koshy struct pmc_owner *po; 1916d07f36b0SJoseph Koshy struct pmckern_map_in *km, *kmbase; 1917d07f36b0SJoseph Koshy 19186573d758SMatt Macy MPASS(in_epoch(global_epoch_preempt) || sx_xlocked(&pmc_sx)); 1919d07f36b0SJoseph Koshy KASSERT(PMC_IS_SAMPLING_MODE(PMC_TO_MODE(pm)), 1920d07f36b0SJoseph Koshy ("[pmc,%d] non-sampling PMC (%p) desires mapping information", 1921d07f36b0SJoseph Koshy __LINE__, (void *) pm)); 1922d07f36b0SJoseph Koshy 1923d07f36b0SJoseph Koshy po = pm->pm_owner; 1924d5ee4074SMitchell Horne if ((po->po_flags & PMC_PO_INITIAL_MAPPINGS_DONE) != 0) 1925d07f36b0SJoseph Koshy return; 1926693cd307SMitchell Horne 192741abd7afSMatt Macy if (PMC_TO_MODE(pm) == PMC_MODE_SS) 192841abd7afSMatt Macy pmc_process_allproc(pm); 1929693cd307SMitchell Horne 1930d07f36b0SJoseph Koshy /* 1931d07f36b0SJoseph Koshy * Log the current set of kernel modules. 1932d07f36b0SJoseph Koshy */ 1933d07f36b0SJoseph Koshy kmbase = linker_hwpmc_list_objects(); 1934d07f36b0SJoseph Koshy for (km = kmbase; km->pm_file != NULL; km++) { 19354a3690dfSJohn Baldwin PMCDBG2(LOG,REG,1,"%s %p", (char *)km->pm_file, 1936d07f36b0SJoseph Koshy (void *)km->pm_address); 1937d07f36b0SJoseph Koshy pmclog_process_map_in(po, (pid_t)-1, km->pm_address, 1938d07f36b0SJoseph Koshy km->pm_file); 1939d07f36b0SJoseph Koshy } 19401ede983cSDag-Erling Smørgrav free(kmbase, M_LINKER); 1941d07f36b0SJoseph Koshy 1942d07f36b0SJoseph Koshy po->po_flags |= PMC_PO_INITIAL_MAPPINGS_DONE; 1943d07f36b0SJoseph Koshy } 1944d07f36b0SJoseph Koshy 1945d07f36b0SJoseph Koshy /* 1946d07f36b0SJoseph Koshy * Log the mappings for a single process. 1947d07f36b0SJoseph Koshy */ 1948d07f36b0SJoseph Koshy static void 1949d07f36b0SJoseph Koshy pmc_log_process_mappings(struct pmc_owner *po, struct proc *p) 1950d07f36b0SJoseph Koshy { 1951bf792d68SJoseph Koshy vm_map_t map; 1952bf792d68SJoseph Koshy vm_map_entry_t entry; 1953bf792d68SJoseph Koshy vm_object_t obj, lobj, tobj; 195401c35b67SMitchell Horne vm_offset_t last_end; 195501c35b67SMitchell Horne vm_offset_t start_addr; 195601c35b67SMitchell Horne struct vnode *vp, *last_vp; 195701c35b67SMitchell Horne struct vmspace *vm; 1958bf792d68SJoseph Koshy char *fullpath, *freepath; 195901c35b67SMitchell Horne u_int last_timestamp; 1960bf792d68SJoseph Koshy 1961bf792d68SJoseph Koshy last_vp = NULL; 1962bf792d68SJoseph Koshy last_end = (vm_offset_t)0; 1963bf792d68SJoseph Koshy fullpath = freepath = NULL; 1964bf792d68SJoseph Koshy 1965bf792d68SJoseph Koshy if ((vm = vmspace_acquire_ref(p)) == NULL) 1966bf792d68SJoseph Koshy return; 1967bf792d68SJoseph Koshy 1968bf792d68SJoseph Koshy map = &vm->vm_map; 1969bf792d68SJoseph Koshy vm_map_lock_read(map); 19702288078cSDoug Moore VM_MAP_ENTRY_FOREACH(entry, map) { 1971bf792d68SJoseph Koshy if (entry == NULL) { 19724a3690dfSJohn Baldwin PMCDBG2(LOG,OPS,2, "hwpmc: vm_map entry unexpectedly " 1973bf792d68SJoseph Koshy "NULL! pid=%d vm_map=%p\n", p->p_pid, map); 1974bf792d68SJoseph Koshy break; 1975bf792d68SJoseph Koshy } 1976bf792d68SJoseph Koshy 1977bf792d68SJoseph Koshy /* 1978bf792d68SJoseph Koshy * We only care about executable map entries. 1979bf792d68SJoseph Koshy */ 1980d5ee4074SMitchell Horne if ((entry->eflags & MAP_ENTRY_IS_SUB_MAP) != 0 || 1981d5ee4074SMitchell Horne (entry->protection & VM_PROT_EXECUTE) == 0 || 1982d5ee4074SMitchell Horne entry->object.vm_object == NULL) { 1983bf792d68SJoseph Koshy continue; 1984bf792d68SJoseph Koshy } 1985bf792d68SJoseph Koshy 1986bf792d68SJoseph Koshy obj = entry->object.vm_object; 198766c392dfSAlan Cox VM_OBJECT_RLOCK(obj); 1988bf792d68SJoseph Koshy 1989bf792d68SJoseph Koshy /* 199001c35b67SMitchell Horne * Walk the backing_object list to find the base (non-shadowed) 199101c35b67SMitchell Horne * vm_object. 1992bf792d68SJoseph Koshy */ 1993d5ee4074SMitchell Horne for (lobj = tobj = obj; tobj != NULL; 1994d5ee4074SMitchell Horne tobj = tobj->backing_object) { 1995bf792d68SJoseph Koshy if (tobj != obj) 199666c392dfSAlan Cox VM_OBJECT_RLOCK(tobj); 1997bf792d68SJoseph Koshy if (lobj != obj) 199866c392dfSAlan Cox VM_OBJECT_RUNLOCK(lobj); 1999bf792d68SJoseph Koshy lobj = tobj; 2000bf792d68SJoseph Koshy } 2001bf792d68SJoseph Koshy 2002bf792d68SJoseph Koshy /* 2003bf792d68SJoseph Koshy * At this point lobj is the base vm_object and it is locked. 2004bf792d68SJoseph Koshy */ 2005bf792d68SJoseph Koshy if (lobj == NULL) { 2006693cd307SMitchell Horne PMCDBG3(LOG,OPS,2, 2007693cd307SMitchell Horne "hwpmc: lobj unexpectedly NULL! pid=%d " 2008bf792d68SJoseph Koshy "vm_map=%p vm_obj=%p\n", p->p_pid, map, obj); 200966c392dfSAlan Cox VM_OBJECT_RUNLOCK(obj); 2010bf792d68SJoseph Koshy continue; 2011bf792d68SJoseph Koshy } 2012bf792d68SJoseph Koshy 201363e4c6cdSEric van Gyzen vp = vm_object_vnode(lobj); 201463e4c6cdSEric van Gyzen if (vp == NULL) { 2015bf792d68SJoseph Koshy if (lobj != obj) 201666c392dfSAlan Cox VM_OBJECT_RUNLOCK(lobj); 201766c392dfSAlan Cox VM_OBJECT_RUNLOCK(obj); 2018bf792d68SJoseph Koshy continue; 2019bf792d68SJoseph Koshy } 2020bf792d68SJoseph Koshy 2021bf792d68SJoseph Koshy /* 202201c35b67SMitchell Horne * Skip contiguous regions that point to the same vnode, so we 202301c35b67SMitchell Horne * don't emit redundant MAP-IN directives. 2024bf792d68SJoseph Koshy */ 202563e4c6cdSEric van Gyzen if (entry->start == last_end && vp == last_vp) { 2026bf792d68SJoseph Koshy last_end = entry->end; 2027bf792d68SJoseph Koshy if (lobj != obj) 202866c392dfSAlan Cox VM_OBJECT_RUNLOCK(lobj); 202966c392dfSAlan Cox VM_OBJECT_RUNLOCK(obj); 2030bf792d68SJoseph Koshy continue; 2031bf792d68SJoseph Koshy } 2032bf792d68SJoseph Koshy 2033bf792d68SJoseph Koshy /* 203401c35b67SMitchell Horne * We don't want to keep the proc's vm_map or this vm_object 203501c35b67SMitchell Horne * locked while we walk the pathname, since vn_fullpath() can 203601c35b67SMitchell Horne * sleep. However, if we drop the lock, it's possible for 203701c35b67SMitchell Horne * concurrent activity to modify the vm_map list. To protect 203801c35b67SMitchell Horne * against this, we save the vm_map timestamp before we release 203901c35b67SMitchell Horne * the lock, and check it after we reacquire the lock below. 2040bf792d68SJoseph Koshy */ 2041bf792d68SJoseph Koshy start_addr = entry->start; 2042bf792d68SJoseph Koshy last_end = entry->end; 2043bf792d68SJoseph Koshy last_timestamp = map->timestamp; 2044bf792d68SJoseph Koshy vm_map_unlock_read(map); 2045bf792d68SJoseph Koshy 2046bf792d68SJoseph Koshy vref(vp); 2047bf792d68SJoseph Koshy if (lobj != obj) 204866c392dfSAlan Cox VM_OBJECT_RUNLOCK(lobj); 204966c392dfSAlan Cox VM_OBJECT_RUNLOCK(obj); 2050bf792d68SJoseph Koshy 2051bf792d68SJoseph Koshy freepath = NULL; 2052bf792d68SJoseph Koshy pmc_getfilename(vp, &fullpath, &freepath); 2053bf792d68SJoseph Koshy last_vp = vp; 2054e9b5dc16SJoseph Koshy 2055bf792d68SJoseph Koshy vrele(vp); 2056e9b5dc16SJoseph Koshy 2057bf792d68SJoseph Koshy vp = NULL; 2058bf792d68SJoseph Koshy pmclog_process_map_in(po, p->p_pid, start_addr, fullpath); 2059d5ee4074SMitchell Horne if (freepath != NULL) 2060bf792d68SJoseph Koshy free(freepath, M_TEMP); 2061bf792d68SJoseph Koshy 2062bf792d68SJoseph Koshy vm_map_lock_read(map); 2063bf792d68SJoseph Koshy 2064bf792d68SJoseph Koshy /* 2065bf792d68SJoseph Koshy * If our saved timestamp doesn't match, this means 2066bf792d68SJoseph Koshy * that the vm_map was modified out from under us and 2067bf792d68SJoseph Koshy * we can't trust our current "entry" pointer. Do a 2068bf792d68SJoseph Koshy * new lookup for this entry. If there is no entry 2069bf792d68SJoseph Koshy * for this address range, vm_map_lookup_entry() will 2070bf792d68SJoseph Koshy * return the previous one, so we always want to go to 20712288078cSDoug Moore * the next entry on the next loop iteration. 2072bf792d68SJoseph Koshy * 2073bf792d68SJoseph Koshy * There is an edge condition here that can occur if 2074bf792d68SJoseph Koshy * there is no entry at or before this address. In 2075bf792d68SJoseph Koshy * this situation, vm_map_lookup_entry returns 2076bf792d68SJoseph Koshy * &map->header, which would cause our loop to abort 2077bf792d68SJoseph Koshy * without processing the rest of the map. However, 2078bf792d68SJoseph Koshy * in practice this will never happen for process 2079bf792d68SJoseph Koshy * vm_map. This is because the executable's text 2080bf792d68SJoseph Koshy * segment is the first mapping in the proc's address 2081bf792d68SJoseph Koshy * space, and this mapping is never removed until the 2082bf792d68SJoseph Koshy * process exits, so there will always be a non-header 2083bf792d68SJoseph Koshy * entry at or before the requested address for 2084bf792d68SJoseph Koshy * vm_map_lookup_entry to return. 2085bf792d68SJoseph Koshy */ 2086bf792d68SJoseph Koshy if (map->timestamp != last_timestamp) 2087bf792d68SJoseph Koshy vm_map_lookup_entry(map, last_end - 1, &entry); 2088bf792d68SJoseph Koshy } 2089bf792d68SJoseph Koshy 2090bf792d68SJoseph Koshy vm_map_unlock_read(map); 2091bf792d68SJoseph Koshy vmspace_free(vm); 2092bf792d68SJoseph Koshy return; 2093d07f36b0SJoseph Koshy } 2094d07f36b0SJoseph Koshy 2095d07f36b0SJoseph Koshy /* 2096d07f36b0SJoseph Koshy * Log mappings for all processes in the system. 2097d07f36b0SJoseph Koshy */ 2098d07f36b0SJoseph Koshy static void 2099d07f36b0SJoseph Koshy pmc_log_all_process_mappings(struct pmc_owner *po) 2100d07f36b0SJoseph Koshy { 2101d07f36b0SJoseph Koshy struct proc *p, *top; 2102d07f36b0SJoseph Koshy 2103d07f36b0SJoseph Koshy sx_assert(&pmc_sx, SX_XLOCKED); 2104d07f36b0SJoseph Koshy 2105d07f36b0SJoseph Koshy if ((p = pfind(1)) == NULL) 2106d07f36b0SJoseph Koshy panic("[pmc,%d] Cannot find init", __LINE__); 2107d07f36b0SJoseph Koshy 2108d07f36b0SJoseph Koshy PROC_UNLOCK(p); 2109d07f36b0SJoseph Koshy 2110d07f36b0SJoseph Koshy sx_slock(&proctree_lock); 2111d07f36b0SJoseph Koshy 2112d07f36b0SJoseph Koshy top = p; 2113d07f36b0SJoseph Koshy for (;;) { 2114d07f36b0SJoseph Koshy pmc_log_process_mappings(po, p); 2115d07f36b0SJoseph Koshy if (!LIST_EMPTY(&p->p_children)) 2116d07f36b0SJoseph Koshy p = LIST_FIRST(&p->p_children); 2117d07f36b0SJoseph Koshy else for (;;) { 2118d07f36b0SJoseph Koshy if (p == top) 2119d07f36b0SJoseph Koshy goto done; 2120d07f36b0SJoseph Koshy if (LIST_NEXT(p, p_sibling)) { 2121d07f36b0SJoseph Koshy p = LIST_NEXT(p, p_sibling); 2122d07f36b0SJoseph Koshy break; 2123d07f36b0SJoseph Koshy } 2124d07f36b0SJoseph Koshy p = p->p_pptr; 2125d07f36b0SJoseph Koshy } 2126d07f36b0SJoseph Koshy } 2127d07f36b0SJoseph Koshy done: 2128d07f36b0SJoseph Koshy sx_sunlock(&proctree_lock); 2129d07f36b0SJoseph Koshy } 2130d07f36b0SJoseph Koshy 2131680f1afdSJohn Baldwin #ifdef HWPMC_DEBUG 2132f263522aSJoseph Koshy const char *pmc_hooknames[] = { 213349874f6eSJoseph Koshy /* these strings correspond to PMC_FN_* in <sys/pmckern.h> */ 2134f263522aSJoseph Koshy "", 2135f263522aSJoseph Koshy "EXEC", 2136f263522aSJoseph Koshy "CSW-IN", 2137f263522aSJoseph Koshy "CSW-OUT", 213849874f6eSJoseph Koshy "SAMPLE", 213929f4e216SMark Johnston "UNUSED1", 214029f4e216SMark Johnston "UNUSED2", 214149874f6eSJoseph Koshy "MMAP", 2142d07f36b0SJoseph Koshy "MUNMAP", 2143f5f9340bSFabien Thomas "CALLCHAIN-NMI", 2144f5f9340bSFabien Thomas "CALLCHAIN-SOFT", 21456161b98cSMatt Macy "SOFTSAMPLING", 21466161b98cSMatt Macy "THR-CREATE", 21476161b98cSMatt Macy "THR-EXIT", 21485de96e33SMatt Macy "THR-USERRET", 2149ebfaf69cSMatt Macy "THR-CREATE-LOG", 2150ebfaf69cSMatt Macy "THR-EXIT-LOG", 2151ebfaf69cSMatt Macy "PROC-CREATE-LOG" 2152f263522aSJoseph Koshy }; 2153f263522aSJoseph Koshy #endif 2154f263522aSJoseph Koshy 215501c35b67SMitchell Horne /* 215601c35b67SMitchell Horne * The 'hook' invoked from the kernel proper 215701c35b67SMitchell Horne */ 2158f263522aSJoseph Koshy static int 2159f263522aSJoseph Koshy pmc_hook_handler(struct thread *td, int function, void *arg) 2160f263522aSJoseph Koshy { 21616161b98cSMatt Macy int cpu; 2162f263522aSJoseph Koshy 21634a3690dfSJohn Baldwin PMCDBG4(MOD,PMH,1, "hook td=%p func=%d \"%s\" arg=%p", td, function, 2164f263522aSJoseph Koshy pmc_hooknames[function], arg); 2165f263522aSJoseph Koshy 2166d5ee4074SMitchell Horne switch (function) { 2167f263522aSJoseph Koshy case PMC_FN_PROCESS_EXEC: 2168c4981694SMitchell Horne pmc_process_exec(td, (struct pmckern_procexec *)arg); 2169ebccf1e3SJoseph Koshy break; 2170ebccf1e3SJoseph Koshy 2171f263522aSJoseph Koshy case PMC_FN_CSW_IN: 2172f263522aSJoseph Koshy pmc_process_csw_in(td); 2173f263522aSJoseph Koshy break; 2174f263522aSJoseph Koshy 2175f263522aSJoseph Koshy case PMC_FN_CSW_OUT: 2176f263522aSJoseph Koshy pmc_process_csw_out(td); 2177f263522aSJoseph Koshy break; 2178f263522aSJoseph Koshy 2179f263522aSJoseph Koshy /* 2180f263522aSJoseph Koshy * Process accumulated PC samples. 2181f263522aSJoseph Koshy * 2182f263522aSJoseph Koshy * This function is expected to be called by hardclock() for 2183f263522aSJoseph Koshy * each CPU that has accumulated PC samples. 2184f263522aSJoseph Koshy * 2185f263522aSJoseph Koshy * This function is to be executed on the CPU whose samples 2186f263522aSJoseph Koshy * are being processed. 2187f263522aSJoseph Koshy */ 2188f263522aSJoseph Koshy case PMC_FN_DO_SAMPLES: 2189f263522aSJoseph Koshy /* 2190f263522aSJoseph Koshy * Clear the cpu specific bit in the CPU mask before 2191f263522aSJoseph Koshy * do the rest of the processing. If the NMI handler 2192f263522aSJoseph Koshy * gets invoked after the "atomic_clear_int()" call 2193f263522aSJoseph Koshy * below but before "pmc_process_samples()" gets 2194f263522aSJoseph Koshy * around to processing the interrupt, then we will 2195f263522aSJoseph Koshy * come back here at the next hardclock() tick (and 2196f263522aSJoseph Koshy * may find nothing to do if "pmc_process_samples()" 2197f263522aSJoseph Koshy * had already processed the interrupt). We don't 2198f263522aSJoseph Koshy * lose the interrupt sample. 2199f263522aSJoseph Koshy */ 2200e6b475e0SMatt Macy DPCPU_SET(pmc_sampled, 0); 22016161b98cSMatt Macy cpu = PCPU_GET(cpuid); 22026161b98cSMatt Macy pmc_process_samples(cpu, PMC_HR); 22036161b98cSMatt Macy pmc_process_samples(cpu, PMC_SR); 22045de96e33SMatt Macy pmc_process_samples(cpu, PMC_UR); 2205f263522aSJoseph Koshy break; 2206f263522aSJoseph Koshy 220749874f6eSJoseph Koshy case PMC_FN_MMAP: 220849874f6eSJoseph Koshy pmc_process_mmap(td, (struct pmckern_map_in *)arg); 220949874f6eSJoseph Koshy break; 221049874f6eSJoseph Koshy 221149874f6eSJoseph Koshy case PMC_FN_MUNMAP: 22126573d758SMatt Macy MPASS(in_epoch(global_epoch_preempt) || sx_xlocked(&pmc_sx)); 221349874f6eSJoseph Koshy pmc_process_munmap(td, (struct pmckern_map_out *)arg); 221449874f6eSJoseph Koshy break; 221549874f6eSJoseph Koshy 2216ebfaf69cSMatt Macy case PMC_FN_PROC_CREATE_LOG: 2217ebfaf69cSMatt Macy pmc_process_proccreate((struct proc *)arg); 2218ebfaf69cSMatt Macy break; 2219ebfaf69cSMatt Macy 2220d07f36b0SJoseph Koshy case PMC_FN_USER_CALLCHAIN: 2221d07f36b0SJoseph Koshy /* 2222d07f36b0SJoseph Koshy * Record a call chain. 2223d07f36b0SJoseph Koshy */ 22246fe00c78SJoseph Koshy KASSERT(td == curthread, ("[pmc,%d] td != curthread", 22256fe00c78SJoseph Koshy __LINE__)); 2226f5f9340bSFabien Thomas 2227f5f9340bSFabien Thomas pmc_capture_user_callchain(PCPU_GET(cpuid), PMC_HR, 2228d07f36b0SJoseph Koshy (struct trapframe *)arg); 22295de96e33SMatt Macy 22305de96e33SMatt Macy KASSERT(td->td_pinned == 1, 22315de96e33SMatt Macy ("[pmc,%d] invalid td_pinned value", __LINE__)); 22325de96e33SMatt Macy sched_unpin(); /* Can migrate safely now. */ 22335de96e33SMatt Macy 22346fe00c78SJoseph Koshy td->td_pflags &= ~TDP_CALLCHAIN; 2235d07f36b0SJoseph Koshy break; 2236d07f36b0SJoseph Koshy 2237f5f9340bSFabien Thomas case PMC_FN_USER_CALLCHAIN_SOFT: 2238f5f9340bSFabien Thomas /* 2239f5f9340bSFabien Thomas * Record a call chain. 2240f5f9340bSFabien Thomas */ 2241f5f9340bSFabien Thomas KASSERT(td == curthread, ("[pmc,%d] td != curthread", 2242f5f9340bSFabien Thomas __LINE__)); 22435de96e33SMatt Macy 22445de96e33SMatt Macy cpu = PCPU_GET(cpuid); 22455de96e33SMatt Macy pmc_capture_user_callchain(cpu, PMC_SR, 2246f5f9340bSFabien Thomas (struct trapframe *) arg); 22475de96e33SMatt Macy 22485de96e33SMatt Macy KASSERT(td->td_pinned == 1, 22495de96e33SMatt Macy ("[pmc,%d] invalid td_pinned value", __LINE__)); 22505de96e33SMatt Macy 22515de96e33SMatt Macy sched_unpin(); /* Can migrate safely now. */ 22525de96e33SMatt Macy 2253f5f9340bSFabien Thomas td->td_pflags &= ~TDP_CALLCHAIN; 2254f5f9340bSFabien Thomas break; 2255f5f9340bSFabien Thomas 2256f5f9340bSFabien Thomas case PMC_FN_SOFT_SAMPLING: 2257f5f9340bSFabien Thomas /* 2258f5f9340bSFabien Thomas * Call soft PMC sampling intr. 2259f5f9340bSFabien Thomas */ 2260f5f9340bSFabien Thomas pmc_soft_intr((struct pmckern_soft *)arg); 2261f5f9340bSFabien Thomas break; 2262f5f9340bSFabien Thomas 22636161b98cSMatt Macy case PMC_FN_THR_CREATE: 22646161b98cSMatt Macy pmc_process_thread_add(td); 2265ebfaf69cSMatt Macy pmc_process_threadcreate(td); 2266ebfaf69cSMatt Macy break; 2267ebfaf69cSMatt Macy 2268ebfaf69cSMatt Macy case PMC_FN_THR_CREATE_LOG: 2269ebfaf69cSMatt Macy pmc_process_threadcreate(td); 22706161b98cSMatt Macy break; 22716161b98cSMatt Macy 22726161b98cSMatt Macy case PMC_FN_THR_EXIT: 22736161b98cSMatt Macy KASSERT(td == curthread, ("[pmc,%d] td != curthread", 22746161b98cSMatt Macy __LINE__)); 22756161b98cSMatt Macy pmc_process_thread_delete(td); 2276ebfaf69cSMatt Macy pmc_process_threadexit(td); 22776161b98cSMatt Macy break; 2278ebfaf69cSMatt Macy case PMC_FN_THR_EXIT_LOG: 2279ebfaf69cSMatt Macy pmc_process_threadexit(td); 2280ebfaf69cSMatt Macy break; 22815de96e33SMatt Macy case PMC_FN_THR_USERRET: 22825de96e33SMatt Macy KASSERT(td == curthread, ("[pmc,%d] td != curthread", 22835de96e33SMatt Macy __LINE__)); 22845de96e33SMatt Macy pmc_process_thread_userret(td); 22855de96e33SMatt Macy break; 2286ebccf1e3SJoseph Koshy default: 2287680f1afdSJohn Baldwin #ifdef HWPMC_DEBUG 2288ebccf1e3SJoseph Koshy KASSERT(0, ("[pmc,%d] unknown hook %d\n", __LINE__, function)); 2289ebccf1e3SJoseph Koshy #endif 2290ebccf1e3SJoseph Koshy break; 2291ebccf1e3SJoseph Koshy } 2292ebccf1e3SJoseph Koshy 229352ebac7fSMitchell Horne return (0); 2294ebccf1e3SJoseph Koshy } 2295ebccf1e3SJoseph Koshy 2296ebccf1e3SJoseph Koshy /* 229701c35b67SMitchell Horne * Allocate a 'struct pmc_owner' descriptor in the owner hash table. 2298ebccf1e3SJoseph Koshy */ 2299ebccf1e3SJoseph Koshy static struct pmc_owner * 2300ebccf1e3SJoseph Koshy pmc_allocate_owner_descriptor(struct proc *p) 2301ebccf1e3SJoseph Koshy { 2302ebccf1e3SJoseph Koshy struct pmc_owner *po; 2303ebccf1e3SJoseph Koshy struct pmc_ownerhash *poh; 230401c35b67SMitchell Horne uint32_t hindex; 2305ebccf1e3SJoseph Koshy 2306ebccf1e3SJoseph Koshy hindex = PMC_HASH_PTR(p, pmc_ownerhashmask); 2307ebccf1e3SJoseph Koshy poh = &pmc_ownerhash[hindex]; 2308ebccf1e3SJoseph Koshy 230901c35b67SMitchell Horne /* Allocate space for N pointers and one descriptor struct. */ 2310e829eb6dSJoseph Koshy po = malloc(sizeof(struct pmc_owner), M_PMC, M_WAITOK | M_ZERO); 2311ebccf1e3SJoseph Koshy po->po_owner = p; 2312ebccf1e3SJoseph Koshy LIST_INSERT_HEAD(poh, po, po_next); /* insert into hash table */ 2313ebccf1e3SJoseph Koshy 2314f263522aSJoseph Koshy TAILQ_INIT(&po->po_logbuffers); 2315382d30cdSJoseph Koshy mtx_init(&po->po_mtx, "pmc-owner-mtx", "pmc-per-proc", MTX_SPIN); 2316f263522aSJoseph Koshy 23174a3690dfSJohn Baldwin PMCDBG4(OWN,ALL,1, "allocate-owner proc=%p (%d, %s) pmc-owner=%p", 2318ebccf1e3SJoseph Koshy p, p->p_pid, p->p_comm, po); 2319ebccf1e3SJoseph Koshy 232052ebac7fSMitchell Horne return (po); 2321ebccf1e3SJoseph Koshy } 2322ebccf1e3SJoseph Koshy 2323f263522aSJoseph Koshy static void 2324f263522aSJoseph Koshy pmc_destroy_owner_descriptor(struct pmc_owner *po) 2325f263522aSJoseph Koshy { 2326f263522aSJoseph Koshy 23274a3690dfSJohn Baldwin PMCDBG4(OWN,REL,1, "destroy-owner po=%p proc=%p (%d, %s)", 2328f263522aSJoseph Koshy po, po->po_owner, po->po_owner->p_pid, po->po_owner->p_comm); 2329f263522aSJoseph Koshy 2330f263522aSJoseph Koshy mtx_destroy(&po->po_mtx); 23311ede983cSDag-Erling Smørgrav free(po, M_PMC); 2332f263522aSJoseph Koshy } 2333f263522aSJoseph Koshy 2334ebccf1e3SJoseph Koshy /* 23356161b98cSMatt Macy * Allocate a thread descriptor from the free pool. 23366161b98cSMatt Macy * 23376161b98cSMatt Macy * NOTE: This *can* return NULL. 23386161b98cSMatt Macy */ 23396161b98cSMatt Macy static struct pmc_thread * 23406161b98cSMatt Macy pmc_thread_descriptor_pool_alloc(void) 23416161b98cSMatt Macy { 23426161b98cSMatt Macy struct pmc_thread *pt; 23436161b98cSMatt Macy 23446161b98cSMatt Macy mtx_lock_spin(&pmc_threadfreelist_mtx); 23456161b98cSMatt Macy if ((pt = LIST_FIRST(&pmc_threadfreelist)) != NULL) { 23466161b98cSMatt Macy LIST_REMOVE(pt, pt_next); 23476161b98cSMatt Macy pmc_threadfreelist_entries--; 23486161b98cSMatt Macy } 23496161b98cSMatt Macy mtx_unlock_spin(&pmc_threadfreelist_mtx); 23506161b98cSMatt Macy 23516161b98cSMatt Macy return (pt); 23526161b98cSMatt Macy } 23536161b98cSMatt Macy 23546161b98cSMatt Macy /* 23556161b98cSMatt Macy * Add a thread descriptor to the free pool. We use this instead of free() 23566161b98cSMatt Macy * to maintain a cache of free entries. Additionally, we can safely call 23576161b98cSMatt Macy * this function when we cannot call free(), such as in a critical section. 23586161b98cSMatt Macy */ 23596161b98cSMatt Macy static void 23606161b98cSMatt Macy pmc_thread_descriptor_pool_free(struct pmc_thread *pt) 23616161b98cSMatt Macy { 23626161b98cSMatt Macy 23636161b98cSMatt Macy if (pt == NULL) 23646161b98cSMatt Macy return; 23656161b98cSMatt Macy 23666161b98cSMatt Macy memset(pt, 0, THREADENTRY_SIZE); 23676161b98cSMatt Macy mtx_lock_spin(&pmc_threadfreelist_mtx); 23686161b98cSMatt Macy LIST_INSERT_HEAD(&pmc_threadfreelist, pt, pt_next); 23696161b98cSMatt Macy pmc_threadfreelist_entries++; 23706161b98cSMatt Macy if (pmc_threadfreelist_entries > pmc_threadfreelist_max) 23719b1d850bSMark Johnston taskqueue_enqueue(taskqueue_fast, &free_task); 23726161b98cSMatt Macy mtx_unlock_spin(&pmc_threadfreelist_mtx); 23736161b98cSMatt Macy } 23746161b98cSMatt Macy 23756161b98cSMatt Macy /* 23769b1d850bSMark Johnston * An asynchronous task to manage the free list. 23776161b98cSMatt Macy */ 23786161b98cSMatt Macy static void 23799b1d850bSMark Johnston pmc_thread_descriptor_pool_free_task(void *arg __unused, int pending __unused) 23806161b98cSMatt Macy { 23816161b98cSMatt Macy struct pmc_thread *pt; 23826161b98cSMatt Macy LIST_HEAD(, pmc_thread) tmplist; 23836161b98cSMatt Macy int delta; 23846161b98cSMatt Macy 23856161b98cSMatt Macy LIST_INIT(&tmplist); 23869893ab3fSMark Johnston 23876161b98cSMatt Macy /* Determine what changes, if any, we need to make. */ 23886161b98cSMatt Macy mtx_lock_spin(&pmc_threadfreelist_mtx); 23896161b98cSMatt Macy delta = pmc_threadfreelist_entries - pmc_threadfreelist_max; 23909893ab3fSMark Johnston while (delta > 0 && (pt = LIST_FIRST(&pmc_threadfreelist)) != NULL) { 23913de22849SMatt Macy delta--; 23929893ab3fSMark Johnston pmc_threadfreelist_entries--; 23936161b98cSMatt Macy LIST_REMOVE(pt, pt_next); 23946161b98cSMatt Macy LIST_INSERT_HEAD(&tmplist, pt, pt_next); 23956161b98cSMatt Macy } 23966161b98cSMatt Macy mtx_unlock_spin(&pmc_threadfreelist_mtx); 23976161b98cSMatt Macy 23986161b98cSMatt Macy /* If there are entries to free, free them. */ 23996161b98cSMatt Macy while (!LIST_EMPTY(&tmplist)) { 24003de22849SMatt Macy pt = LIST_FIRST(&tmplist); 24016161b98cSMatt Macy LIST_REMOVE(pt, pt_next); 24026161b98cSMatt Macy free(pt, M_PMC); 24036161b98cSMatt Macy } 24046161b98cSMatt Macy } 24056161b98cSMatt Macy 24066161b98cSMatt Macy /* 24076161b98cSMatt Macy * Drain the thread free pool, freeing all allocations. 24086161b98cSMatt Macy */ 24096161b98cSMatt Macy static void 2410555d2c93SDimitry Andric pmc_thread_descriptor_pool_drain(void) 24116161b98cSMatt Macy { 24126161b98cSMatt Macy struct pmc_thread *pt, *next; 24136161b98cSMatt Macy 24146161b98cSMatt Macy LIST_FOREACH_SAFE(pt, &pmc_threadfreelist, pt_next, next) { 24156161b98cSMatt Macy LIST_REMOVE(pt, pt_next); 24166161b98cSMatt Macy free(pt, M_PMC); 24176161b98cSMatt Macy } 24186161b98cSMatt Macy } 24196161b98cSMatt Macy 24206161b98cSMatt Macy /* 24216161b98cSMatt Macy * find the descriptor corresponding to thread 'td', adding or removing it 24226161b98cSMatt Macy * as specified by 'mode'. 24236161b98cSMatt Macy * 24246161b98cSMatt Macy * Note that this supports additional mode flags in addition to those 24256161b98cSMatt Macy * supported by pmc_find_process_descriptor(): 24266161b98cSMatt Macy * PMC_FLAG_NOWAIT: Causes the function to not wait for mallocs. 24276161b98cSMatt Macy * This makes it safe to call while holding certain other locks. 24286161b98cSMatt Macy */ 24296161b98cSMatt Macy static struct pmc_thread * 24306161b98cSMatt Macy pmc_find_thread_descriptor(struct pmc_process *pp, struct thread *td, 24316161b98cSMatt Macy uint32_t mode) 24326161b98cSMatt Macy { 24336161b98cSMatt Macy struct pmc_thread *pt = NULL, *ptnew = NULL; 24346161b98cSMatt Macy int wait_flag; 24356161b98cSMatt Macy 24366161b98cSMatt Macy KASSERT(td != NULL, ("[pmc,%d] called to add NULL td", __LINE__)); 24376161b98cSMatt Macy 24386161b98cSMatt Macy /* 24396161b98cSMatt Macy * Pre-allocate memory in the PMC_FLAG_ALLOCATE case prior to 24406161b98cSMatt Macy * acquiring the lock. 24416161b98cSMatt Macy */ 2442d5ee4074SMitchell Horne if ((mode & PMC_FLAG_ALLOCATE) != 0) { 24436161b98cSMatt Macy if ((ptnew = pmc_thread_descriptor_pool_alloc()) == NULL) { 244439446ce5SMatt Macy wait_flag = M_WAITOK; 2445693cd307SMitchell Horne if ((mode & PMC_FLAG_NOWAIT) != 0 || 2446693cd307SMitchell Horne in_epoch(global_epoch_preempt)) 244739446ce5SMatt Macy wait_flag = M_NOWAIT; 244839446ce5SMatt Macy 24496161b98cSMatt Macy ptnew = malloc(THREADENTRY_SIZE, M_PMC, 24506161b98cSMatt Macy wait_flag | M_ZERO); 24516161b98cSMatt Macy } 24526161b98cSMatt Macy } 24536161b98cSMatt Macy 24546161b98cSMatt Macy mtx_lock_spin(pp->pp_tdslock); 2455d5ee4074SMitchell Horne LIST_FOREACH(pt, &pp->pp_tds, pt_next) { 24566161b98cSMatt Macy if (pt->pt_td == td) 24576161b98cSMatt Macy break; 2458d5ee4074SMitchell Horne } 24596161b98cSMatt Macy 2460d5ee4074SMitchell Horne if ((mode & PMC_FLAG_REMOVE) != 0 && pt != NULL) 24616161b98cSMatt Macy LIST_REMOVE(pt, pt_next); 24626161b98cSMatt Macy 2463d5ee4074SMitchell Horne if ((mode & PMC_FLAG_ALLOCATE) != 0 && pt == NULL && ptnew != NULL) { 24646161b98cSMatt Macy pt = ptnew; 24656161b98cSMatt Macy ptnew = NULL; 24666161b98cSMatt Macy pt->pt_td = td; 24676161b98cSMatt Macy LIST_INSERT_HEAD(&pp->pp_tds, pt, pt_next); 24686161b98cSMatt Macy } 24696161b98cSMatt Macy 24706161b98cSMatt Macy mtx_unlock_spin(pp->pp_tdslock); 24716161b98cSMatt Macy 24726161b98cSMatt Macy if (ptnew != NULL) { 24736161b98cSMatt Macy free(ptnew, M_PMC); 24746161b98cSMatt Macy } 24756161b98cSMatt Macy 247652ebac7fSMitchell Horne return (pt); 24776161b98cSMatt Macy } 24786161b98cSMatt Macy 24796161b98cSMatt Macy /* 24806161b98cSMatt Macy * Try to add thread descriptors for each thread in a process. 24816161b98cSMatt Macy */ 24826161b98cSMatt Macy static void 24836161b98cSMatt Macy pmc_add_thread_descriptors_from_proc(struct proc *p, struct pmc_process *pp) 24846161b98cSMatt Macy { 24856161b98cSMatt Macy struct pmc_thread **tdlist; 248601c35b67SMitchell Horne struct thread *curtd; 24876161b98cSMatt Macy int i, tdcnt, tdlistsz; 24886161b98cSMatt Macy 24896161b98cSMatt Macy KASSERT(!PROC_LOCKED(p), ("[pmc,%d] proc unexpectedly locked", 24906161b98cSMatt Macy __LINE__)); 24916161b98cSMatt Macy tdcnt = 32; 24926161b98cSMatt Macy restart: 24936161b98cSMatt Macy tdlistsz = roundup2(tdcnt, 32); 24946161b98cSMatt Macy 24956161b98cSMatt Macy tdcnt = 0; 2496693cd307SMitchell Horne tdlist = malloc(sizeof(struct pmc_thread *) * tdlistsz, M_TEMP, 2497693cd307SMitchell Horne M_WAITOK); 24986161b98cSMatt Macy 24996161b98cSMatt Macy PROC_LOCK(p); 25006161b98cSMatt Macy FOREACH_THREAD_IN_PROC(p, curtd) 25016161b98cSMatt Macy tdcnt++; 25026161b98cSMatt Macy if (tdcnt >= tdlistsz) { 25036161b98cSMatt Macy PROC_UNLOCK(p); 25046161b98cSMatt Macy free(tdlist, M_TEMP); 25056161b98cSMatt Macy goto restart; 25066161b98cSMatt Macy } 2507693cd307SMitchell Horne 25086161b98cSMatt Macy /* 25096161b98cSMatt Macy * Try to add each thread to the list without sleeping. If unable, 25106161b98cSMatt Macy * add to a queue to retry after dropping the process lock. 25116161b98cSMatt Macy */ 25126161b98cSMatt Macy tdcnt = 0; 25136161b98cSMatt Macy FOREACH_THREAD_IN_PROC(p, curtd) { 25146161b98cSMatt Macy tdlist[tdcnt] = pmc_find_thread_descriptor(pp, curtd, 25156161b98cSMatt Macy PMC_FLAG_ALLOCATE | PMC_FLAG_NOWAIT); 25166161b98cSMatt Macy if (tdlist[tdcnt] == NULL) { 25176161b98cSMatt Macy PROC_UNLOCK(p); 25186161b98cSMatt Macy for (i = 0; i <= tdcnt; i++) 25196161b98cSMatt Macy pmc_thread_descriptor_pool_free(tdlist[i]); 25206161b98cSMatt Macy free(tdlist, M_TEMP); 25216161b98cSMatt Macy goto restart; 25226161b98cSMatt Macy } 25236161b98cSMatt Macy tdcnt++; 25246161b98cSMatt Macy } 25256161b98cSMatt Macy PROC_UNLOCK(p); 25266161b98cSMatt Macy free(tdlist, M_TEMP); 25276161b98cSMatt Macy } 25286161b98cSMatt Macy 25296161b98cSMatt Macy /* 253001c35b67SMitchell Horne * Find the descriptor corresponding to process 'p', adding or removing it 2531ebccf1e3SJoseph Koshy * as specified by 'mode'. 2532ebccf1e3SJoseph Koshy */ 2533ebccf1e3SJoseph Koshy static struct pmc_process * 2534ebccf1e3SJoseph Koshy pmc_find_process_descriptor(struct proc *p, uint32_t mode) 2535ebccf1e3SJoseph Koshy { 2536ebccf1e3SJoseph Koshy struct pmc_process *pp, *ppnew; 2537ebccf1e3SJoseph Koshy struct pmc_processhash *pph; 253801c35b67SMitchell Horne uint32_t hindex; 2539ebccf1e3SJoseph Koshy 2540ebccf1e3SJoseph Koshy hindex = PMC_HASH_PTR(p, pmc_processhashmask); 2541ebccf1e3SJoseph Koshy pph = &pmc_processhash[hindex]; 2542ebccf1e3SJoseph Koshy 2543ebccf1e3SJoseph Koshy ppnew = NULL; 2544ebccf1e3SJoseph Koshy 2545ebccf1e3SJoseph Koshy /* 25466161b98cSMatt Macy * Pre-allocate memory in the PMC_FLAG_ALLOCATE case since we 2547ebccf1e3SJoseph Koshy * cannot call malloc(9) once we hold a spin lock. 2548ebccf1e3SJoseph Koshy */ 2549d5ee4074SMitchell Horne if ((mode & PMC_FLAG_ALLOCATE) != 0) 25501ede983cSDag-Erling Smørgrav ppnew = malloc(sizeof(struct pmc_process) + md->pmd_npmc * 2551e829eb6dSJoseph Koshy sizeof(struct pmc_targetstate), M_PMC, M_WAITOK | M_ZERO); 2552ebccf1e3SJoseph Koshy 2553ebccf1e3SJoseph Koshy mtx_lock_spin(&pmc_processhash_mtx); 2554d5ee4074SMitchell Horne LIST_FOREACH(pp, pph, pp_next) { 2555ebccf1e3SJoseph Koshy if (pp->pp_proc == p) 2556ebccf1e3SJoseph Koshy break; 2557d5ee4074SMitchell Horne } 2558ebccf1e3SJoseph Koshy 2559d5ee4074SMitchell Horne if ((mode & PMC_FLAG_REMOVE) != 0 && pp != NULL) 2560ebccf1e3SJoseph Koshy LIST_REMOVE(pp, pp_next); 2561ebccf1e3SJoseph Koshy 2562d5ee4074SMitchell Horne if ((mode & PMC_FLAG_ALLOCATE) != 0 && pp == NULL && ppnew != NULL) { 2563ebccf1e3SJoseph Koshy ppnew->pp_proc = p; 25646161b98cSMatt Macy LIST_INIT(&ppnew->pp_tds); 25656161b98cSMatt Macy ppnew->pp_tdslock = mtx_pool_find(pmc_mtxpool, ppnew); 2566ebccf1e3SJoseph Koshy LIST_INSERT_HEAD(pph, ppnew, pp_next); 25676161b98cSMatt Macy mtx_unlock_spin(&pmc_processhash_mtx); 2568ebccf1e3SJoseph Koshy pp = ppnew; 2569ebccf1e3SJoseph Koshy ppnew = NULL; 25706161b98cSMatt Macy 25716161b98cSMatt Macy /* Add thread descriptors for this process' current threads. */ 25726161b98cSMatt Macy pmc_add_thread_descriptors_from_proc(p, pp); 2573693cd307SMitchell Horne } else 2574ebccf1e3SJoseph Koshy mtx_unlock_spin(&pmc_processhash_mtx); 2575ebccf1e3SJoseph Koshy 25766161b98cSMatt Macy if (ppnew != NULL) 25771ede983cSDag-Erling Smørgrav free(ppnew, M_PMC); 257852ebac7fSMitchell Horne return (pp); 2579ebccf1e3SJoseph Koshy } 2580ebccf1e3SJoseph Koshy 2581ebccf1e3SJoseph Koshy /* 258201c35b67SMitchell Horne * Remove a process descriptor from the process hash table. 2583ebccf1e3SJoseph Koshy */ 2584ebccf1e3SJoseph Koshy static void 2585ebccf1e3SJoseph Koshy pmc_remove_process_descriptor(struct pmc_process *pp) 2586ebccf1e3SJoseph Koshy { 2587ebccf1e3SJoseph Koshy KASSERT(pp->pp_refcnt == 0, 2588ebccf1e3SJoseph Koshy ("[pmc,%d] Removing process descriptor %p with count %d", 2589ebccf1e3SJoseph Koshy __LINE__, pp, pp->pp_refcnt)); 2590ebccf1e3SJoseph Koshy 2591ebccf1e3SJoseph Koshy mtx_lock_spin(&pmc_processhash_mtx); 2592ebccf1e3SJoseph Koshy LIST_REMOVE(pp, pp_next); 2593ebccf1e3SJoseph Koshy mtx_unlock_spin(&pmc_processhash_mtx); 2594ebccf1e3SJoseph Koshy } 2595ebccf1e3SJoseph Koshy 25966161b98cSMatt Macy /* 259701c35b67SMitchell Horne * Destroy a process descriptor. 25986161b98cSMatt Macy */ 25996161b98cSMatt Macy static void 26006161b98cSMatt Macy pmc_destroy_process_descriptor(struct pmc_process *pp) 26016161b98cSMatt Macy { 26026161b98cSMatt Macy struct pmc_thread *pmc_td; 26036161b98cSMatt Macy 26046161b98cSMatt Macy while ((pmc_td = LIST_FIRST(&pp->pp_tds)) != NULL) { 26056161b98cSMatt Macy LIST_REMOVE(pmc_td, pt_next); 26066161b98cSMatt Macy pmc_thread_descriptor_pool_free(pmc_td); 26076161b98cSMatt Macy } 26086161b98cSMatt Macy free(pp, M_PMC); 26096161b98cSMatt Macy } 26106161b98cSMatt Macy 2611ebccf1e3SJoseph Koshy /* 261201c35b67SMitchell Horne * Find an owner descriptor corresponding to proc 'p'. 2613ebccf1e3SJoseph Koshy */ 2614ebccf1e3SJoseph Koshy static struct pmc_owner * 2615ebccf1e3SJoseph Koshy pmc_find_owner_descriptor(struct proc *p) 2616ebccf1e3SJoseph Koshy { 2617ebccf1e3SJoseph Koshy struct pmc_owner *po; 2618ebccf1e3SJoseph Koshy struct pmc_ownerhash *poh; 261901c35b67SMitchell Horne uint32_t hindex; 2620ebccf1e3SJoseph Koshy 2621ebccf1e3SJoseph Koshy hindex = PMC_HASH_PTR(p, pmc_ownerhashmask); 2622ebccf1e3SJoseph Koshy poh = &pmc_ownerhash[hindex]; 2623ebccf1e3SJoseph Koshy 2624ebccf1e3SJoseph Koshy po = NULL; 2625d5ee4074SMitchell Horne LIST_FOREACH(po, poh, po_next) { 2626ebccf1e3SJoseph Koshy if (po->po_owner == p) 2627ebccf1e3SJoseph Koshy break; 2628d5ee4074SMitchell Horne } 2629ebccf1e3SJoseph Koshy 26304a3690dfSJohn Baldwin PMCDBG5(OWN,FND,1, "find-owner proc=%p (%d, %s) hindex=0x%x -> " 2631ebccf1e3SJoseph Koshy "pmc-owner=%p", p, p->p_pid, p->p_comm, hindex, po); 2632ebccf1e3SJoseph Koshy 263352ebac7fSMitchell Horne return (po); 2634ebccf1e3SJoseph Koshy } 2635ebccf1e3SJoseph Koshy 2636ebccf1e3SJoseph Koshy /* 263701c35b67SMitchell Horne * Allocate a pmc descriptor and initialize its fields. 2638ebccf1e3SJoseph Koshy */ 2639ebccf1e3SJoseph Koshy static struct pmc * 2640ebccf1e3SJoseph Koshy pmc_allocate_pmc_descriptor(void) 2641ebccf1e3SJoseph Koshy { 2642ebccf1e3SJoseph Koshy struct pmc *pmc; 2643ebccf1e3SJoseph Koshy 2644e829eb6dSJoseph Koshy pmc = malloc(sizeof(struct pmc), M_PMC, M_WAITOK | M_ZERO); 2645e6b475e0SMatt Macy pmc->pm_runcount = counter_u64_alloc(M_WAITOK); 2646693cd307SMitchell Horne pmc->pm_pcpu_state = malloc(sizeof(struct pmc_pcpu_state) * mp_ncpus, 2647693cd307SMitchell Horne M_PMC, M_WAITOK | M_ZERO); 26484a3690dfSJohn Baldwin PMCDBG1(PMC,ALL,1, "allocate-pmc -> pmc=%p", pmc); 2649ebccf1e3SJoseph Koshy 265052ebac7fSMitchell Horne return (pmc); 2651ebccf1e3SJoseph Koshy } 2652ebccf1e3SJoseph Koshy 2653ebccf1e3SJoseph Koshy /* 2654ebccf1e3SJoseph Koshy * Destroy a pmc descriptor. 2655ebccf1e3SJoseph Koshy */ 2656ebccf1e3SJoseph Koshy static void 2657ebccf1e3SJoseph Koshy pmc_destroy_pmc_descriptor(struct pmc *pm) 2658ebccf1e3SJoseph Koshy { 2659ebccf1e3SJoseph Koshy 2660ebccf1e3SJoseph Koshy KASSERT(pm->pm_state == PMC_STATE_DELETED || 2661ebccf1e3SJoseph Koshy pm->pm_state == PMC_STATE_FREE, 2662ebccf1e3SJoseph Koshy ("[pmc,%d] destroying non-deleted PMC", __LINE__)); 2663ebccf1e3SJoseph Koshy KASSERT(LIST_EMPTY(&pm->pm_targets), 2664ebccf1e3SJoseph Koshy ("[pmc,%d] destroying pmc with targets", __LINE__)); 2665ebccf1e3SJoseph Koshy KASSERT(pm->pm_owner == NULL, 2666ebccf1e3SJoseph Koshy ("[pmc,%d] destroying pmc attached to an owner", __LINE__)); 2667e6b475e0SMatt Macy KASSERT(counter_u64_fetch(pm->pm_runcount) == 0, 266801c35b67SMitchell Horne ("[pmc,%d] pmc has non-zero run count %ju", __LINE__, 266901c35b67SMitchell Horne (uintmax_t)counter_u64_fetch(pm->pm_runcount))); 267006796b67SMark Johnston 2671e6b475e0SMatt Macy counter_u64_free(pm->pm_runcount); 2672e6b475e0SMatt Macy free(pm->pm_pcpu_state, M_PMC); 267306796b67SMark Johnston free(pm, M_PMC); 2674ebccf1e3SJoseph Koshy } 2675ebccf1e3SJoseph Koshy 2676f263522aSJoseph Koshy static void 2677f263522aSJoseph Koshy pmc_wait_for_pmc_idle(struct pmc *pm) 2678f263522aSJoseph Koshy { 2679d9f1b8dbSMatt Macy #ifdef INVARIANTS 2680f263522aSJoseph Koshy volatile int maxloop; 2681f263522aSJoseph Koshy 2682122ccdc1SJoseph Koshy maxloop = 100 * pmc_cpu_max(); 2683f263522aSJoseph Koshy #endif 2684f263522aSJoseph Koshy /* 2685f263522aSJoseph Koshy * Loop (with a forced context switch) till the PMC's runcount 2686f263522aSJoseph Koshy * comes down to zero. 2687f263522aSJoseph Koshy */ 2688ebfaf69cSMatt Macy pmclog_flush(pm->pm_owner, 1); 2689e6b475e0SMatt Macy while (counter_u64_fetch(pm->pm_runcount) > 0) { 2690ebfaf69cSMatt Macy pmclog_flush(pm->pm_owner, 1); 2691d9f1b8dbSMatt Macy #ifdef INVARIANTS 2692f263522aSJoseph Koshy maxloop--; 2693f263522aSJoseph Koshy KASSERT(maxloop > 0, 269401c35b67SMitchell Horne ("[pmc,%d] (ri%d, rc%ju) waiting too long for " 269501c35b67SMitchell Horne "pmc to be free", __LINE__, PMC_TO_ROWINDEX(pm), 269601c35b67SMitchell Horne (uintmax_t)counter_u64_fetch(pm->pm_runcount))); 2697f263522aSJoseph Koshy #endif 2698f263522aSJoseph Koshy pmc_force_context_switch(); 2699f263522aSJoseph Koshy } 2700f263522aSJoseph Koshy } 2701f263522aSJoseph Koshy 2702ebccf1e3SJoseph Koshy /* 2703ebccf1e3SJoseph Koshy * This function does the following things: 2704ebccf1e3SJoseph Koshy * 2705ebccf1e3SJoseph Koshy * - detaches the PMC from hardware 2706ebccf1e3SJoseph Koshy * - unlinks all target threads that were attached to it 2707ebccf1e3SJoseph Koshy * - removes the PMC from its owner's list 270806796b67SMark Johnston * - destroys the PMC private mutex 2709ebccf1e3SJoseph Koshy * 271006796b67SMark Johnston * Once this function completes, the given pmc pointer can be freed by 271106796b67SMark Johnston * calling pmc_destroy_pmc_descriptor(). 2712ebccf1e3SJoseph Koshy */ 2713ebccf1e3SJoseph Koshy static void 2714ebccf1e3SJoseph Koshy pmc_release_pmc_descriptor(struct pmc *pm) 2715ebccf1e3SJoseph Koshy { 2716ebccf1e3SJoseph Koshy struct pmc_binding pb; 2717e829eb6dSJoseph Koshy struct pmc_classdep *pcd; 271801c35b67SMitchell Horne struct pmc_hw *phw __diagused; 271901c35b67SMitchell Horne struct pmc_owner *po; 272001c35b67SMitchell Horne struct pmc_process *pp; 2721e829eb6dSJoseph Koshy struct pmc_target *ptgt, *tmp; 272201c35b67SMitchell Horne enum pmc_mode mode; 272301c35b67SMitchell Horne u_int adjri, ri, cpu; 2724ebccf1e3SJoseph Koshy 2725ebccf1e3SJoseph Koshy sx_assert(&pmc_sx, SX_XLOCKED); 2726ebccf1e3SJoseph Koshy KASSERT(pm, ("[pmc,%d] null pmc", __LINE__)); 2727ebccf1e3SJoseph Koshy 2728c5153e19SJoseph Koshy ri = PMC_TO_ROWINDEX(pm); 2729e829eb6dSJoseph Koshy pcd = pmc_ri_to_classdep(md, ri, &adjri); 2730c5153e19SJoseph Koshy mode = PMC_TO_MODE(pm); 2731ebccf1e3SJoseph Koshy 27324a3690dfSJohn Baldwin PMCDBG3(PMC,REL,1, "release-pmc pmc=%p ri=%d mode=%d", pm, ri, 2733c5153e19SJoseph Koshy mode); 2734ebccf1e3SJoseph Koshy 2735ebccf1e3SJoseph Koshy /* 2736ebccf1e3SJoseph Koshy * First, we take the PMC off hardware. 2737ebccf1e3SJoseph Koshy */ 2738869f4a8bSWarner Losh cpu = 0; 2739c5153e19SJoseph Koshy if (PMC_IS_SYSTEM_MODE(mode)) { 2740ebccf1e3SJoseph Koshy /* 2741ebccf1e3SJoseph Koshy * A system mode PMC runs on a specific CPU. Switch 2742ebccf1e3SJoseph Koshy * to this CPU and turn hardware off. 2743ebccf1e3SJoseph Koshy */ 2744ebccf1e3SJoseph Koshy pmc_save_cpu_binding(&pb); 2745c5153e19SJoseph Koshy cpu = PMC_TO_CPU(pm); 2746ebccf1e3SJoseph Koshy pmc_select_cpu(cpu); 2747ebccf1e3SJoseph Koshy 2748f263522aSJoseph Koshy /* switch off non-stalled CPUs */ 2749e6b475e0SMatt Macy pm->pm_pcpu_state[cpu].pps_cpustate = 0; 2750f263522aSJoseph Koshy if (pm->pm_state == PMC_STATE_RUNNING && 2751e6b475e0SMatt Macy pm->pm_pcpu_state[cpu].pps_stalled == 0) { 2752f263522aSJoseph Koshy 2753ebccf1e3SJoseph Koshy phw = pmc_pcpu[cpu]->pc_hwpmcs[ri]; 2754ebccf1e3SJoseph Koshy 2755ebccf1e3SJoseph Koshy KASSERT(phw->phw_pmc == pm, 2756ebccf1e3SJoseph Koshy ("[pmc, %d] pmc ptr ri(%d) hw(%p) pm(%p)", 2757ebccf1e3SJoseph Koshy __LINE__, ri, phw->phw_pmc, pm)); 27584a3690dfSJohn Baldwin PMCDBG2(PMC,REL,2, "stopping cpu=%d ri=%d", cpu, ri); 2759ebccf1e3SJoseph Koshy 2760ebccf1e3SJoseph Koshy critical_enter(); 276101c35b67SMitchell Horne (void)pcd->pcd_stop_pmc(cpu, adjri, pm); 2762ebccf1e3SJoseph Koshy critical_exit(); 2763ebccf1e3SJoseph Koshy } 2764ebccf1e3SJoseph Koshy 27654a3690dfSJohn Baldwin PMCDBG2(PMC,REL,2, "decfg cpu=%d ri=%d", cpu, ri); 2766ebccf1e3SJoseph Koshy 2767ebccf1e3SJoseph Koshy critical_enter(); 276801c35b67SMitchell Horne (void)pcd->pcd_config_pmc(cpu, adjri, NULL); 2769ebccf1e3SJoseph Koshy critical_exit(); 2770ebccf1e3SJoseph Koshy 2771f263522aSJoseph Koshy /* adjust the global and process count of SS mode PMCs */ 2772f263522aSJoseph Koshy if (mode == PMC_MODE_SS && pm->pm_state == PMC_STATE_RUNNING) { 2773f263522aSJoseph Koshy po = pm->pm_owner; 2774f263522aSJoseph Koshy po->po_sscount--; 2775f263522aSJoseph Koshy if (po->po_sscount == 0) { 2776f263522aSJoseph Koshy atomic_subtract_rel_int(&pmc_ss_count, 1); 27770f00315cSMatt Macy CK_LIST_REMOVE(po, po_ssnext); 277870398c2fSMatt Macy epoch_wait_preempt(global_epoch_preempt); 2779f263522aSJoseph Koshy } 2780f263522aSJoseph Koshy } 2781ebccf1e3SJoseph Koshy pm->pm_state = PMC_STATE_DELETED; 2782ebccf1e3SJoseph Koshy 2783ebccf1e3SJoseph Koshy pmc_restore_cpu_binding(&pb); 2784ebccf1e3SJoseph Koshy 2785f263522aSJoseph Koshy /* 278601c35b67SMitchell Horne * We could have references to this PMC structure in the 278701c35b67SMitchell Horne * per-cpu sample queues. Wait for the queue to drain. 2788f263522aSJoseph Koshy */ 2789f263522aSJoseph Koshy pmc_wait_for_pmc_idle(pm); 2790f263522aSJoseph Koshy 2791c5153e19SJoseph Koshy } else if (PMC_IS_VIRTUAL_MODE(mode)) { 2792ebccf1e3SJoseph Koshy /* 279301c35b67SMitchell Horne * A virtual PMC could be running on multiple CPUs at a given 279401c35b67SMitchell Horne * instant. 2795ebccf1e3SJoseph Koshy * 279601c35b67SMitchell Horne * By marking its state as DELETED, we ensure that this PMC is 279701c35b67SMitchell Horne * never further scheduled on hardware. 2798ebccf1e3SJoseph Koshy * 2799ebccf1e3SJoseph Koshy * Then we wait till all CPUs are done with this PMC. 2800ebccf1e3SJoseph Koshy */ 2801ebccf1e3SJoseph Koshy pm->pm_state = PMC_STATE_DELETED; 2802ebccf1e3SJoseph Koshy 2803f263522aSJoseph Koshy /* Wait for the PMCs runcount to come to zero. */ 2804f263522aSJoseph Koshy pmc_wait_for_pmc_idle(pm); 2805ebccf1e3SJoseph Koshy 2806ebccf1e3SJoseph Koshy /* 280701c35b67SMitchell Horne * At this point the PMC is off all CPUs and cannot be freshly 280801c35b67SMitchell Horne * scheduled onto a CPU. It is now safe to unlink all targets 280901c35b67SMitchell Horne * from this PMC. If a process-record's refcount falls to zero, 281001c35b67SMitchell Horne * we remove it from the hash table. The module-wide SX lock 2811ebccf1e3SJoseph Koshy * protects us from races. 2812ebccf1e3SJoseph Koshy */ 2813ebccf1e3SJoseph Koshy LIST_FOREACH_SAFE(ptgt, &pm->pm_targets, pt_next, tmp) { 2814ebccf1e3SJoseph Koshy pp = ptgt->pt_process; 2815ebccf1e3SJoseph Koshy pmc_unlink_target_process(pm, pp); /* frees 'ptgt' */ 2816ebccf1e3SJoseph Koshy 28174a3690dfSJohn Baldwin PMCDBG1(PMC,REL,3, "pp->refcnt=%d", pp->pp_refcnt); 2818ebccf1e3SJoseph Koshy 2819ebccf1e3SJoseph Koshy /* 282001c35b67SMitchell Horne * If the target process record shows that no PMCs are 282101c35b67SMitchell Horne * attached to it, reclaim its space. 2822ebccf1e3SJoseph Koshy */ 2823ebccf1e3SJoseph Koshy if (pp->pp_refcnt == 0) { 2824ebccf1e3SJoseph Koshy pmc_remove_process_descriptor(pp); 28256161b98cSMatt Macy pmc_destroy_process_descriptor(pp); 2826ebccf1e3SJoseph Koshy } 2827ebccf1e3SJoseph Koshy } 2828ebccf1e3SJoseph Koshy 2829ebccf1e3SJoseph Koshy cpu = curthread->td_oncpu; /* setup cpu for pmd_release() */ 2830ebccf1e3SJoseph Koshy } 2831ebccf1e3SJoseph Koshy 2832ebccf1e3SJoseph Koshy /* 283301c35b67SMitchell Horne * Release any MD resources. 2834ebccf1e3SJoseph Koshy */ 2835e829eb6dSJoseph Koshy (void)pcd->pcd_release_pmc(cpu, adjri, pm); 2836ebccf1e3SJoseph Koshy 2837ebccf1e3SJoseph Koshy /* 283801c35b67SMitchell Horne * Update row disposition. 2839ebccf1e3SJoseph Koshy */ 2840c5153e19SJoseph Koshy if (PMC_IS_SYSTEM_MODE(PMC_TO_MODE(pm))) 2841ebccf1e3SJoseph Koshy PMC_UNMARK_ROW_STANDALONE(ri); 2842ebccf1e3SJoseph Koshy else 2843ebccf1e3SJoseph Koshy PMC_UNMARK_ROW_THREAD(ri); 2844ebccf1e3SJoseph Koshy 284501c35b67SMitchell Horne /* Unlink from the owner's list. */ 2846d5ee4074SMitchell Horne if (pm->pm_owner != NULL) { 2847f263522aSJoseph Koshy LIST_REMOVE(pm, pm_next); 2848f263522aSJoseph Koshy pm->pm_owner = NULL; 2849f263522aSJoseph Koshy } 2850ebccf1e3SJoseph Koshy } 2851ebccf1e3SJoseph Koshy 2852ebccf1e3SJoseph Koshy /* 2853ebccf1e3SJoseph Koshy * Register an owner and a pmc. 2854ebccf1e3SJoseph Koshy */ 2855ebccf1e3SJoseph Koshy static int 2856ebccf1e3SJoseph Koshy pmc_register_owner(struct proc *p, struct pmc *pmc) 2857ebccf1e3SJoseph Koshy { 2858ebccf1e3SJoseph Koshy struct pmc_owner *po; 2859ebccf1e3SJoseph Koshy 2860ebccf1e3SJoseph Koshy sx_assert(&pmc_sx, SX_XLOCKED); 2861ebccf1e3SJoseph Koshy 2862d5ee4074SMitchell Horne if ((po = pmc_find_owner_descriptor(p)) == NULL) { 2863f263522aSJoseph Koshy if ((po = pmc_allocate_owner_descriptor(p)) == NULL) 286452ebac7fSMitchell Horne return (ENOMEM); 2865d5ee4074SMitchell Horne } 2866ebccf1e3SJoseph Koshy 2867ebccf1e3SJoseph Koshy KASSERT(pmc->pm_owner == NULL, 2868ebccf1e3SJoseph Koshy ("[pmc,%d] attempting to own an initialized PMC", __LINE__)); 2869ebccf1e3SJoseph Koshy pmc->pm_owner = po; 2870ebccf1e3SJoseph Koshy 2871f263522aSJoseph Koshy LIST_INSERT_HEAD(&po->po_pmcs, pmc, pm_next); 2872ebccf1e3SJoseph Koshy 2873ebccf1e3SJoseph Koshy PROC_LOCK(p); 2874ebccf1e3SJoseph Koshy p->p_flag |= P_HWPMC; 2875ebccf1e3SJoseph Koshy PROC_UNLOCK(p); 2876ebccf1e3SJoseph Koshy 2877d5ee4074SMitchell Horne if ((po->po_flags & PMC_PO_OWNS_LOGFILE) != 0) 2878f263522aSJoseph Koshy pmclog_process_pmcallocate(pmc); 2879f263522aSJoseph Koshy 28804a3690dfSJohn Baldwin PMCDBG2(PMC,REG,1, "register-owner pmc-owner=%p pmc=%p", 2881f263522aSJoseph Koshy po, pmc); 2882ebccf1e3SJoseph Koshy 288352ebac7fSMitchell Horne return (0); 2884ebccf1e3SJoseph Koshy } 2885ebccf1e3SJoseph Koshy 2886ebccf1e3SJoseph Koshy /* 2887ebccf1e3SJoseph Koshy * Return the current row disposition: 2888ebccf1e3SJoseph Koshy * == 0 => FREE 2889ebccf1e3SJoseph Koshy * > 0 => PROCESS MODE 2890ebccf1e3SJoseph Koshy * < 0 => SYSTEM MODE 2891ebccf1e3SJoseph Koshy */ 2892ebccf1e3SJoseph Koshy int 2893ebccf1e3SJoseph Koshy pmc_getrowdisp(int ri) 2894ebccf1e3SJoseph Koshy { 289552ebac7fSMitchell Horne return (pmc_pmcdisp[ri]); 2896ebccf1e3SJoseph Koshy } 2897ebccf1e3SJoseph Koshy 2898ebccf1e3SJoseph Koshy /* 2899ebccf1e3SJoseph Koshy * Check if a PMC at row index 'ri' can be allocated to the current 2900ebccf1e3SJoseph Koshy * process. 2901ebccf1e3SJoseph Koshy * 2902ebccf1e3SJoseph Koshy * Allocation can fail if: 2903ebccf1e3SJoseph Koshy * - the current process is already being profiled by a PMC at index 'ri', 2904ebccf1e3SJoseph Koshy * attached to it via OP_PMCATTACH. 2905ebccf1e3SJoseph Koshy * - the current process has already allocated a PMC at index 'ri' 2906ebccf1e3SJoseph Koshy * via OP_ALLOCATE. 2907ebccf1e3SJoseph Koshy */ 2908c514a571SMitchell Horne static bool 2909c5153e19SJoseph Koshy pmc_can_allocate_rowindex(struct proc *p, unsigned int ri, int cpu) 2910ebccf1e3SJoseph Koshy { 2911c5153e19SJoseph Koshy struct pmc *pm; 2912ebccf1e3SJoseph Koshy struct pmc_owner *po; 2913ebccf1e3SJoseph Koshy struct pmc_process *pp; 291401c35b67SMitchell Horne enum pmc_mode mode; 2915ebccf1e3SJoseph Koshy 29164a3690dfSJohn Baldwin PMCDBG5(PMC,ALR,1, "can-allocate-rowindex proc=%p (%d, %s) ri=%d " 2917c5153e19SJoseph Koshy "cpu=%d", p, p->p_pid, p->p_comm, ri, cpu); 2918ebccf1e3SJoseph Koshy 2919c5153e19SJoseph Koshy /* 2920c5153e19SJoseph Koshy * We shouldn't have already allocated a process-mode PMC at 2921c5153e19SJoseph Koshy * row index 'ri'. 2922c5153e19SJoseph Koshy * 2923c5153e19SJoseph Koshy * We shouldn't have allocated a system-wide PMC on the same 2924c5153e19SJoseph Koshy * CPU and same RI. 2925c5153e19SJoseph Koshy */ 2926d5ee4074SMitchell Horne if ((po = pmc_find_owner_descriptor(p)) != NULL) { 2927f263522aSJoseph Koshy LIST_FOREACH(pm, &po->po_pmcs, pm_next) { 2928c5153e19SJoseph Koshy if (PMC_TO_ROWINDEX(pm) == ri) { 2929c5153e19SJoseph Koshy mode = PMC_TO_MODE(pm); 2930c5153e19SJoseph Koshy if (PMC_IS_VIRTUAL_MODE(mode)) 2931c514a571SMitchell Horne return (false); 2932c5153e19SJoseph Koshy if (PMC_IS_SYSTEM_MODE(mode) && 2933d5ee4074SMitchell Horne PMC_TO_CPU(pm) == cpu) 2934c514a571SMitchell Horne return (false); 2935d5ee4074SMitchell Horne } 2936c5153e19SJoseph Koshy } 2937c5153e19SJoseph Koshy } 2938ebccf1e3SJoseph Koshy 2939c5153e19SJoseph Koshy /* 2940c5153e19SJoseph Koshy * We also shouldn't be the target of any PMC at this index 2941c5153e19SJoseph Koshy * since otherwise a PMC_ATTACH to ourselves will fail. 2942c5153e19SJoseph Koshy */ 2943ebccf1e3SJoseph Koshy if ((pp = pmc_find_process_descriptor(p, 0)) != NULL) 2944d5ee4074SMitchell Horne if (pp->pp_pmcs[ri].pp_pmc != NULL) 2945c514a571SMitchell Horne return (false); 2946ebccf1e3SJoseph Koshy 29474a3690dfSJohn Baldwin PMCDBG4(PMC,ALR,2, "can-allocate-rowindex proc=%p (%d, %s) ri=%d ok", 2948ebccf1e3SJoseph Koshy p, p->p_pid, p->p_comm, ri); 2949c514a571SMitchell Horne return (true); 2950ebccf1e3SJoseph Koshy } 2951ebccf1e3SJoseph Koshy 2952ebccf1e3SJoseph Koshy /* 2953ebccf1e3SJoseph Koshy * Check if a given PMC at row index 'ri' can be currently used in 2954ebccf1e3SJoseph Koshy * mode 'mode'. 2955ebccf1e3SJoseph Koshy */ 2956c514a571SMitchell Horne static bool 2957ebccf1e3SJoseph Koshy pmc_can_allocate_row(int ri, enum pmc_mode mode) 2958ebccf1e3SJoseph Koshy { 2959ebccf1e3SJoseph Koshy enum pmc_disp disp; 2960ebccf1e3SJoseph Koshy 2961ebccf1e3SJoseph Koshy sx_assert(&pmc_sx, SX_XLOCKED); 2962ebccf1e3SJoseph Koshy 29634a3690dfSJohn Baldwin PMCDBG2(PMC,ALR,1, "can-allocate-row ri=%d mode=%d", ri, mode); 2964ebccf1e3SJoseph Koshy 2965ebccf1e3SJoseph Koshy if (PMC_IS_SYSTEM_MODE(mode)) 2966ebccf1e3SJoseph Koshy disp = PMC_DISP_STANDALONE; 2967ebccf1e3SJoseph Koshy else 2968ebccf1e3SJoseph Koshy disp = PMC_DISP_THREAD; 2969ebccf1e3SJoseph Koshy 2970ebccf1e3SJoseph Koshy /* 2971ebccf1e3SJoseph Koshy * check disposition for PMC row 'ri': 2972ebccf1e3SJoseph Koshy * 2973ebccf1e3SJoseph Koshy * Expected disposition Row-disposition Result 2974ebccf1e3SJoseph Koshy * 2975ebccf1e3SJoseph Koshy * STANDALONE STANDALONE or FREE proceed 2976ebccf1e3SJoseph Koshy * STANDALONE THREAD fail 2977ebccf1e3SJoseph Koshy * THREAD THREAD or FREE proceed 2978ebccf1e3SJoseph Koshy * THREAD STANDALONE fail 2979ebccf1e3SJoseph Koshy */ 2980ebccf1e3SJoseph Koshy if (!PMC_ROW_DISP_IS_FREE(ri) && 2981ebccf1e3SJoseph Koshy !(disp == PMC_DISP_THREAD && PMC_ROW_DISP_IS_THREAD(ri)) && 2982ebccf1e3SJoseph Koshy !(disp == PMC_DISP_STANDALONE && PMC_ROW_DISP_IS_STANDALONE(ri))) 2983c514a571SMitchell Horne return (false); 2984ebccf1e3SJoseph Koshy 2985ebccf1e3SJoseph Koshy /* 2986ebccf1e3SJoseph Koshy * All OK 2987ebccf1e3SJoseph Koshy */ 29884a3690dfSJohn Baldwin PMCDBG2(PMC,ALR,2, "can-allocate-row ri=%d mode=%d ok", ri, mode); 2989c514a571SMitchell Horne return (true); 2990ebccf1e3SJoseph Koshy } 2991ebccf1e3SJoseph Koshy 2992ebccf1e3SJoseph Koshy /* 2993c5153e19SJoseph Koshy * Find a PMC descriptor with user handle 'pmcid' for thread 'td'. 2994ebccf1e3SJoseph Koshy */ 2995ebccf1e3SJoseph Koshy static struct pmc * 2996ebccf1e3SJoseph Koshy pmc_find_pmc_descriptor_in_process(struct pmc_owner *po, pmc_id_t pmcid) 2997ebccf1e3SJoseph Koshy { 2998f263522aSJoseph Koshy struct pmc *pm; 2999ebccf1e3SJoseph Koshy 3000c5153e19SJoseph Koshy KASSERT(PMC_ID_TO_ROWINDEX(pmcid) < md->pmd_npmc, 3001c5153e19SJoseph Koshy ("[pmc,%d] Illegal pmc index %d (max %d)", __LINE__, 3002c5153e19SJoseph Koshy PMC_ID_TO_ROWINDEX(pmcid), md->pmd_npmc)); 3003ebccf1e3SJoseph Koshy 3004d5ee4074SMitchell Horne LIST_FOREACH(pm, &po->po_pmcs, pm_next) { 3005f263522aSJoseph Koshy if (pm->pm_id == pmcid) 3006d5ee4074SMitchell Horne return (pm); 3007d5ee4074SMitchell Horne } 3008ebccf1e3SJoseph Koshy 300952ebac7fSMitchell Horne return (NULL); 3010ebccf1e3SJoseph Koshy } 3011ebccf1e3SJoseph Koshy 3012ebccf1e3SJoseph Koshy static int 3013ebccf1e3SJoseph Koshy pmc_find_pmc(pmc_id_t pmcid, struct pmc **pmc) 3014ebccf1e3SJoseph Koshy { 3015e6f47577SBjoern A. Zeeb struct pmc *pm, *opm; 3016ebccf1e3SJoseph Koshy struct pmc_owner *po; 3017e6f47577SBjoern A. Zeeb struct pmc_process *pp; 3018ebccf1e3SJoseph Koshy 30194a3690dfSJohn Baldwin PMCDBG1(PMC,FND,1, "find-pmc id=%d", pmcid); 3020d2cd6388SKonstantin Belousov if (PMC_ID_TO_ROWINDEX(pmcid) >= md->pmd_npmc) 3021d2cd6388SKonstantin Belousov return (EINVAL); 3022ebccf1e3SJoseph Koshy 3023e6f47577SBjoern A. Zeeb if ((po = pmc_find_owner_descriptor(curthread->td_proc)) == NULL) { 3024e6f47577SBjoern A. Zeeb /* 3025e6f47577SBjoern A. Zeeb * In case of PMC_F_DESCENDANTS child processes we will not find 3026e6f47577SBjoern A. Zeeb * the current process in the owners hash list. Find the owner 3027e6f47577SBjoern A. Zeeb * process first and from there lookup the po. 3028e6f47577SBjoern A. Zeeb */ 3029d5ee4074SMitchell Horne pp = pmc_find_process_descriptor(curthread->td_proc, 3030d5ee4074SMitchell Horne PMC_FLAG_NONE); 3031d5ee4074SMitchell Horne if (pp == NULL) 303252ebac7fSMitchell Horne return (ESRCH); 3033e6f47577SBjoern A. Zeeb opm = pp->pp_pmcs[PMC_ID_TO_ROWINDEX(pmcid)].pp_pmc; 3034e6f47577SBjoern A. Zeeb if (opm == NULL) 303552ebac7fSMitchell Horne return (ESRCH); 3036d5ee4074SMitchell Horne if ((opm->pm_flags & 3037d5ee4074SMitchell Horne (PMC_F_ATTACHED_TO_OWNER | PMC_F_DESCENDANTS)) != 3038d5ee4074SMitchell Horne (PMC_F_ATTACHED_TO_OWNER | PMC_F_DESCENDANTS)) 303952ebac7fSMitchell Horne return (ESRCH); 3040d5ee4074SMitchell Horne 3041e6f47577SBjoern A. Zeeb po = opm->pm_owner; 3042e6f47577SBjoern A. Zeeb } 3043ebccf1e3SJoseph Koshy 3044ebccf1e3SJoseph Koshy if ((pm = pmc_find_pmc_descriptor_in_process(po, pmcid)) == NULL) 304552ebac7fSMitchell Horne return (EINVAL); 3046ebccf1e3SJoseph Koshy 30474a3690dfSJohn Baldwin PMCDBG2(PMC,FND,2, "find-pmc id=%d -> pmc=%p", pmcid, pm); 3048ebccf1e3SJoseph Koshy 3049ebccf1e3SJoseph Koshy *pmc = pm; 305052ebac7fSMitchell Horne return (0); 3051ebccf1e3SJoseph Koshy } 3052ebccf1e3SJoseph Koshy 3053ebccf1e3SJoseph Koshy /* 3054ebccf1e3SJoseph Koshy * Start a PMC. 3055ebccf1e3SJoseph Koshy */ 3056ebccf1e3SJoseph Koshy static int 3057ebccf1e3SJoseph Koshy pmc_start(struct pmc *pm) 3058ebccf1e3SJoseph Koshy { 3059ebccf1e3SJoseph Koshy struct pmc_binding pb; 3060e829eb6dSJoseph Koshy struct pmc_classdep *pcd; 306101c35b67SMitchell Horne struct pmc_owner *po; 3062d5ee4074SMitchell Horne pmc_value_t v; 306301c35b67SMitchell Horne enum pmc_mode mode; 3064e829eb6dSJoseph Koshy int adjri, error, cpu, ri; 3065ebccf1e3SJoseph Koshy 3066ebccf1e3SJoseph Koshy KASSERT(pm != NULL, 3067ebccf1e3SJoseph Koshy ("[pmc,%d] null pm", __LINE__)); 3068ebccf1e3SJoseph Koshy 3069c5153e19SJoseph Koshy mode = PMC_TO_MODE(pm); 3070c5153e19SJoseph Koshy ri = PMC_TO_ROWINDEX(pm); 3071e829eb6dSJoseph Koshy pcd = pmc_ri_to_classdep(md, ri, &adjri); 3072e829eb6dSJoseph Koshy 3073c5153e19SJoseph Koshy error = 0; 307401c35b67SMitchell Horne po = pm->pm_owner; 3075c5153e19SJoseph Koshy 30764a3690dfSJohn Baldwin PMCDBG3(PMC,OPS,1, "start pmc=%p mode=%d ri=%d", pm, mode, ri); 3077ebccf1e3SJoseph Koshy 3078f263522aSJoseph Koshy po = pm->pm_owner; 3079ebccf1e3SJoseph Koshy 3080d07f36b0SJoseph Koshy /* 3081d07f36b0SJoseph Koshy * Disallow PMCSTART if a logfile is required but has not been 3082d07f36b0SJoseph Koshy * configured yet. 3083d07f36b0SJoseph Koshy */ 3084d5ee4074SMitchell Horne if ((pm->pm_flags & PMC_F_NEEDS_LOGFILE) != 0 && 3085d07f36b0SJoseph Koshy (po->po_flags & PMC_PO_OWNS_LOGFILE) == 0) 3086e829eb6dSJoseph Koshy return (EDOOFUS); /* programming error */ 3087d07f36b0SJoseph Koshy 3088d07f36b0SJoseph Koshy /* 3089d07f36b0SJoseph Koshy * If this is a sampling mode PMC, log mapping information for 3090d07f36b0SJoseph Koshy * the kernel modules that are currently loaded. 3091d07f36b0SJoseph Koshy */ 3092d07f36b0SJoseph Koshy if (PMC_IS_SAMPLING_MODE(PMC_TO_MODE(pm))) 3093d07f36b0SJoseph Koshy pmc_log_kernel_mappings(pm); 3094d07f36b0SJoseph Koshy 3095c5153e19SJoseph Koshy if (PMC_IS_VIRTUAL_MODE(mode)) { 3096ebccf1e3SJoseph Koshy /* 3097f263522aSJoseph Koshy * If a PMCATTACH has never been done on this PMC, 3098f263522aSJoseph Koshy * attach it to its owner process. 3099ebccf1e3SJoseph Koshy */ 3100d5ee4074SMitchell Horne if (LIST_EMPTY(&pm->pm_targets)) { 3101d5ee4074SMitchell Horne error = (pm->pm_flags & PMC_F_ATTACH_DONE) != 0 ? 3102d5ee4074SMitchell Horne ESRCH : pmc_attach_process(po->po_owner, pm); 3103d5ee4074SMitchell Horne } 3104f263522aSJoseph Koshy 3105f263522aSJoseph Koshy /* 3106c5153e19SJoseph Koshy * If the PMC is attached to its owner, then force a context 3107c5153e19SJoseph Koshy * switch to ensure that the MD state gets set correctly. 3108c5153e19SJoseph Koshy */ 3109f263522aSJoseph Koshy if (error == 0) { 3110f263522aSJoseph Koshy pm->pm_state = PMC_STATE_RUNNING; 3111d5ee4074SMitchell Horne if ((pm->pm_flags & PMC_F_ATTACHED_TO_OWNER) != 0) 3112f263522aSJoseph Koshy pmc_force_context_switch(); 3113f263522aSJoseph Koshy } 3114ebccf1e3SJoseph Koshy 3115e829eb6dSJoseph Koshy return (error); 3116f263522aSJoseph Koshy } 3117ebccf1e3SJoseph Koshy 3118f263522aSJoseph Koshy /* 3119f263522aSJoseph Koshy * A system-wide PMC. 3120d07f36b0SJoseph Koshy * 3121f263522aSJoseph Koshy * Add the owner to the global list if this is a system-wide 3122f263522aSJoseph Koshy * sampling PMC. 3123f263522aSJoseph Koshy */ 3124f263522aSJoseph Koshy if (mode == PMC_MODE_SS) { 3125bf792d68SJoseph Koshy /* 3126bf792d68SJoseph Koshy * Log mapping information for all existing processes in the 3127bf792d68SJoseph Koshy * system. Subsequent mappings are logged as they happen; 3128bf792d68SJoseph Koshy * see pmc_process_mmap(). 3129bf792d68SJoseph Koshy */ 3130bf792d68SJoseph Koshy if (po->po_logprocmaps == 0) { 3131d07f36b0SJoseph Koshy pmc_log_all_process_mappings(po); 3132bf792d68SJoseph Koshy po->po_logprocmaps = 1; 3133bf792d68SJoseph Koshy } 31348fa7df36SMatt Macy po->po_sscount++; 31358fa7df36SMatt Macy if (po->po_sscount == 1) { 31368fa7df36SMatt Macy atomic_add_rel_int(&pmc_ss_count, 1); 31378fa7df36SMatt Macy CK_LIST_INSERT_HEAD(&pmc_ss_owners, po, po_ssnext); 31388fa7df36SMatt Macy PMCDBG1(PMC,OPS,1, "po=%p in global list", po); 31398fa7df36SMatt Macy } 314004001891SRyan Stone } 314149874f6eSJoseph Koshy 3142ebccf1e3SJoseph Koshy /* 3143f263522aSJoseph Koshy * Move to the CPU associated with this 3144ebccf1e3SJoseph Koshy * PMC, and start the hardware. 3145ebccf1e3SJoseph Koshy */ 3146ebccf1e3SJoseph Koshy pmc_save_cpu_binding(&pb); 3147c5153e19SJoseph Koshy cpu = PMC_TO_CPU(pm); 3148122ccdc1SJoseph Koshy if (!pmc_cpu_is_active(cpu)) 3149e829eb6dSJoseph Koshy return (ENXIO); 3150ebccf1e3SJoseph Koshy pmc_select_cpu(cpu); 3151ebccf1e3SJoseph Koshy 3152ebccf1e3SJoseph Koshy /* 3153ebccf1e3SJoseph Koshy * global PMCs are configured at allocation time 3154ebccf1e3SJoseph Koshy * so write out the initial value and start the PMC. 3155ebccf1e3SJoseph Koshy */ 3156f263522aSJoseph Koshy pm->pm_state = PMC_STATE_RUNNING; 3157f263522aSJoseph Koshy 3158c5153e19SJoseph Koshy critical_enter(); 3159d5ee4074SMitchell Horne v = PMC_IS_SAMPLING_MODE(mode) ? pm->pm_sc.pm_reloadcount : 3160d5ee4074SMitchell Horne pm->pm_sc.pm_initial; 3161d5ee4074SMitchell Horne if ((error = pcd->pcd_write_pmc(cpu, adjri, pm, v)) == 0) { 3162a3924968SJonathan T. Looney /* If a sampling mode PMC, reset stalled state. */ 3163a3924968SJonathan T. Looney if (PMC_IS_SAMPLING_MODE(mode)) 3164e6b475e0SMatt Macy pm->pm_pcpu_state[cpu].pps_stalled = 0; 3165a3924968SJonathan T. Looney 3166a3924968SJonathan T. Looney /* Indicate that we desire this to run. Start it. */ 3167e6b475e0SMatt Macy pm->pm_pcpu_state[cpu].pps_cpustate = 1; 316839f92a76SMitchell Horne error = pcd->pcd_start_pmc(cpu, adjri, pm); 3169a3924968SJonathan T. Looney } 3170c5153e19SJoseph Koshy critical_exit(); 3171ebccf1e3SJoseph Koshy 3172ebccf1e3SJoseph Koshy pmc_restore_cpu_binding(&pb); 3173e829eb6dSJoseph Koshy return (error); 3174ebccf1e3SJoseph Koshy } 3175ebccf1e3SJoseph Koshy 3176ebccf1e3SJoseph Koshy /* 3177ebccf1e3SJoseph Koshy * Stop a PMC. 3178ebccf1e3SJoseph Koshy */ 3179ebccf1e3SJoseph Koshy static int 3180ebccf1e3SJoseph Koshy pmc_stop(struct pmc *pm) 3181ebccf1e3SJoseph Koshy { 3182ebccf1e3SJoseph Koshy struct pmc_binding pb; 3183e829eb6dSJoseph Koshy struct pmc_classdep *pcd; 318401c35b67SMitchell Horne struct pmc_owner *po; 3185e829eb6dSJoseph Koshy int adjri, cpu, error, ri; 3186ebccf1e3SJoseph Koshy 3187ebccf1e3SJoseph Koshy KASSERT(pm != NULL, ("[pmc,%d] null pmc", __LINE__)); 3188ebccf1e3SJoseph Koshy 3189693cd307SMitchell Horne PMCDBG3(PMC,OPS,1, "stop pmc=%p mode=%d ri=%d", pm, PMC_TO_MODE(pm), 3190693cd307SMitchell Horne PMC_TO_ROWINDEX(pm)); 3191ebccf1e3SJoseph Koshy 3192ebccf1e3SJoseph Koshy pm->pm_state = PMC_STATE_STOPPED; 3193ebccf1e3SJoseph Koshy 3194ebccf1e3SJoseph Koshy /* 319501c35b67SMitchell Horne * If the PMC is a virtual mode one, changing the state to non-RUNNING 319601c35b67SMitchell Horne * is enough to ensure that the PMC never gets scheduled. 3197ebccf1e3SJoseph Koshy * 319801c35b67SMitchell Horne * If this PMC is current running on a CPU, then it will handled 319901c35b67SMitchell Horne * correctly at the time its target process is context switched out. 3200ebccf1e3SJoseph Koshy */ 3201c5153e19SJoseph Koshy if (PMC_IS_VIRTUAL_MODE(PMC_TO_MODE(pm))) 320252ebac7fSMitchell Horne return (0); 3203ebccf1e3SJoseph Koshy 3204ebccf1e3SJoseph Koshy /* 320501c35b67SMitchell Horne * A system-mode PMC. Move to the CPU associated with this PMC, and 320601c35b67SMitchell Horne * stop the hardware. We update the 'initial count' so that a 320701c35b67SMitchell Horne * subsequent PMCSTART will resume counting from the current hardware 320801c35b67SMitchell Horne * count. 3209ebccf1e3SJoseph Koshy */ 3210ebccf1e3SJoseph Koshy pmc_save_cpu_binding(&pb); 3211ebccf1e3SJoseph Koshy 3212c5153e19SJoseph Koshy cpu = PMC_TO_CPU(pm); 3213122ccdc1SJoseph Koshy KASSERT(cpu >= 0 && cpu < pmc_cpu_max(), 3214c5153e19SJoseph Koshy ("[pmc,%d] illegal cpu=%d", __LINE__, cpu)); 3215122ccdc1SJoseph Koshy if (!pmc_cpu_is_active(cpu)) 321652ebac7fSMitchell Horne return (ENXIO); 3217ebccf1e3SJoseph Koshy 3218ebccf1e3SJoseph Koshy pmc_select_cpu(cpu); 3219ebccf1e3SJoseph Koshy 3220c5153e19SJoseph Koshy ri = PMC_TO_ROWINDEX(pm); 3221e829eb6dSJoseph Koshy pcd = pmc_ri_to_classdep(md, ri, &adjri); 3222c5153e19SJoseph Koshy 3223e6b475e0SMatt Macy pm->pm_pcpu_state[cpu].pps_cpustate = 0; 3224c5153e19SJoseph Koshy critical_enter(); 3225d5ee4074SMitchell Horne if ((error = pcd->pcd_stop_pmc(cpu, adjri, pm)) == 0) { 322639f92a76SMitchell Horne error = pcd->pcd_read_pmc(cpu, adjri, pm, 322739f92a76SMitchell Horne &pm->pm_sc.pm_initial); 3228d5ee4074SMitchell Horne } 3229c5153e19SJoseph Koshy critical_exit(); 3230ebccf1e3SJoseph Koshy 3231ebccf1e3SJoseph Koshy pmc_restore_cpu_binding(&pb); 3232ebccf1e3SJoseph Koshy 323301c35b67SMitchell Horne /* Remove this owner from the global list of SS PMC owners. */ 3234f263522aSJoseph Koshy po = pm->pm_owner; 3235f263522aSJoseph Koshy if (PMC_TO_MODE(pm) == PMC_MODE_SS) { 3236f263522aSJoseph Koshy po->po_sscount--; 3237f263522aSJoseph Koshy if (po->po_sscount == 0) { 3238f263522aSJoseph Koshy atomic_subtract_rel_int(&pmc_ss_count, 1); 32390f00315cSMatt Macy CK_LIST_REMOVE(po, po_ssnext); 324070398c2fSMatt Macy epoch_wait_preempt(global_epoch_preempt); 32414a3690dfSJohn Baldwin PMCDBG1(PMC,OPS,2,"po=%p removed from global list", po); 3242f263522aSJoseph Koshy } 3243f263522aSJoseph Koshy } 3244f263522aSJoseph Koshy 3245e829eb6dSJoseph Koshy return (error); 3246ebccf1e3SJoseph Koshy } 3247ebccf1e3SJoseph Koshy 3248ba32b203SMatt Macy static struct pmc_classdep * 3249ba32b203SMatt Macy pmc_class_to_classdep(enum pmc_class class) 3250ba32b203SMatt Macy { 3251ba32b203SMatt Macy int n; 3252ba32b203SMatt Macy 3253d5ee4074SMitchell Horne for (n = 0; n < md->pmd_nclass; n++) { 3254ba32b203SMatt Macy if (md->pmd_classdep[n].pcd_class == class) 3255ba32b203SMatt Macy return (&md->pmd_classdep[n]); 3256d5ee4074SMitchell Horne } 3257ba32b203SMatt Macy return (NULL); 3258ba32b203SMatt Macy } 3259ebccf1e3SJoseph Koshy 32605de96e33SMatt Macy #if defined(HWPMC_DEBUG) && defined(KTR) 3261ebccf1e3SJoseph Koshy static const char *pmc_op_to_name[] = { 3262ebccf1e3SJoseph Koshy #undef __PMC_OP 3263ebccf1e3SJoseph Koshy #define __PMC_OP(N, D) #N , 3264ebccf1e3SJoseph Koshy __PMC_OPS() 3265ebccf1e3SJoseph Koshy NULL 3266ebccf1e3SJoseph Koshy }; 3267ebccf1e3SJoseph Koshy #endif 3268ebccf1e3SJoseph Koshy 3269ebccf1e3SJoseph Koshy /* 3270ebccf1e3SJoseph Koshy * The syscall interface 3271ebccf1e3SJoseph Koshy */ 3272ebccf1e3SJoseph Koshy 3273ebccf1e3SJoseph Koshy #define PMC_GET_SX_XLOCK(...) do { \ 3274ebccf1e3SJoseph Koshy sx_xlock(&pmc_sx); \ 3275ebccf1e3SJoseph Koshy if (pmc_hook == NULL) { \ 3276ebccf1e3SJoseph Koshy sx_xunlock(&pmc_sx); \ 3277ebccf1e3SJoseph Koshy return __VA_ARGS__; \ 3278ebccf1e3SJoseph Koshy } \ 3279ebccf1e3SJoseph Koshy } while (0) 3280ebccf1e3SJoseph Koshy 3281ebccf1e3SJoseph Koshy #define PMC_DOWNGRADE_SX() do { \ 3282ebccf1e3SJoseph Koshy sx_downgrade(&pmc_sx); \ 328301c35b67SMitchell Horne is_sx_downgraded = true; \ 3284ebccf1e3SJoseph Koshy } while (0) 3285ebccf1e3SJoseph Koshy 3286a133f642SMitchell Horne /* 3287c514a571SMitchell Horne * Main body of PMC_OP_PMCALLOCATE. 3288c514a571SMitchell Horne */ 3289c514a571SMitchell Horne static int 3290c514a571SMitchell Horne pmc_do_op_pmcallocate(struct thread *td, struct pmc_op_pmcallocate *pa) 3291c514a571SMitchell Horne { 3292c514a571SMitchell Horne struct proc *p; 3293c514a571SMitchell Horne struct pmc *pmc; 3294c514a571SMitchell Horne struct pmc_binding pb; 3295c514a571SMitchell Horne struct pmc_classdep *pcd; 3296c514a571SMitchell Horne struct pmc_hw *phw; 3297c514a571SMitchell Horne enum pmc_mode mode; 3298c514a571SMitchell Horne enum pmc_class class; 3299c514a571SMitchell Horne uint32_t caps; 3300c514a571SMitchell Horne u_int cpu; 3301c514a571SMitchell Horne int adjri, n; 3302c514a571SMitchell Horne int error; 3303c514a571SMitchell Horne 3304c514a571SMitchell Horne class = pa->pm_class; 3305c514a571SMitchell Horne caps = pa->pm_caps; 3306c514a571SMitchell Horne mode = pa->pm_mode; 3307c514a571SMitchell Horne cpu = pa->pm_cpu; 3308c514a571SMitchell Horne 3309c514a571SMitchell Horne p = td->td_proc; 3310c514a571SMitchell Horne 3311c514a571SMitchell Horne /* Requested mode must exist. */ 3312c514a571SMitchell Horne if ((mode != PMC_MODE_SS && mode != PMC_MODE_SC && 3313c514a571SMitchell Horne mode != PMC_MODE_TS && mode != PMC_MODE_TC)) 3314c514a571SMitchell Horne return (EINVAL); 3315c514a571SMitchell Horne 3316c514a571SMitchell Horne /* Requested CPU must be valid. */ 3317c514a571SMitchell Horne if (cpu != PMC_CPU_ANY && cpu >= pmc_cpu_max()) 3318c514a571SMitchell Horne return (EINVAL); 3319c514a571SMitchell Horne 3320c514a571SMitchell Horne /* 3321c514a571SMitchell Horne * Virtual PMCs should only ask for a default CPU. 3322c514a571SMitchell Horne * System mode PMCs need to specify a non-default CPU. 3323c514a571SMitchell Horne */ 3324c514a571SMitchell Horne if ((PMC_IS_VIRTUAL_MODE(mode) && cpu != PMC_CPU_ANY) || 3325c514a571SMitchell Horne (PMC_IS_SYSTEM_MODE(mode) && cpu == PMC_CPU_ANY)) 3326c514a571SMitchell Horne return (EINVAL); 3327c514a571SMitchell Horne 3328c514a571SMitchell Horne /* 3329c514a571SMitchell Horne * Check that an inactive CPU is not being asked for. 3330c514a571SMitchell Horne */ 3331c514a571SMitchell Horne if (PMC_IS_SYSTEM_MODE(mode) && !pmc_cpu_is_active(cpu)) 3332c514a571SMitchell Horne return (ENXIO); 3333c514a571SMitchell Horne 3334c514a571SMitchell Horne /* 3335c514a571SMitchell Horne * Refuse an allocation for a system-wide PMC if this process has been 3336c514a571SMitchell Horne * jailed, or if this process lacks super-user credentials and the 3337c514a571SMitchell Horne * sysctl tunable 'security.bsd.unprivileged_syspmcs' is zero. 3338c514a571SMitchell Horne */ 3339c514a571SMitchell Horne if (PMC_IS_SYSTEM_MODE(mode)) { 3340c514a571SMitchell Horne if (jailed(td->td_ucred)) 3341c514a571SMitchell Horne return (EPERM); 3342c514a571SMitchell Horne if (!pmc_unprivileged_syspmcs) { 3343c514a571SMitchell Horne error = priv_check(td, PRIV_PMC_SYSTEM); 3344c514a571SMitchell Horne if (error != 0) 3345c514a571SMitchell Horne return (error); 3346c514a571SMitchell Horne } 3347c514a571SMitchell Horne } 3348c514a571SMitchell Horne 3349c514a571SMitchell Horne /* 3350c514a571SMitchell Horne * Look for valid values for 'pm_flags'. 3351c514a571SMitchell Horne */ 3352c514a571SMitchell Horne if ((pa->pm_flags & ~(PMC_F_DESCENDANTS | PMC_F_LOG_PROCCSW | 3353c514a571SMitchell Horne PMC_F_LOG_PROCEXIT | PMC_F_CALLCHAIN | PMC_F_USERCALLCHAIN)) != 0) 3354c514a571SMitchell Horne return (EINVAL); 3355c514a571SMitchell Horne 3356c514a571SMitchell Horne /* PMC_F_USERCALLCHAIN is only valid with PMC_F_CALLCHAIN. */ 3357c514a571SMitchell Horne if ((pa->pm_flags & (PMC_F_CALLCHAIN | PMC_F_USERCALLCHAIN)) == 3358c514a571SMitchell Horne PMC_F_USERCALLCHAIN) 3359c514a571SMitchell Horne return (EINVAL); 3360c514a571SMitchell Horne 3361c514a571SMitchell Horne /* PMC_F_USERCALLCHAIN is only valid for sampling mode. */ 3362c514a571SMitchell Horne if ((pa->pm_flags & PMC_F_USERCALLCHAIN) != 0 && mode != PMC_MODE_TS && 3363c514a571SMitchell Horne mode != PMC_MODE_SS) 3364c514a571SMitchell Horne return (EINVAL); 3365c514a571SMitchell Horne 3366c514a571SMitchell Horne /* Process logging options are not allowed for system PMCs. */ 3367c514a571SMitchell Horne if (PMC_IS_SYSTEM_MODE(mode) && 3368c514a571SMitchell Horne (pa->pm_flags & (PMC_F_LOG_PROCCSW | PMC_F_LOG_PROCEXIT)) != 0) 3369c514a571SMitchell Horne return (EINVAL); 3370c514a571SMitchell Horne 3371c514a571SMitchell Horne /* 3372c514a571SMitchell Horne * All sampling mode PMCs need to be able to interrupt the CPU. 3373c514a571SMitchell Horne */ 3374c514a571SMitchell Horne if (PMC_IS_SAMPLING_MODE(mode)) 3375c514a571SMitchell Horne caps |= PMC_CAP_INTERRUPT; 3376c514a571SMitchell Horne 3377c514a571SMitchell Horne /* A valid class specifier should have been passed in. */ 3378c514a571SMitchell Horne pcd = pmc_class_to_classdep(class); 3379c514a571SMitchell Horne if (pcd == NULL) 3380c514a571SMitchell Horne return (EINVAL); 3381c514a571SMitchell Horne 3382c514a571SMitchell Horne /* The requested PMC capabilities should be feasible. */ 3383c514a571SMitchell Horne if ((pcd->pcd_caps & caps) != caps) 3384c514a571SMitchell Horne return (EOPNOTSUPP); 3385c514a571SMitchell Horne 3386c514a571SMitchell Horne PMCDBG4(PMC,ALL,2, "event=%d caps=0x%x mode=%d cpu=%d", pa->pm_ev, 3387c514a571SMitchell Horne caps, mode, cpu); 3388c514a571SMitchell Horne 3389c514a571SMitchell Horne pmc = pmc_allocate_pmc_descriptor(); 3390c514a571SMitchell Horne pmc->pm_id = PMC_ID_MAKE_ID(cpu, pa->pm_mode, class, PMC_ID_INVALID); 3391c514a571SMitchell Horne pmc->pm_event = pa->pm_ev; 3392c514a571SMitchell Horne pmc->pm_state = PMC_STATE_FREE; 3393c514a571SMitchell Horne pmc->pm_caps = caps; 3394c514a571SMitchell Horne pmc->pm_flags = pa->pm_flags; 3395c514a571SMitchell Horne 3396c514a571SMitchell Horne /* XXX set lower bound on sampling for process counters */ 3397c514a571SMitchell Horne if (PMC_IS_SAMPLING_MODE(mode)) { 3398c514a571SMitchell Horne /* 3399c514a571SMitchell Horne * Don't permit requested sample rate to be less than 3400c514a571SMitchell Horne * pmc_mincount. 3401c514a571SMitchell Horne */ 3402c514a571SMitchell Horne if (pa->pm_count < MAX(1, pmc_mincount)) 3403c514a571SMitchell Horne log(LOG_WARNING, "pmcallocate: passed sample " 3404c514a571SMitchell Horne "rate %ju - setting to %u\n", 3405c514a571SMitchell Horne (uintmax_t)pa->pm_count, 3406c514a571SMitchell Horne MAX(1, pmc_mincount)); 3407c514a571SMitchell Horne pmc->pm_sc.pm_reloadcount = MAX(MAX(1, pmc_mincount), 3408c514a571SMitchell Horne pa->pm_count); 3409c514a571SMitchell Horne } else 3410c514a571SMitchell Horne pmc->pm_sc.pm_initial = pa->pm_count; 3411c514a571SMitchell Horne 3412c514a571SMitchell Horne /* switch thread to CPU 'cpu' */ 3413c514a571SMitchell Horne pmc_save_cpu_binding(&pb); 3414c514a571SMitchell Horne 3415c514a571SMitchell Horne #define PMC_IS_SHAREABLE_PMC(cpu, n) \ 3416c514a571SMitchell Horne (pmc_pcpu[(cpu)]->pc_hwpmcs[(n)]->phw_state & \ 3417c514a571SMitchell Horne PMC_PHW_FLAG_IS_SHAREABLE) 3418c514a571SMitchell Horne #define PMC_IS_UNALLOCATED(cpu, n) \ 3419c514a571SMitchell Horne (pmc_pcpu[(cpu)]->pc_hwpmcs[(n)]->phw_pmc == NULL) 3420c514a571SMitchell Horne 3421c514a571SMitchell Horne if (PMC_IS_SYSTEM_MODE(mode)) { 3422c514a571SMitchell Horne pmc_select_cpu(cpu); 3423c514a571SMitchell Horne for (n = pcd->pcd_ri; n < md->pmd_npmc; n++) { 3424c514a571SMitchell Horne pcd = pmc_ri_to_classdep(md, n, &adjri); 3425c514a571SMitchell Horne 3426c514a571SMitchell Horne if (!pmc_can_allocate_row(n, mode) || 3427c514a571SMitchell Horne !pmc_can_allocate_rowindex(p, n, cpu)) 3428c514a571SMitchell Horne continue; 3429c514a571SMitchell Horne if (!PMC_IS_UNALLOCATED(cpu, n) && 3430c514a571SMitchell Horne !PMC_IS_SHAREABLE_PMC(cpu, n)) 3431c514a571SMitchell Horne continue; 3432c514a571SMitchell Horne 3433c514a571SMitchell Horne if (pcd->pcd_allocate_pmc(cpu, adjri, pmc, pa) == 0) { 3434c514a571SMitchell Horne /* Success. */ 3435c514a571SMitchell Horne break; 3436c514a571SMitchell Horne } 3437c514a571SMitchell Horne } 3438c514a571SMitchell Horne } else { 3439c514a571SMitchell Horne /* Process virtual mode */ 3440c514a571SMitchell Horne for (n = pcd->pcd_ri; n < md->pmd_npmc; n++) { 3441c514a571SMitchell Horne pcd = pmc_ri_to_classdep(md, n, &adjri); 3442c514a571SMitchell Horne 3443c514a571SMitchell Horne if (!pmc_can_allocate_row(n, mode) || 3444c514a571SMitchell Horne !pmc_can_allocate_rowindex(p, n, PMC_CPU_ANY)) 3445c514a571SMitchell Horne continue; 3446c514a571SMitchell Horne 3447c514a571SMitchell Horne if (pcd->pcd_allocate_pmc(td->td_oncpu, adjri, pmc, 3448c514a571SMitchell Horne pa) == 0) { 3449c514a571SMitchell Horne /* Success. */ 3450c514a571SMitchell Horne break; 3451c514a571SMitchell Horne } 3452c514a571SMitchell Horne } 3453c514a571SMitchell Horne } 3454c514a571SMitchell Horne 3455c514a571SMitchell Horne #undef PMC_IS_UNALLOCATED 3456c514a571SMitchell Horne #undef PMC_IS_SHAREABLE_PMC 3457c514a571SMitchell Horne 3458c514a571SMitchell Horne pmc_restore_cpu_binding(&pb); 3459c514a571SMitchell Horne 3460c514a571SMitchell Horne if (n == md->pmd_npmc) { 3461c514a571SMitchell Horne pmc_destroy_pmc_descriptor(pmc); 3462c514a571SMitchell Horne return (EINVAL); 3463c514a571SMitchell Horne } 3464c514a571SMitchell Horne 3465c514a571SMitchell Horne /* Fill in the correct value in the ID field. */ 3466c514a571SMitchell Horne pmc->pm_id = PMC_ID_MAKE_ID(cpu, mode, class, n); 3467c514a571SMitchell Horne 3468c514a571SMitchell Horne PMCDBG5(PMC,ALL,2, "ev=%d class=%d mode=%d n=%d -> pmcid=%x", 3469c514a571SMitchell Horne pmc->pm_event, class, mode, n, pmc->pm_id); 3470c514a571SMitchell Horne 3471c514a571SMitchell Horne /* Process mode PMCs with logging enabled need log files. */ 3472c514a571SMitchell Horne if ((pmc->pm_flags & (PMC_F_LOG_PROCEXIT | PMC_F_LOG_PROCCSW)) != 0) 3473c514a571SMitchell Horne pmc->pm_flags |= PMC_F_NEEDS_LOGFILE; 3474c514a571SMitchell Horne 3475c514a571SMitchell Horne /* All system mode sampling PMCs require a log file. */ 3476c514a571SMitchell Horne if (PMC_IS_SAMPLING_MODE(mode) && PMC_IS_SYSTEM_MODE(mode)) 3477c514a571SMitchell Horne pmc->pm_flags |= PMC_F_NEEDS_LOGFILE; 3478c514a571SMitchell Horne 3479c514a571SMitchell Horne /* 3480c514a571SMitchell Horne * Configure global pmc's immediately. 3481c514a571SMitchell Horne */ 3482c514a571SMitchell Horne if (PMC_IS_SYSTEM_MODE(PMC_TO_MODE(pmc))) { 3483c514a571SMitchell Horne pmc_save_cpu_binding(&pb); 3484c514a571SMitchell Horne pmc_select_cpu(cpu); 3485c514a571SMitchell Horne 3486c514a571SMitchell Horne phw = pmc_pcpu[cpu]->pc_hwpmcs[n]; 3487c514a571SMitchell Horne pcd = pmc_ri_to_classdep(md, n, &adjri); 3488c514a571SMitchell Horne 3489c514a571SMitchell Horne if ((phw->phw_state & PMC_PHW_FLAG_IS_ENABLED) == 0 || 3490c514a571SMitchell Horne (error = pcd->pcd_config_pmc(cpu, adjri, pmc)) != 0) { 3491c514a571SMitchell Horne (void)pcd->pcd_release_pmc(cpu, adjri, pmc); 3492c514a571SMitchell Horne pmc_destroy_pmc_descriptor(pmc); 3493c514a571SMitchell Horne pmc_restore_cpu_binding(&pb); 3494c514a571SMitchell Horne return (EPERM); 3495c514a571SMitchell Horne } 3496c514a571SMitchell Horne 3497c514a571SMitchell Horne pmc_restore_cpu_binding(&pb); 3498c514a571SMitchell Horne } 3499c514a571SMitchell Horne 3500c514a571SMitchell Horne pmc->pm_state = PMC_STATE_ALLOCATED; 3501c514a571SMitchell Horne pmc->pm_class = class; 3502c514a571SMitchell Horne 3503c514a571SMitchell Horne /* 3504c514a571SMitchell Horne * Mark row disposition. 3505c514a571SMitchell Horne */ 3506c514a571SMitchell Horne if (PMC_IS_SYSTEM_MODE(mode)) 3507c514a571SMitchell Horne PMC_MARK_ROW_STANDALONE(n); 3508c514a571SMitchell Horne else 3509c514a571SMitchell Horne PMC_MARK_ROW_THREAD(n); 3510c514a571SMitchell Horne 3511c514a571SMitchell Horne /* 3512c514a571SMitchell Horne * Register this PMC with the current thread as its owner. 3513c514a571SMitchell Horne */ 3514c514a571SMitchell Horne error = pmc_register_owner(p, pmc); 3515c514a571SMitchell Horne if (error != 0) { 3516c514a571SMitchell Horne pmc_release_pmc_descriptor(pmc); 3517c514a571SMitchell Horne pmc_destroy_pmc_descriptor(pmc); 3518c514a571SMitchell Horne return (error); 3519c514a571SMitchell Horne } 3520c514a571SMitchell Horne 3521c514a571SMitchell Horne /* 3522c514a571SMitchell Horne * Return the allocated index. 3523c514a571SMitchell Horne */ 3524c514a571SMitchell Horne pa->pm_pmcid = pmc->pm_id; 3525c514a571SMitchell Horne return (0); 3526c514a571SMitchell Horne } 3527c514a571SMitchell Horne 3528c514a571SMitchell Horne /* 3529a133f642SMitchell Horne * Main body of PMC_OP_PMCATTACH. 3530a133f642SMitchell Horne */ 3531a133f642SMitchell Horne static int 3532a133f642SMitchell Horne pmc_do_op_pmcattach(struct thread *td, struct pmc_op_pmcattach a) 3533a133f642SMitchell Horne { 3534a133f642SMitchell Horne struct pmc *pm; 3535a133f642SMitchell Horne struct proc *p; 3536a133f642SMitchell Horne int error; 3537a133f642SMitchell Horne 3538a133f642SMitchell Horne sx_assert(&pmc_sx, SX_XLOCKED); 3539a133f642SMitchell Horne 3540a133f642SMitchell Horne if (a.pm_pid < 0) { 3541a133f642SMitchell Horne return (EINVAL); 3542a133f642SMitchell Horne } else if (a.pm_pid == 0) { 3543a133f642SMitchell Horne a.pm_pid = td->td_proc->p_pid; 3544a133f642SMitchell Horne } 3545a133f642SMitchell Horne 3546a133f642SMitchell Horne error = pmc_find_pmc(a.pm_pmc, &pm); 3547a133f642SMitchell Horne if (error != 0) 3548a133f642SMitchell Horne return (error); 3549a133f642SMitchell Horne 3550a133f642SMitchell Horne if (PMC_IS_SYSTEM_MODE(PMC_TO_MODE(pm))) 3551a133f642SMitchell Horne return (EINVAL); 3552a133f642SMitchell Horne 3553a133f642SMitchell Horne /* PMCs may be (re)attached only when allocated or stopped */ 3554a133f642SMitchell Horne if (pm->pm_state == PMC_STATE_RUNNING) { 3555a133f642SMitchell Horne return (EBUSY); 3556a133f642SMitchell Horne } else if (pm->pm_state != PMC_STATE_ALLOCATED && 3557a133f642SMitchell Horne pm->pm_state != PMC_STATE_STOPPED) { 3558a133f642SMitchell Horne return (EINVAL); 3559a133f642SMitchell Horne } 3560a133f642SMitchell Horne 3561a133f642SMitchell Horne /* lookup pid */ 3562a133f642SMitchell Horne if ((p = pfind(a.pm_pid)) == NULL) 3563a133f642SMitchell Horne return (ESRCH); 3564a133f642SMitchell Horne 3565a133f642SMitchell Horne /* 3566a133f642SMitchell Horne * Ignore processes that are working on exiting. 3567a133f642SMitchell Horne */ 3568a133f642SMitchell Horne if ((p->p_flag & P_WEXIT) != 0) { 3569a133f642SMitchell Horne PROC_UNLOCK(p); /* pfind() returns a locked process */ 3570a133f642SMitchell Horne return (ESRCH); 3571a133f642SMitchell Horne } 3572a133f642SMitchell Horne 3573a133f642SMitchell Horne /* 3574a133f642SMitchell Horne * We are allowed to attach a PMC to a process if we can debug it. 3575a133f642SMitchell Horne */ 3576a133f642SMitchell Horne error = p_candebug(curthread, p); 3577a133f642SMitchell Horne 3578a133f642SMitchell Horne PROC_UNLOCK(p); 3579a133f642SMitchell Horne 3580a133f642SMitchell Horne if (error == 0) 3581a133f642SMitchell Horne error = pmc_attach_process(p, pm); 3582a133f642SMitchell Horne 3583a133f642SMitchell Horne return (error); 3584a133f642SMitchell Horne } 3585a133f642SMitchell Horne 3586a133f642SMitchell Horne /* 3587a133f642SMitchell Horne * Main body of PMC_OP_PMCDETACH. 3588a133f642SMitchell Horne */ 3589a133f642SMitchell Horne static int 3590a133f642SMitchell Horne pmc_do_op_pmcdetach(struct thread *td, struct pmc_op_pmcattach a) 3591a133f642SMitchell Horne { 3592a133f642SMitchell Horne struct pmc *pm; 3593a133f642SMitchell Horne struct proc *p; 3594a133f642SMitchell Horne int error; 3595a133f642SMitchell Horne 3596a133f642SMitchell Horne if (a.pm_pid < 0) { 3597a133f642SMitchell Horne return (EINVAL); 3598a133f642SMitchell Horne } else if (a.pm_pid == 0) 3599a133f642SMitchell Horne a.pm_pid = td->td_proc->p_pid; 3600a133f642SMitchell Horne 3601a133f642SMitchell Horne error = pmc_find_pmc(a.pm_pmc, &pm); 3602a133f642SMitchell Horne if (error != 0) 3603a133f642SMitchell Horne return (error); 3604a133f642SMitchell Horne 3605a133f642SMitchell Horne if ((p = pfind(a.pm_pid)) == NULL) 3606a133f642SMitchell Horne return (ESRCH); 3607a133f642SMitchell Horne 3608a133f642SMitchell Horne /* 3609a133f642SMitchell Horne * Treat processes that are in the process of exiting as if they were 3610a133f642SMitchell Horne * not present. 3611a133f642SMitchell Horne */ 3612a133f642SMitchell Horne if ((p->p_flag & P_WEXIT) != 0) { 3613a133f642SMitchell Horne PROC_UNLOCK(p); 3614a133f642SMitchell Horne return (ESRCH); 3615a133f642SMitchell Horne } 3616a133f642SMitchell Horne 3617a133f642SMitchell Horne PROC_UNLOCK(p); /* pfind() returns a locked process */ 3618a133f642SMitchell Horne 3619a133f642SMitchell Horne if (error == 0) 3620a133f642SMitchell Horne error = pmc_detach_process(p, pm); 3621a133f642SMitchell Horne 3622a133f642SMitchell Horne return (error); 3623a133f642SMitchell Horne } 3624a133f642SMitchell Horne 3625*f4fac946SMitchell Horne /* 3626*f4fac946SMitchell Horne * Main body of PMC_OP_PMCRELEASE. 3627*f4fac946SMitchell Horne */ 3628*f4fac946SMitchell Horne static int 3629*f4fac946SMitchell Horne pmc_do_op_pmcrelease(pmc_id_t pmcid) 3630*f4fac946SMitchell Horne { 3631*f4fac946SMitchell Horne struct pmc_owner *po; 3632*f4fac946SMitchell Horne struct pmc *pm; 3633*f4fac946SMitchell Horne int error; 3634*f4fac946SMitchell Horne 3635*f4fac946SMitchell Horne /* 3636*f4fac946SMitchell Horne * Find PMC pointer for the named PMC. 3637*f4fac946SMitchell Horne * 3638*f4fac946SMitchell Horne * Use pmc_release_pmc_descriptor() to switch off the 3639*f4fac946SMitchell Horne * PMC, remove all its target threads, and remove the 3640*f4fac946SMitchell Horne * PMC from its owner's list. 3641*f4fac946SMitchell Horne * 3642*f4fac946SMitchell Horne * Remove the owner record if this is the last PMC 3643*f4fac946SMitchell Horne * owned. 3644*f4fac946SMitchell Horne * 3645*f4fac946SMitchell Horne * Free up space. 3646*f4fac946SMitchell Horne */ 3647*f4fac946SMitchell Horne error = pmc_find_pmc(pmcid, &pm); 3648*f4fac946SMitchell Horne if (error != 0) 3649*f4fac946SMitchell Horne return (error); 3650*f4fac946SMitchell Horne 3651*f4fac946SMitchell Horne po = pm->pm_owner; 3652*f4fac946SMitchell Horne pmc_release_pmc_descriptor(pm); 3653*f4fac946SMitchell Horne pmc_maybe_remove_owner(po); 3654*f4fac946SMitchell Horne pmc_destroy_pmc_descriptor(pm); 3655*f4fac946SMitchell Horne 3656*f4fac946SMitchell Horne return (error); 3657*f4fac946SMitchell Horne } 3658*f4fac946SMitchell Horne 3659ebccf1e3SJoseph Koshy static int 3660ebccf1e3SJoseph Koshy pmc_syscall_handler(struct thread *td, void *syscall_args) 3661ebccf1e3SJoseph Koshy { 3662ebccf1e3SJoseph Koshy struct pmc_syscall_args *c; 366320b555e1SKonstantin Belousov void *pmclog_proc_handle; 3664ebccf1e3SJoseph Koshy void *arg; 366501c35b67SMitchell Horne int error, op; 366601c35b67SMitchell Horne bool is_sx_downgraded; 3667ebccf1e3SJoseph Koshy 3668ebccf1e3SJoseph Koshy c = (struct pmc_syscall_args *)syscall_args; 3669ebccf1e3SJoseph Koshy op = c->pmop_code; 3670ebccf1e3SJoseph Koshy arg = c->pmop_data; 3671693cd307SMitchell Horne 36720f00315cSMatt Macy /* PMC isn't set up yet */ 36730f00315cSMatt Macy if (pmc_hook == NULL) 36740f00315cSMatt Macy return (EINVAL); 3675693cd307SMitchell Horne 367620b555e1SKonstantin Belousov if (op == PMC_OP_CONFIGURELOG) { 367720b555e1SKonstantin Belousov /* 367820b555e1SKonstantin Belousov * We cannot create the logging process inside 367920b555e1SKonstantin Belousov * pmclog_configure_log() because there is a LOR 368020b555e1SKonstantin Belousov * between pmc_sx and process structure locks. 368120b555e1SKonstantin Belousov * Instead, pre-create the process and ignite the loop 368220b555e1SKonstantin Belousov * if everything is fine, otherwise direct the process 368320b555e1SKonstantin Belousov * to exit. 368420b555e1SKonstantin Belousov */ 368520b555e1SKonstantin Belousov error = pmclog_proc_create(td, &pmclog_proc_handle); 368620b555e1SKonstantin Belousov if (error != 0) 368720b555e1SKonstantin Belousov goto done_syscall; 368820b555e1SKonstantin Belousov } 368920b555e1SKonstantin Belousov 369020b555e1SKonstantin Belousov PMC_GET_SX_XLOCK(ENOSYS); 369101c35b67SMitchell Horne is_sx_downgraded = false; 36924a3690dfSJohn Baldwin PMCDBG3(MOD,PMS,1, "syscall op=%d \"%s\" arg=%p", op, 3693ebccf1e3SJoseph Koshy pmc_op_to_name[op], arg); 3694ebccf1e3SJoseph Koshy 3695ebccf1e3SJoseph Koshy error = 0; 3696e6b475e0SMatt Macy counter_u64_add(pmc_stats.pm_syscalls, 1); 3697ebccf1e3SJoseph Koshy 3698cf9ef806SKonstantin Belousov switch (op) { 3699ebccf1e3SJoseph Koshy 3700ebccf1e3SJoseph Koshy 3701ebccf1e3SJoseph Koshy /* 3702ebccf1e3SJoseph Koshy * Configure a log file. 3703ebccf1e3SJoseph Koshy * 3704ebccf1e3SJoseph Koshy * XXX This OP will be reworked. 3705ebccf1e3SJoseph Koshy */ 3706ebccf1e3SJoseph Koshy 3707ebccf1e3SJoseph Koshy case PMC_OP_CONFIGURELOG: 3708ebccf1e3SJoseph Koshy { 370949874f6eSJoseph Koshy struct proc *p; 3710fc9a2b80SJoseph Koshy struct pmc *pm; 3711ebccf1e3SJoseph Koshy struct pmc_owner *po; 3712ebccf1e3SJoseph Koshy struct pmc_op_configurelog cl; 3713ebccf1e3SJoseph Koshy 371420b555e1SKonstantin Belousov if ((error = copyin(arg, &cl, sizeof(cl))) != 0) { 371520b555e1SKonstantin Belousov pmclog_proc_ignite(pmclog_proc_handle, NULL); 3716ebccf1e3SJoseph Koshy break; 371720b555e1SKonstantin Belousov } 3718ebccf1e3SJoseph Koshy 37198e63e787SJessica Clarke /* No flags currently implemented */ 37208e63e787SJessica Clarke if (cl.pm_flags != 0) { 37218e63e787SJessica Clarke error = EINVAL; 37228e63e787SJessica Clarke break; 37238e63e787SJessica Clarke } 37248e63e787SJessica Clarke 3725ebccf1e3SJoseph Koshy /* mark this process as owning a log file */ 3726ebccf1e3SJoseph Koshy p = td->td_proc; 3727ebccf1e3SJoseph Koshy if ((po = pmc_find_owner_descriptor(p)) == NULL) 3728f263522aSJoseph Koshy if ((po = pmc_allocate_owner_descriptor(p)) == NULL) { 372920b555e1SKonstantin Belousov pmclog_proc_ignite(pmclog_proc_handle, NULL); 3730f263522aSJoseph Koshy error = ENOMEM; 3731ebccf1e3SJoseph Koshy break; 3732f263522aSJoseph Koshy } 3733ebccf1e3SJoseph Koshy 3734f263522aSJoseph Koshy /* 3735f263522aSJoseph Koshy * If a valid fd was passed in, try to configure that, 3736f263522aSJoseph Koshy * otherwise if 'fd' was less than zero and there was 3737f263522aSJoseph Koshy * a log file configured, flush its buffers and 3738f263522aSJoseph Koshy * de-configure it. 3739f263522aSJoseph Koshy */ 3740ca2d94beSAttilio Rao if (cl.pm_logfd >= 0) { 37410cfab8ddSJoseph Koshy error = pmclog_configure_log(md, po, cl.pm_logfd); 374220b555e1SKonstantin Belousov pmclog_proc_ignite(pmclog_proc_handle, error == 0 ? 374320b555e1SKonstantin Belousov po : NULL); 3744ca2d94beSAttilio Rao } else if (po->po_flags & PMC_PO_OWNS_LOGFILE) { 374520b555e1SKonstantin Belousov pmclog_proc_ignite(pmclog_proc_handle, NULL); 3746dceed24aSFabien Thomas error = pmclog_close(po); 3747fc9a2b80SJoseph Koshy if (error == 0) { 3748fc9a2b80SJoseph Koshy LIST_FOREACH(pm, &po->po_pmcs, pm_next) 374966f3bc78SJoseph Koshy if (pm->pm_flags & PMC_F_NEEDS_LOGFILE && 375066f3bc78SJoseph Koshy pm->pm_state == PMC_STATE_RUNNING) 3751fc9a2b80SJoseph Koshy pmc_stop(pm); 3752f263522aSJoseph Koshy error = pmclog_deconfigure_log(po); 3753fc9a2b80SJoseph Koshy } 375420b555e1SKonstantin Belousov } else { 375520b555e1SKonstantin Belousov pmclog_proc_ignite(pmclog_proc_handle, NULL); 3756f263522aSJoseph Koshy error = EINVAL; 375720b555e1SKonstantin Belousov } 3758ebccf1e3SJoseph Koshy } 3759ebccf1e3SJoseph Koshy break; 3760ebccf1e3SJoseph Koshy 3761ebccf1e3SJoseph Koshy /* 3762f263522aSJoseph Koshy * Flush a log file. 3763f263522aSJoseph Koshy */ 3764f263522aSJoseph Koshy 3765f263522aSJoseph Koshy case PMC_OP_FLUSHLOG: 3766f263522aSJoseph Koshy { 3767f263522aSJoseph Koshy struct pmc_owner *po; 3768f263522aSJoseph Koshy 3769f263522aSJoseph Koshy sx_assert(&pmc_sx, SX_XLOCKED); 3770f263522aSJoseph Koshy 3771f263522aSJoseph Koshy if ((po = pmc_find_owner_descriptor(td->td_proc)) == NULL) { 3772f263522aSJoseph Koshy error = EINVAL; 3773f263522aSJoseph Koshy break; 3774f263522aSJoseph Koshy } 3775f263522aSJoseph Koshy 3776ebfaf69cSMatt Macy error = pmclog_flush(po, 0); 3777f263522aSJoseph Koshy } 3778f263522aSJoseph Koshy break; 3779f263522aSJoseph Koshy 3780f263522aSJoseph Koshy /* 3781dceed24aSFabien Thomas * Close a log file. 3782dceed24aSFabien Thomas */ 3783dceed24aSFabien Thomas 3784dceed24aSFabien Thomas case PMC_OP_CLOSELOG: 3785dceed24aSFabien Thomas { 3786dceed24aSFabien Thomas struct pmc_owner *po; 3787dceed24aSFabien Thomas 3788dceed24aSFabien Thomas sx_assert(&pmc_sx, SX_XLOCKED); 3789dceed24aSFabien Thomas 3790dceed24aSFabien Thomas if ((po = pmc_find_owner_descriptor(td->td_proc)) == NULL) { 3791dceed24aSFabien Thomas error = EINVAL; 3792dceed24aSFabien Thomas break; 3793dceed24aSFabien Thomas } 3794dceed24aSFabien Thomas 3795dceed24aSFabien Thomas error = pmclog_close(po); 3796dceed24aSFabien Thomas } 3797dceed24aSFabien Thomas break; 3798dceed24aSFabien Thomas 3799dceed24aSFabien Thomas /* 3800ebccf1e3SJoseph Koshy * Retrieve hardware configuration. 3801ebccf1e3SJoseph Koshy */ 3802ebccf1e3SJoseph Koshy 3803ebccf1e3SJoseph Koshy case PMC_OP_GETCPUINFO: /* CPU information */ 3804ebccf1e3SJoseph Koshy { 3805ebccf1e3SJoseph Koshy struct pmc_op_getcpuinfo gci; 3806e829eb6dSJoseph Koshy struct pmc_classinfo *pci; 3807e829eb6dSJoseph Koshy struct pmc_classdep *pcd; 3808e829eb6dSJoseph Koshy int cl; 3809ebccf1e3SJoseph Koshy 38108f77f60fSMark Johnston memset(&gci, 0, sizeof(gci)); 3811ebccf1e3SJoseph Koshy gci.pm_cputype = md->pmd_cputype; 3812122ccdc1SJoseph Koshy gci.pm_ncpu = pmc_cpu_max(); 3813ebccf1e3SJoseph Koshy gci.pm_npmc = md->pmd_npmc; 3814ebccf1e3SJoseph Koshy gci.pm_nclass = md->pmd_nclass; 3815e829eb6dSJoseph Koshy pci = gci.pm_classes; 3816e829eb6dSJoseph Koshy pcd = md->pmd_classdep; 3817e829eb6dSJoseph Koshy for (cl = 0; cl < md->pmd_nclass; cl++, pci++, pcd++) { 3818e829eb6dSJoseph Koshy pci->pm_caps = pcd->pcd_caps; 3819e829eb6dSJoseph Koshy pci->pm_class = pcd->pcd_class; 3820e829eb6dSJoseph Koshy pci->pm_width = pcd->pcd_width; 3821e829eb6dSJoseph Koshy pci->pm_num = pcd->pcd_num; 3822e829eb6dSJoseph Koshy } 3823ebccf1e3SJoseph Koshy error = copyout(&gci, arg, sizeof(gci)); 3824ebccf1e3SJoseph Koshy } 3825ebccf1e3SJoseph Koshy break; 3826ebccf1e3SJoseph Koshy 3827f5f9340bSFabien Thomas /* 3828f5f9340bSFabien Thomas * Retrieve soft events list. 3829f5f9340bSFabien Thomas */ 3830f5f9340bSFabien Thomas case PMC_OP_GETDYNEVENTINFO: 3831f5f9340bSFabien Thomas { 3832f5f9340bSFabien Thomas enum pmc_class cl; 3833f5f9340bSFabien Thomas enum pmc_event ev; 3834f5f9340bSFabien Thomas struct pmc_op_getdyneventinfo *gei; 3835f5f9340bSFabien Thomas struct pmc_dyn_event_descr dev; 3836f5f9340bSFabien Thomas struct pmc_soft *ps; 3837f5f9340bSFabien Thomas uint32_t nevent; 3838f5f9340bSFabien Thomas 3839f5f9340bSFabien Thomas sx_assert(&pmc_sx, SX_LOCKED); 3840f5f9340bSFabien Thomas 3841f5f9340bSFabien Thomas gei = (struct pmc_op_getdyneventinfo *) arg; 3842f5f9340bSFabien Thomas 3843f5f9340bSFabien Thomas if ((error = copyin(&gei->pm_class, &cl, sizeof(cl))) != 0) 3844f5f9340bSFabien Thomas break; 3845f5f9340bSFabien Thomas 3846f5f9340bSFabien Thomas /* Only SOFT class is dynamic. */ 3847f5f9340bSFabien Thomas if (cl != PMC_CLASS_SOFT) { 3848f5f9340bSFabien Thomas error = EINVAL; 3849f5f9340bSFabien Thomas break; 3850f5f9340bSFabien Thomas } 3851f5f9340bSFabien Thomas 3852f5f9340bSFabien Thomas nevent = 0; 3853ca57f64fSSean Bruno for (ev = PMC_EV_SOFT_FIRST; (int)ev <= PMC_EV_SOFT_LAST; ev++) { 3854f5f9340bSFabien Thomas ps = pmc_soft_ev_acquire(ev); 3855f5f9340bSFabien Thomas if (ps == NULL) 3856f5f9340bSFabien Thomas continue; 3857f5f9340bSFabien Thomas bcopy(&ps->ps_ev, &dev, sizeof(dev)); 3858f5f9340bSFabien Thomas pmc_soft_ev_release(ps); 3859f5f9340bSFabien Thomas 3860f5f9340bSFabien Thomas error = copyout(&dev, 3861f5f9340bSFabien Thomas &gei->pm_events[nevent], 3862f5f9340bSFabien Thomas sizeof(struct pmc_dyn_event_descr)); 3863f5f9340bSFabien Thomas if (error != 0) 3864f5f9340bSFabien Thomas break; 3865f5f9340bSFabien Thomas nevent++; 3866f5f9340bSFabien Thomas } 3867f5f9340bSFabien Thomas if (error != 0) 3868f5f9340bSFabien Thomas break; 3869f5f9340bSFabien Thomas 3870f5f9340bSFabien Thomas error = copyout(&nevent, &gei->pm_nevent, 3871f5f9340bSFabien Thomas sizeof(nevent)); 3872f5f9340bSFabien Thomas } 3873f5f9340bSFabien Thomas break; 3874ebccf1e3SJoseph Koshy 3875ebccf1e3SJoseph Koshy /* 3876ebccf1e3SJoseph Koshy * Get module statistics 3877ebccf1e3SJoseph Koshy */ 3878ebccf1e3SJoseph Koshy 3879ebccf1e3SJoseph Koshy case PMC_OP_GETDRIVERSTATS: 3880ebccf1e3SJoseph Koshy { 3881ebccf1e3SJoseph Koshy struct pmc_op_getdriverstats gms; 3882e6b475e0SMatt Macy #define CFETCH(a, b, field) a.field = counter_u64_fetch(b.field) 3883e6b475e0SMatt Macy CFETCH(gms, pmc_stats, pm_intr_ignored); 3884e6b475e0SMatt Macy CFETCH(gms, pmc_stats, pm_intr_processed); 3885e6b475e0SMatt Macy CFETCH(gms, pmc_stats, pm_intr_bufferfull); 3886e6b475e0SMatt Macy CFETCH(gms, pmc_stats, pm_syscalls); 3887e6b475e0SMatt Macy CFETCH(gms, pmc_stats, pm_syscall_errors); 3888e6b475e0SMatt Macy CFETCH(gms, pmc_stats, pm_buffer_requests); 3889e6b475e0SMatt Macy CFETCH(gms, pmc_stats, pm_buffer_requests_failed); 3890e6b475e0SMatt Macy CFETCH(gms, pmc_stats, pm_log_sweeps); 3891e6b475e0SMatt Macy #undef CFETCH 3892ebccf1e3SJoseph Koshy error = copyout(&gms, arg, sizeof(gms)); 3893ebccf1e3SJoseph Koshy } 3894ebccf1e3SJoseph Koshy break; 3895ebccf1e3SJoseph Koshy 3896ebccf1e3SJoseph Koshy 3897ebccf1e3SJoseph Koshy /* 3898ebccf1e3SJoseph Koshy * Retrieve module version number 3899ebccf1e3SJoseph Koshy */ 3900ebccf1e3SJoseph Koshy 3901ebccf1e3SJoseph Koshy case PMC_OP_GETMODULEVERSION: 3902ebccf1e3SJoseph Koshy { 3903f263522aSJoseph Koshy uint32_t cv, modv; 3904f263522aSJoseph Koshy 3905f263522aSJoseph Koshy /* retrieve the client's idea of the ABI version */ 3906f263522aSJoseph Koshy if ((error = copyin(arg, &cv, sizeof(uint32_t))) != 0) 3907f263522aSJoseph Koshy break; 3908f263522aSJoseph Koshy /* don't service clients newer than our driver */ 3909f263522aSJoseph Koshy modv = PMC_VERSION; 3910f263522aSJoseph Koshy if ((cv & 0xFFFF0000) > (modv & 0xFFFF0000)) { 3911f263522aSJoseph Koshy error = EPROGMISMATCH; 3912f263522aSJoseph Koshy break; 3913f263522aSJoseph Koshy } 3914f263522aSJoseph Koshy error = copyout(&modv, arg, sizeof(int)); 3915ebccf1e3SJoseph Koshy } 3916ebccf1e3SJoseph Koshy break; 3917ebccf1e3SJoseph Koshy 3918ebccf1e3SJoseph Koshy 3919ebccf1e3SJoseph Koshy /* 3920ebccf1e3SJoseph Koshy * Retrieve the state of all the PMCs on a given 3921ebccf1e3SJoseph Koshy * CPU. 3922ebccf1e3SJoseph Koshy */ 3923ebccf1e3SJoseph Koshy 3924ebccf1e3SJoseph Koshy case PMC_OP_GETPMCINFO: 3925ebccf1e3SJoseph Koshy { 3926e829eb6dSJoseph Koshy int ari; 3927ebccf1e3SJoseph Koshy struct pmc *pm; 3928e829eb6dSJoseph Koshy size_t pmcinfo_size; 3929e829eb6dSJoseph Koshy uint32_t cpu, n, npmc; 3930ebccf1e3SJoseph Koshy struct pmc_owner *po; 3931ebccf1e3SJoseph Koshy struct pmc_binding pb; 3932e829eb6dSJoseph Koshy struct pmc_classdep *pcd; 3933e829eb6dSJoseph Koshy struct pmc_info *p, *pmcinfo; 3934e829eb6dSJoseph Koshy struct pmc_op_getpmcinfo *gpi; 3935ebccf1e3SJoseph Koshy 3936ebccf1e3SJoseph Koshy PMC_DOWNGRADE_SX(); 3937ebccf1e3SJoseph Koshy 3938ebccf1e3SJoseph Koshy gpi = (struct pmc_op_getpmcinfo *) arg; 3939ebccf1e3SJoseph Koshy 3940ebccf1e3SJoseph Koshy if ((error = copyin(&gpi->pm_cpu, &cpu, sizeof(cpu))) != 0) 3941ebccf1e3SJoseph Koshy break; 3942ebccf1e3SJoseph Koshy 3943122ccdc1SJoseph Koshy if (cpu >= pmc_cpu_max()) { 3944ebccf1e3SJoseph Koshy error = EINVAL; 3945ebccf1e3SJoseph Koshy break; 3946ebccf1e3SJoseph Koshy } 3947ebccf1e3SJoseph Koshy 3948122ccdc1SJoseph Koshy if (!pmc_cpu_is_active(cpu)) { 3949ebccf1e3SJoseph Koshy error = ENXIO; 3950ebccf1e3SJoseph Koshy break; 3951ebccf1e3SJoseph Koshy } 3952ebccf1e3SJoseph Koshy 3953ebccf1e3SJoseph Koshy /* switch to CPU 'cpu' */ 3954ebccf1e3SJoseph Koshy pmc_save_cpu_binding(&pb); 3955ebccf1e3SJoseph Koshy pmc_select_cpu(cpu); 3956ebccf1e3SJoseph Koshy 3957ebccf1e3SJoseph Koshy npmc = md->pmd_npmc; 3958ebccf1e3SJoseph Koshy 3959ebccf1e3SJoseph Koshy pmcinfo_size = npmc * sizeof(struct pmc_info); 39608f77f60fSMark Johnston pmcinfo = malloc(pmcinfo_size, M_PMC, M_WAITOK | M_ZERO); 3961ebccf1e3SJoseph Koshy 3962ebccf1e3SJoseph Koshy p = pmcinfo; 3963ebccf1e3SJoseph Koshy 3964ebccf1e3SJoseph Koshy for (n = 0; n < md->pmd_npmc; n++, p++) { 3965ebccf1e3SJoseph Koshy 3966e829eb6dSJoseph Koshy pcd = pmc_ri_to_classdep(md, n, &ari); 3967e829eb6dSJoseph Koshy 3968e829eb6dSJoseph Koshy KASSERT(pcd != NULL, 3969e829eb6dSJoseph Koshy ("[pmc,%d] null pcd ri=%d", __LINE__, n)); 3970e829eb6dSJoseph Koshy 3971e829eb6dSJoseph Koshy if ((error = pcd->pcd_describe(cpu, ari, p, &pm)) != 0) 3972ebccf1e3SJoseph Koshy break; 3973ebccf1e3SJoseph Koshy 3974ebccf1e3SJoseph Koshy if (PMC_ROW_DISP_IS_STANDALONE(n)) 3975ebccf1e3SJoseph Koshy p->pm_rowdisp = PMC_DISP_STANDALONE; 3976ebccf1e3SJoseph Koshy else if (PMC_ROW_DISP_IS_THREAD(n)) 3977ebccf1e3SJoseph Koshy p->pm_rowdisp = PMC_DISP_THREAD; 3978ebccf1e3SJoseph Koshy else 3979ebccf1e3SJoseph Koshy p->pm_rowdisp = PMC_DISP_FREE; 3980ebccf1e3SJoseph Koshy 3981ebccf1e3SJoseph Koshy p->pm_ownerpid = -1; 3982ebccf1e3SJoseph Koshy 3983ebccf1e3SJoseph Koshy if (pm == NULL) /* no PMC associated */ 3984ebccf1e3SJoseph Koshy continue; 3985ebccf1e3SJoseph Koshy 3986ebccf1e3SJoseph Koshy po = pm->pm_owner; 3987ebccf1e3SJoseph Koshy 3988ebccf1e3SJoseph Koshy KASSERT(po->po_owner != NULL, 3989ebccf1e3SJoseph Koshy ("[pmc,%d] pmc_owner had a null proc pointer", 3990ebccf1e3SJoseph Koshy __LINE__)); 3991ebccf1e3SJoseph Koshy 3992ebccf1e3SJoseph Koshy p->pm_ownerpid = po->po_owner->p_pid; 3993c5153e19SJoseph Koshy p->pm_mode = PMC_TO_MODE(pm); 3994ebccf1e3SJoseph Koshy p->pm_event = pm->pm_event; 3995ebccf1e3SJoseph Koshy p->pm_flags = pm->pm_flags; 3996ebccf1e3SJoseph Koshy 3997c5153e19SJoseph Koshy if (PMC_IS_SAMPLING_MODE(PMC_TO_MODE(pm))) 3998ebccf1e3SJoseph Koshy p->pm_reloadcount = 3999ebccf1e3SJoseph Koshy pm->pm_sc.pm_reloadcount; 4000ebccf1e3SJoseph Koshy } 4001ebccf1e3SJoseph Koshy 4002ebccf1e3SJoseph Koshy pmc_restore_cpu_binding(&pb); 4003ebccf1e3SJoseph Koshy 4004ebccf1e3SJoseph Koshy /* now copy out the PMC info collected */ 4005ebccf1e3SJoseph Koshy if (error == 0) 4006ebccf1e3SJoseph Koshy error = copyout(pmcinfo, &gpi->pm_pmcs, pmcinfo_size); 4007ebccf1e3SJoseph Koshy 40081ede983cSDag-Erling Smørgrav free(pmcinfo, M_PMC); 4009ebccf1e3SJoseph Koshy } 4010ebccf1e3SJoseph Koshy break; 4011ebccf1e3SJoseph Koshy 4012ebccf1e3SJoseph Koshy 4013ebccf1e3SJoseph Koshy /* 4014ebccf1e3SJoseph Koshy * Set the administrative state of a PMC. I.e. whether 4015ebccf1e3SJoseph Koshy * the PMC is to be used or not. 4016ebccf1e3SJoseph Koshy */ 4017ebccf1e3SJoseph Koshy 4018ebccf1e3SJoseph Koshy case PMC_OP_PMCADMIN: 4019ebccf1e3SJoseph Koshy { 4020ebccf1e3SJoseph Koshy int cpu, ri; 4021ebccf1e3SJoseph Koshy enum pmc_state request; 4022ebccf1e3SJoseph Koshy struct pmc_cpu *pc; 4023ebccf1e3SJoseph Koshy struct pmc_hw *phw; 4024ebccf1e3SJoseph Koshy struct pmc_op_pmcadmin pma; 4025ebccf1e3SJoseph Koshy struct pmc_binding pb; 4026ebccf1e3SJoseph Koshy 4027ebccf1e3SJoseph Koshy sx_assert(&pmc_sx, SX_XLOCKED); 4028ebccf1e3SJoseph Koshy 4029ebccf1e3SJoseph Koshy KASSERT(td == curthread, 4030ebccf1e3SJoseph Koshy ("[pmc,%d] td != curthread", __LINE__)); 4031ebccf1e3SJoseph Koshy 4032acd3428bSRobert Watson error = priv_check(td, PRIV_PMC_MANAGE); 4033acd3428bSRobert Watson if (error) 4034ebccf1e3SJoseph Koshy break; 4035ebccf1e3SJoseph Koshy 4036ebccf1e3SJoseph Koshy if ((error = copyin(arg, &pma, sizeof(pma))) != 0) 4037ebccf1e3SJoseph Koshy break; 4038ebccf1e3SJoseph Koshy 4039ebccf1e3SJoseph Koshy cpu = pma.pm_cpu; 4040ebccf1e3SJoseph Koshy 4041122ccdc1SJoseph Koshy if (cpu < 0 || cpu >= (int) pmc_cpu_max()) { 4042ebccf1e3SJoseph Koshy error = EINVAL; 4043ebccf1e3SJoseph Koshy break; 4044ebccf1e3SJoseph Koshy } 4045ebccf1e3SJoseph Koshy 4046122ccdc1SJoseph Koshy if (!pmc_cpu_is_active(cpu)) { 4047ebccf1e3SJoseph Koshy error = ENXIO; 4048ebccf1e3SJoseph Koshy break; 4049ebccf1e3SJoseph Koshy } 4050ebccf1e3SJoseph Koshy 4051ebccf1e3SJoseph Koshy request = pma.pm_state; 4052ebccf1e3SJoseph Koshy 4053ebccf1e3SJoseph Koshy if (request != PMC_STATE_DISABLED && 4054ebccf1e3SJoseph Koshy request != PMC_STATE_FREE) { 4055ebccf1e3SJoseph Koshy error = EINVAL; 4056ebccf1e3SJoseph Koshy break; 4057ebccf1e3SJoseph Koshy } 4058ebccf1e3SJoseph Koshy 4059ebccf1e3SJoseph Koshy ri = pma.pm_pmc; /* pmc id == row index */ 4060ebccf1e3SJoseph Koshy if (ri < 0 || ri >= (int) md->pmd_npmc) { 4061ebccf1e3SJoseph Koshy error = EINVAL; 4062ebccf1e3SJoseph Koshy break; 4063ebccf1e3SJoseph Koshy } 4064ebccf1e3SJoseph Koshy 4065ebccf1e3SJoseph Koshy /* 4066ebccf1e3SJoseph Koshy * We can't disable a PMC with a row-index allocated 4067ebccf1e3SJoseph Koshy * for process virtual PMCs. 4068ebccf1e3SJoseph Koshy */ 4069ebccf1e3SJoseph Koshy 4070ebccf1e3SJoseph Koshy if (PMC_ROW_DISP_IS_THREAD(ri) && 4071ebccf1e3SJoseph Koshy request == PMC_STATE_DISABLED) { 4072ebccf1e3SJoseph Koshy error = EBUSY; 4073ebccf1e3SJoseph Koshy break; 4074ebccf1e3SJoseph Koshy } 4075ebccf1e3SJoseph Koshy 4076ebccf1e3SJoseph Koshy /* 4077ebccf1e3SJoseph Koshy * otherwise, this PMC on this CPU is either free or 4078ebccf1e3SJoseph Koshy * in system-wide mode. 4079ebccf1e3SJoseph Koshy */ 4080ebccf1e3SJoseph Koshy 4081ebccf1e3SJoseph Koshy pmc_save_cpu_binding(&pb); 4082ebccf1e3SJoseph Koshy pmc_select_cpu(cpu); 4083ebccf1e3SJoseph Koshy 4084ebccf1e3SJoseph Koshy pc = pmc_pcpu[cpu]; 4085ebccf1e3SJoseph Koshy phw = pc->pc_hwpmcs[ri]; 4086ebccf1e3SJoseph Koshy 4087ebccf1e3SJoseph Koshy /* 4088ebccf1e3SJoseph Koshy * XXX do we need some kind of 'forced' disable? 4089ebccf1e3SJoseph Koshy */ 4090ebccf1e3SJoseph Koshy 4091ebccf1e3SJoseph Koshy if (phw->phw_pmc == NULL) { 4092ebccf1e3SJoseph Koshy if (request == PMC_STATE_DISABLED && 4093ebccf1e3SJoseph Koshy (phw->phw_state & PMC_PHW_FLAG_IS_ENABLED)) { 4094ebccf1e3SJoseph Koshy phw->phw_state &= ~PMC_PHW_FLAG_IS_ENABLED; 4095ebccf1e3SJoseph Koshy PMC_MARK_ROW_STANDALONE(ri); 4096ebccf1e3SJoseph Koshy } else if (request == PMC_STATE_FREE && 4097ebccf1e3SJoseph Koshy (phw->phw_state & PMC_PHW_FLAG_IS_ENABLED) == 0) { 4098ebccf1e3SJoseph Koshy phw->phw_state |= PMC_PHW_FLAG_IS_ENABLED; 4099ebccf1e3SJoseph Koshy PMC_UNMARK_ROW_STANDALONE(ri); 4100ebccf1e3SJoseph Koshy } 4101ebccf1e3SJoseph Koshy /* other cases are a no-op */ 4102ebccf1e3SJoseph Koshy } else 4103ebccf1e3SJoseph Koshy error = EBUSY; 4104ebccf1e3SJoseph Koshy 4105ebccf1e3SJoseph Koshy pmc_restore_cpu_binding(&pb); 4106ebccf1e3SJoseph Koshy } 4107ebccf1e3SJoseph Koshy break; 4108ebccf1e3SJoseph Koshy 4109ebccf1e3SJoseph Koshy 4110ebccf1e3SJoseph Koshy /* 4111ebccf1e3SJoseph Koshy * Allocate a PMC. 4112ebccf1e3SJoseph Koshy */ 4113ebccf1e3SJoseph Koshy case PMC_OP_PMCALLOCATE: 4114ebccf1e3SJoseph Koshy { 4115e829eb6dSJoseph Koshy struct pmc_op_pmcallocate pa; 4116ebccf1e3SJoseph Koshy 4117c514a571SMitchell Horne error = copyin(arg, &pa, sizeof(pa)); 4118c514a571SMitchell Horne if (error != 0) 4119ebccf1e3SJoseph Koshy break; 4120ebccf1e3SJoseph Koshy 4121c514a571SMitchell Horne error = pmc_do_op_pmcallocate(td, &pa); 4122c514a571SMitchell Horne if (error != 0) 4123ebccf1e3SJoseph Koshy break; 4124ebccf1e3SJoseph Koshy 4125ebccf1e3SJoseph Koshy error = copyout(&pa, arg, sizeof(pa)); 4126ebccf1e3SJoseph Koshy } 4127ebccf1e3SJoseph Koshy break; 4128ebccf1e3SJoseph Koshy 4129ebccf1e3SJoseph Koshy /* 4130ebccf1e3SJoseph Koshy * Attach a PMC to a process. 4131ebccf1e3SJoseph Koshy */ 4132ebccf1e3SJoseph Koshy case PMC_OP_PMCATTACH: 4133ebccf1e3SJoseph Koshy { 4134ebccf1e3SJoseph Koshy struct pmc_op_pmcattach a; 4135ebccf1e3SJoseph Koshy 4136a133f642SMitchell Horne error = copyin(arg, &a, sizeof(a)); 4137a133f642SMitchell Horne if (error != 0) 4138ebccf1e3SJoseph Koshy break; 4139ebccf1e3SJoseph Koshy 4140a133f642SMitchell Horne error = pmc_do_op_pmcattach(td, a); 4141ebccf1e3SJoseph Koshy } 4142ebccf1e3SJoseph Koshy break; 4143ebccf1e3SJoseph Koshy 4144ebccf1e3SJoseph Koshy /* 4145ebccf1e3SJoseph Koshy * Detach an attached PMC from a process. 4146ebccf1e3SJoseph Koshy */ 4147ebccf1e3SJoseph Koshy case PMC_OP_PMCDETACH: 4148ebccf1e3SJoseph Koshy { 4149ebccf1e3SJoseph Koshy struct pmc_op_pmcattach a; 4150ebccf1e3SJoseph Koshy 4151a133f642SMitchell Horne error = copyin(arg, &a, sizeof(a)); 4152a133f642SMitchell Horne if (error != 0) 4153ebccf1e3SJoseph Koshy break; 4154ebccf1e3SJoseph Koshy 4155a133f642SMitchell Horne error = pmc_do_op_pmcdetach(td, a); 4156ebccf1e3SJoseph Koshy } 4157ebccf1e3SJoseph Koshy break; 4158ebccf1e3SJoseph Koshy 4159ebccf1e3SJoseph Koshy 4160ebccf1e3SJoseph Koshy /* 4161f263522aSJoseph Koshy * Retrieve the MSR number associated with the counter 4162f263522aSJoseph Koshy * 'pmc_id'. This allows processes to directly use RDPMC 4163f263522aSJoseph Koshy * instructions to read their PMCs, without the overhead of a 4164f263522aSJoseph Koshy * system call. 4165f263522aSJoseph Koshy */ 4166f263522aSJoseph Koshy 4167f263522aSJoseph Koshy case PMC_OP_PMCGETMSR: 4168f263522aSJoseph Koshy { 4169e829eb6dSJoseph Koshy int adjri, ri; 4170f263522aSJoseph Koshy struct pmc *pm; 4171f263522aSJoseph Koshy struct pmc_target *pt; 4172f263522aSJoseph Koshy struct pmc_op_getmsr gm; 4173e829eb6dSJoseph Koshy struct pmc_classdep *pcd; 4174f263522aSJoseph Koshy 4175f263522aSJoseph Koshy PMC_DOWNGRADE_SX(); 4176f263522aSJoseph Koshy 4177f263522aSJoseph Koshy if ((error = copyin(arg, &gm, sizeof(gm))) != 0) 4178f263522aSJoseph Koshy break; 4179f263522aSJoseph Koshy 4180f263522aSJoseph Koshy if ((error = pmc_find_pmc(gm.pm_pmcid, &pm)) != 0) 4181f263522aSJoseph Koshy break; 4182f263522aSJoseph Koshy 4183f263522aSJoseph Koshy /* 4184f263522aSJoseph Koshy * The allocated PMC has to be a process virtual PMC, 4185f263522aSJoseph Koshy * i.e., of type MODE_T[CS]. Global PMCs can only be 4186f263522aSJoseph Koshy * read using the PMCREAD operation since they may be 4187f263522aSJoseph Koshy * allocated on a different CPU than the one we could 4188f263522aSJoseph Koshy * be running on at the time of the RDPMC instruction. 4189f263522aSJoseph Koshy * 4190f263522aSJoseph Koshy * The GETMSR operation is not allowed for PMCs that 4191f263522aSJoseph Koshy * are inherited across processes. 4192f263522aSJoseph Koshy */ 4193f263522aSJoseph Koshy 4194f263522aSJoseph Koshy if (!PMC_IS_VIRTUAL_MODE(PMC_TO_MODE(pm)) || 4195f263522aSJoseph Koshy (pm->pm_flags & PMC_F_DESCENDANTS)) { 4196f263522aSJoseph Koshy error = EINVAL; 4197f263522aSJoseph Koshy break; 4198f263522aSJoseph Koshy } 4199f263522aSJoseph Koshy 4200f263522aSJoseph Koshy /* 4201f263522aSJoseph Koshy * It only makes sense to use a RDPMC (or its 4202f263522aSJoseph Koshy * equivalent instruction on non-x86 architectures) on 4203f263522aSJoseph Koshy * a process that has allocated and attached a PMC to 4204f263522aSJoseph Koshy * itself. Conversely the PMC is only allowed to have 4205f263522aSJoseph Koshy * one process attached to it -- its owner. 4206f263522aSJoseph Koshy */ 4207f263522aSJoseph Koshy 4208f263522aSJoseph Koshy if ((pt = LIST_FIRST(&pm->pm_targets)) == NULL || 4209f263522aSJoseph Koshy LIST_NEXT(pt, pt_next) != NULL || 4210f263522aSJoseph Koshy pt->pt_process->pp_proc != pm->pm_owner->po_owner) { 4211f263522aSJoseph Koshy error = EINVAL; 4212f263522aSJoseph Koshy break; 4213f263522aSJoseph Koshy } 4214f263522aSJoseph Koshy 4215f263522aSJoseph Koshy ri = PMC_TO_ROWINDEX(pm); 4216e829eb6dSJoseph Koshy pcd = pmc_ri_to_classdep(md, ri, &adjri); 4217f263522aSJoseph Koshy 4218e829eb6dSJoseph Koshy /* PMC class has no 'GETMSR' support */ 4219e829eb6dSJoseph Koshy if (pcd->pcd_get_msr == NULL) { 4220e829eb6dSJoseph Koshy error = ENOSYS; 4221e829eb6dSJoseph Koshy break; 4222e829eb6dSJoseph Koshy } 4223e829eb6dSJoseph Koshy 4224e829eb6dSJoseph Koshy if ((error = (*pcd->pcd_get_msr)(adjri, &gm.pm_msr)) < 0) 4225f263522aSJoseph Koshy break; 4226f263522aSJoseph Koshy 4227f263522aSJoseph Koshy if ((error = copyout(&gm, arg, sizeof(gm))) < 0) 4228f263522aSJoseph Koshy break; 4229f263522aSJoseph Koshy 4230f263522aSJoseph Koshy /* 4231f263522aSJoseph Koshy * Mark our process as using MSRs. Update machine 4232f263522aSJoseph Koshy * state using a forced context switch. 4233f263522aSJoseph Koshy */ 4234f263522aSJoseph Koshy 4235f263522aSJoseph Koshy pt->pt_process->pp_flags |= PMC_PP_ENABLE_MSR_ACCESS; 4236f263522aSJoseph Koshy pmc_force_context_switch(); 4237f263522aSJoseph Koshy 4238f263522aSJoseph Koshy } 4239f263522aSJoseph Koshy break; 4240f263522aSJoseph Koshy 4241f263522aSJoseph Koshy /* 4242*f4fac946SMitchell Horne * Release an allocated PMC. 4243ebccf1e3SJoseph Koshy */ 4244ebccf1e3SJoseph Koshy case PMC_OP_PMCRELEASE: 4245ebccf1e3SJoseph Koshy { 4246ebccf1e3SJoseph Koshy struct pmc_op_simple sp; 4247ebccf1e3SJoseph Koshy 4248*f4fac946SMitchell Horne error = copyin(arg, &sp, sizeof(sp)); 4249*f4fac946SMitchell Horne if (error != 0) 4250ebccf1e3SJoseph Koshy break; 4251ebccf1e3SJoseph Koshy 4252*f4fac946SMitchell Horne error = pmc_do_op_pmcrelease(sp.pm_pmcid); 4253ebccf1e3SJoseph Koshy } 4254ebccf1e3SJoseph Koshy break; 4255ebccf1e3SJoseph Koshy 4256ebccf1e3SJoseph Koshy 4257ebccf1e3SJoseph Koshy /* 4258ebccf1e3SJoseph Koshy * Read and/or write a PMC. 4259ebccf1e3SJoseph Koshy */ 4260ebccf1e3SJoseph Koshy 4261ebccf1e3SJoseph Koshy case PMC_OP_PMCRW: 4262ebccf1e3SJoseph Koshy { 4263e829eb6dSJoseph Koshy int adjri; 4264ebccf1e3SJoseph Koshy struct pmc *pm; 4265e829eb6dSJoseph Koshy uint32_t cpu, ri; 4266ebccf1e3SJoseph Koshy pmc_value_t oldvalue; 4267e829eb6dSJoseph Koshy struct pmc_binding pb; 4268e829eb6dSJoseph Koshy struct pmc_op_pmcrw prw; 4269e829eb6dSJoseph Koshy struct pmc_classdep *pcd; 4270e829eb6dSJoseph Koshy struct pmc_op_pmcrw *pprw; 4271ebccf1e3SJoseph Koshy 4272ebccf1e3SJoseph Koshy PMC_DOWNGRADE_SX(); 4273ebccf1e3SJoseph Koshy 4274ebccf1e3SJoseph Koshy if ((error = copyin(arg, &prw, sizeof(prw))) != 0) 4275ebccf1e3SJoseph Koshy break; 4276ebccf1e3SJoseph Koshy 42774a3690dfSJohn Baldwin PMCDBG2(PMC,OPS,1, "rw id=%d flags=0x%x", prw.pm_pmcid, 4278ebccf1e3SJoseph Koshy prw.pm_flags); 4279ebccf1e3SJoseph Koshy 4280ebccf1e3SJoseph Koshy /* must have at least one flag set */ 4281ebccf1e3SJoseph Koshy if ((prw.pm_flags & (PMC_F_OLDVALUE|PMC_F_NEWVALUE)) == 0) { 4282ebccf1e3SJoseph Koshy error = EINVAL; 4283ebccf1e3SJoseph Koshy break; 4284ebccf1e3SJoseph Koshy } 4285ebccf1e3SJoseph Koshy 4286ebccf1e3SJoseph Koshy /* locate pmc descriptor */ 4287ebccf1e3SJoseph Koshy if ((error = pmc_find_pmc(prw.pm_pmcid, &pm)) != 0) 4288ebccf1e3SJoseph Koshy break; 4289ebccf1e3SJoseph Koshy 4290ebccf1e3SJoseph Koshy /* Can't read a PMC that hasn't been started. */ 4291ebccf1e3SJoseph Koshy if (pm->pm_state != PMC_STATE_ALLOCATED && 4292ebccf1e3SJoseph Koshy pm->pm_state != PMC_STATE_STOPPED && 4293ebccf1e3SJoseph Koshy pm->pm_state != PMC_STATE_RUNNING) { 4294ebccf1e3SJoseph Koshy error = EINVAL; 4295ebccf1e3SJoseph Koshy break; 4296ebccf1e3SJoseph Koshy } 4297ebccf1e3SJoseph Koshy 4298ebccf1e3SJoseph Koshy /* writing a new value is allowed only for 'STOPPED' pmcs */ 4299ebccf1e3SJoseph Koshy if (pm->pm_state == PMC_STATE_RUNNING && 4300ebccf1e3SJoseph Koshy (prw.pm_flags & PMC_F_NEWVALUE)) { 4301ebccf1e3SJoseph Koshy error = EBUSY; 4302ebccf1e3SJoseph Koshy break; 4303ebccf1e3SJoseph Koshy } 4304ebccf1e3SJoseph Koshy 4305c5153e19SJoseph Koshy if (PMC_IS_VIRTUAL_MODE(PMC_TO_MODE(pm))) { 4306ebccf1e3SJoseph Koshy 4307c5153e19SJoseph Koshy /* 4308c5153e19SJoseph Koshy * If this PMC is attached to its owner (i.e., 4309c5153e19SJoseph Koshy * the process requesting this operation) and 4310c5153e19SJoseph Koshy * is running, then attempt to get an 4311c5153e19SJoseph Koshy * upto-date reading from hardware for a READ. 4312c5153e19SJoseph Koshy * Writes are only allowed when the PMC is 4313c5153e19SJoseph Koshy * stopped, so only update the saved value 4314c5153e19SJoseph Koshy * field. 4315c5153e19SJoseph Koshy * 4316c5153e19SJoseph Koshy * If the PMC is not running, or is not 4317c5153e19SJoseph Koshy * attached to its owner, read/write to the 4318c5153e19SJoseph Koshy * savedvalue field. 4319c5153e19SJoseph Koshy */ 4320c5153e19SJoseph Koshy 4321c5153e19SJoseph Koshy ri = PMC_TO_ROWINDEX(pm); 4322e829eb6dSJoseph Koshy pcd = pmc_ri_to_classdep(md, ri, &adjri); 4323c5153e19SJoseph Koshy 4324ebccf1e3SJoseph Koshy mtx_pool_lock_spin(pmc_mtxpool, pm); 4325c5153e19SJoseph Koshy cpu = curthread->td_oncpu; 4326c5153e19SJoseph Koshy 4327c5153e19SJoseph Koshy if (prw.pm_flags & PMC_F_OLDVALUE) { 4328c5153e19SJoseph Koshy if ((pm->pm_flags & PMC_F_ATTACHED_TO_OWNER) && 4329c5153e19SJoseph Koshy (pm->pm_state == PMC_STATE_RUNNING)) 4330e829eb6dSJoseph Koshy error = (*pcd->pcd_read_pmc)(cpu, adjri, 433139f92a76SMitchell Horne pm, &oldvalue); 4332c5153e19SJoseph Koshy else 4333ebccf1e3SJoseph Koshy oldvalue = pm->pm_gv.pm_savedvalue; 4334c5153e19SJoseph Koshy } 4335ebccf1e3SJoseph Koshy if (prw.pm_flags & PMC_F_NEWVALUE) 4336ebccf1e3SJoseph Koshy pm->pm_gv.pm_savedvalue = prw.pm_value; 4337c5153e19SJoseph Koshy 4338ebccf1e3SJoseph Koshy mtx_pool_unlock_spin(pmc_mtxpool, pm); 4339ebccf1e3SJoseph Koshy 4340ebccf1e3SJoseph Koshy } else { /* System mode PMCs */ 4341c5153e19SJoseph Koshy cpu = PMC_TO_CPU(pm); 4342c5153e19SJoseph Koshy ri = PMC_TO_ROWINDEX(pm); 4343e829eb6dSJoseph Koshy pcd = pmc_ri_to_classdep(md, ri, &adjri); 4344ebccf1e3SJoseph Koshy 4345122ccdc1SJoseph Koshy if (!pmc_cpu_is_active(cpu)) { 4346ebccf1e3SJoseph Koshy error = ENXIO; 4347ebccf1e3SJoseph Koshy break; 4348ebccf1e3SJoseph Koshy } 4349ebccf1e3SJoseph Koshy 4350ebccf1e3SJoseph Koshy /* move this thread to CPU 'cpu' */ 4351ebccf1e3SJoseph Koshy pmc_save_cpu_binding(&pb); 4352ebccf1e3SJoseph Koshy pmc_select_cpu(cpu); 4353ebccf1e3SJoseph Koshy 4354c5153e19SJoseph Koshy critical_enter(); 4355ebccf1e3SJoseph Koshy /* save old value */ 435639f92a76SMitchell Horne if (prw.pm_flags & PMC_F_OLDVALUE) { 4357e829eb6dSJoseph Koshy if ((error = (*pcd->pcd_read_pmc)(cpu, adjri, 435839f92a76SMitchell Horne pm, &oldvalue))) 4359ebccf1e3SJoseph Koshy goto error; 436039f92a76SMitchell Horne } 4361ebccf1e3SJoseph Koshy /* write out new value */ 4362ebccf1e3SJoseph Koshy if (prw.pm_flags & PMC_F_NEWVALUE) 436339f92a76SMitchell Horne error = (*pcd->pcd_write_pmc)(cpu, adjri, pm, 4364ebccf1e3SJoseph Koshy prw.pm_value); 4365ebccf1e3SJoseph Koshy error: 4366c5153e19SJoseph Koshy critical_exit(); 4367ebccf1e3SJoseph Koshy pmc_restore_cpu_binding(&pb); 4368ebccf1e3SJoseph Koshy if (error) 4369ebccf1e3SJoseph Koshy break; 4370ebccf1e3SJoseph Koshy } 4371ebccf1e3SJoseph Koshy 4372ebccf1e3SJoseph Koshy pprw = (struct pmc_op_pmcrw *) arg; 4373ebccf1e3SJoseph Koshy 4374680f1afdSJohn Baldwin #ifdef HWPMC_DEBUG 4375ebccf1e3SJoseph Koshy if (prw.pm_flags & PMC_F_NEWVALUE) 43764a3690dfSJohn Baldwin PMCDBG3(PMC,OPS,2, "rw id=%d new %jx -> old %jx", 4377ebccf1e3SJoseph Koshy ri, prw.pm_value, oldvalue); 43789d0a2685SJoseph Koshy else if (prw.pm_flags & PMC_F_OLDVALUE) 43794a3690dfSJohn Baldwin PMCDBG2(PMC,OPS,2, "rw id=%d -> old %jx", ri, oldvalue); 4380ebccf1e3SJoseph Koshy #endif 4381ebccf1e3SJoseph Koshy /* return old value if requested */ 4382ebccf1e3SJoseph Koshy if (prw.pm_flags & PMC_F_OLDVALUE) 4383ebccf1e3SJoseph Koshy if ((error = copyout(&oldvalue, &pprw->pm_value, 4384ebccf1e3SJoseph Koshy sizeof(prw.pm_value)))) 4385ebccf1e3SJoseph Koshy break; 4386ebccf1e3SJoseph Koshy } 4387ebccf1e3SJoseph Koshy break; 4388ebccf1e3SJoseph Koshy 4389ebccf1e3SJoseph Koshy 4390ebccf1e3SJoseph Koshy /* 4391ebccf1e3SJoseph Koshy * Set the sampling rate for a sampling mode PMC and the 4392ebccf1e3SJoseph Koshy * initial count for a counting mode PMC. 4393ebccf1e3SJoseph Koshy */ 4394ebccf1e3SJoseph Koshy 4395ebccf1e3SJoseph Koshy case PMC_OP_PMCSETCOUNT: 4396ebccf1e3SJoseph Koshy { 4397ebccf1e3SJoseph Koshy struct pmc *pm; 4398ebccf1e3SJoseph Koshy struct pmc_op_pmcsetcount sc; 4399ebccf1e3SJoseph Koshy 4400ebccf1e3SJoseph Koshy PMC_DOWNGRADE_SX(); 4401ebccf1e3SJoseph Koshy 4402ebccf1e3SJoseph Koshy if ((error = copyin(arg, &sc, sizeof(sc))) != 0) 4403ebccf1e3SJoseph Koshy break; 4404ebccf1e3SJoseph Koshy 4405ebccf1e3SJoseph Koshy if ((error = pmc_find_pmc(sc.pm_pmcid, &pm)) != 0) 4406ebccf1e3SJoseph Koshy break; 4407ebccf1e3SJoseph Koshy 4408ebccf1e3SJoseph Koshy if (pm->pm_state == PMC_STATE_RUNNING) { 4409ebccf1e3SJoseph Koshy error = EBUSY; 4410ebccf1e3SJoseph Koshy break; 4411ebccf1e3SJoseph Koshy } 4412ebccf1e3SJoseph Koshy 44130204d85aSMatt Macy if (PMC_IS_SAMPLING_MODE(PMC_TO_MODE(pm))) { 44140204d85aSMatt Macy /* 4415ca341f3cSJohn Baldwin * Don't permit requested sample rate to be 4416ca341f3cSJohn Baldwin * less than pmc_mincount. 44170204d85aSMatt Macy */ 4418ca341f3cSJohn Baldwin if (sc.pm_count < MAX(1, pmc_mincount)) 4419ca341f3cSJohn Baldwin log(LOG_WARNING, "pmcsetcount: passed sample " 4420ca341f3cSJohn Baldwin "rate %ju - setting to %u\n", 4421ca341f3cSJohn Baldwin (uintmax_t)sc.pm_count, 4422ca341f3cSJohn Baldwin MAX(1, pmc_mincount)); 4423ca341f3cSJohn Baldwin pm->pm_sc.pm_reloadcount = MAX(MAX(1, pmc_mincount), 4424ca341f3cSJohn Baldwin sc.pm_count); 44250204d85aSMatt Macy } else 4426ebccf1e3SJoseph Koshy pm->pm_sc.pm_initial = sc.pm_count; 4427ebccf1e3SJoseph Koshy } 4428ebccf1e3SJoseph Koshy break; 4429ebccf1e3SJoseph Koshy 4430ebccf1e3SJoseph Koshy 4431ebccf1e3SJoseph Koshy /* 4432ebccf1e3SJoseph Koshy * Start a PMC. 4433ebccf1e3SJoseph Koshy */ 4434ebccf1e3SJoseph Koshy 4435ebccf1e3SJoseph Koshy case PMC_OP_PMCSTART: 4436ebccf1e3SJoseph Koshy { 4437ebccf1e3SJoseph Koshy pmc_id_t pmcid; 4438ebccf1e3SJoseph Koshy struct pmc *pm; 4439ebccf1e3SJoseph Koshy struct pmc_op_simple sp; 4440ebccf1e3SJoseph Koshy 4441ebccf1e3SJoseph Koshy sx_assert(&pmc_sx, SX_XLOCKED); 4442ebccf1e3SJoseph Koshy 4443ebccf1e3SJoseph Koshy if ((error = copyin(arg, &sp, sizeof(sp))) != 0) 4444ebccf1e3SJoseph Koshy break; 4445ebccf1e3SJoseph Koshy 4446ebccf1e3SJoseph Koshy pmcid = sp.pm_pmcid; 4447ebccf1e3SJoseph Koshy 4448ebccf1e3SJoseph Koshy if ((error = pmc_find_pmc(pmcid, &pm)) != 0) 4449ebccf1e3SJoseph Koshy break; 4450ebccf1e3SJoseph Koshy 4451c5153e19SJoseph Koshy KASSERT(pmcid == pm->pm_id, 4452c5153e19SJoseph Koshy ("[pmc,%d] pmcid %x != id %x", __LINE__, 4453c5153e19SJoseph Koshy pm->pm_id, pmcid)); 4454ebccf1e3SJoseph Koshy 4455ebccf1e3SJoseph Koshy if (pm->pm_state == PMC_STATE_RUNNING) /* already running */ 4456ebccf1e3SJoseph Koshy break; 4457ebccf1e3SJoseph Koshy else if (pm->pm_state != PMC_STATE_STOPPED && 4458ebccf1e3SJoseph Koshy pm->pm_state != PMC_STATE_ALLOCATED) { 4459ebccf1e3SJoseph Koshy error = EINVAL; 4460ebccf1e3SJoseph Koshy break; 4461ebccf1e3SJoseph Koshy } 4462ebccf1e3SJoseph Koshy 4463ebccf1e3SJoseph Koshy error = pmc_start(pm); 4464ebccf1e3SJoseph Koshy } 4465ebccf1e3SJoseph Koshy break; 4466ebccf1e3SJoseph Koshy 4467ebccf1e3SJoseph Koshy 4468ebccf1e3SJoseph Koshy /* 4469ebccf1e3SJoseph Koshy * Stop a PMC. 4470ebccf1e3SJoseph Koshy */ 4471ebccf1e3SJoseph Koshy 4472ebccf1e3SJoseph Koshy case PMC_OP_PMCSTOP: 4473ebccf1e3SJoseph Koshy { 4474ebccf1e3SJoseph Koshy pmc_id_t pmcid; 4475ebccf1e3SJoseph Koshy struct pmc *pm; 4476ebccf1e3SJoseph Koshy struct pmc_op_simple sp; 4477ebccf1e3SJoseph Koshy 4478ebccf1e3SJoseph Koshy PMC_DOWNGRADE_SX(); 4479ebccf1e3SJoseph Koshy 4480ebccf1e3SJoseph Koshy if ((error = copyin(arg, &sp, sizeof(sp))) != 0) 4481ebccf1e3SJoseph Koshy break; 4482ebccf1e3SJoseph Koshy 4483ebccf1e3SJoseph Koshy pmcid = sp.pm_pmcid; 4484ebccf1e3SJoseph Koshy 4485ebccf1e3SJoseph Koshy /* 4486ebccf1e3SJoseph Koshy * Mark the PMC as inactive and invoke the MD stop 4487ebccf1e3SJoseph Koshy * routines if needed. 4488ebccf1e3SJoseph Koshy */ 4489ebccf1e3SJoseph Koshy 4490ebccf1e3SJoseph Koshy if ((error = pmc_find_pmc(pmcid, &pm)) != 0) 4491ebccf1e3SJoseph Koshy break; 4492ebccf1e3SJoseph Koshy 4493c5153e19SJoseph Koshy KASSERT(pmcid == pm->pm_id, 4494c5153e19SJoseph Koshy ("[pmc,%d] pmc id %x != pmcid %x", __LINE__, 4495c5153e19SJoseph Koshy pm->pm_id, pmcid)); 4496ebccf1e3SJoseph Koshy 4497ebccf1e3SJoseph Koshy if (pm->pm_state == PMC_STATE_STOPPED) /* already stopped */ 4498ebccf1e3SJoseph Koshy break; 4499ebccf1e3SJoseph Koshy else if (pm->pm_state != PMC_STATE_RUNNING) { 4500ebccf1e3SJoseph Koshy error = EINVAL; 4501ebccf1e3SJoseph Koshy break; 4502ebccf1e3SJoseph Koshy } 4503ebccf1e3SJoseph Koshy 4504ebccf1e3SJoseph Koshy error = pmc_stop(pm); 4505ebccf1e3SJoseph Koshy } 4506ebccf1e3SJoseph Koshy break; 4507ebccf1e3SJoseph Koshy 4508ebccf1e3SJoseph Koshy 4509ebccf1e3SJoseph Koshy /* 4510fbf1556dSJoseph Koshy * Write a user supplied value to the log file. 4511ebccf1e3SJoseph Koshy */ 4512ebccf1e3SJoseph Koshy 4513ebccf1e3SJoseph Koshy case PMC_OP_WRITELOG: 4514ebccf1e3SJoseph Koshy { 4515f263522aSJoseph Koshy struct pmc_op_writelog wl; 4516f263522aSJoseph Koshy struct pmc_owner *po; 4517ebccf1e3SJoseph Koshy 4518ebccf1e3SJoseph Koshy PMC_DOWNGRADE_SX(); 4519ebccf1e3SJoseph Koshy 4520f263522aSJoseph Koshy if ((error = copyin(arg, &wl, sizeof(wl))) != 0) 4521ebccf1e3SJoseph Koshy break; 4522ebccf1e3SJoseph Koshy 4523f263522aSJoseph Koshy if ((po = pmc_find_owner_descriptor(td->td_proc)) == NULL) { 4524ebccf1e3SJoseph Koshy error = EINVAL; 4525ebccf1e3SJoseph Koshy break; 4526ebccf1e3SJoseph Koshy } 4527ebccf1e3SJoseph Koshy 4528f263522aSJoseph Koshy if ((po->po_flags & PMC_PO_OWNS_LOGFILE) == 0) { 4529c5153e19SJoseph Koshy error = EINVAL; 4530c5153e19SJoseph Koshy break; 4531c5153e19SJoseph Koshy } 4532c5153e19SJoseph Koshy 4533f263522aSJoseph Koshy error = pmclog_process_userlog(po, &wl); 4534ebccf1e3SJoseph Koshy } 4535ebccf1e3SJoseph Koshy break; 4536f263522aSJoseph Koshy 4537ebccf1e3SJoseph Koshy 4538ebccf1e3SJoseph Koshy default: 4539ebccf1e3SJoseph Koshy error = EINVAL; 4540ebccf1e3SJoseph Koshy break; 4541ebccf1e3SJoseph Koshy } 4542ebccf1e3SJoseph Koshy 4543ebccf1e3SJoseph Koshy if (is_sx_downgraded) 4544ebccf1e3SJoseph Koshy sx_sunlock(&pmc_sx); 4545ebccf1e3SJoseph Koshy else 4546ebccf1e3SJoseph Koshy sx_xunlock(&pmc_sx); 454720b555e1SKonstantin Belousov done_syscall: 4548ebccf1e3SJoseph Koshy if (error) 4549e6b475e0SMatt Macy counter_u64_add(pmc_stats.pm_syscall_errors, 1); 4550ebccf1e3SJoseph Koshy 4551cf9ef806SKonstantin Belousov return (error); 4552ebccf1e3SJoseph Koshy } 4553ebccf1e3SJoseph Koshy 4554ebccf1e3SJoseph Koshy /* 4555ebccf1e3SJoseph Koshy * Helper functions 4556ebccf1e3SJoseph Koshy */ 4557ebccf1e3SJoseph Koshy 4558ebccf1e3SJoseph Koshy /* 4559d07f36b0SJoseph Koshy * Mark the thread as needing callchain capture and post an AST. The 4560d07f36b0SJoseph Koshy * actual callchain capture will be done in a context where it is safe 4561d07f36b0SJoseph Koshy * to take page faults. 4562d07f36b0SJoseph Koshy */ 4563d07f36b0SJoseph Koshy static void 45646fe00c78SJoseph Koshy pmc_post_callchain_callback(void) 4565d07f36b0SJoseph Koshy { 4566d07f36b0SJoseph Koshy struct thread *td; 4567d07f36b0SJoseph Koshy 4568d07f36b0SJoseph Koshy td = curthread; 4569d07f36b0SJoseph Koshy 45700e031404SFabien Thomas /* 45710e031404SFabien Thomas * If there is multiple PMCs for the same interrupt ignore new post 45720e031404SFabien Thomas */ 4573d5ee4074SMitchell Horne if ((td->td_pflags & TDP_CALLCHAIN) != 0) 45740e031404SFabien Thomas return; 45756fe00c78SJoseph Koshy 4576d07f36b0SJoseph Koshy /* 45776fe00c78SJoseph Koshy * Mark this thread as needing callchain capture. 45786fe00c78SJoseph Koshy * `td->td_pflags' will be safe to touch because this thread 45796fe00c78SJoseph Koshy * was in user space when it was interrupted. 4580d07f36b0SJoseph Koshy */ 4581d07f36b0SJoseph Koshy td->td_pflags |= TDP_CALLCHAIN; 4582d07f36b0SJoseph Koshy 4583d07f36b0SJoseph Koshy /* 45846fe00c78SJoseph Koshy * Don't let this thread migrate between CPUs until callchain 45856fe00c78SJoseph Koshy * capture completes. 4586d07f36b0SJoseph Koshy */ 45876fe00c78SJoseph Koshy sched_pin(); 4588d07f36b0SJoseph Koshy 4589d07f36b0SJoseph Koshy return; 4590d07f36b0SJoseph Koshy } 4591d07f36b0SJoseph Koshy 4592d07f36b0SJoseph Koshy /* 4593d07f36b0SJoseph Koshy * Find a free slot in the per-cpu array of samples and capture the 4594d07f36b0SJoseph Koshy * current callchain there. If a sample was successfully added, a bit 4595d07f36b0SJoseph Koshy * is set in mask 'pmc_cpumask' denoting that the DO_SAMPLES hook 4596d07f36b0SJoseph Koshy * needs to be invoked from the clock handler. 4597f263522aSJoseph Koshy * 4598f263522aSJoseph Koshy * This function is meant to be called from an NMI handler. It cannot 4599f263522aSJoseph Koshy * use any of the locking primitives supplied by the OS. 4600ebccf1e3SJoseph Koshy */ 46015de96e33SMatt Macy static int 4602d9f1b8dbSMatt Macy pmc_add_sample(ring_type_t ring, struct pmc *pm, struct trapframe *tf) 4603ebccf1e3SJoseph Koshy { 4604f263522aSJoseph Koshy struct pmc_sample *ps; 4605f263522aSJoseph Koshy struct pmc_samplebuffer *psb; 460601c35b67SMitchell Horne struct thread *td; 460701c35b67SMitchell Horne int error, cpu, callchaindepth; 460801c35b67SMitchell Horne bool inuserspace; 4609ebccf1e3SJoseph Koshy 4610f263522aSJoseph Koshy error = 0; 4611ebccf1e3SJoseph Koshy 4612d07f36b0SJoseph Koshy /* 4613d07f36b0SJoseph Koshy * Allocate space for a sample buffer. 4614d07f36b0SJoseph Koshy */ 4615eb7c9019SMatt Macy cpu = curcpu; 4616f5f9340bSFabien Thomas psb = pmc_pcpu[cpu]->pc_sb[ring]; 4617eb7c9019SMatt Macy inuserspace = TRAPF_USERMODE(tf); 4618d9f1b8dbSMatt Macy ps = PMC_PROD_SAMPLE(psb); 4619d9f1b8dbSMatt Macy if (psb->ps_considx != psb->ps_prodidx && 4620d9f1b8dbSMatt Macy ps->ps_nsamples) { /* in use, reader hasn't caught up */ 4621e6b475e0SMatt Macy pm->pm_pcpu_state[cpu].pps_stalled = 1; 4622e6b475e0SMatt Macy counter_u64_add(pmc_stats.pm_intr_bufferfull, 1); 46234a3690dfSJohn Baldwin PMCDBG6(SAM,INT,1,"(spc) cpu=%d pm=%p tf=%p um=%d wr=%d rd=%d", 462401c35b67SMitchell Horne cpu, pm, tf, inuserspace, 4625d9f1b8dbSMatt Macy (int)(psb->ps_prodidx & pmc_sample_mask), 4626d9f1b8dbSMatt Macy (int)(psb->ps_considx & pmc_sample_mask)); 4627c66ea2eeSJonathan T. Looney callchaindepth = 1; 4628f263522aSJoseph Koshy error = ENOMEM; 4629f263522aSJoseph Koshy goto done; 4630ebccf1e3SJoseph Koshy } 4631ebccf1e3SJoseph Koshy 4632d07f36b0SJoseph Koshy /* Fill in entry. */ 4633693cd307SMitchell Horne PMCDBG6(SAM,INT,1,"cpu=%d pm=%p tf=%p um=%d wr=%d rd=%d", cpu, pm, tf, 4634693cd307SMitchell Horne inuserspace, (int)(psb->ps_prodidx & pmc_sample_mask), 4635d9f1b8dbSMatt Macy (int)(psb->ps_considx & pmc_sample_mask)); 4636f5f9340bSFabien Thomas 4637cf823003SMatt Macy td = curthread; 4638f263522aSJoseph Koshy ps->ps_pmc = pm; 46396fe00c78SJoseph Koshy ps->ps_td = td; 4640cf823003SMatt Macy ps->ps_pid = td->td_proc->p_pid; 4641cf823003SMatt Macy ps->ps_tid = td->td_tid; 4642f992dd4bSMatt Macy ps->ps_tsc = pmc_rdtsc(); 4643d9f1b8dbSMatt Macy ps->ps_ticks = ticks; 4644cf823003SMatt Macy ps->ps_cpu = cpu; 4645d07f36b0SJoseph Koshy ps->ps_flags = inuserspace ? PMC_CC_F_USERSPACE : 0; 4646d07f36b0SJoseph Koshy 4647d07f36b0SJoseph Koshy callchaindepth = (pm->pm_flags & PMC_F_CALLCHAIN) ? 4648d07f36b0SJoseph Koshy pmc_callchaindepth : 1; 4649d07f36b0SJoseph Koshy 4650d9f1b8dbSMatt Macy MPASS(ps->ps_pc != NULL); 4651d5ee4074SMitchell Horne if (callchaindepth == 1) { 4652d07f36b0SJoseph Koshy ps->ps_pc[0] = PMC_TRAPFRAME_TO_PC(tf); 4653d5ee4074SMitchell Horne } else { 4654d07f36b0SJoseph Koshy /* 465501c35b67SMitchell Horne * Kernel stack traversals can be done immediately, while we 465601c35b67SMitchell Horne * defer to an AST for user space traversals. 4657d07f36b0SJoseph Koshy */ 4658f5f9340bSFabien Thomas if (!inuserspace) { 4659693cd307SMitchell Horne callchaindepth = pmc_save_kernel_callchain(ps->ps_pc, 4660d07f36b0SJoseph Koshy callchaindepth, tf); 4661f5f9340bSFabien Thomas } else { 46626fe00c78SJoseph Koshy pmc_post_callchain_callback(); 4663d9f1b8dbSMatt Macy callchaindepth = PMC_USER_CALLCHAIN_PENDING; 4664d07f36b0SJoseph Koshy } 4665d07f36b0SJoseph Koshy } 4666d07f36b0SJoseph Koshy 4667d5ee4074SMitchell Horne ps->ps_nsamples = callchaindepth; /* mark entry as in-use */ 46685de96e33SMatt Macy if (ring == PMC_UR) { 4669d5ee4074SMitchell Horne ps->ps_nsamples_actual = callchaindepth; 4670d9f1b8dbSMatt Macy ps->ps_nsamples = PMC_USER_CALLCHAIN_PENDING; 4671d5ee4074SMitchell Horne } 4672f263522aSJoseph Koshy 4673d9f1b8dbSMatt Macy KASSERT(counter_u64_fetch(pm->pm_runcount) >= 0, 467401c35b67SMitchell Horne ("[pmc,%d] pm=%p runcount %ju", __LINE__, pm, 467501c35b67SMitchell Horne (uintmax_t)counter_u64_fetch(pm->pm_runcount))); 4676d9f1b8dbSMatt Macy 4677d9f1b8dbSMatt Macy counter_u64_add(pm->pm_runcount, 1); /* hold onto PMC */ 4678d9f1b8dbSMatt Macy /* increment write pointer */ 4679d9f1b8dbSMatt Macy psb->ps_prodidx++; 4680f263522aSJoseph Koshy done: 4681f263522aSJoseph Koshy /* mark CPU as needing processing */ 4682d9f1b8dbSMatt Macy if (callchaindepth != PMC_USER_CALLCHAIN_PENDING) 4683e6b475e0SMatt Macy DPCPU_SET(pmc_sampled, 1); 4684f263522aSJoseph Koshy 4685d07f36b0SJoseph Koshy return (error); 4686d07f36b0SJoseph Koshy } 4687d07f36b0SJoseph Koshy 4688d07f36b0SJoseph Koshy /* 46895de96e33SMatt Macy * Interrupt processing. 46905de96e33SMatt Macy * 469101c35b67SMitchell Horne * This function may be called from an NMI handler. It cannot use any of the 469201c35b67SMitchell Horne * locking primitives supplied by the OS. 46935de96e33SMatt Macy */ 46945de96e33SMatt Macy int 4695eb7c9019SMatt Macy pmc_process_interrupt(int ring, struct pmc *pm, struct trapframe *tf) 46965de96e33SMatt Macy { 46975de96e33SMatt Macy struct thread *td; 46985de96e33SMatt Macy 46995de96e33SMatt Macy td = curthread; 47005de96e33SMatt Macy if ((pm->pm_flags & PMC_F_USERCALLCHAIN) && 4701d5ee4074SMitchell Horne (td->td_proc->p_flag & P_KPROC) == 0 && !TRAPF_USERMODE(tf)) { 4702a9336cefSMark Johnston atomic_add_int(&td->td_pmcpend, 1); 4703eb7c9019SMatt Macy return (pmc_add_sample(PMC_UR, pm, tf)); 47045de96e33SMatt Macy } 4705eb7c9019SMatt Macy return (pmc_add_sample(ring, pm, tf)); 47065de96e33SMatt Macy } 47075de96e33SMatt Macy 47085de96e33SMatt Macy /* 4709d07f36b0SJoseph Koshy * Capture a user call chain. This function will be called from ast() 4710d07f36b0SJoseph Koshy * before control returns to userland and before the process gets 4711d07f36b0SJoseph Koshy * rescheduled. 4712d07f36b0SJoseph Koshy */ 4713d07f36b0SJoseph Koshy static void 4714f5f9340bSFabien Thomas pmc_capture_user_callchain(int cpu, int ring, struct trapframe *tf) 4715d07f36b0SJoseph Koshy { 4716d07f36b0SJoseph Koshy struct pmc *pm; 4717d9f1b8dbSMatt Macy struct pmc_sample *ps; 4718d07f36b0SJoseph Koshy struct pmc_samplebuffer *psb; 471901c35b67SMitchell Horne struct thread *td; 4720d9f1b8dbSMatt Macy uint64_t considx, prodidx; 4721d9f1b8dbSMatt Macy int nsamples, nrecords, pass, iter; 472201c35b67SMitchell Horne int start_ticks __diagused; 472301c35b67SMitchell Horne 4724f5f9340bSFabien Thomas psb = pmc_pcpu[cpu]->pc_sb[ring]; 47256fe00c78SJoseph Koshy td = curthread; 472601c35b67SMitchell Horne nrecords = INT_MAX; 472701c35b67SMitchell Horne pass = 0; 472801c35b67SMitchell Horne start_ticks = ticks; 47296fe00c78SJoseph Koshy 47306fe00c78SJoseph Koshy KASSERT(td->td_pflags & TDP_CALLCHAIN, 47316fe00c78SJoseph Koshy ("[pmc,%d] Retrieving callchain for thread that doesn't want it", 47326fe00c78SJoseph Koshy __LINE__)); 47335de96e33SMatt Macy restart: 47345de96e33SMatt Macy if (ring == PMC_UR) 47355de96e33SMatt Macy nrecords = atomic_readandclear_32(&td->td_pmcpend); 4736d07f36b0SJoseph Koshy 4737d9f1b8dbSMatt Macy for (iter = 0, considx = psb->ps_considx, prodidx = psb->ps_prodidx; 4738d9f1b8dbSMatt Macy considx < prodidx && iter < pmc_nsamples; considx++, iter++) { 4739d9f1b8dbSMatt Macy ps = PMC_CONS_SAMPLE_OFF(psb, considx); 4740d9f1b8dbSMatt Macy 4741d07f36b0SJoseph Koshy /* 474201c35b67SMitchell Horne * Iterate through all deferred callchain requests. Walk from 474301c35b67SMitchell Horne * the current read pointer to the current write pointer. 4744d07f36b0SJoseph Koshy */ 47457bc7e3cdSAndrew Turner #ifdef INVARIANTS 47465de96e33SMatt Macy if (ps->ps_nsamples == PMC_SAMPLE_FREE) { 4747d9f1b8dbSMatt Macy continue; 47485de96e33SMatt Macy } 47497bc7e3cdSAndrew Turner #endif 4750d9f1b8dbSMatt Macy if (ps->ps_td != td || 47511bb4eefaSMatt Macy ps->ps_nsamples != PMC_USER_CALLCHAIN_PENDING || 4752d9f1b8dbSMatt Macy ps->ps_pmc->pm_state != PMC_STATE_RUNNING) 4753d9f1b8dbSMatt Macy continue; 47546fe00c78SJoseph Koshy 47556fe00c78SJoseph Koshy KASSERT(ps->ps_cpu == cpu, 47566fe00c78SJoseph Koshy ("[pmc,%d] cpu mismatch ps_cpu=%d pcpu=%d", __LINE__, 47576fe00c78SJoseph Koshy ps->ps_cpu, PCPU_GET(cpuid))); 4758d07f36b0SJoseph Koshy 4759d07f36b0SJoseph Koshy pm = ps->ps_pmc; 4760d07f36b0SJoseph Koshy KASSERT(pm->pm_flags & PMC_F_CALLCHAIN, 4761d07f36b0SJoseph Koshy ("[pmc,%d] Retrieving callchain for PMC that doesn't " 4762d07f36b0SJoseph Koshy "want it", __LINE__)); 4763e6b475e0SMatt Macy KASSERT(counter_u64_fetch(pm->pm_runcount) > 0, 476401c35b67SMitchell Horne ("[pmc,%d] runcount %ju", __LINE__, 476501c35b67SMitchell Horne (uintmax_t)counter_u64_fetch(pm->pm_runcount))); 47666fe00c78SJoseph Koshy 47675de96e33SMatt Macy if (ring == PMC_UR) { 47685de96e33SMatt Macy nsamples = ps->ps_nsamples_actual; 47695de96e33SMatt Macy counter_u64_add(pmc_stats.pm_merges, 1); 47705de96e33SMatt Macy } else 47715de96e33SMatt Macy nsamples = 0; 47725de96e33SMatt Macy 4773d07f36b0SJoseph Koshy /* 4774d07f36b0SJoseph Koshy * Retrieve the callchain and mark the sample buffer 4775d07f36b0SJoseph Koshy * as 'processable' by the timer tick sweep code. 4776d07f36b0SJoseph Koshy */ 47775de96e33SMatt Macy if (__predict_true(nsamples < pmc_callchaindepth - 1)) 47785de96e33SMatt Macy nsamples += pmc_save_user_callchain(ps->ps_pc + nsamples, 47795de96e33SMatt Macy pmc_callchaindepth - nsamples - 1, tf); 4780d9f1b8dbSMatt Macy 4781d9f1b8dbSMatt Macy /* 4782d9f1b8dbSMatt Macy * We have to prevent hardclock from potentially overwriting 4783d9f1b8dbSMatt Macy * this sample between when we read the value and when we set 478401c35b67SMitchell Horne * it. 4785d9f1b8dbSMatt Macy */ 4786d9f1b8dbSMatt Macy spinlock_enter(); 4787693cd307SMitchell Horne 4788d9f1b8dbSMatt Macy /* 478901c35b67SMitchell Horne * Verify that the sample hasn't been dropped in the meantime. 4790d9f1b8dbSMatt Macy */ 4791d9f1b8dbSMatt Macy if (ps->ps_nsamples == PMC_USER_CALLCHAIN_PENDING) { 47925de96e33SMatt Macy ps->ps_nsamples = nsamples; 4793d9f1b8dbSMatt Macy /* 479401c35b67SMitchell Horne * If we couldn't get a sample, simply drop the 479501c35b67SMitchell Horne * reference. 4796d9f1b8dbSMatt Macy */ 4797d9f1b8dbSMatt Macy if (nsamples == 0) 4798d9f1b8dbSMatt Macy counter_u64_add(pm->pm_runcount, -1); 4799d9f1b8dbSMatt Macy } 4800d9f1b8dbSMatt Macy spinlock_exit(); 48015de96e33SMatt Macy if (nrecords-- == 1) 48025de96e33SMatt Macy break; 4803d9f1b8dbSMatt Macy } 48045de96e33SMatt Macy if (__predict_false(ring == PMC_UR && td->td_pmcpend)) { 48055de96e33SMatt Macy if (pass == 0) { 48065de96e33SMatt Macy pass = 1; 48075de96e33SMatt Macy goto restart; 48085de96e33SMatt Macy } 48095de96e33SMatt Macy /* only collect samples for this part once */ 48105de96e33SMatt Macy td->td_pmcpend = 0; 48115de96e33SMatt Macy } 4812d07f36b0SJoseph Koshy 48136cb40391SZbigniew Bodek #ifdef INVARIANTS 4814d9f1b8dbSMatt Macy if ((ticks - start_ticks) > hz) 4815d9f1b8dbSMatt Macy log(LOG_ERR, "%s took %d ticks\n", __func__, (ticks - start_ticks)); 48166cb40391SZbigniew Bodek #endif 4817c66ea2eeSJonathan T. Looney /* mark CPU as needing processing */ 4818e6b475e0SMatt Macy DPCPU_SET(pmc_sampled, 1); 4819f263522aSJoseph Koshy } 4820f263522aSJoseph Koshy 4821ebccf1e3SJoseph Koshy /* 4822f263522aSJoseph Koshy * Process saved PC samples. 4823ebccf1e3SJoseph Koshy */ 4824ebccf1e3SJoseph Koshy static void 4825d9f1b8dbSMatt Macy pmc_process_samples(int cpu, ring_type_t ring) 4826ebccf1e3SJoseph Koshy { 4827f263522aSJoseph Koshy struct pmc *pm; 4828f263522aSJoseph Koshy struct thread *td; 4829f263522aSJoseph Koshy struct pmc_owner *po; 4830f263522aSJoseph Koshy struct pmc_sample *ps; 4831e829eb6dSJoseph Koshy struct pmc_classdep *pcd; 4832f263522aSJoseph Koshy struct pmc_samplebuffer *psb; 4833aee6e7dcSMateusz Guzik uint64_t delta __diagused; 483401c35b67SMitchell Horne int adjri, n; 4835ebccf1e3SJoseph Koshy 4836f263522aSJoseph Koshy KASSERT(PCPU_GET(cpuid) == cpu, 4837f263522aSJoseph Koshy ("[pmc,%d] not on the correct CPU pcpu=%d cpu=%d", __LINE__, 4838f263522aSJoseph Koshy PCPU_GET(cpuid), cpu)); 4839ebccf1e3SJoseph Koshy 4840f5f9340bSFabien Thomas psb = pmc_pcpu[cpu]->pc_sb[ring]; 4841d9f1b8dbSMatt Macy delta = psb->ps_prodidx - psb->ps_considx; 4842d9f1b8dbSMatt Macy MPASS(delta <= pmc_nsamples); 4843d9f1b8dbSMatt Macy MPASS(psb->ps_considx <= psb->ps_prodidx); 4844d9f1b8dbSMatt Macy for (n = 0; psb->ps_considx < psb->ps_prodidx; psb->ps_considx++, n++) { 4845d9f1b8dbSMatt Macy ps = PMC_CONS_SAMPLE(psb); 4846f263522aSJoseph Koshy 4847d9f1b8dbSMatt Macy if (__predict_false(ps->ps_nsamples == PMC_SAMPLE_FREE)) 4848d9f1b8dbSMatt Macy continue; 484901c35b67SMitchell Horne 4850d9f1b8dbSMatt Macy /* skip non-running samples */ 485101c35b67SMitchell Horne pm = ps->ps_pmc; 4852d9f1b8dbSMatt Macy if (pm->pm_state != PMC_STATE_RUNNING) 4853d9f1b8dbSMatt Macy goto entrydone; 48546fe00c78SJoseph Koshy 4855e6b475e0SMatt Macy KASSERT(counter_u64_fetch(pm->pm_runcount) > 0, 485601c35b67SMitchell Horne ("[pmc,%d] pm=%p runcount %ju", __LINE__, pm, 485701c35b67SMitchell Horne (uintmax_t)counter_u64_fetch(pm->pm_runcount))); 4858f263522aSJoseph Koshy KASSERT(PMC_IS_SAMPLING_MODE(PMC_TO_MODE(pm)), 4859f263522aSJoseph Koshy ("[pmc,%d] pmc=%p non-sampling mode=%d", __LINE__, 4860f263522aSJoseph Koshy pm, PMC_TO_MODE(pm))); 4861f263522aSJoseph Koshy 486201c35b67SMitchell Horne po = pm->pm_owner; 4863f263522aSJoseph Koshy 4864f5f9340bSFabien Thomas /* If there is a pending AST wait for completion */ 4865d9f1b8dbSMatt Macy if (ps->ps_nsamples == PMC_USER_CALLCHAIN_PENDING) { 486601c35b67SMitchell Horne /* 486701c35b67SMitchell Horne * If we've been waiting more than 1 tick to 4868acf50a7fSMatt Macy * collect a callchain for this record then 4869acf50a7fSMatt Macy * drop it and move on. 4870acf50a7fSMatt Macy */ 4871acf50a7fSMatt Macy if (ticks - ps->ps_ticks > 1) { 4872d9f1b8dbSMatt Macy /* 487301c35b67SMitchell Horne * Track how often we hit this as it will 4874d9f1b8dbSMatt Macy * preferentially lose user samples 487501c35b67SMitchell Horne * for long running system calls. 4876d9f1b8dbSMatt Macy */ 4877d9f1b8dbSMatt Macy counter_u64_add(pmc_stats.pm_overwrites, 1); 4878d9f1b8dbSMatt Macy goto entrydone; 4879d9f1b8dbSMatt Macy } 4880f5f9340bSFabien Thomas /* Need a rescan at a later time. */ 4881e6b475e0SMatt Macy DPCPU_SET(pmc_sampled, 1); 4882f5f9340bSFabien Thomas break; 4883f5f9340bSFabien Thomas } 4884f5f9340bSFabien Thomas 48854a3690dfSJohn Baldwin PMCDBG6(SAM,OPS,1,"cpu=%d pm=%p n=%d fl=%x wr=%d rd=%d", cpu, 4886d07f36b0SJoseph Koshy pm, ps->ps_nsamples, ps->ps_flags, 4887d9f1b8dbSMatt Macy (int)(psb->ps_prodidx & pmc_sample_mask), 4888d9f1b8dbSMatt Macy (int)(psb->ps_considx & pmc_sample_mask)); 4889f263522aSJoseph Koshy 4890f263522aSJoseph Koshy /* 4891f263522aSJoseph Koshy * If this is a process-mode PMC that is attached to 4892f263522aSJoseph Koshy * its owner, and if the PC is in user mode, update 4893f263522aSJoseph Koshy * profiling statistics like timer-based profiling 4894f263522aSJoseph Koshy * would have done. 48955de96e33SMatt Macy * 48965de96e33SMatt Macy * Otherwise, this is either a sampling-mode PMC that 48975de96e33SMatt Macy * is attached to a different process than its owner, 48985de96e33SMatt Macy * or a system-wide sampling PMC. Dispatch a log 48995de96e33SMatt Macy * entry to the PMC's owner process. 4900f263522aSJoseph Koshy */ 4901f263522aSJoseph Koshy if (pm->pm_flags & PMC_F_ATTACHED_TO_OWNER) { 4902d07f36b0SJoseph Koshy if (ps->ps_flags & PMC_CC_F_USERSPACE) { 4903f263522aSJoseph Koshy td = FIRST_THREAD_IN_PROC(po->po_owner); 4904d07f36b0SJoseph Koshy addupc_intr(td, ps->ps_pc[0], 1); 4905f263522aSJoseph Koshy } 49065de96e33SMatt Macy } else 4907d07f36b0SJoseph Koshy pmclog_process_callchain(pm, ps); 4908f263522aSJoseph Koshy 4909f263522aSJoseph Koshy entrydone: 4910d07f36b0SJoseph Koshy ps->ps_nsamples = 0; /* mark entry as free */ 4911d9f1b8dbSMatt Macy KASSERT(counter_u64_fetch(pm->pm_runcount) > 0, 491201c35b67SMitchell Horne ("[pmc,%d] pm=%p runcount %ju", __LINE__, pm, 491301c35b67SMitchell Horne (uintmax_t)counter_u64_fetch(pm->pm_runcount))); 4914f263522aSJoseph Koshy 4915d9f1b8dbSMatt Macy counter_u64_add(pm->pm_runcount, -1); 4916f263522aSJoseph Koshy } 4917f263522aSJoseph Koshy 4918e6b475e0SMatt Macy counter_u64_add(pmc_stats.pm_log_sweeps, 1); 4919f263522aSJoseph Koshy 4920f263522aSJoseph Koshy /* Do not re-enable stalled PMCs if we failed to process any samples */ 4921f263522aSJoseph Koshy if (n == 0) 4922ebccf1e3SJoseph Koshy return; 4923f263522aSJoseph Koshy 4924f263522aSJoseph Koshy /* 4925f263522aSJoseph Koshy * Restart any stalled sampling PMCs on this CPU. 4926f263522aSJoseph Koshy * 4927fbf1556dSJoseph Koshy * If the NMI handler sets the pm_stalled field of a PMC after 4928fbf1556dSJoseph Koshy * the check below, we'll end up processing the stalled PMC at 4929fbf1556dSJoseph Koshy * the next hardclock tick. 4930f263522aSJoseph Koshy */ 4931f263522aSJoseph Koshy for (n = 0; n < md->pmd_npmc; n++) { 4932e829eb6dSJoseph Koshy pcd = pmc_ri_to_classdep(md, n, &adjri); 4933e829eb6dSJoseph Koshy KASSERT(pcd != NULL, 4934e829eb6dSJoseph Koshy ("[pmc,%d] null pcd ri=%d", __LINE__, n)); 4935e829eb6dSJoseph Koshy (void)(*pcd->pcd_get_config)(cpu, adjri, &pm); 4936e829eb6dSJoseph Koshy 4937f263522aSJoseph Koshy if (pm == NULL || /* !cfg'ed */ 4938f263522aSJoseph Koshy pm->pm_state != PMC_STATE_RUNNING || /* !active */ 4939f263522aSJoseph Koshy !PMC_IS_SAMPLING_MODE(PMC_TO_MODE(pm)) || /* !sampling */ 4940e6b475e0SMatt Macy !pm->pm_pcpu_state[cpu].pps_cpustate || /* !desired */ 4941e6b475e0SMatt Macy !pm->pm_pcpu_state[cpu].pps_stalled) /* !stalled */ 4942f263522aSJoseph Koshy continue; 4943f263522aSJoseph Koshy 4944e6b475e0SMatt Macy pm->pm_pcpu_state[cpu].pps_stalled = 0; 494501c35b67SMitchell Horne (void)(*pcd->pcd_start_pmc)(cpu, adjri, pm); 4946f263522aSJoseph Koshy } 4947ebccf1e3SJoseph Koshy } 4948ebccf1e3SJoseph Koshy 4949ebccf1e3SJoseph Koshy /* 4950ebccf1e3SJoseph Koshy * Event handlers. 4951ebccf1e3SJoseph Koshy */ 4952ebccf1e3SJoseph Koshy 4953ebccf1e3SJoseph Koshy /* 4954ebccf1e3SJoseph Koshy * Handle a process exit. 4955ebccf1e3SJoseph Koshy * 4956f263522aSJoseph Koshy * Remove this process from all hash tables. If this process 4957f263522aSJoseph Koshy * owned any PMCs, turn off those PMCs and deallocate them, 4958f263522aSJoseph Koshy * removing any associations with target processes. 4959f263522aSJoseph Koshy * 4960f263522aSJoseph Koshy * This function will be called by the last 'thread' of a 4961f263522aSJoseph Koshy * process. 4962f263522aSJoseph Koshy * 4963ebccf1e3SJoseph Koshy * XXX This eventhandler gets called early in the exit process. 4964ebccf1e3SJoseph Koshy * Consider using a 'hook' invocation from thread_exit() or equivalent 4965ebccf1e3SJoseph Koshy * spot. Another negative is that kse_exit doesn't seem to call 4966ebccf1e3SJoseph Koshy * exit1() [??]. 4967ebccf1e3SJoseph Koshy */ 4968ebccf1e3SJoseph Koshy static void 4969ebccf1e3SJoseph Koshy pmc_process_exit(void *arg __unused, struct proc *p) 4970ebccf1e3SJoseph Koshy { 4971f263522aSJoseph Koshy struct pmc *pm; 4972f263522aSJoseph Koshy struct pmc_owner *po; 4973e829eb6dSJoseph Koshy struct pmc_process *pp; 4974e829eb6dSJoseph Koshy struct pmc_classdep *pcd; 4975f263522aSJoseph Koshy pmc_value_t newvalue, tmp; 497601c35b67SMitchell Horne int ri, adjri, cpu; 497701c35b67SMitchell Horne bool is_using_hwpmcs; 4978ebccf1e3SJoseph Koshy 4979ebccf1e3SJoseph Koshy PROC_LOCK(p); 4980d5ee4074SMitchell Horne is_using_hwpmcs = (p->p_flag & P_HWPMC) != 0; 4981ebccf1e3SJoseph Koshy PROC_UNLOCK(p); 4982ebccf1e3SJoseph Koshy 4983f263522aSJoseph Koshy /* 4984f263522aSJoseph Koshy * Log a sysexit event to all SS PMC owners. 4985f263522aSJoseph Koshy */ 49866573d758SMatt Macy PMC_EPOCH_ENTER(); 4987d5ee4074SMitchell Horne CK_LIST_FOREACH(po, &pmc_ss_owners, po_ssnext) { 4988d5ee4074SMitchell Horne if ((po->po_flags & PMC_PO_OWNS_LOGFILE) != 0) 4989f263522aSJoseph Koshy pmclog_process_sysexit(po, p->p_pid); 4990d5ee4074SMitchell Horne } 49916573d758SMatt Macy PMC_EPOCH_EXIT(); 4992f263522aSJoseph Koshy 4993f263522aSJoseph Koshy if (!is_using_hwpmcs) 4994f263522aSJoseph Koshy return; 4995f263522aSJoseph Koshy 4996f263522aSJoseph Koshy PMC_GET_SX_XLOCK(); 49974a3690dfSJohn Baldwin PMCDBG3(PRC,EXT,1,"process-exit proc=%p (%d, %s)", p, p->p_pid, 4998ebccf1e3SJoseph Koshy p->p_comm); 4999ebccf1e3SJoseph Koshy 5000f263522aSJoseph Koshy /* 5001f263522aSJoseph Koshy * Since this code is invoked by the last thread in an exiting 5002f263522aSJoseph Koshy * process, we would have context switched IN at some prior 5003f263522aSJoseph Koshy * point. However, with PREEMPTION, kernel mode context 5004f263522aSJoseph Koshy * switches may happen any time, so we want to disable a 5005b790c193SPedro F. Giffuni * context switch OUT till we get any PMCs targeting this 5006f263522aSJoseph Koshy * process off the hardware. 5007f263522aSJoseph Koshy * 5008f263522aSJoseph Koshy * We also need to atomically remove this process' 5009f263522aSJoseph Koshy * entry from our target process hash table, using 5010f263522aSJoseph Koshy * PMC_FLAG_REMOVE. 5011f263522aSJoseph Koshy */ 50124a3690dfSJohn Baldwin PMCDBG3(PRC,EXT,1, "process-exit proc=%p (%d, %s)", p, p->p_pid, 5013f263522aSJoseph Koshy p->p_comm); 5014f263522aSJoseph Koshy 5015f263522aSJoseph Koshy critical_enter(); /* no preemption */ 5016f263522aSJoseph Koshy 5017f263522aSJoseph Koshy cpu = curthread->td_oncpu; 5018d5ee4074SMitchell Horne if ((pp = pmc_find_process_descriptor(p, PMC_FLAG_REMOVE)) != NULL) { 5019f263522aSJoseph Koshy 50204a3690dfSJohn Baldwin PMCDBG2(PRC,EXT,2, 5021f263522aSJoseph Koshy "process-exit proc=%p pmc-process=%p", p, pp); 5022f263522aSJoseph Koshy 5023f263522aSJoseph Koshy /* 5024f263522aSJoseph Koshy * The exiting process could the target of 5025f263522aSJoseph Koshy * some PMCs which will be running on 5026f263522aSJoseph Koshy * currently executing CPU. 5027f263522aSJoseph Koshy * 5028f263522aSJoseph Koshy * We need to turn these PMCs off like we 5029f263522aSJoseph Koshy * would do at context switch OUT time. 5030f263522aSJoseph Koshy */ 5031f263522aSJoseph Koshy for (ri = 0; ri < md->pmd_npmc; ri++) { 5032f263522aSJoseph Koshy /* 5033f263522aSJoseph Koshy * Pick up the pmc pointer from hardware 5034f263522aSJoseph Koshy * state similar to the CSW_OUT code. 5035f263522aSJoseph Koshy */ 5036f263522aSJoseph Koshy pm = NULL; 5037e829eb6dSJoseph Koshy 5038e829eb6dSJoseph Koshy pcd = pmc_ri_to_classdep(md, ri, &adjri); 5039e829eb6dSJoseph Koshy 5040e829eb6dSJoseph Koshy (void)(*pcd->pcd_get_config)(cpu, adjri, &pm); 5041f263522aSJoseph Koshy 50424a3690dfSJohn Baldwin PMCDBG2(PRC,EXT,2, "ri=%d pm=%p", ri, pm); 5043f263522aSJoseph Koshy 5044693cd307SMitchell Horne if (pm == NULL || !PMC_IS_VIRTUAL_MODE(PMC_TO_MODE(pm))) 5045f263522aSJoseph Koshy continue; 5046f263522aSJoseph Koshy 50474a3690dfSJohn Baldwin PMCDBG4(PRC,EXT,2, "ppmcs[%d]=%p pm=%p " 5048f263522aSJoseph Koshy "state=%d", ri, pp->pp_pmcs[ri].pp_pmc, 5049f263522aSJoseph Koshy pm, pm->pm_state); 5050f263522aSJoseph Koshy 5051f263522aSJoseph Koshy KASSERT(PMC_TO_ROWINDEX(pm) == ri, 5052f263522aSJoseph Koshy ("[pmc,%d] ri mismatch pmc(%d) ri(%d)", 5053f263522aSJoseph Koshy __LINE__, PMC_TO_ROWINDEX(pm), ri)); 5054f263522aSJoseph Koshy KASSERT(pm == pp->pp_pmcs[ri].pp_pmc, 5055f263522aSJoseph Koshy ("[pmc,%d] pm %p != pp_pmcs[%d] %p", 5056f263522aSJoseph Koshy __LINE__, pm, ri, pp->pp_pmcs[ri].pp_pmc)); 5057e6b475e0SMatt Macy KASSERT(counter_u64_fetch(pm->pm_runcount) > 0, 505801c35b67SMitchell Horne ("[pmc,%d] bad runcount ri %d rc %ju", 505901c35b67SMitchell Horne __LINE__, ri, 506001c35b67SMitchell Horne (uintmax_t)counter_u64_fetch(pm->pm_runcount))); 5061f263522aSJoseph Koshy 5062a3924968SJonathan T. Looney /* 5063a3924968SJonathan T. Looney * Change desired state, and then stop if not 5064a3924968SJonathan T. Looney * stalled. This two-step dance should avoid 5065a3924968SJonathan T. Looney * race conditions where an interrupt re-enables 5066a3924968SJonathan T. Looney * the PMC after this code has already checked 5067a3924968SJonathan T. Looney * the pm_stalled flag. 5068a3924968SJonathan T. Looney */ 5069e6b475e0SMatt Macy if (pm->pm_pcpu_state[cpu].pps_cpustate) { 5070e6b475e0SMatt Macy pm->pm_pcpu_state[cpu].pps_cpustate = 0; 5071e6b475e0SMatt Macy if (!pm->pm_pcpu_state[cpu].pps_stalled) { 507239f92a76SMitchell Horne (void)pcd->pcd_stop_pmc(cpu, adjri, pm); 50736161b98cSMatt Macy 50746161b98cSMatt Macy if (PMC_TO_MODE(pm) == PMC_MODE_TC) { 5075a3924968SJonathan T. Looney pcd->pcd_read_pmc(cpu, adjri, 507639f92a76SMitchell Horne pm, &newvalue); 5077f263522aSJoseph Koshy tmp = newvalue - 5078f263522aSJoseph Koshy PMC_PCPU_SAVED(cpu, ri); 5079f263522aSJoseph Koshy 50806161b98cSMatt Macy mtx_pool_lock_spin(pmc_mtxpool, 50816161b98cSMatt Macy pm); 5082f263522aSJoseph Koshy pm->pm_gv.pm_savedvalue += tmp; 50836161b98cSMatt Macy pp->pp_pmcs[ri].pp_pmcval += 50846161b98cSMatt Macy tmp; 50856161b98cSMatt Macy mtx_pool_unlock_spin( 50866161b98cSMatt Macy pmc_mtxpool, pm); 50876161b98cSMatt Macy } 5088ebccf1e3SJoseph Koshy } 5089a3924968SJonathan T. Looney } 5090f263522aSJoseph Koshy 509101c35b67SMitchell Horne KASSERT(counter_u64_fetch(pm->pm_runcount) > 0, 5092f263522aSJoseph Koshy ("[pmc,%d] runcount is %d", __LINE__, ri)); 5093f263522aSJoseph Koshy 5094d9f1b8dbSMatt Macy counter_u64_add(pm->pm_runcount, -1); 5095e829eb6dSJoseph Koshy (void)pcd->pcd_config_pmc(cpu, adjri, NULL); 5096f263522aSJoseph Koshy } 5097f263522aSJoseph Koshy 5098f263522aSJoseph Koshy /* 5099f263522aSJoseph Koshy * Inform the MD layer of this pseudo "context switch 5100f263522aSJoseph Koshy * out" 5101f263522aSJoseph Koshy */ 5102f263522aSJoseph Koshy (void)md->pmd_switch_out(pmc_pcpu[cpu], pp); 5103f263522aSJoseph Koshy 5104f263522aSJoseph Koshy critical_exit(); /* ok to be pre-empted now */ 5105f263522aSJoseph Koshy 5106f263522aSJoseph Koshy /* 5107f263522aSJoseph Koshy * Unlink this process from the PMCs that are 5108b790c193SPedro F. Giffuni * targeting it. This will send a signal to 5109f263522aSJoseph Koshy * all PMC owner's whose PMCs are orphaned. 5110f263522aSJoseph Koshy * 5111f263522aSJoseph Koshy * Log PMC value at exit time if requested. 5112f263522aSJoseph Koshy */ 5113d5ee4074SMitchell Horne for (ri = 0; ri < md->pmd_npmc; ri++) { 5114f263522aSJoseph Koshy if ((pm = pp->pp_pmcs[ri].pp_pmc) != NULL) { 5115d5ee4074SMitchell Horne if ((pm->pm_flags & PMC_F_NEEDS_LOGFILE) != 0 && 5116d5ee4074SMitchell Horne PMC_IS_COUNTING_MODE(PMC_TO_MODE(pm))) { 5117f263522aSJoseph Koshy pmclog_process_procexit(pm, pp); 5118d5ee4074SMitchell Horne } 5119f263522aSJoseph Koshy pmc_unlink_target_process(pm, pp); 5120f263522aSJoseph Koshy } 5121d5ee4074SMitchell Horne } 51221ede983cSDag-Erling Smørgrav free(pp, M_PMC); 5123f263522aSJoseph Koshy } else 5124f263522aSJoseph Koshy critical_exit(); /* pp == NULL */ 5125f263522aSJoseph Koshy 5126f263522aSJoseph Koshy /* 5127f263522aSJoseph Koshy * If the process owned PMCs, free them up and free up 5128f263522aSJoseph Koshy * memory. 5129f263522aSJoseph Koshy */ 5130f263522aSJoseph Koshy if ((po = pmc_find_owner_descriptor(p)) != NULL) { 5131f263522aSJoseph Koshy pmc_remove_owner(po); 5132f263522aSJoseph Koshy pmc_destroy_owner_descriptor(po); 5133f263522aSJoseph Koshy } 5134f263522aSJoseph Koshy 5135f263522aSJoseph Koshy sx_xunlock(&pmc_sx); 5136ebccf1e3SJoseph Koshy } 5137ebccf1e3SJoseph Koshy 5138ebccf1e3SJoseph Koshy /* 5139ebccf1e3SJoseph Koshy * Handle a process fork. 5140ebccf1e3SJoseph Koshy * 5141ebccf1e3SJoseph Koshy * If the parent process 'p1' is under HWPMC monitoring, then copy 5142ebccf1e3SJoseph Koshy * over any attached PMCs that have 'do_descendants' semantics. 5143ebccf1e3SJoseph Koshy */ 5144ebccf1e3SJoseph Koshy static void 5145f263522aSJoseph Koshy pmc_process_fork(void *arg __unused, struct proc *p1, struct proc *newproc, 514601c35b67SMitchell Horne int flags __unused) 5147ebccf1e3SJoseph Koshy { 5148f263522aSJoseph Koshy struct pmc *pm; 5149f263522aSJoseph Koshy struct pmc_owner *po; 5150f263522aSJoseph Koshy struct pmc_process *ppnew, *ppold; 515101c35b67SMitchell Horne unsigned int ri; 515201c35b67SMitchell Horne bool is_using_hwpmcs, do_descendants; 5153ebccf1e3SJoseph Koshy 5154ebccf1e3SJoseph Koshy PROC_LOCK(p1); 5155d5ee4074SMitchell Horne is_using_hwpmcs = (p1->p_flag & P_HWPMC) != 0; 5156ebccf1e3SJoseph Koshy PROC_UNLOCK(p1); 5157ebccf1e3SJoseph Koshy 5158f263522aSJoseph Koshy /* 5159f263522aSJoseph Koshy * If there are system-wide sampling PMCs active, we need to 5160f263522aSJoseph Koshy * log all fork events to their owner's logs. 5161f263522aSJoseph Koshy */ 51626573d758SMatt Macy PMC_EPOCH_ENTER(); 5163d5ee4074SMitchell Horne CK_LIST_FOREACH(po, &pmc_ss_owners, po_ssnext) { 5164ebfaf69cSMatt Macy if (po->po_flags & PMC_PO_OWNS_LOGFILE) { 5165f263522aSJoseph Koshy pmclog_process_procfork(po, p1->p_pid, newproc->p_pid); 5166ebfaf69cSMatt Macy pmclog_process_proccreate(po, newproc, 1); 5167ebfaf69cSMatt Macy } 5168d5ee4074SMitchell Horne } 51696573d758SMatt Macy PMC_EPOCH_EXIT(); 5170f263522aSJoseph Koshy 5171f263522aSJoseph Koshy if (!is_using_hwpmcs) 5172f263522aSJoseph Koshy return; 5173f263522aSJoseph Koshy 5174ebccf1e3SJoseph Koshy PMC_GET_SX_XLOCK(); 51754a3690dfSJohn Baldwin PMCDBG4(PMC,FRK,1, "process-fork proc=%p (%d, %s) -> %p", p1, 5176f263522aSJoseph Koshy p1->p_pid, p1->p_comm, newproc); 5177f263522aSJoseph Koshy 5178f263522aSJoseph Koshy /* 5179f263522aSJoseph Koshy * If the parent process (curthread->td_proc) is a 5180f263522aSJoseph Koshy * target of any PMCs, look for PMCs that are to be 5181f263522aSJoseph Koshy * inherited, and link these into the new process 5182f263522aSJoseph Koshy * descriptor. 5183f263522aSJoseph Koshy */ 5184d5ee4074SMitchell Horne ppold = pmc_find_process_descriptor(curthread->td_proc, PMC_FLAG_NONE); 5185d5ee4074SMitchell Horne if (ppold == NULL) 5186f263522aSJoseph Koshy goto done; /* nothing to do */ 5187f263522aSJoseph Koshy 518801c35b67SMitchell Horne do_descendants = false; 5189d5ee4074SMitchell Horne for (ri = 0; ri < md->pmd_npmc; ri++) { 5190d5ee4074SMitchell Horne if ((pm = ppold->pp_pmcs[ri].pp_pmc) != NULL && 5191d5ee4074SMitchell Horne (pm->pm_flags & PMC_F_DESCENDANTS) != 0) { 5192d5ee4074SMitchell Horne do_descendants = true; 5193d5ee4074SMitchell Horne break; 5194d5ee4074SMitchell Horne } 5195d5ee4074SMitchell Horne } 519601c35b67SMitchell Horne if (!do_descendants) /* nothing to do */ 5197f263522aSJoseph Koshy goto done; 5198f263522aSJoseph Koshy 51996161b98cSMatt Macy /* 52006161b98cSMatt Macy * Now mark the new process as being tracked by this driver. 52016161b98cSMatt Macy */ 52026161b98cSMatt Macy PROC_LOCK(newproc); 52036161b98cSMatt Macy newproc->p_flag |= P_HWPMC; 52046161b98cSMatt Macy PROC_UNLOCK(newproc); 52056161b98cSMatt Macy 520601c35b67SMitchell Horne /* Allocate a descriptor for the new process. */ 5207d5ee4074SMitchell Horne ppnew = pmc_find_process_descriptor(newproc, PMC_FLAG_ALLOCATE); 5208d5ee4074SMitchell Horne if (ppnew == NULL) 5209f263522aSJoseph Koshy goto done; 5210f263522aSJoseph Koshy 5211f263522aSJoseph Koshy /* 5212f263522aSJoseph Koshy * Run through all PMCs that were targeting the old process 5213f263522aSJoseph Koshy * and which specified F_DESCENDANTS and attach them to the 5214f263522aSJoseph Koshy * new process. 5215f263522aSJoseph Koshy * 5216f263522aSJoseph Koshy * Log the fork event to all owners of PMCs attached to this 5217f263522aSJoseph Koshy * process, if not already logged. 5218f263522aSJoseph Koshy */ 5219d5ee4074SMitchell Horne for (ri = 0; ri < md->pmd_npmc; ri++) { 5220f263522aSJoseph Koshy if ((pm = ppold->pp_pmcs[ri].pp_pmc) != NULL && 5221d5ee4074SMitchell Horne (pm->pm_flags & PMC_F_DESCENDANTS) != 0) { 5222f263522aSJoseph Koshy pmc_link_target_process(pm, ppnew); 5223f263522aSJoseph Koshy po = pm->pm_owner; 5224f263522aSJoseph Koshy if (po->po_sscount == 0 && 5225d5ee4074SMitchell Horne (po->po_flags & PMC_PO_OWNS_LOGFILE) != 0) { 5226f263522aSJoseph Koshy pmclog_process_procfork(po, p1->p_pid, 5227f263522aSJoseph Koshy newproc->p_pid); 5228ebccf1e3SJoseph Koshy } 5229d5ee4074SMitchell Horne } 5230d5ee4074SMitchell Horne } 5231f263522aSJoseph Koshy 5232f263522aSJoseph Koshy done: 5233f263522aSJoseph Koshy sx_xunlock(&pmc_sx); 5234ebccf1e3SJoseph Koshy } 5235ebccf1e3SJoseph Koshy 523629f4e216SMark Johnston static void 5237ebfaf69cSMatt Macy pmc_process_threadcreate(struct thread *td) 5238ebfaf69cSMatt Macy { 5239ebfaf69cSMatt Macy struct pmc_owner *po; 5240ebfaf69cSMatt Macy 52416573d758SMatt Macy PMC_EPOCH_ENTER(); 5242d5ee4074SMitchell Horne CK_LIST_FOREACH(po, &pmc_ss_owners, po_ssnext) { 5243d5ee4074SMitchell Horne if ((po->po_flags & PMC_PO_OWNS_LOGFILE) != 0) 5244ebfaf69cSMatt Macy pmclog_process_threadcreate(po, td, 1); 5245d5ee4074SMitchell Horne } 52466573d758SMatt Macy PMC_EPOCH_EXIT(); 5247ebfaf69cSMatt Macy } 5248ebfaf69cSMatt Macy 5249ebfaf69cSMatt Macy static void 5250ebfaf69cSMatt Macy pmc_process_threadexit(struct thread *td) 5251ebfaf69cSMatt Macy { 5252ebfaf69cSMatt Macy struct pmc_owner *po; 5253ebfaf69cSMatt Macy 52546573d758SMatt Macy PMC_EPOCH_ENTER(); 5255d5ee4074SMitchell Horne CK_LIST_FOREACH(po, &pmc_ss_owners, po_ssnext) { 5256d5ee4074SMitchell Horne if ((po->po_flags & PMC_PO_OWNS_LOGFILE) != 0) 5257ebfaf69cSMatt Macy pmclog_process_threadexit(po, td); 5258d5ee4074SMitchell Horne } 52596573d758SMatt Macy PMC_EPOCH_EXIT(); 5260ebfaf69cSMatt Macy } 5261ebfaf69cSMatt Macy 5262ebfaf69cSMatt Macy static void 5263ebfaf69cSMatt Macy pmc_process_proccreate(struct proc *p) 5264ebfaf69cSMatt Macy { 5265ebfaf69cSMatt Macy struct pmc_owner *po; 5266ebfaf69cSMatt Macy 52676573d758SMatt Macy PMC_EPOCH_ENTER(); 5268d5ee4074SMitchell Horne CK_LIST_FOREACH(po, &pmc_ss_owners, po_ssnext) { 5269d5ee4074SMitchell Horne if ((po->po_flags & PMC_PO_OWNS_LOGFILE) != 0) 5270ebfaf69cSMatt Macy pmclog_process_proccreate(po, p, 1 /* sync */); 5271d5ee4074SMitchell Horne } 52726573d758SMatt Macy PMC_EPOCH_EXIT(); 5273ebfaf69cSMatt Macy } 5274ebfaf69cSMatt Macy 5275ebfaf69cSMatt Macy static void 5276ebfaf69cSMatt Macy pmc_process_allproc(struct pmc *pm) 5277ebfaf69cSMatt Macy { 5278ebfaf69cSMatt Macy struct pmc_owner *po; 5279ebfaf69cSMatt Macy struct thread *td; 5280ebfaf69cSMatt Macy struct proc *p; 5281ebfaf69cSMatt Macy 5282ebfaf69cSMatt Macy po = pm->pm_owner; 5283ebfaf69cSMatt Macy if ((po->po_flags & PMC_PO_OWNS_LOGFILE) == 0) 5284ebfaf69cSMatt Macy return; 5285693cd307SMitchell Horne 5286ebfaf69cSMatt Macy sx_slock(&allproc_lock); 5287ebfaf69cSMatt Macy FOREACH_PROC_IN_SYSTEM(p) { 5288ebfaf69cSMatt Macy pmclog_process_proccreate(po, p, 0 /* sync */); 5289ebfaf69cSMatt Macy PROC_LOCK(p); 5290ebfaf69cSMatt Macy FOREACH_THREAD_IN_PROC(p, td) 5291ebfaf69cSMatt Macy pmclog_process_threadcreate(po, td, 0 /* sync */); 5292ebfaf69cSMatt Macy PROC_UNLOCK(p); 5293ebfaf69cSMatt Macy } 5294ebfaf69cSMatt Macy sx_sunlock(&allproc_lock); 5295ebfaf69cSMatt Macy pmclog_flush(po, 0); 5296ebfaf69cSMatt Macy } 5297ebfaf69cSMatt Macy 5298ebfaf69cSMatt Macy static void 529929f4e216SMark Johnston pmc_kld_load(void *arg __unused, linker_file_t lf) 530029f4e216SMark Johnston { 530129f4e216SMark Johnston struct pmc_owner *po; 530229f4e216SMark Johnston 530329f4e216SMark Johnston /* 530429f4e216SMark Johnston * Notify owners of system sampling PMCs about KLD operations. 530529f4e216SMark Johnston */ 53066573d758SMatt Macy PMC_EPOCH_ENTER(); 5307d5ee4074SMitchell Horne CK_LIST_FOREACH(po, &pmc_ss_owners, po_ssnext) { 530829f4e216SMark Johnston if (po->po_flags & PMC_PO_OWNS_LOGFILE) 530929f4e216SMark Johnston pmclog_process_map_in(po, (pid_t) -1, 531053d0b9e4SJessica Clarke (uintfptr_t) lf->address, lf->pathname); 5311d5ee4074SMitchell Horne } 53126573d758SMatt Macy PMC_EPOCH_EXIT(); 531329f4e216SMark Johnston 531429f4e216SMark Johnston /* 531529f4e216SMark Johnston * TODO: Notify owners of (all) process-sampling PMCs too. 531629f4e216SMark Johnston */ 531729f4e216SMark Johnston } 531829f4e216SMark Johnston 531929f4e216SMark Johnston static void 532029f4e216SMark Johnston pmc_kld_unload(void *arg __unused, const char *filename __unused, 532129f4e216SMark Johnston caddr_t address, size_t size) 532229f4e216SMark Johnston { 532329f4e216SMark Johnston struct pmc_owner *po; 532429f4e216SMark Johnston 53256573d758SMatt Macy PMC_EPOCH_ENTER(); 5326d5ee4074SMitchell Horne CK_LIST_FOREACH(po, &pmc_ss_owners, po_ssnext) { 5327d5ee4074SMitchell Horne if ((po->po_flags & PMC_PO_OWNS_LOGFILE) != 0) { 532829f4e216SMark Johnston pmclog_process_map_out(po, (pid_t)-1, 532929f4e216SMark Johnston (uintfptr_t)address, (uintfptr_t)address + size); 5330d5ee4074SMitchell Horne } 5331d5ee4074SMitchell Horne } 53326573d758SMatt Macy PMC_EPOCH_EXIT(); 533329f4e216SMark Johnston 533429f4e216SMark Johnston /* 533529f4e216SMark Johnston * TODO: Notify owners of process-sampling PMCs. 533629f4e216SMark Johnston */ 533729f4e216SMark Johnston } 5338ebccf1e3SJoseph Koshy 5339ebccf1e3SJoseph Koshy /* 5340ebccf1e3SJoseph Koshy * initialization 5341ebccf1e3SJoseph Koshy */ 53420ceb54c2SJohn Baldwin static const char * 53430ceb54c2SJohn Baldwin pmc_name_of_pmcclass(enum pmc_class class) 53440ceb54c2SJohn Baldwin { 5345ebccf1e3SJoseph Koshy 53460ceb54c2SJohn Baldwin switch (class) { 5347ebccf1e3SJoseph Koshy #undef __PMC_CLASS 53480ceb54c2SJohn Baldwin #define __PMC_CLASS(S,V,D) \ 53490ceb54c2SJohn Baldwin case PMC_CLASS_##S: \ 53500ceb54c2SJohn Baldwin return #S; 53510ceb54c2SJohn Baldwin __PMC_CLASSES(); 53520ceb54c2SJohn Baldwin default: 53530ceb54c2SJohn Baldwin return ("<unknown>"); 53540ceb54c2SJohn Baldwin } 53550ceb54c2SJohn Baldwin } 5356ebccf1e3SJoseph Koshy 5357f5f9340bSFabien Thomas /* 5358f5f9340bSFabien Thomas * Base class initializer: allocate structure and set default classes. 5359f5f9340bSFabien Thomas */ 5360f5f9340bSFabien Thomas struct pmc_mdep * 5361f5f9340bSFabien Thomas pmc_mdep_alloc(int nclasses) 5362f5f9340bSFabien Thomas { 5363f5f9340bSFabien Thomas struct pmc_mdep *md; 5364f5f9340bSFabien Thomas int n; 5365f5f9340bSFabien Thomas 5366f5f9340bSFabien Thomas /* SOFT + md classes */ 5367f5f9340bSFabien Thomas n = 1 + nclasses; 5368693cd307SMitchell Horne md = malloc(sizeof(struct pmc_mdep) + n * sizeof(struct pmc_classdep), 5369693cd307SMitchell Horne M_PMC, M_WAITOK | M_ZERO); 5370f5f9340bSFabien Thomas md->pmd_nclass = n; 5371f5f9340bSFabien Thomas 5372fa88954fSMitchell Horne /* Default methods */ 5373fa88954fSMitchell Horne md->pmd_switch_in = generic_switch_in; 5374fa88954fSMitchell Horne md->pmd_switch_out = generic_switch_out; 5375fa88954fSMitchell Horne 5376f5f9340bSFabien Thomas /* Add base class. */ 5377f5f9340bSFabien Thomas pmc_soft_initialize(md); 537852ebac7fSMitchell Horne return (md); 5379f5f9340bSFabien Thomas } 5380f5f9340bSFabien Thomas 5381f5f9340bSFabien Thomas void 5382f5f9340bSFabien Thomas pmc_mdep_free(struct pmc_mdep *md) 5383f5f9340bSFabien Thomas { 5384f5f9340bSFabien Thomas pmc_soft_finalize(md); 5385f5f9340bSFabien Thomas free(md, M_PMC); 5386f5f9340bSFabien Thomas } 5387f5f9340bSFabien Thomas 5388f5f9340bSFabien Thomas static int 538901c35b67SMitchell Horne generic_switch_in(struct pmc_cpu *pc __unused, struct pmc_process *pp __unused) 5390f5f9340bSFabien Thomas { 5391f5f9340bSFabien Thomas 5392f5f9340bSFabien Thomas return (0); 5393f5f9340bSFabien Thomas } 5394f5f9340bSFabien Thomas 5395f5f9340bSFabien Thomas static int 539601c35b67SMitchell Horne generic_switch_out(struct pmc_cpu *pc __unused, struct pmc_process *pp __unused) 5397f5f9340bSFabien Thomas { 5398f5f9340bSFabien Thomas 5399f5f9340bSFabien Thomas return (0); 5400f5f9340bSFabien Thomas } 5401f5f9340bSFabien Thomas 5402f5f9340bSFabien Thomas static struct pmc_mdep * 5403f5f9340bSFabien Thomas pmc_generic_cpu_initialize(void) 5404f5f9340bSFabien Thomas { 5405f5f9340bSFabien Thomas struct pmc_mdep *md; 5406f5f9340bSFabien Thomas 5407f5f9340bSFabien Thomas md = pmc_mdep_alloc(0); 5408f5f9340bSFabien Thomas 5409f5f9340bSFabien Thomas md->pmd_cputype = PMC_CPU_GENERIC; 5410f5f9340bSFabien Thomas 5411f5f9340bSFabien Thomas return (md); 5412f5f9340bSFabien Thomas } 5413f5f9340bSFabien Thomas 5414f5f9340bSFabien Thomas static void 541501c35b67SMitchell Horne pmc_generic_cpu_finalize(struct pmc_mdep *md __unused) 5416f5f9340bSFabien Thomas { 5417f5f9340bSFabien Thomas 541801c35b67SMitchell Horne } 5419f5f9340bSFabien Thomas 5420ebccf1e3SJoseph Koshy static int 5421ebccf1e3SJoseph Koshy pmc_initialize(void) 5422ebccf1e3SJoseph Koshy { 5423e6b475e0SMatt Macy struct pcpu *pc; 5424ebccf1e3SJoseph Koshy struct pmc_binding pb; 5425e829eb6dSJoseph Koshy struct pmc_classdep *pcd; 542601c35b67SMitchell Horne struct pmc_sample *ps; 5427f263522aSJoseph Koshy struct pmc_samplebuffer *sb; 542801c35b67SMitchell Horne int c, cpu, error, n, ri; 542901c35b67SMitchell Horne u_int maxcpu, domain; 5430ebccf1e3SJoseph Koshy 5431ebccf1e3SJoseph Koshy md = NULL; 5432ebccf1e3SJoseph Koshy error = 0; 5433ebccf1e3SJoseph Koshy 5434e6b475e0SMatt Macy pmc_stats.pm_intr_ignored = counter_u64_alloc(M_WAITOK); 5435e6b475e0SMatt Macy pmc_stats.pm_intr_processed = counter_u64_alloc(M_WAITOK); 5436e6b475e0SMatt Macy pmc_stats.pm_intr_bufferfull = counter_u64_alloc(M_WAITOK); 5437e6b475e0SMatt Macy pmc_stats.pm_syscalls = counter_u64_alloc(M_WAITOK); 5438e6b475e0SMatt Macy pmc_stats.pm_syscall_errors = counter_u64_alloc(M_WAITOK); 5439e6b475e0SMatt Macy pmc_stats.pm_buffer_requests = counter_u64_alloc(M_WAITOK); 5440e6b475e0SMatt Macy pmc_stats.pm_buffer_requests_failed = counter_u64_alloc(M_WAITOK); 5441e6b475e0SMatt Macy pmc_stats.pm_log_sweeps = counter_u64_alloc(M_WAITOK); 54425de96e33SMatt Macy pmc_stats.pm_merges = counter_u64_alloc(M_WAITOK); 54435de96e33SMatt Macy pmc_stats.pm_overwrites = counter_u64_alloc(M_WAITOK); 5444e6b475e0SMatt Macy 5445680f1afdSJohn Baldwin #ifdef HWPMC_DEBUG 5446ebccf1e3SJoseph Koshy /* parse debug flags first */ 5447ebccf1e3SJoseph Koshy if (TUNABLE_STR_FETCH(PMC_SYSCTL_NAME_PREFIX "debugflags", 544801c35b67SMitchell Horne pmc_debugstr, sizeof(pmc_debugstr))) { 544901c35b67SMitchell Horne pmc_debugflags_parse(pmc_debugstr, pmc_debugstr + 545001c35b67SMitchell Horne strlen(pmc_debugstr)); 545101c35b67SMitchell Horne } 5452ebccf1e3SJoseph Koshy #endif 5453ebccf1e3SJoseph Koshy 54544a3690dfSJohn Baldwin PMCDBG1(MOD,INI,0, "PMC Initialize (version %x)", PMC_VERSION); 5455ebccf1e3SJoseph Koshy 5456fadcc6e2SJoseph Koshy /* check kernel version */ 5457fadcc6e2SJoseph Koshy if (pmc_kernel_version != PMC_VERSION) { 5458fadcc6e2SJoseph Koshy if (pmc_kernel_version == 0) 5459fadcc6e2SJoseph Koshy printf("hwpmc: this kernel has not been compiled with " 5460fadcc6e2SJoseph Koshy "'options HWPMC_HOOKS'.\n"); 5461fadcc6e2SJoseph Koshy else 5462fadcc6e2SJoseph Koshy printf("hwpmc: kernel version (0x%x) does not match " 5463fadcc6e2SJoseph Koshy "module version (0x%x).\n", pmc_kernel_version, 5464fadcc6e2SJoseph Koshy PMC_VERSION); 546552ebac7fSMitchell Horne return (EPROGMISMATCH); 5466fadcc6e2SJoseph Koshy } 5467fadcc6e2SJoseph Koshy 5468ebccf1e3SJoseph Koshy /* 5469ebccf1e3SJoseph Koshy * check sysctl parameters 5470ebccf1e3SJoseph Koshy */ 5471ebccf1e3SJoseph Koshy if (pmc_hashsize <= 0) { 547201c35b67SMitchell Horne printf("hwpmc: tunable \"hashsize\"=%d must be " 5473d07f36b0SJoseph Koshy "greater than zero.\n", pmc_hashsize); 5474ebccf1e3SJoseph Koshy pmc_hashsize = PMC_HASH_SIZE; 5475ebccf1e3SJoseph Koshy } 5476ebccf1e3SJoseph Koshy 5477f263522aSJoseph Koshy if (pmc_nsamples <= 0 || pmc_nsamples > 65535) { 547801c35b67SMitchell Horne printf("hwpmc: tunable \"nsamples\"=%d out of " 5479d07f36b0SJoseph Koshy "range.\n", pmc_nsamples); 5480f263522aSJoseph Koshy pmc_nsamples = PMC_NSAMPLES; 5481f263522aSJoseph Koshy } 5482d9f1b8dbSMatt Macy pmc_sample_mask = pmc_nsamples - 1; 5483f263522aSJoseph Koshy 5484d07f36b0SJoseph Koshy if (pmc_callchaindepth <= 0 || 5485d07f36b0SJoseph Koshy pmc_callchaindepth > PMC_CALLCHAIN_DEPTH_MAX) { 548601c35b67SMitchell Horne printf("hwpmc: tunable \"callchaindepth\"=%d out of " 5487201b654eSEd Maste "range - using %d.\n", pmc_callchaindepth, 5488201b654eSEd Maste PMC_CALLCHAIN_DEPTH_MAX); 5489201b654eSEd Maste pmc_callchaindepth = PMC_CALLCHAIN_DEPTH_MAX; 5490d07f36b0SJoseph Koshy } 5491d07f36b0SJoseph Koshy 5492f263522aSJoseph Koshy md = pmc_md_initialize(); 5493f5f9340bSFabien Thomas if (md == NULL) { 5494f5f9340bSFabien Thomas /* Default to generic CPU. */ 5495f5f9340bSFabien Thomas md = pmc_generic_cpu_initialize(); 5496e829eb6dSJoseph Koshy if (md == NULL) 5497e829eb6dSJoseph Koshy return (ENOSYS); 5498f5f9340bSFabien Thomas } 5499e829eb6dSJoseph Koshy 5500fdfeaa66SAleksandr Rybalko /* 5501fdfeaa66SAleksandr Rybalko * Refresh classes base ri. Optional classes may come in different 5502fdfeaa66SAleksandr Rybalko * order. 5503fdfeaa66SAleksandr Rybalko */ 5504fdfeaa66SAleksandr Rybalko for (ri = c = 0; c < md->pmd_nclass; c++) { 5505fdfeaa66SAleksandr Rybalko pcd = &md->pmd_classdep[c]; 5506fdfeaa66SAleksandr Rybalko pcd->pcd_ri = ri; 5507fdfeaa66SAleksandr Rybalko ri += pcd->pcd_num; 5508fdfeaa66SAleksandr Rybalko } 5509fdfeaa66SAleksandr Rybalko 5510e829eb6dSJoseph Koshy KASSERT(md->pmd_nclass >= 1 && md->pmd_npmc >= 1, 5511e829eb6dSJoseph Koshy ("[pmc,%d] no classes or pmcs", __LINE__)); 5512e829eb6dSJoseph Koshy 5513e829eb6dSJoseph Koshy /* Compute the map from row-indices to classdep pointers. */ 5514e829eb6dSJoseph Koshy pmc_rowindex_to_classdep = malloc(sizeof(struct pmc_classdep *) * 5515e829eb6dSJoseph Koshy md->pmd_npmc, M_PMC, M_WAITOK | M_ZERO); 5516e829eb6dSJoseph Koshy 5517e829eb6dSJoseph Koshy for (n = 0; n < md->pmd_npmc; n++) 5518e829eb6dSJoseph Koshy pmc_rowindex_to_classdep[n] = NULL; 5519693cd307SMitchell Horne 5520e829eb6dSJoseph Koshy for (ri = c = 0; c < md->pmd_nclass; c++) { 5521e829eb6dSJoseph Koshy pcd = &md->pmd_classdep[c]; 5522e829eb6dSJoseph Koshy for (n = 0; n < pcd->pcd_num; n++, ri++) 5523e829eb6dSJoseph Koshy pmc_rowindex_to_classdep[ri] = pcd; 5524e829eb6dSJoseph Koshy } 5525e829eb6dSJoseph Koshy 5526e829eb6dSJoseph Koshy KASSERT(ri == md->pmd_npmc, 5527e829eb6dSJoseph Koshy ("[pmc,%d] npmc miscomputed: ri=%d, md->npmc=%d", __LINE__, 5528e829eb6dSJoseph Koshy ri, md->pmd_npmc)); 5529ebccf1e3SJoseph Koshy 5530122ccdc1SJoseph Koshy maxcpu = pmc_cpu_max(); 5531122ccdc1SJoseph Koshy 5532ebccf1e3SJoseph Koshy /* allocate space for the per-cpu array */ 5533e829eb6dSJoseph Koshy pmc_pcpu = malloc(maxcpu * sizeof(struct pmc_cpu *), M_PMC, 5534e829eb6dSJoseph Koshy M_WAITOK | M_ZERO); 5535ebccf1e3SJoseph Koshy 5536ebccf1e3SJoseph Koshy /* per-cpu 'saved values' for managing process-mode PMCs */ 5537e11e3f18SDag-Erling Smørgrav pmc_pcpu_saved = malloc(sizeof(pmc_value_t) * maxcpu * md->pmd_npmc, 5538e11e3f18SDag-Erling Smørgrav M_PMC, M_WAITOK); 5539ebccf1e3SJoseph Koshy 5540122ccdc1SJoseph Koshy /* Perform CPU-dependent initialization. */ 5541ebccf1e3SJoseph Koshy pmc_save_cpu_binding(&pb); 5542e829eb6dSJoseph Koshy error = 0; 5543e829eb6dSJoseph Koshy for (cpu = 0; error == 0 && cpu < maxcpu; cpu++) { 5544122ccdc1SJoseph Koshy if (!pmc_cpu_is_active(cpu)) 5545ebccf1e3SJoseph Koshy continue; 5546ebccf1e3SJoseph Koshy pmc_select_cpu(cpu); 5547e829eb6dSJoseph Koshy pmc_pcpu[cpu] = malloc(sizeof(struct pmc_cpu) + 5548e829eb6dSJoseph Koshy md->pmd_npmc * sizeof(struct pmc_hw *), M_PMC, 5549e829eb6dSJoseph Koshy M_WAITOK | M_ZERO); 5550e829eb6dSJoseph Koshy for (n = 0; error == 0 && n < md->pmd_nclass; n++) 5551fdfeaa66SAleksandr Rybalko if (md->pmd_classdep[n].pcd_num > 0) 5552fdfeaa66SAleksandr Rybalko error = md->pmd_classdep[n].pcd_pcpu_init(md, 5553fdfeaa66SAleksandr Rybalko cpu); 5554ebccf1e3SJoseph Koshy } 5555ebccf1e3SJoseph Koshy pmc_restore_cpu_binding(&pb); 5556ebccf1e3SJoseph Koshy 5557d5ee4074SMitchell Horne if (error != 0) 5558e829eb6dSJoseph Koshy return (error); 5559ebccf1e3SJoseph Koshy 5560f263522aSJoseph Koshy /* allocate space for the sample array */ 5561122ccdc1SJoseph Koshy for (cpu = 0; cpu < maxcpu; cpu++) { 5562122ccdc1SJoseph Koshy if (!pmc_cpu_is_active(cpu)) 5563f263522aSJoseph Koshy continue; 5564e6b475e0SMatt Macy pc = pcpu_find(cpu); 5565e6b475e0SMatt Macy domain = pc->pc_domain; 55669978bd99SMark Johnston sb = malloc_domainset(sizeof(struct pmc_samplebuffer) + 55679978bd99SMark Johnston pmc_nsamples * sizeof(struct pmc_sample), M_PMC, 55689978bd99SMark Johnston DOMAINSET_PREF(domain), M_WAITOK | M_ZERO); 5569e829eb6dSJoseph Koshy 5570f263522aSJoseph Koshy KASSERT(pmc_pcpu[cpu] != NULL, 5571f263522aSJoseph Koshy ("[pmc,%d] cpu=%d Null per-cpu data", __LINE__, cpu)); 5572f263522aSJoseph Koshy 55739978bd99SMark Johnston sb->ps_callchains = malloc_domainset(pmc_callchaindepth * 55749978bd99SMark Johnston pmc_nsamples * sizeof(uintptr_t), M_PMC, 55759978bd99SMark Johnston DOMAINSET_PREF(domain), M_WAITOK | M_ZERO); 5576d07f36b0SJoseph Koshy 5577d07f36b0SJoseph Koshy for (n = 0, ps = sb->ps_samples; n < pmc_nsamples; n++, ps++) 5578d07f36b0SJoseph Koshy ps->ps_pc = sb->ps_callchains + 5579d07f36b0SJoseph Koshy (n * pmc_callchaindepth); 5580d07f36b0SJoseph Koshy 5581f5f9340bSFabien Thomas pmc_pcpu[cpu]->pc_sb[PMC_HR] = sb; 5582f5f9340bSFabien Thomas 55839978bd99SMark Johnston sb = malloc_domainset(sizeof(struct pmc_samplebuffer) + 55849978bd99SMark Johnston pmc_nsamples * sizeof(struct pmc_sample), M_PMC, 55859978bd99SMark Johnston DOMAINSET_PREF(domain), M_WAITOK | M_ZERO); 5586f5f9340bSFabien Thomas 55879978bd99SMark Johnston sb->ps_callchains = malloc_domainset(pmc_callchaindepth * 55889978bd99SMark Johnston pmc_nsamples * sizeof(uintptr_t), M_PMC, 55899978bd99SMark Johnston DOMAINSET_PREF(domain), M_WAITOK | M_ZERO); 5590f5f9340bSFabien Thomas for (n = 0, ps = sb->ps_samples; n < pmc_nsamples; n++, ps++) 5591f5f9340bSFabien Thomas ps->ps_pc = sb->ps_callchains + 5592f5f9340bSFabien Thomas (n * pmc_callchaindepth); 5593f5f9340bSFabien Thomas 5594f5f9340bSFabien Thomas pmc_pcpu[cpu]->pc_sb[PMC_SR] = sb; 55955de96e33SMatt Macy 55969978bd99SMark Johnston sb = malloc_domainset(sizeof(struct pmc_samplebuffer) + 55979978bd99SMark Johnston pmc_nsamples * sizeof(struct pmc_sample), M_PMC, 55989978bd99SMark Johnston DOMAINSET_PREF(domain), M_WAITOK | M_ZERO); 55999978bd99SMark Johnston sb->ps_callchains = malloc_domainset(pmc_callchaindepth * 56009978bd99SMark Johnston pmc_nsamples * sizeof(uintptr_t), M_PMC, 56019978bd99SMark Johnston DOMAINSET_PREF(domain), M_WAITOK | M_ZERO); 56025de96e33SMatt Macy for (n = 0, ps = sb->ps_samples; n < pmc_nsamples; n++, ps++) 56039978bd99SMark Johnston ps->ps_pc = sb->ps_callchains + n * pmc_callchaindepth; 56045de96e33SMatt Macy 56055de96e33SMatt Macy pmc_pcpu[cpu]->pc_sb[PMC_UR] = sb; 5606f263522aSJoseph Koshy } 5607f263522aSJoseph Koshy 5608ebccf1e3SJoseph Koshy /* allocate space for the row disposition array */ 5609ebccf1e3SJoseph Koshy pmc_pmcdisp = malloc(sizeof(enum pmc_mode) * md->pmd_npmc, 5610ebccf1e3SJoseph Koshy M_PMC, M_WAITOK | M_ZERO); 5611ebccf1e3SJoseph Koshy 5612ebccf1e3SJoseph Koshy /* mark all PMCs as available */ 561301c35b67SMitchell Horne for (n = 0; n < md->pmd_npmc; n++) 5614ebccf1e3SJoseph Koshy PMC_MARK_ROW_FREE(n); 5615ebccf1e3SJoseph Koshy 5616ebccf1e3SJoseph Koshy /* allocate thread hash tables */ 5617ebccf1e3SJoseph Koshy pmc_ownerhash = hashinit(pmc_hashsize, M_PMC, 5618ebccf1e3SJoseph Koshy &pmc_ownerhashmask); 5619ebccf1e3SJoseph Koshy 5620ebccf1e3SJoseph Koshy pmc_processhash = hashinit(pmc_hashsize, M_PMC, 5621ebccf1e3SJoseph Koshy &pmc_processhashmask); 5622382d30cdSJoseph Koshy mtx_init(&pmc_processhash_mtx, "pmc-process-hash", "pmc-leaf", 5623382d30cdSJoseph Koshy MTX_SPIN); 5624ebccf1e3SJoseph Koshy 56250f8d79d9SMatt Macy CK_LIST_INIT(&pmc_ss_owners); 5626f263522aSJoseph Koshy pmc_ss_count = 0; 5627f263522aSJoseph Koshy 5628ebccf1e3SJoseph Koshy /* allocate a pool of spin mutexes */ 5629382d30cdSJoseph Koshy pmc_mtxpool = mtx_pool_create("pmc-leaf", pmc_mtxpool_size, 5630382d30cdSJoseph Koshy MTX_SPIN); 5631ebccf1e3SJoseph Koshy 56324a3690dfSJohn Baldwin PMCDBG4(MOD,INI,1, "pmc_ownerhash=%p, mask=0x%lx " 5633ebccf1e3SJoseph Koshy "targethash=%p mask=0x%lx", pmc_ownerhash, pmc_ownerhashmask, 5634ebccf1e3SJoseph Koshy pmc_processhash, pmc_processhashmask); 5635ebccf1e3SJoseph Koshy 56366161b98cSMatt Macy /* Initialize a spin mutex for the thread free list. */ 56376161b98cSMatt Macy mtx_init(&pmc_threadfreelist_mtx, "pmc-threadfreelist", "pmc-leaf", 56386161b98cSMatt Macy MTX_SPIN); 56396161b98cSMatt Macy 56409b1d850bSMark Johnston /* Initialize the task to prune the thread free list. */ 56419b1d850bSMark Johnston TASK_INIT(&free_task, 0, pmc_thread_descriptor_pool_free_task, NULL); 56426161b98cSMatt Macy 5643ebccf1e3SJoseph Koshy /* register process {exit,fork,exec} handlers */ 5644ebccf1e3SJoseph Koshy pmc_exit_tag = EVENTHANDLER_REGISTER(process_exit, 5645ebccf1e3SJoseph Koshy pmc_process_exit, NULL, EVENTHANDLER_PRI_ANY); 5646ebccf1e3SJoseph Koshy pmc_fork_tag = EVENTHANDLER_REGISTER(process_fork, 5647ebccf1e3SJoseph Koshy pmc_process_fork, NULL, EVENTHANDLER_PRI_ANY); 5648ebccf1e3SJoseph Koshy 564929f4e216SMark Johnston /* register kld event handlers */ 565029f4e216SMark Johnston pmc_kld_load_tag = EVENTHANDLER_REGISTER(kld_load, pmc_kld_load, 565129f4e216SMark Johnston NULL, EVENTHANDLER_PRI_ANY); 565229f4e216SMark Johnston pmc_kld_unload_tag = EVENTHANDLER_REGISTER(kld_unload, pmc_kld_unload, 565329f4e216SMark Johnston NULL, EVENTHANDLER_PRI_ANY); 565429f4e216SMark Johnston 5655f263522aSJoseph Koshy /* initialize logging */ 5656f263522aSJoseph Koshy pmclog_initialize(); 5657f263522aSJoseph Koshy 5658ebccf1e3SJoseph Koshy /* set hook functions */ 5659ebccf1e3SJoseph Koshy pmc_intr = md->pmd_intr; 56600f00315cSMatt Macy wmb(); 5661ebccf1e3SJoseph Koshy pmc_hook = pmc_hook_handler; 5662ebccf1e3SJoseph Koshy 5663ebccf1e3SJoseph Koshy if (error == 0) { 5664ebccf1e3SJoseph Koshy printf(PMC_MODULE_NAME ":"); 566501c35b67SMitchell Horne for (n = 0; n < md->pmd_nclass; n++) { 5666fdfeaa66SAleksandr Rybalko if (md->pmd_classdep[n].pcd_num == 0) 5667fdfeaa66SAleksandr Rybalko continue; 5668e829eb6dSJoseph Koshy pcd = &md->pmd_classdep[n]; 56697dada264SJoseph Koshy printf(" %s/%d/%d/0x%b", 56700ceb54c2SJohn Baldwin pmc_name_of_pmcclass(pcd->pcd_class), 5671e829eb6dSJoseph Koshy pcd->pcd_num, 56727dada264SJoseph Koshy pcd->pcd_width, 5673e829eb6dSJoseph Koshy pcd->pcd_caps, 5674a8eb16c5SJoseph Koshy "\20" 5675a8eb16c5SJoseph Koshy "\1INT\2USR\3SYS\4EDG\5THR" 5676a8eb16c5SJoseph Koshy "\6REA\7WRI\10INV\11QUA\12PRC" 5677a8eb16c5SJoseph Koshy "\13TAG\14CSC"); 5678a8eb16c5SJoseph Koshy } 5679ebccf1e3SJoseph Koshy printf("\n"); 5680ebccf1e3SJoseph Koshy } 5681ebccf1e3SJoseph Koshy 5682e829eb6dSJoseph Koshy return (error); 5683ebccf1e3SJoseph Koshy } 5684ebccf1e3SJoseph Koshy 5685ebccf1e3SJoseph Koshy /* prepare to be unloaded */ 5686ebccf1e3SJoseph Koshy static void 5687ebccf1e3SJoseph Koshy pmc_cleanup(void) 5688ebccf1e3SJoseph Koshy { 5689ebccf1e3SJoseph Koshy struct pmc_binding pb; 569001c35b67SMitchell Horne struct pmc_owner *po, *tmp; 569101c35b67SMitchell Horne struct pmc_ownerhash *ph; 569201c35b67SMitchell Horne struct pmc_processhash *prh __pmcdbg_used; 569301c35b67SMitchell Horne u_int maxcpu; 569401c35b67SMitchell Horne int cpu, c; 5695ebccf1e3SJoseph Koshy 56964a3690dfSJohn Baldwin PMCDBG0(MOD,INI,0, "cleanup"); 5697ebccf1e3SJoseph Koshy 5698f263522aSJoseph Koshy /* switch off sampling */ 5699e6b475e0SMatt Macy CPU_FOREACH(cpu) 5700e6b475e0SMatt Macy DPCPU_ID_SET(cpu, pmc_sampled, 0); 5701f263522aSJoseph Koshy pmc_intr = NULL; 5702ebccf1e3SJoseph Koshy 5703ebccf1e3SJoseph Koshy sx_xlock(&pmc_sx); 5704ebccf1e3SJoseph Koshy if (pmc_hook == NULL) { /* being unloaded already */ 5705ebccf1e3SJoseph Koshy sx_xunlock(&pmc_sx); 5706ebccf1e3SJoseph Koshy return; 5707ebccf1e3SJoseph Koshy } 5708ebccf1e3SJoseph Koshy 5709ebccf1e3SJoseph Koshy pmc_hook = NULL; /* prevent new threads from entering module */ 5710ebccf1e3SJoseph Koshy 5711ebccf1e3SJoseph Koshy /* deregister event handlers */ 5712ebccf1e3SJoseph Koshy EVENTHANDLER_DEREGISTER(process_fork, pmc_fork_tag); 5713ebccf1e3SJoseph Koshy EVENTHANDLER_DEREGISTER(process_exit, pmc_exit_tag); 571429f4e216SMark Johnston EVENTHANDLER_DEREGISTER(kld_load, pmc_kld_load_tag); 571529f4e216SMark Johnston EVENTHANDLER_DEREGISTER(kld_unload, pmc_kld_unload_tag); 5716ebccf1e3SJoseph Koshy 5717ebccf1e3SJoseph Koshy /* send SIGBUS to all owner threads, free up allocations */ 5718d5ee4074SMitchell Horne if (pmc_ownerhash != NULL) { 5719ebccf1e3SJoseph Koshy for (ph = pmc_ownerhash; 5720ebccf1e3SJoseph Koshy ph <= &pmc_ownerhash[pmc_ownerhashmask]; 5721ebccf1e3SJoseph Koshy ph++) { 5722ebccf1e3SJoseph Koshy LIST_FOREACH_SAFE(po, ph, po_next, tmp) { 5723ebccf1e3SJoseph Koshy pmc_remove_owner(po); 5724ebccf1e3SJoseph Koshy 572501c35b67SMitchell Horne PMCDBG3(MOD,INI,2, 572601c35b67SMitchell Horne "cleanup signal proc=%p (%d, %s)", 572701c35b67SMitchell Horne po->po_owner, po->po_owner->p_pid, 5728ebccf1e3SJoseph Koshy po->po_owner->p_comm); 5729ebccf1e3SJoseph Koshy 5730ebccf1e3SJoseph Koshy PROC_LOCK(po->po_owner); 57318451d0ddSKip Macy kern_psignal(po->po_owner, SIGBUS); 5732ebccf1e3SJoseph Koshy PROC_UNLOCK(po->po_owner); 5733f263522aSJoseph Koshy 5734f263522aSJoseph Koshy pmc_destroy_owner_descriptor(po); 5735ebccf1e3SJoseph Koshy } 5736ebccf1e3SJoseph Koshy } 5737d5ee4074SMitchell Horne } 5738ebccf1e3SJoseph Koshy 5739ebccf1e3SJoseph Koshy /* reclaim allocated data structures */ 57409b1d850bSMark Johnston taskqueue_drain(taskqueue_fast, &free_task); 57416161b98cSMatt Macy mtx_destroy(&pmc_threadfreelist_mtx); 57426161b98cSMatt Macy pmc_thread_descriptor_pool_drain(); 57436161b98cSMatt Macy 5744d5ee4074SMitchell Horne if (pmc_mtxpool != NULL) 5745ebccf1e3SJoseph Koshy mtx_pool_destroy(&pmc_mtxpool); 5746ebccf1e3SJoseph Koshy 5747ebccf1e3SJoseph Koshy mtx_destroy(&pmc_processhash_mtx); 5748d5ee4074SMitchell Horne if (pmc_processhash != NULL) { 5749680f1afdSJohn Baldwin #ifdef HWPMC_DEBUG 5750ebccf1e3SJoseph Koshy struct pmc_process *pp; 5751ebccf1e3SJoseph Koshy 57524a3690dfSJohn Baldwin PMCDBG0(MOD,INI,3, "destroy process hash"); 5753ebccf1e3SJoseph Koshy for (prh = pmc_processhash; 5754ebccf1e3SJoseph Koshy prh <= &pmc_processhash[pmc_processhashmask]; 5755ebccf1e3SJoseph Koshy prh++) 5756ebccf1e3SJoseph Koshy LIST_FOREACH(pp, prh, pp_next) 57574a3690dfSJohn Baldwin PMCDBG1(MOD,INI,3, "pid=%d", pp->pp_proc->p_pid); 5758ebccf1e3SJoseph Koshy #endif 5759ebccf1e3SJoseph Koshy 5760ebccf1e3SJoseph Koshy hashdestroy(pmc_processhash, M_PMC, pmc_processhashmask); 5761ebccf1e3SJoseph Koshy pmc_processhash = NULL; 5762ebccf1e3SJoseph Koshy } 5763ebccf1e3SJoseph Koshy 5764d5ee4074SMitchell Horne if (pmc_ownerhash != NULL) { 57654a3690dfSJohn Baldwin PMCDBG0(MOD,INI,3, "destroy owner hash"); 5766ebccf1e3SJoseph Koshy hashdestroy(pmc_ownerhash, M_PMC, pmc_ownerhashmask); 5767ebccf1e3SJoseph Koshy pmc_ownerhash = NULL; 5768ebccf1e3SJoseph Koshy } 5769ebccf1e3SJoseph Koshy 57700f8d79d9SMatt Macy KASSERT(CK_LIST_EMPTY(&pmc_ss_owners), 5771f263522aSJoseph Koshy ("[pmc,%d] Global SS owner list not empty", __LINE__)); 5772f263522aSJoseph Koshy KASSERT(pmc_ss_count == 0, 5773f263522aSJoseph Koshy ("[pmc,%d] Global SS count not empty", __LINE__)); 5774f263522aSJoseph Koshy 5775e829eb6dSJoseph Koshy /* do processor and pmc-class dependent cleanup */ 5776122ccdc1SJoseph Koshy maxcpu = pmc_cpu_max(); 5777ba8ae2deSJoseph Koshy 57784a3690dfSJohn Baldwin PMCDBG0(MOD,INI,3, "md cleanup"); 5779ebccf1e3SJoseph Koshy if (md) { 5780ebccf1e3SJoseph Koshy pmc_save_cpu_binding(&pb); 5781122ccdc1SJoseph Koshy for (cpu = 0; cpu < maxcpu; cpu++) { 57824a3690dfSJohn Baldwin PMCDBG2(MOD,INI,1,"pmc-cleanup cpu=%d pcs=%p", 5783ebccf1e3SJoseph Koshy cpu, pmc_pcpu[cpu]); 5784122ccdc1SJoseph Koshy if (!pmc_cpu_is_active(cpu) || pmc_pcpu[cpu] == NULL) 5785ebccf1e3SJoseph Koshy continue; 5786693cd307SMitchell Horne 5787ebccf1e3SJoseph Koshy pmc_select_cpu(cpu); 5788d5ee4074SMitchell Horne for (c = 0; c < md->pmd_nclass; c++) { 5789d5ee4074SMitchell Horne if (md->pmd_classdep[c].pcd_num > 0) { 5790fdfeaa66SAleksandr Rybalko md->pmd_classdep[c].pcd_pcpu_fini(md, 5791fdfeaa66SAleksandr Rybalko cpu); 5792ebccf1e3SJoseph Koshy } 5793d5ee4074SMitchell Horne } 5794d5ee4074SMitchell Horne } 5795bc4f0adeSJoseph Koshy 5796f5f9340bSFabien Thomas if (md->pmd_cputype == PMC_CPU_GENERIC) 5797f5f9340bSFabien Thomas pmc_generic_cpu_finalize(md); 5798f5f9340bSFabien Thomas else 5799bc4f0adeSJoseph Koshy pmc_md_finalize(md); 5800bc4f0adeSJoseph Koshy 5801f5f9340bSFabien Thomas pmc_mdep_free(md); 5802ebccf1e3SJoseph Koshy md = NULL; 5803ebccf1e3SJoseph Koshy pmc_restore_cpu_binding(&pb); 5804ebccf1e3SJoseph Koshy } 5805ebccf1e3SJoseph Koshy 5806e829eb6dSJoseph Koshy /* Free per-cpu descriptors. */ 5807e829eb6dSJoseph Koshy for (cpu = 0; cpu < maxcpu; cpu++) { 5808e829eb6dSJoseph Koshy if (!pmc_cpu_is_active(cpu)) 5809e829eb6dSJoseph Koshy continue; 5810f5f9340bSFabien Thomas KASSERT(pmc_pcpu[cpu]->pc_sb[PMC_HR] != NULL, 5811f5f9340bSFabien Thomas ("[pmc,%d] Null hw cpu sample buffer cpu=%d", __LINE__, 5812e829eb6dSJoseph Koshy cpu)); 5813f5f9340bSFabien Thomas KASSERT(pmc_pcpu[cpu]->pc_sb[PMC_SR] != NULL, 5814f5f9340bSFabien Thomas ("[pmc,%d] Null sw cpu sample buffer cpu=%d", __LINE__, 5815f5f9340bSFabien Thomas cpu)); 58165de96e33SMatt Macy KASSERT(pmc_pcpu[cpu]->pc_sb[PMC_UR] != NULL, 58175de96e33SMatt Macy ("[pmc,%d] Null userret cpu sample buffer cpu=%d", __LINE__, 58185de96e33SMatt Macy cpu)); 581996ad26eeSMark Johnston free(pmc_pcpu[cpu]->pc_sb[PMC_HR]->ps_callchains, M_PMC); 582096ad26eeSMark Johnston free(pmc_pcpu[cpu]->pc_sb[PMC_HR], M_PMC); 582196ad26eeSMark Johnston free(pmc_pcpu[cpu]->pc_sb[PMC_SR]->ps_callchains, M_PMC); 582296ad26eeSMark Johnston free(pmc_pcpu[cpu]->pc_sb[PMC_SR], M_PMC); 582396ad26eeSMark Johnston free(pmc_pcpu[cpu]->pc_sb[PMC_UR]->ps_callchains, M_PMC); 582496ad26eeSMark Johnston free(pmc_pcpu[cpu]->pc_sb[PMC_UR], M_PMC); 582596ad26eeSMark Johnston free(pmc_pcpu[cpu], M_PMC); 5826e829eb6dSJoseph Koshy } 5827e829eb6dSJoseph Koshy 58281ede983cSDag-Erling Smørgrav free(pmc_pcpu, M_PMC); 5829ebccf1e3SJoseph Koshy pmc_pcpu = NULL; 5830ebccf1e3SJoseph Koshy 58311ede983cSDag-Erling Smørgrav free(pmc_pcpu_saved, M_PMC); 5832ebccf1e3SJoseph Koshy pmc_pcpu_saved = NULL; 5833ebccf1e3SJoseph Koshy 5834d5ee4074SMitchell Horne if (pmc_pmcdisp != NULL) { 58351ede983cSDag-Erling Smørgrav free(pmc_pmcdisp, M_PMC); 5836ebccf1e3SJoseph Koshy pmc_pmcdisp = NULL; 5837ebccf1e3SJoseph Koshy } 5838ebccf1e3SJoseph Koshy 5839d5ee4074SMitchell Horne if (pmc_rowindex_to_classdep != NULL) { 5840e829eb6dSJoseph Koshy free(pmc_rowindex_to_classdep, M_PMC); 5841e829eb6dSJoseph Koshy pmc_rowindex_to_classdep = NULL; 5842e829eb6dSJoseph Koshy } 5843e829eb6dSJoseph Koshy 5844f263522aSJoseph Koshy pmclog_shutdown(); 5845e6b475e0SMatt Macy counter_u64_free(pmc_stats.pm_intr_ignored); 5846e6b475e0SMatt Macy counter_u64_free(pmc_stats.pm_intr_processed); 5847e6b475e0SMatt Macy counter_u64_free(pmc_stats.pm_intr_bufferfull); 5848e6b475e0SMatt Macy counter_u64_free(pmc_stats.pm_syscalls); 5849e6b475e0SMatt Macy counter_u64_free(pmc_stats.pm_syscall_errors); 5850e6b475e0SMatt Macy counter_u64_free(pmc_stats.pm_buffer_requests); 5851e6b475e0SMatt Macy counter_u64_free(pmc_stats.pm_buffer_requests_failed); 5852e6b475e0SMatt Macy counter_u64_free(pmc_stats.pm_log_sweeps); 58535de96e33SMatt Macy counter_u64_free(pmc_stats.pm_merges); 58545de96e33SMatt Macy counter_u64_free(pmc_stats.pm_overwrites); 5855ebccf1e3SJoseph Koshy sx_xunlock(&pmc_sx); /* we are done */ 5856ebccf1e3SJoseph Koshy } 5857ebccf1e3SJoseph Koshy 5858ebccf1e3SJoseph Koshy /* 5859ebccf1e3SJoseph Koshy * The function called at load/unload. 5860ebccf1e3SJoseph Koshy */ 5861ebccf1e3SJoseph Koshy static int 5862ebccf1e3SJoseph Koshy load(struct module *module __unused, int cmd, void *arg __unused) 5863ebccf1e3SJoseph Koshy { 5864ebccf1e3SJoseph Koshy int error; 5865ebccf1e3SJoseph Koshy 5866ebccf1e3SJoseph Koshy error = 0; 5867ebccf1e3SJoseph Koshy 5868ebccf1e3SJoseph Koshy switch (cmd) { 5869ebccf1e3SJoseph Koshy case MOD_LOAD: 5870ebccf1e3SJoseph Koshy /* initialize the subsystem */ 5871ebccf1e3SJoseph Koshy error = pmc_initialize(); 5872ebccf1e3SJoseph Koshy if (error != 0) 5873ebccf1e3SJoseph Koshy break; 5874693cd307SMitchell Horne PMCDBG2(MOD,INI,1, "syscall=%d maxcpu=%d", pmc_syscall_num, 5875693cd307SMitchell Horne pmc_cpu_max()); 5876ebccf1e3SJoseph Koshy break; 5877ebccf1e3SJoseph Koshy case MOD_UNLOAD: 5878ebccf1e3SJoseph Koshy case MOD_SHUTDOWN: 5879ebccf1e3SJoseph Koshy pmc_cleanup(); 58804a3690dfSJohn Baldwin PMCDBG0(MOD,INI,1, "unloaded"); 5881ebccf1e3SJoseph Koshy break; 5882ebccf1e3SJoseph Koshy default: 5883693cd307SMitchell Horne error = EINVAL; 5884ebccf1e3SJoseph Koshy break; 5885ebccf1e3SJoseph Koshy } 5886ebccf1e3SJoseph Koshy 588752ebac7fSMitchell Horne return (error); 5888ebccf1e3SJoseph Koshy } 5889