0409ad53fa
time, especially for SMP. If configured, it turns itself on at boot time for calibration, so is fragile even if never otherwise used. Both types of kernel profiling were supposed to use a global spinlock in the SMP case. If hi-res profiling is configured (but not necessarily used), this was supposed to be optimized by only using it when necessary, and slightly more efficiently, in asm. But it was not done at all for mcount entry where it is necessary. This caused crashes in the SMP case when either type of profiling was enabled. For mcount exit, it only caused wrong times. The times were wrongest with an i8254 timer since using that requires exclusive access to the hardware. The i8254 timer was too slow to use here 20 years ago and is much less usable now, but it is the default for the SMP case since TSCs weren't invariant when SMP was new. Do the locking in all hi-res SMP cases for simplicity. Calibration uses special asms, and the clobber lists in these were sort of inverted. They contained the arg and return registers which are not clobbered, but on amd64 they didn't contain the residue of the call-used registers which may be clobbered (%r10 and %r11). This usually caused hangs at boot time. This usually affected even the UP case.
200 lines
5.7 KiB
C
200 lines
5.7 KiB
C
/*-
|
|
* SPDX-License-Identifier: BSD-3-Clause
|
|
*
|
|
* Copyright (c) 1992, 1993
|
|
* The Regents of the University of California. All rights reserved.
|
|
*
|
|
* Redistribution and use in source and binary forms, with or without
|
|
* modification, are permitted provided that the following conditions
|
|
* are met:
|
|
* 1. Redistributions of source code must retain the above copyright
|
|
* notice, this list of conditions and the following disclaimer.
|
|
* 2. Redistributions in binary form must reproduce the above copyright
|
|
* notice, this list of conditions and the following disclaimer in the
|
|
* documentation and/or other materials provided with the distribution.
|
|
* 3. Neither the name of the University nor the names of its contributors
|
|
* may be used to endorse or promote products derived from this software
|
|
* without specific prior written permission.
|
|
*
|
|
* THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
|
|
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
|
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
|
|
* ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
|
|
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
|
|
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
|
|
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
|
|
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
|
|
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
|
|
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
|
|
* SUCH DAMAGE.
|
|
*
|
|
* @(#)profile.h 8.1 (Berkeley) 6/11/93
|
|
* $FreeBSD$
|
|
*/
|
|
|
|
#ifndef _MACHINE_PROFILE_H_
|
|
#define _MACHINE_PROFILE_H_
|
|
|
|
#ifndef _SYS_CDEFS_H_
|
|
#error this file needs sys/cdefs.h as a prerequisite
|
|
#endif
|
|
|
|
#ifdef _KERNEL
|
|
|
|
/*
|
|
* Config generates something to tell the compiler to align functions on 16
|
|
* byte boundaries. A strict alignment is good for keeping the tables small.
|
|
*/
|
|
#define FUNCTION_ALIGNMENT 16
|
|
|
|
/*
|
|
* The kernel uses assembler stubs instead of unportable inlines.
|
|
* This is mainly to save a little time when profiling is not enabled,
|
|
* which is the usual case for the kernel.
|
|
*/
|
|
#define _MCOUNT_DECL void mcount
|
|
#define MCOUNT
|
|
|
|
#ifdef GUPROF
|
|
#define MCOUNT_DECL(s)
|
|
#define MCOUNT_ENTER(s)
|
|
#define MCOUNT_EXIT(s)
|
|
#ifdef __GNUCLIKE_ASM
|
|
#define MCOUNT_OVERHEAD(label) \
|
|
__asm __volatile("pushq %0; call __mcount; popq %%rcx" \
|
|
: \
|
|
: "i" (label) \
|
|
: "cx", "r10", "r11", "memory")
|
|
#define MEXITCOUNT_OVERHEAD() \
|
|
__asm __volatile("call .mexitcount; 1:" \
|
|
: : \
|
|
: "r10", "r11", "memory")
|
|
#define MEXITCOUNT_OVERHEAD_GETLABEL(labelp) \
|
|
__asm __volatile("movq $1b,%0" : "=rm" (labelp))
|
|
#else
|
|
#error this file needs to be ported to your compiler
|
|
#endif /* !__GNUCLIKE_ASM */
|
|
#else /* !GUPROF */
|
|
#define MCOUNT_DECL(s) register_t s;
|
|
#ifdef SMP
|
|
extern int mcount_lock;
|
|
#define MCOUNT_ENTER(s) { s = intr_disable(); \
|
|
while (!atomic_cmpset_acq_int(&mcount_lock, 0, 1)) \
|
|
/* nothing */ ; }
|
|
#define MCOUNT_EXIT(s) { atomic_store_rel_int(&mcount_lock, 0); \
|
|
intr_restore(s); }
|
|
#else
|
|
#define MCOUNT_ENTER(s) { s = intr_disable(); }
|
|
#define MCOUNT_EXIT(s) (intr_restore(s))
|
|
#endif
|
|
#endif /* GUPROF */
|
|
|
|
void bintr(void);
|
|
void btrap(void);
|
|
void eintr(void);
|
|
void user(void);
|
|
|
|
#define MCOUNT_FROMPC_USER(pc) \
|
|
((pc < (uintfptr_t)VM_MAXUSER_ADDRESS) ? (uintfptr_t)user : pc)
|
|
|
|
#define MCOUNT_FROMPC_INTR(pc) \
|
|
((pc >= (uintfptr_t)btrap && pc < (uintfptr_t)eintr) ? \
|
|
((pc >= (uintfptr_t)bintr) ? (uintfptr_t)bintr : \
|
|
(uintfptr_t)btrap) : ~0UL)
|
|
|
|
#else /* !_KERNEL */
|
|
|
|
#define FUNCTION_ALIGNMENT 4
|
|
|
|
#define _MCOUNT_DECL \
|
|
static void _mcount(uintfptr_t frompc, uintfptr_t selfpc) __used; \
|
|
static void _mcount
|
|
|
|
#ifdef __GNUCLIKE_ASM
|
|
#define MCOUNT __asm(" \n\
|
|
.text \n\
|
|
.p2align 4,0x90 \n\
|
|
.globl .mcount \n\
|
|
.type .mcount,@function \n\
|
|
.mcount: \n\
|
|
pushq %rdi \n\
|
|
pushq %rsi \n\
|
|
pushq %rdx \n\
|
|
pushq %rcx \n\
|
|
pushq %r8 \n\
|
|
pushq %r9 \n\
|
|
pushq %rax \n\
|
|
movq 8(%rbp),%rdi \n\
|
|
movq 7*8(%rsp),%rsi \n\
|
|
call _mcount \n\
|
|
popq %rax \n\
|
|
popq %r9 \n\
|
|
popq %r8 \n\
|
|
popq %rcx \n\
|
|
popq %rdx \n\
|
|
popq %rsi \n\
|
|
popq %rdi \n\
|
|
ret \n\
|
|
.size .mcount, . - .mcount");
|
|
#if 0
|
|
/*
|
|
* We could use this, except it doesn't preserve the registers that were
|
|
* being passed with arguments to the function that we were inserted
|
|
* into. I've left it here as documentation of what the code above is
|
|
* supposed to do.
|
|
*/
|
|
#define MCOUNT \
|
|
void \
|
|
mcount() \
|
|
{ \
|
|
uintfptr_t selfpc, frompc; \
|
|
/* \
|
|
* Find the return address for mcount, \
|
|
* and the return address for mcount's caller. \
|
|
* \
|
|
* selfpc = pc pushed by call to mcount \
|
|
*/ \
|
|
__asm("movq 8(%%rbp),%0" : "=r" (selfpc)); \
|
|
/* \
|
|
* frompc = pc pushed by call to mcount's caller. \
|
|
* The caller's stack frame has already been built, so %rbp is \
|
|
* the caller's frame pointer. The caller's raddr is in the \
|
|
* caller's frame following the caller's caller's frame pointer.\
|
|
*/ \
|
|
__asm("movq (%%rbp),%0" : "=r" (frompc)); \
|
|
frompc = ((uintfptr_t *)frompc)[1]; \
|
|
_mcount(frompc, selfpc); \
|
|
}
|
|
#endif
|
|
#else /* !__GNUCLIKE_ASM */
|
|
#define MCOUNT
|
|
#endif /* __GNUCLIKE_ASM */
|
|
|
|
typedef u_long uintfptr_t;
|
|
|
|
#endif /* _KERNEL */
|
|
|
|
/*
|
|
* An unsigned integral type that can hold non-negative difference between
|
|
* function pointers.
|
|
*/
|
|
typedef u_long fptrdiff_t;
|
|
|
|
#ifdef _KERNEL
|
|
|
|
void mcount(uintfptr_t frompc, uintfptr_t selfpc);
|
|
|
|
#else /* !_KERNEL */
|
|
|
|
#include <sys/cdefs.h>
|
|
|
|
__BEGIN_DECLS
|
|
#ifdef __GNUCLIKE_ASM
|
|
void mcount(void) __asm(".mcount");
|
|
#endif
|
|
__END_DECLS
|
|
|
|
#endif /* _KERNEL */
|
|
|
|
#endif /* !_MACHINE_PROFILE_H_ */
|