mirror of
https://github.com/apache/nuttx.git
synced 2026-05-27 19:36:35 +08:00
libc/perf: userspace PMU access
Add ARCH_HAVE_PERF_EVENTS_USER_ACCESS capability to allow applications to directly access hardware perf counters via perf_gettime() from userspace, enabling performance monitoring and profiling without syscalls. Signed-off-by: Yanfeng Liu <p-liuyanfeng9@xiaomi.com>
This commit is contained in:
@@ -605,6 +605,13 @@ config ARCH_HAVE_PERF_EVENTS
|
|||||||
---help---
|
---help---
|
||||||
The architecture supports hardware performance counting.
|
The architecture supports hardware performance counting.
|
||||||
|
|
||||||
|
config ARCH_HAVE_PERF_EVENTS_USER_ACCESS
|
||||||
|
bool
|
||||||
|
default n
|
||||||
|
select ARCH_HAVE_PERF_EVENTS
|
||||||
|
---help---
|
||||||
|
Select if hardware allows userspace perf counter access.
|
||||||
|
|
||||||
config ARCH_PERF_EVENTS
|
config ARCH_PERF_EVENTS
|
||||||
bool "Configure hardware performance counting"
|
bool "Configure hardware performance counting"
|
||||||
default y if SCHED_CRITMONITOR || SCHED_IRQMONITOR || RPMSG_PING || SEGGER_SYSVIEW
|
default y if SCHED_CRITMONITOR || SCHED_IRQMONITOR || RPMSG_PING || SEGGER_SYSVIEW
|
||||||
|
|||||||
@@ -43,4 +43,8 @@ if(NOT CONFIG_BUILD_KERNEL)
|
|||||||
list(APPEND SRCS task_startup.c)
|
list(APPEND SRCS task_startup.c)
|
||||||
endif()
|
endif()
|
||||||
|
|
||||||
|
if(CONFIG_ARCH_HAVE_PERF_EVENTS_USER_ACCESS)
|
||||||
|
list(APPEND SRCS clock_perf.c)
|
||||||
|
endif()
|
||||||
|
|
||||||
target_sources(c PRIVATE ${SRCS})
|
target_sources(c PRIVATE ${SRCS})
|
||||||
|
|||||||
@@ -39,6 +39,10 @@ ifneq ($(CONFIG_BUILD_KERNEL),y)
|
|||||||
CSRCS += task_startup.c
|
CSRCS += task_startup.c
|
||||||
endif # CONFIG_BUILD_KERNEL
|
endif # CONFIG_BUILD_KERNEL
|
||||||
|
|
||||||
|
ifeq ($(CONFIG_ARCH_HAVE_PERF_EVENTS_USER_ACCESS),y)
|
||||||
|
CSRCS += clock_perf.c
|
||||||
|
endif
|
||||||
|
|
||||||
# Add the sched directory to the build
|
# Add the sched directory to the build
|
||||||
|
|
||||||
DEPPATH += --dep-path sched
|
DEPPATH += --dep-path sched
|
||||||
|
|||||||
@@ -0,0 +1,91 @@
|
|||||||
|
/****************************************************************************
|
||||||
|
* libs/libc/sched/clock_perf.c
|
||||||
|
*
|
||||||
|
* SPDX-License-Identifier: Apache-2.0
|
||||||
|
*
|
||||||
|
* Licensed to the Apache Software Foundation (ASF) under one or more
|
||||||
|
* contributor license agreements. See the NOTICE file distributed with
|
||||||
|
* this work for additional information regarding copyright ownership. The
|
||||||
|
* ASF licenses this file to you under the Apache License, Version 2.0 (the
|
||||||
|
* "License"); you may not use this file except in compliance with the
|
||||||
|
* License. You may obtain a copy of the License at
|
||||||
|
*
|
||||||
|
* http://www.apache.org/licenses/LICENSE-2.0
|
||||||
|
*
|
||||||
|
* Unless required by applicable law or agreed to in writing, software
|
||||||
|
* distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
|
||||||
|
* WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
|
||||||
|
* License for the specific language governing permissions and limitations
|
||||||
|
* under the License.
|
||||||
|
*
|
||||||
|
****************************************************************************/
|
||||||
|
|
||||||
|
/****************************************************************************
|
||||||
|
* Included Files
|
||||||
|
****************************************************************************/
|
||||||
|
|
||||||
|
#include <stdint.h>
|
||||||
|
|
||||||
|
#include <nuttx/arch.h>
|
||||||
|
#include <nuttx/bits.h>
|
||||||
|
#include <nuttx/clock.h>
|
||||||
|
|
||||||
|
#if defined(CONFIG_PERF_OVERFLOW_CORRECTION) && ULONG_MAX != UINT64_MAX
|
||||||
|
|
||||||
|
/****************************************************************************
|
||||||
|
* Preprocessors
|
||||||
|
****************************************************************************/
|
||||||
|
|
||||||
|
#define MASK_LO GENMASK_ULL(31, 0)
|
||||||
|
#define MASK_HI GENMASK_ULL(63, 32)
|
||||||
|
|
||||||
|
#define LO(x) (uint32_t)((x) & MASK_LO)
|
||||||
|
#define HI(x) (uint32_t)(((x) & MASK_HI) >> 32)
|
||||||
|
|
||||||
|
#define PACK64(hi,lo) ((MASK_LO & (lo)) | (((uint64_t)(hi)) << 32))
|
||||||
|
#define CLOCK_T(p) (LO(p) | ((clock_t)HI(p) << \
|
||||||
|
CONFIG_ARCH_PERF_COUNT_BITWIDTH))
|
||||||
|
|
||||||
|
/****************************************************************************
|
||||||
|
* Private Data
|
||||||
|
****************************************************************************/
|
||||||
|
|
||||||
|
static atomic64_t g_perf; /* hi word is overflow, lo word is last */
|
||||||
|
|
||||||
|
/****************************************************************************
|
||||||
|
* Public Functions
|
||||||
|
****************************************************************************/
|
||||||
|
|
||||||
|
/****************************************************************************
|
||||||
|
* perf_gettime
|
||||||
|
****************************************************************************/
|
||||||
|
|
||||||
|
clock_t perf_gettime(void)
|
||||||
|
{
|
||||||
|
uint64_t snap;
|
||||||
|
uint64_t result;
|
||||||
|
clock_t now;
|
||||||
|
|
||||||
|
do
|
||||||
|
{
|
||||||
|
snap = atomic64_read(&g_perf);
|
||||||
|
now = up_perf_gettime();
|
||||||
|
result = PACK64(now < LO(snap) ? HI(snap) + 1 : HI(snap), now);
|
||||||
|
}
|
||||||
|
while (!atomic64_try_cmpxchg(&g_perf, &snap, result));
|
||||||
|
|
||||||
|
return CLOCK_T(result);
|
||||||
|
}
|
||||||
|
|
||||||
|
#else
|
||||||
|
|
||||||
|
/****************************************************************************
|
||||||
|
* perf_gettime
|
||||||
|
****************************************************************************/
|
||||||
|
|
||||||
|
clock_t perf_gettime(void)
|
||||||
|
{
|
||||||
|
return up_perf_gettime();
|
||||||
|
}
|
||||||
|
|
||||||
|
#endif
|
||||||
@@ -31,7 +31,13 @@
|
|||||||
#include <nuttx/spinlock.h>
|
#include <nuttx/spinlock.h>
|
||||||
#include <nuttx/wdog.h>
|
#include <nuttx/wdog.h>
|
||||||
|
|
||||||
#if defined(CONFIG_PERF_OVERFLOW_CORRECTION) && ULONG_MAX != UINT64_MAX
|
#ifndef CONFIG_ARCH_HAVE_PERF_EVENTS_USER_ACCESS
|
||||||
|
|
||||||
|
/****************************************************************************
|
||||||
|
* Preprocessors
|
||||||
|
****************************************************************************/
|
||||||
|
|
||||||
|
# if defined(CONFIG_PERF_OVERFLOW_CORRECTION) && ULONG_MAX != UINT64_MAX
|
||||||
|
|
||||||
/****************************************************************************
|
/****************************************************************************
|
||||||
* Private Types
|
* Private Types
|
||||||
@@ -104,8 +110,8 @@ clock_t perf_gettime(void)
|
|||||||
return result;
|
return result;
|
||||||
}
|
}
|
||||||
|
|
||||||
#elif defined(CONFIG_ALARM_ARCH) || defined (CONFIG_TIMER_ARCH) || \
|
# elif defined(CONFIG_ALARM_ARCH) || defined (CONFIG_TIMER_ARCH) || \
|
||||||
defined(CONFIG_ARCH_PERF_EVENTS)
|
defined(CONFIG_ARCH_PERF_EVENTS)
|
||||||
|
|
||||||
/****************************************************************************
|
/****************************************************************************
|
||||||
* perf_gettime
|
* perf_gettime
|
||||||
@@ -116,7 +122,7 @@ clock_t perf_gettime(void)
|
|||||||
return up_perf_gettime();
|
return up_perf_gettime();
|
||||||
}
|
}
|
||||||
|
|
||||||
#else
|
# else
|
||||||
|
|
||||||
/****************************************************************************
|
/****************************************************************************
|
||||||
* perf_gettime
|
* perf_gettime
|
||||||
@@ -127,7 +133,8 @@ clock_t perf_gettime(void)
|
|||||||
return clock_systime_ticks();
|
return clock_systime_ticks();
|
||||||
}
|
}
|
||||||
|
|
||||||
#endif
|
# endif
|
||||||
|
#endif /* !CONFIG_ARCH_HAVE_PERF_EVENTS_USER_ACCESS */
|
||||||
|
|
||||||
#if defined(CONFIG_ALARM_ARCH) || defined (CONFIG_TIMER_ARCH) || \
|
#if defined(CONFIG_ALARM_ARCH) || defined (CONFIG_TIMER_ARCH) || \
|
||||||
defined(CONFIG_ARCH_PERF_EVENTS)
|
defined(CONFIG_ARCH_PERF_EVENTS)
|
||||||
|
|||||||
Reference in New Issue
Block a user