1.【需求描述】:
L0-L1 支持Perf,提供2种模式的配置, 及3大类型的事件配置:
2种模式:计数模式(仅统计事件发生次数)、采样模式(收集上下文如任务ID、pc、backtrace等)。
3种事件类型:CPU硬件事件(cycle、branch、icache、dcache等)、OS软件事件(task switch、mux pend、irq等)、高精度周期事件(cpu clock)。
2.【方案描述】:
L0:
基于事件采样原理,以性能事件为基础,当事件发生时,相应的事件计数器溢出发生中断,在中断处理函数中记录事件信息,包括当前的pc、当前运 行的任务ID以及调用栈等信息。
L1:
新增perf字符设备,位于“dev/perf”,通过对设备节点的read\ioctl,实现用户态perf
BREAKING CHANGE:
1.新增一系列perf的对外API,位于los_perf.h中.
LOS_PerfInit配置采样数据缓冲区
LOS_PerfStart开启Perf采样
LOS_PerfStop停止Perf采样
LOS_PerfConfig配置Perf采样事件
LOS_PerfDataRead读取采样数据
LOS_PerfNotifyHookReg 注册采样数据缓冲区的钩子函数
LOS_PerfFlushHookReg 注册缓冲区刷cache的钩子
2. 用户态新增perf命令
【Usage】:
./perf [start] /[start id] Start perf.
./perf [stop] Stop perf.
./perf [read nBytes] Read nBytes raw data from perf buffer and print out.
./perf [list] List events to be used in -e.
./perf [stat] or [record] <option> <command>
-e, event selector. use './perf list' to list available events.
-p, event period.
-o, perf data output filename.
-t, taskId filter(whiltelist), if not set perf will sample all tasks.
-s, type of data to sample defined in PerfSampleType los_perf.h.
-P, processId filter(whiltelist), if not set perf will sample all processes.
-d, whether to prescaler (once every 64 counts), which only take effect on cpu cycle hardware event.
Close #I47I9A
Signed-off-by: LiteOS2021 <dinglu@huawei.com>
Change-Id: Ieb9b7483c85d1495df7c55bc0027f4309dff9814
184 lines
5.3 KiB
C
184 lines
5.3 KiB
C
/*
|
|
* Copyright (c) 2013-2019 Huawei Technologies Co., Ltd. All rights reserved.
|
|
* Copyright (c) 2020-2021 Huawei Device Co., Ltd. All rights reserved.
|
|
*
|
|
* Redistribution and use in source and binary forms, with or without modification,
|
|
* are permitted provided that the following conditions are met:
|
|
*
|
|
* 1. Redistributions of source code must retain the above copyright notice, this list of
|
|
* conditions and the following disclaimer.
|
|
*
|
|
* 2. Redistributions in binary form must reproduce the above copyright notice, this list
|
|
* of conditions and the following disclaimer in the documentation and/or other materials
|
|
* provided with the distribution.
|
|
*
|
|
* 3. Neither the name of the copyright holder nor the names of its contributors may be used
|
|
* to endorse or promote products derived from this software without specific prior written
|
|
* permission.
|
|
*
|
|
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
|
* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,
|
|
* THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
|
|
* PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR
|
|
* CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
|
|
* EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
|
|
* PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
|
|
* OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
|
|
* WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
|
|
* OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
|
|
* ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
*/
|
|
|
|
#include "los_mp.h"
|
|
#include "los_init.h"
|
|
#include "los_percpu_pri.h"
|
|
#include "los_sched_pri.h"
|
|
#include "los_swtmr.h"
|
|
#include "los_task_pri.h"
|
|
|
|
#ifdef LOSCFG_KERNEL_SMP
|
|
|
|
#ifdef LOSCFG_KERNEL_SMP_CALL
|
|
LITE_OS_SEC_BSS SPIN_LOCK_INIT(g_mpCallSpin);
|
|
#define MP_CALL_LOCK(state) LOS_SpinLockSave(&g_mpCallSpin, &(state))
|
|
#define MP_CALL_UNLOCK(state) LOS_SpinUnlockRestore(&g_mpCallSpin, (state))
|
|
#endif
|
|
|
|
VOID LOS_MpSchedule(UINT32 target)
|
|
{
|
|
UINT32 cpuid = ArchCurrCpuid();
|
|
target &= ~(1U << cpuid);
|
|
HalIrqSendIpi(target, LOS_MP_IPI_SCHEDULE);
|
|
}
|
|
|
|
VOID OsMpWakeHandler(VOID)
|
|
{
|
|
/* generic wakeup ipi, do nothing */
|
|
}
|
|
|
|
VOID OsMpScheduleHandler(VOID)
|
|
{
|
|
/*
|
|
* set schedule flag to differ from wake function,
|
|
* so that the scheduler can be triggered at the end of irq.
|
|
*/
|
|
OsPercpuGet()->schedFlag |= INT_PEND_RESCH;
|
|
}
|
|
|
|
VOID OsMpHaltHandler(VOID)
|
|
{
|
|
(VOID)LOS_IntLock();
|
|
OsPercpuGet()->excFlag = CPU_HALT;
|
|
|
|
while (1) {}
|
|
}
|
|
|
|
VOID OsMpCollectTasks(VOID)
|
|
{
|
|
LosTaskCB *taskCB = NULL;
|
|
UINT32 taskID = 0;
|
|
UINT32 ret;
|
|
|
|
/* recursive checking all the available task */
|
|
for (; taskID <= g_taskMaxNum; taskID++) {
|
|
taskCB = &g_taskCBArray[taskID];
|
|
|
|
if (OsTaskIsUnused(taskCB) || OsTaskIsRunning(taskCB)) {
|
|
continue;
|
|
}
|
|
|
|
/*
|
|
* though task status is not atomic, this check may success but not accomplish
|
|
* the deletion; this deletion will be handled until the next run.
|
|
*/
|
|
if (taskCB->signal & SIGNAL_KILL) {
|
|
ret = LOS_TaskDelete(taskID);
|
|
if (ret != LOS_OK) {
|
|
PRINT_WARN("GC collect task failed err:0x%x\n", ret);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
#ifdef LOSCFG_KERNEL_SMP_CALL
|
|
VOID OsMpFuncCall(UINT32 target, SMP_FUNC_CALL func, VOID *args)
|
|
{
|
|
UINT32 index;
|
|
UINT32 intSave;
|
|
|
|
if (func == NULL) {
|
|
return;
|
|
}
|
|
|
|
if (!(target & OS_MP_CPU_ALL)) {
|
|
return;
|
|
}
|
|
|
|
for (index = 0; index < LOSCFG_KERNEL_CORE_NUM; index++) {
|
|
if (CPUID_TO_AFFI_MASK(index) & target) {
|
|
MpCallFunc *mpCallFunc = (MpCallFunc *)LOS_MemAlloc(m_aucSysMem0, sizeof(MpCallFunc));
|
|
if (mpCallFunc == NULL) {
|
|
PRINT_ERR("smp func call malloc failed\n");
|
|
return;
|
|
}
|
|
mpCallFunc->func = func;
|
|
mpCallFunc->args = args;
|
|
|
|
MP_CALL_LOCK(intSave);
|
|
LOS_ListAdd(&g_percpu[index].funcLink, &(mpCallFunc->node));
|
|
MP_CALL_UNLOCK(intSave);
|
|
}
|
|
}
|
|
HalIrqSendIpi(target, LOS_MP_IPI_FUNC_CALL);
|
|
}
|
|
|
|
VOID OsMpFuncCallHandler(VOID)
|
|
{
|
|
UINT32 intSave;
|
|
UINT32 cpuid = ArchCurrCpuid();
|
|
LOS_DL_LIST *list = NULL;
|
|
MpCallFunc *mpCallFunc = NULL;
|
|
|
|
MP_CALL_LOCK(intSave);
|
|
while (!LOS_ListEmpty(&g_percpu[cpuid].funcLink)) {
|
|
list = LOS_DL_LIST_FIRST(&g_percpu[cpuid].funcLink);
|
|
LOS_ListDelete(list);
|
|
MP_CALL_UNLOCK(intSave);
|
|
|
|
mpCallFunc = LOS_DL_LIST_ENTRY(list, MpCallFunc, node);
|
|
mpCallFunc->func(mpCallFunc->args);
|
|
(VOID)LOS_MemFree(m_aucSysMem0, mpCallFunc);
|
|
|
|
MP_CALL_LOCK(intSave);
|
|
}
|
|
MP_CALL_UNLOCK(intSave);
|
|
}
|
|
|
|
VOID OsMpFuncCallInit(VOID)
|
|
{
|
|
UINT32 index;
|
|
/* init funclink for each core */
|
|
for (index = 0; index < LOSCFG_KERNEL_CORE_NUM; index++) {
|
|
LOS_ListInit(&g_percpu[index].funcLink);
|
|
}
|
|
}
|
|
#endif /* LOSCFG_KERNEL_SMP_CALL */
|
|
|
|
UINT32 OsMpInit(VOID)
|
|
{
|
|
UINT16 swtmrId;
|
|
|
|
(VOID)LOS_SwtmrCreate(OS_MP_GC_PERIOD, LOS_SWTMR_MODE_PERIOD,
|
|
(SWTMR_PROC_FUNC)OsMpCollectTasks, &swtmrId, 0);
|
|
(VOID)LOS_SwtmrStart(swtmrId);
|
|
#ifdef LOSCFG_KERNEL_SMP_CALL
|
|
OsMpFuncCallInit();
|
|
#endif
|
|
return LOS_OK;
|
|
}
|
|
|
|
LOS_MODULE_INIT(OsMpInit, LOS_INIT_LEVEL_KMOD_TASK);
|
|
|
|
#endif
|
|
|