Johny Mattsson 526d21dab4 Major cleanup - c_whatever is finally history. (#2838)
The PR removed the bulk of non-newlib headers from the NodeMCU source base.  
app/libc has now been cut down to the bare minimum overrides to shadow the 
corresponding functions in the SDK's libc. The old c_xyz.h headerfiles have been 
nuked in favour of the standard <xyz.h> headers, with a few exceptions over in 
sdk-overrides. Again, shipping a libc.a without headers is a terrible thing to do. We're 
still living on a prayer that libc was configured the same was as a default-configured
xtensa gcc toolchain assumes it is. That part I cannot do anything about, unfortunately, 
but it's no worse than it has been before.

This enables our source files to compile successfully using the standard header files, 
and use the typical malloc()/calloc()/realloc()/free(), the strwhatever()s and 
memwhatever()s. These end up, through macro and linker magic, mapped to the 
appropriate SDK or ROM functions.
2019-07-22 00:58:21 +03:00

145 lines
3.0 KiB
C

//
// This module allows performance monitoring by looking at
// the PC at regular intervals and building a histogram
//
// perf.start(start, end, nbins[, pc offset on stack])
// perf.stop() -> total sample, samples outside range, table { addr -> count , .. }
#include "ets_sys.h"
#include "os_type.h"
#include "osapi.h"
#include <stdlib.h>
#include "module.h"
#include "lauxlib.h"
#include "platform.h"
#include "hw_timer.h"
#include "cpu_esp8266.h"
typedef struct {
int ref;
uint32_t start;
uint32_t bucket_shift;
uint32_t bucket_count;
uint32_t total_samples;
uint32_t outside_samples;
uint32_t bucket[1];
} DATA;
static DATA *data;
extern char _flash_used_end[];
#define TIMER_OWNER ((os_param_t) 'p')
static void ICACHE_RAM_ATTR hw_timer_cb(os_param_t p)
{
(void) p;
uint32_t stackaddr;
if (data) {
uint32_t pc;
asm (
"rsr %0, EPC1;" /* read out the EPC */
:"=r"(pc)
);
uint32_t bucket_number = (pc - data->start) >> data->bucket_shift;
if (bucket_number < data->bucket_count) {
data->bucket[bucket_number]++;
} else {
data->outside_samples++;
}
data->total_samples++;
}
}
static int perf_start(lua_State *L)
{
uint32_t start = luaL_optinteger(L, 1, 0x40000000);
uint32_t end = luaL_optinteger(L, 2, (uint32_t) _flash_used_end);
uint32_t bins = luaL_optinteger(L, 3, 1024);
if (end <= start) {
luaL_error(L, "end must be larger than start");
}
uint32_t binsize = (end - start + bins - 1) / bins;
// Round up to a power of two
int shift;
binsize = binsize - 1;
for (shift = 0; binsize > 0; shift++) {
binsize >>= 1;
}
bins = (end - start + (1 << shift) - 1) / (1 << shift);
size_t data_size = sizeof(DATA) + bins * sizeof(uint32_t);
DATA *d = (DATA *) lua_newuserdata(L, data_size);
memset(d, 0, data_size);
d->ref = luaL_ref(L, LUA_REGISTRYINDEX);
d->start = start;
d->bucket_shift = shift;
d->bucket_count = bins;
if (data) {
lua_unref(L, data->ref);
}
data = d;
// Start the timer
if (!platform_hw_timer_init(TIMER_OWNER, FRC1_SOURCE, TRUE)) {
// Failed to init the timer
data = NULL;
lua_unref(L, d->ref);
luaL_error(L, "Unable to initialize timer");
}
platform_hw_timer_set_func(TIMER_OWNER, hw_timer_cb, 0);
platform_hw_timer_arm_us(TIMER_OWNER, 50);
return 0;
}
static int perf_stop(lua_State *L)
{
if (!data) {
return 0;
}
// stop the timer
platform_hw_timer_close(TIMER_OWNER);
DATA *d = data;
data = NULL;
lua_pushnumber(L, d->total_samples);
lua_pushnumber(L, d->outside_samples);
lua_newtable(L);
int i;
uint32_t addr = d->start;
for (i = 0; i < d->bucket_count; i++, addr += (1 << d->bucket_shift)) {
if (d->bucket[i]) {
lua_pushnumber(L, addr);
lua_pushnumber(L, d->bucket[i]);
lua_settable(L, -3);
}
}
lua_pushnumber(L, 1 << d->bucket_shift);
lua_unref(L, d->ref);
return 4;
}
LROT_BEGIN(perf)
LROT_FUNCENTRY( start, perf_start )
LROT_FUNCENTRY( stop, perf_stop )
LROT_END( perf, NULL, 0 )
NODEMCU_MODULE(PERF, "perf", perf, NULL);