From 196dfbc06a7b9be296d6794ce4d71074ee4e9e35 Mon Sep 17 00:00:00 2001 From: timholy Date: Mon, 30 Jun 2014 06:25:58 -0500 Subject: [PATCH] More instrumentation (memory allocation, also fixes #7259) --- base/exports.jl | 1 + base/util.jl | 3 ++ src/codegen.cpp | 37 ++++++++++++++++-- src/debuginfo.cpp | 96 +++++++++++++++++++++++++++++++++++++++-------- src/gc.c | 10 +++++ src/init.c | 4 ++ src/julia.h | 13 +++++++ ui/repl.c | 35 +++++++++++++++-- 8 files changed, 176 insertions(+), 23 deletions(-) diff --git a/base/exports.jl b/base/exports.jl index b972eb93dc407..c3a55f55ed8c1 100644 --- a/base/exports.jl +++ b/base/exports.jl @@ -1072,6 +1072,7 @@ export gc_disable, gc_enable, precompile, + clear_malloc_data, # misc atexit, diff --git a/base/util.jl b/base/util.jl index 76f02c82a0833..49751991e0a76 100644 --- a/base/util.jl +++ b/base/util.jl @@ -12,6 +12,9 @@ gc_time_ns() = ccall(:jl_gc_total_hrtime, Uint64, ()) # total number of bytes allocated so far gc_bytes() = ccall(:jl_gc_total_bytes, Int64, ()) +# reset the malloc log. Used to avoid counting memory allocated during compilation. +clear_malloc_data() = ccall(:jl_clear_malloc_data, Void, ()) + function tic() t0 = time_ns() task_local_storage(:TIMERS, (t0, get(task_local_storage(), :TIMERS, ()))) diff --git a/src/codegen.cpp b/src/codegen.cpp index 7f4c791ac15ff..91cebab5c5124 100644 --- a/src/codegen.cpp +++ b/src/codegen.cpp @@ -322,6 +322,8 @@ static Function *jlgetnthfieldchecked_func; #ifdef _OS_WINDOWS_ static Function *resetstkoflw_func; #endif +static Function *diff_gc_total_bytes_func; +static Function *show_execution_point_func; // --- code generation --- @@ -3367,8 +3369,9 @@ static Function *emit_function(jl_lambda_info_t *lam, bool cstyle) ctx.f = f; // step 5. set up debug info context and create first basic block - bool do_coverage = - jl_compileropts.code_coverage && lam->module != jl_base_module && lam->module != jl_core_module; + bool in_user_code = lam->module != jl_base_module && lam->module != jl_core_module; + bool do_coverage = jl_compileropts.code_coverage == JL_LOG_ALL || (jl_compileropts.code_coverage == JL_LOG_USER && in_user_code); + bool do_malloc_log = jl_compileropts.malloc_log == JL_LOG_ALL || (jl_compileropts.malloc_log == JL_LOG_USER && in_user_code); jl_value_t *stmt = jl_cellref(stmts,0); std::string filename = "no file"; char *dbgFuncName = lam->name->name; @@ -3414,6 +3417,7 @@ static Function *emit_function(jl_lambda_info_t *lam, bool cstyle) builder.SetCurrentDebugLocation(noDbg); debug_enabled = false; do_coverage = false; + do_malloc_log = false; } else { // TODO: Fix when moving to new LLVM version @@ -3716,10 +3720,12 @@ static Function *emit_function(jl_lambda_info_t *lam, bool cstyle) // step 15. compile body statements bool prevlabel = false; + lno = -1; + int prevlno = -1; for(i=0; i < stmtslen; i++) { jl_value_t *stmt = jl_cellref(stmts,i); if (jl_is_linenode(stmt)) { - int lno = jl_linenode_line(stmt); + lno = jl_linenode_line(stmt); if (debug_enabled) builder.SetCurrentDebugLocation(DebugLoc::get(lno, 1, (MDNode*)SP, NULL)); if (do_coverage) @@ -3727,7 +3733,7 @@ static Function *emit_function(jl_lambda_info_t *lam, bool cstyle) ctx.lineno = lno; } else if (jl_is_expr(stmt) && ((jl_expr_t*)stmt)->head == line_sym) { - int lno = jl_unbox_long(jl_exprarg(stmt, 0)); + lno = jl_unbox_long(jl_exprarg(stmt, 0)); if (debug_enabled) builder.SetCurrentDebugLocation(DebugLoc::get(lno, 1, (MDNode*)SP, NULL)); if (do_coverage) @@ -3741,6 +3747,12 @@ static Function *emit_function(jl_lambda_info_t *lam, bool cstyle) else { prevlabel = false; } + if (do_malloc_log && lno != prevlno) { + // Check memory allocation only after finishing a line + if (prevlno != -1) + mallocVisitLine(filename, prevlno); + prevlno = lno; + } if (jl_is_expr(stmt) && ((jl_expr_t*)stmt)->head == return_sym) { jl_expr_t *ex = (jl_expr_t*)stmt; Value *retval; @@ -3761,6 +3773,8 @@ static Function *emit_function(jl_lambda_info_t *lam, bool cstyle) builder.CreateStore(builder.CreateBitCast(builder.CreateLoad(gcpop, false), jl_ppvalue_llvmt), prepare_global(jlpgcstack_var)); #endif + if (do_malloc_log && lno != -1) + mallocVisitLine(filename, lno); if (builder.GetInsertBlock()->getTerminator() == NULL) { if (retty == T_void) builder.CreateRetVoid(); @@ -4254,6 +4268,21 @@ static void init_julia_llvm_env(Module *m) "jl_get_nth_field_checked", m); add_named_global(jlgetnthfieldchecked_func, (void*)*jl_get_nth_field_checked); + diff_gc_total_bytes_func = + Function::Create(FunctionType::get(T_int64, false), + Function::ExternalLinkage, + "diff_gc_total_bytes", m); + add_named_global(diff_gc_total_bytes_func, (void*)*diff_gc_total_bytes); + + std::vector execpoint_args(0); + execpoint_args.push_back(T_pint8); + execpoint_args.push_back(T_int32); + show_execution_point_func = + Function::Create(FunctionType::get(T_void, execpoint_args, false), + Function::ExternalLinkage, + "show_execution_point", m); + add_named_global(show_execution_point_func, (void*)*show_execution_point); + // set up optimization passes FPM = new FunctionPassManager(m); diff --git a/src/debuginfo.cpp b/src/debuginfo.cpp index a055adf504718..b7197486c2a59 100644 --- a/src/debuginfo.cpp +++ b/src/debuginfo.cpp @@ -541,14 +541,14 @@ void* CALLBACK jl_getUnwindInfo(HANDLE hProcess, ULONG64 AddrBase, ULONG64 UserC // Code coverage -typedef std::map > coveragedata_t; -static coveragedata_t coverageData; +typedef std::map > logdata_t; +static logdata_t coverageData; static void coverageVisitLine(std::string filename, int line) { if (filename == "" || filename == "none" || filename == "no file") return; - coveragedata_t::iterator it = coverageData.find(filename); + logdata_t::iterator it = coverageData.find(filename); if (it == coverageData.end()) { coverageData[filename] = std::vector(0); } @@ -564,39 +564,43 @@ static void coverageVisitLine(std::string filename, int line) v); } -extern "C" void jl_write_coverage_data(void) +void write_log_data(logdata_t logData, const char* extension) { - coveragedata_t::iterator it = coverageData.begin(); - for (; it != coverageData.end(); it++) { + std::string base = std::string(julia_home); + base = base + "/../share/julia/base/"; + logdata_t::iterator it = logData.begin(); + for (; it != logData.end(); it++) { std::string filename = (*it).first; - std::string outfile = filename + ".cov"; - std::vector &counts = (*it).second; - if (counts.size() > 1) { + std::vector &values = (*it).second; + if (values.size() > 1) { + if (filename[0] != '/') + filename = base + filename; std::ifstream inf(filename.c_str()); if (inf.is_open()) { + std::string outfile = filename + extension; std::ofstream outf(outfile.c_str(), std::ofstream::trunc | std::ofstream::out); char line[1024]; int l = 1; while (!inf.eof()) { inf.getline(line, sizeof(line)); if (inf.fail() && !inf.bad()) { - // Read through lines longer than 1024 + // Read through lines longer than sizeof(line) inf.clear(); inf.ignore(std::numeric_limits::max(), '\n'); } - int count = -1; - if ((size_t)l < counts.size()) { - GlobalVariable *gv = counts[l]; + int value = -1; + if ((size_t)l < values.size()) { + GlobalVariable *gv = values[l]; if (gv) { int *p = (int*)jl_ExecutionEngine->getPointerToGlobal(gv); - count = *p; + value = *p; } } outf.width(9); - if (count == -1) + if (value == -1) outf<<'-'; else - outf<(0); + } + std::vector &vec = mallocData[filename]; + if (vec.size() <= (size_t)line) + vec.resize(line+1, NULL); + if (vec[line] == NULL) + vec[line] = new GlobalVariable(*jl_Module, T_int64, false, + GlobalVariable::InternalLinkage, + ConstantInt::get(T_int64,0), "bytecnt"); + GlobalVariable *v = vec[line]; + builder.CreateStore(builder.CreateAdd(builder.CreateLoad(v, true), + builder.CreateCall(prepare_call(diff_gc_total_bytes_func))), + v, true); +} + +// Resets the malloc counts. Needed to avoid including memory usage +// from JITting. +extern "C" DLLEXPORT void jl_clear_malloc_data(void) +{ + logdata_t::iterator it = mallocData.begin(); + for (; it != mallocData.end(); it++) { + std::vector &bytes = (*it).second; + std::vector::iterator itb; + for (itb = bytes.begin(); itb != bytes.end(); itb++) { + if (*itb) { + int64_t *p = (int64_t*) jl_ExecutionEngine->getPointerToGlobal(*itb); + *p = 0; + } + } + } + sync_gc_total_bytes(); +} + +extern "C" void jl_write_malloc_log(void) +{ + write_log_data(mallocData, ".mlc"); +} + +void show_execution_point(char *filename, int lno) +{ + jl_printf(JL_STDOUT, "executing file %s, line %d\n", filename, lno); +} diff --git a/src/gc.c b/src/gc.c index 610303564e3af..5661e39f674b5 100644 --- a/src/gc.c +++ b/src/gc.c @@ -80,6 +80,7 @@ typedef struct _bigval_t { // GC knobs and self-measurement variables static size_t allocd_bytes = 0; static int64_t total_allocd_bytes = 0; +static int64_t last_gc_total_bytes = 0; static size_t freed_bytes = 0; static uint64_t total_gc_time=0; #ifdef _P64 @@ -917,6 +918,15 @@ DLLEXPORT int jl_gc_is_enabled(void) { return is_gc_enabled; } DLLEXPORT int64_t jl_gc_total_bytes(void) { return total_allocd_bytes + allocd_bytes; } DLLEXPORT uint64_t jl_gc_total_hrtime(void) { return total_gc_time; } +int64_t diff_gc_total_bytes(void) +{ + int64_t oldtb = last_gc_total_bytes; + int64_t newtb = jl_gc_total_bytes(); + last_gc_total_bytes = newtb; + return newtb - oldtb; +} +void sync_gc_total_bytes(void) {last_gc_total_bytes = jl_gc_total_bytes();} + void jl_gc_ephemeral_on(void) { pools = &ephe_pools[0]; } void jl_gc_ephemeral_off(void) { pools = &norm_pools[0]; } diff --git a/src/init.c b/src/init.c index bb13ce6648155..a726793d2c1ee 100644 --- a/src/init.c +++ b/src/init.c @@ -67,6 +67,7 @@ extern BOOL (WINAPI *hSymRefreshModuleList)(HANDLE); char *julia_home = NULL; jl_compileropts_t jl_compileropts = { NULL, // build_path 0, // code_coverage + 0, // malloc_log JL_COMPILEROPT_CHECK_BOUNDS_DEFAULT, 0 // int32_literals }; @@ -378,6 +379,7 @@ static void jl_uv_exitcleanup_walk(uv_handle_t* handle, void *arg) } void jl_write_coverage_data(void); +void jl_write_malloc_log(void); DLLEXPORT void uv_atexit_hook() { @@ -386,6 +388,8 @@ DLLEXPORT void uv_atexit_hook() #endif if (jl_compileropts.code_coverage) jl_write_coverage_data(); + if (jl_compileropts.malloc_log) + jl_write_malloc_log(); if (jl_base_module) { jl_value_t *f = jl_get_global(jl_base_module, jl_symbol("_atexit")); if (f!=NULL && jl_is_function(f)) { diff --git a/src/julia.h b/src/julia.h index 09a0bd00be0de..6076a9021ff2e 100644 --- a/src/julia.h +++ b/src/julia.h @@ -1054,6 +1054,8 @@ DLLEXPORT void jl_gc_disable(void); DLLEXPORT int jl_gc_is_enabled(void); DLLEXPORT int64_t jl_gc_total_bytes(void); DLLEXPORT uint64_t jl_gc_total_hrtime(void); +int64_t diff_gc_total_bytes(void); +void sync_gc_total_bytes(void); void jl_gc_ephemeral_on(void); void jl_gc_ephemeral_off(void); DLLEXPORT void jl_gc_collect(void); @@ -1073,6 +1075,8 @@ DLLEXPORT void *alloc_4w(void); void *allocb(size_t sz); DLLEXPORT void *allocobj(size_t sz); +DLLEXPORT void jl_clear_malloc_data(void); + #else #define JL_GC_PUSH(...) ; @@ -1308,17 +1312,26 @@ DLLEXPORT size_t jl_static_show(JL_STREAM *out, jl_value_t *v); void jl_print_gc_stats(JL_STREAM *s); #endif +// debugging +void show_execution_point(char *filename, int lno); + // compiler options ----------------------------------------------------------- typedef struct { char *build_path; int8_t code_coverage; + int8_t malloc_log; int8_t check_bounds; int int_literals; } jl_compileropts_t; extern DLLEXPORT jl_compileropts_t jl_compileropts; +// Settings for code_coverage and mallog_log +#define JL_LOG_NONE 0 +#define JL_LOG_USER 1 +#define JL_LOG_ALL 2 + #define JL_COMPILEROPT_CHECK_BOUNDS_DEFAULT 0 #define JL_COMPILEROPT_CHECK_BOUNDS_ON 1 #define JL_COMPILEROPT_CHECK_BOUNDS_OFF 2 diff --git a/ui/repl.c b/ui/repl.c index 3b773c013a32d..c894b3d18ca55 100644 --- a/ui/repl.c +++ b/ui/repl.c @@ -48,7 +48,8 @@ extern DLLEXPORT char *julia_home; char system_image[256] = JL_SYSTEM_IMAGE_PATH; static int lisp_prompt = 0; -static int codecov=0; +static int codecov = JL_LOG_NONE; +static int malloclog= JL_LOG_NONE; static char *program = NULL; char *image_file = NULL; @@ -74,7 +75,10 @@ static const char *opts = " -F Load ~/.juliarc.jl, then handle remaining inputs\n" " --color={yes|no} Enable or disable color text\n\n" - " --code-coverage Count executions of source lines\n" + " --code-coverage={none|user|all}, --code-coverage\n" + " Count executions of source lines (omitting setting is equivalent to 'user')\n" + " --track-allocation={none|user|all}\n" + " Count bytes allocated by each source line\n" " --check-bounds={yes|no} Emit bounds checks always or never (ignoring declarations)\n" " --int-literals={32|64} Select integer literal size independent of platform\n"; @@ -88,7 +92,8 @@ void parse_opts(int *argcp, char ***argvp) { "lisp", no_argument, &lisp_prompt, 1 }, { "help", no_argument, 0, 'h' }, { "sysimage", required_argument, 0, 'J' }, - { "code-coverage", no_argument, &codecov, 1 }, + { "code-coverage", optional_argument, 0, 'c' }, + { "track-allocation",required_argument, 0, 'm' }, { "check-bounds", required_argument, 0, 300 }, { "int-literals", required_argument, 0, 301 }, { 0, 0, 0, 0 } @@ -122,6 +127,29 @@ void parse_opts(int *argcp, char ***argvp) case 'h': printf("%s%s", usage, opts); exit(0); + case 'c': + if (optarg != NULL) { + if (!strcmp(optarg,"user")) + codecov = JL_LOG_USER; + else if (!strcmp(optarg,"all")) + codecov = JL_LOG_ALL; + else if (!strcmp(optarg,"none")) + codecov = JL_LOG_NONE; + break; + } + else + codecov = JL_LOG_USER; + break; + case 'm': + if (optarg != NULL) { + if (!strcmp(optarg,"user")) + malloclog = JL_LOG_USER; + else if (!strcmp(optarg,"all")) + malloclog = JL_LOG_ALL; + else if (!strcmp(optarg,"none")) + malloclog = JL_LOG_NONE; + break; + } case 300: if (!strcmp(optarg,"yes")) jl_compileropts.check_bounds = JL_COMPILEROPT_CHECK_BOUNDS_ON; @@ -145,6 +173,7 @@ void parse_opts(int *argcp, char ***argvp) } } jl_compileropts.code_coverage = codecov; + jl_compileropts.malloc_log = malloclog; if (!julia_home) { julia_home = getenv("JULIA_HOME"); if (julia_home) {