erlang各种有用的函数包括一些有用nif封装,还有一些性能测试case。
Non puoi selezionare più di 25 argomenti Gli argomenti devono iniziare con una lettera o un numero, possono includere trattini ('-') e possono essere lunghi fino a 35 caratteri.
 
 
 
 
 
 

476 righe
16 KiB

-module(utVMInfo).
-compile([export_all, nowarn_export_all]).
%% 打印并排序各个表的缓存消耗
show_cache() ->
io:format("table name | memory | size~n", []),
lists:reverse(lists:keysort(2, [{T, ets:info(T, memory), ets:info(T, size)} || T <- ets:all()])).
%% 打印进程消耗内存的信息
show_process() ->
lists:reverse(lists:keysort(2, [{erlang:process_info(P, registered_name), erlang:process_info(P, heap_size)} || P <- erlang:processes()])).
%% 打印当前进程数量
show_process_count() ->
length(erlang:processes()).
%% 反编译
%% 确认线上运行代码是否正确,reltools没掌握好,升级偶尔出现问题
decompile(Mod) ->
{ok,{_,[{abstract_code,{_,AC}}]}} = beam_lib:chunks(code:which(Mod), [abstract_code]),
io:format("~s~n", [erl_prettypr:format(erl_syntax:form_list(AC))]).
%% 进程栈
%% 类似于jstack,发现大量进程挂起,进程数过高,运行慢,hang住等问题用到
pstack(Reg) when is_atom(Reg) ->
case whereis(Reg) of
undefined -> undefined;
Pid -> pstack(Pid)
end;
pstack(Pid) ->
io:format("~s~n", [element(2, process_info(Pid, backtrace))]).
%% ====================================================================
%% etop
%% 分析内存、cpu占用进程,即使数十w进程node 也能正常使用
%% 进程CPU占用排名
%% --------------------------------------------------------------------
etop() ->
spawn(fun() -> etop:start([{output, text}, {interval, 10}, {lines, 20}, {sort, reductions}]) end).
%% 进程Mem占用排名
etop_mem() ->
spawn(fun() -> etop:start([{output, text}, {interval, 10}, {lines, 20}, {sort, memory}]) end).
%% 停止etop
etop_stop() ->
etop:stop().
%% ====================================================================
%% 对所有process做gc
%% 进程内存过高时,来一发,看看是内存泄露还是gc不过来
gc_all() ->
[erlang:garbage_collect(Pid) || Pid <- processes()],
ok.
%% 对MFA 执行分析,会严重减缓运行,建议只对小量业务执行
%% 结果:
%% fprof 结果比较详细,能够输出热点调用路径
fprof(M, F, A) ->
fprof:start(),
fprof:apply(M, F, A),
fprof:profile(),
fprof:analyse(),
fprof:stop().
%% 对整个节点内所有进程执行eprof, eprof 对线上业务有一定影响,慎用!
%% 建议TimeoutSec<10s,且进程数< 1000,否则可能导致节点crash
%% 结果:
%% 输出每个方法实际执行时间(不会累计方法内其他mod调用执行时间)
%% 只能得到mod - Fun 执行次数 执行耗时
eprof_all(TimeoutSec) ->
eprof(processes() -- [whereis(eprof)], TimeoutSec).
eprof(Pids, TimeoutSec) ->
eprof:start(),
eprof:start_profiling(Pids),
timer:sleep(TimeoutSec),
eprof:stop_profiling(),
eprof:analyze(total),
eprof:stop().
%% scheduler usage
%% 统计下1s每个调度器CPU的实际利用率(因为有spin wait、调度工作, 可能usage 比top显示低很多)
scheduler_usage() ->
scheduler_usage(1000).
scheduler_usage(RunMs) ->
erlang:system_flag(scheduler_wall_time, true),
Ts0 = lists:sort(erlang:statistics(scheduler_wall_time)),
timer:sleep(RunMs),
Ts1 = lists:sort(erlang:statistics(scheduler_wall_time)),
erlang:system_flag(scheduler_wall_time, false),
Cores = lists:map(fun({{_I, A0, T0}, {I, A1, T1}}) ->
{I, (A1 - A0) / (T1 - T0)} end, lists:zip(Ts0, Ts1)),
{A, T} = lists:foldl(fun({{_, A0, T0}, {_, A1, T1}}, {Ai,Ti}) ->
{Ai + (A1 - A0), Ti + (T1 - T0)} end, {0, 0}, lists:zip(Ts0, Ts1)),
Total = A/T,
io:format("~p~n", [[{total, Total} | Cores]]).
%% 进程调度
%% 统计下1s内调度进程数量(含义:第一个数字执行进程数量,第二个数字迁移进程数量)
scheduler_stat() ->
scheduler_stat(1000).
scheduler_stat(RunMs) ->
erlang:system_flag(scheduling_statistics, enable),
Ts0 = erlang:system_info(total_scheduling_statistics),
timer:sleep(RunMs),
Ts1 = erlang:system_info(total_scheduling_statistics),
erlang:system_flag(scheduling_statistics, disable),
lists:map(fun({{_Key, In0, Out0}, {Key, In1, Out1}}) ->
{Key, In1 - In0, Out1 - Out0} end, lists:zip(Ts0, Ts1)).
%% ====================================================================
%% trace 日志
%% 会把mod 每次调用详细MFA log 下来,args 太大就不好看了
%% trace Mod 所有方法的调用
%% --------------------------------------------------------------------
trace(Mod) ->
dbg:tracer(),
dbg:tpl(Mod, '_', []),
dbg:p(all, c).
%% trace Node上指定 Mod 所有方法的调用, 结果将输出到本地shell
trace(Node, Mod) ->
dbg:tracer(),
dbg:n(Node),
dbg:tpl(Mod, '_', []),
dbg:p(all, c).
%% 停止trace
trace_stop() ->
dbg:stop_clear().
%% ====================================================================
%% 内存高OOM 排查工具
%% etop 无法应对10w+ 进程节点, 下面代码就没问题了;找到可疑proc后通过pstack、message_queu_len 排查原因
proc_mem_all(SizeLimitKb) ->
Procs = [{undefined, Pid} || Pid<- erlang:processes()],
proc_mem(Procs, SizeLimitKb).
proc_mem(SizeLimitKb) ->
Procs = [{Name, Pid} || {_, Name, Pid, _} <- release_handler_1:get_supervised_procs(),
is_process_alive(Pid)],
proc_mem(Procs, SizeLimitKb).
proc_mem(Procs, SizeLimitKb) ->
SizeLimit = SizeLimitKb * 1024,
{R, Total} = lists:foldl(fun({Name, Pid}, {Acc, TotalSize}) ->
case erlang:process_info(Pid, total_heap_size) of
{_, Size0} ->
Size = Size0*8,
case Size > SizeLimit of
true -> {[{Name, Pid, Size} | Acc], TotalSize+Size};
false -> {Acc, TotalSize}
end;
_ -> {Acc, TotalSize}
end
end, {[], 0}, Procs),
R1 = lists:keysort(3, R),
{Total, lists:reverse(R1)}.
show(N) ->
F = fun(P) ->
case catch process_info(P, [memory, dictionary]) of
[{_, Memory}, {_, Dict}] ->
InitStart = util:prop_get_value('$initial_call', Dict, null),
{InitStart, Memory};
_ -> {null, 0}
end
end,
Infos1 = lists:map(F, processes()),
Infos2 = [{Name, M} || {Name, M} <- Infos1, Name =/= null],
SortFun = fun({_, M1}, {_, M2}) -> M1 > M2 end,
Infos3 = lists:sort(SortFun, Infos2),
Infos4 = lists:sublist(Infos3, N),
[io:format("~p : ~p ~n", [Name, M]) || {Name, M} <- Infos4],
ok.
show(N, SkipNames) ->
F = fun(P) ->
case catch process_info(P, [memory, dictionary]) of
[{_, Memory}, {_, Dict}] ->
InitStart = util:prop_get_value('$initial_call', Dict, null),
case catch tuple_to_list(InitStart) of
[Name | _] ->
case lists:member(Name, SkipNames) of
true -> {null, 0};
false -> {InitStart, Memory}
end;
_ -> {null, 0}
end;
_ -> {null, 0}
end
end,
Infos1 = lists:map(F, processes()),
Infos2 = [{Name, M} || {Name, M} <- Infos1, Name =/= null],
SortFun = fun({_, M1}, {_, M2}) -> M1 > M2 end,
Infos3 = lists:sort(SortFun, Infos2),
Infos4 = lists:sublist(Infos3, N),
[io:format("~p : ~p ~n", [Name, M]) || {Name, M} <- Infos4],
ok.
show1(N) ->
F = fun(P, Acc) ->
case catch process_info(P, [memory, dictionary]) of
[{_, Memory}, {_, Dict}] ->
InitStart = util:prop_get_value('$initial_call', Dict, null),
case lists:keyfind(InitStart, 1, Acc) of
false -> [{InitStart, Memory, 1} | Acc];
{InitStart, Memory1, Num} -> lists:keystore(InitStart, 1, Acc, {InitStart, Memory + Memory1, Num + 1})
end;
_ -> Acc
end
end,
Infos1 = lists:foldl(F, [], processes()),
Infos2 = [{Name, M, Num} || {Name, M, Num} <- Infos1, Name =/= null],
SortFun = fun({_, M1, _}, {_, M2, _}) -> M1 > M2 end,
Infos3 = lists:sort(SortFun, Infos2),
Infos4 = lists:sublist(Infos3, N),
[io:format("~p : per_memory=~p process_num=~p ~n", [Name, (M div Num), Num]) || {Name, M, Num} <- Infos4],
ok.
%% 得到CPU核数
coreCnt() ->
erlang:system_info(schedulers).
%% 获取当前进程运行的核id
coreIndex() ->
erlang:system_info(scheduler_id).
%% @doc 节点所有进程信息
process_infos() ->
filelib:ensure_dir("./logs/"),
File = "./logs/processes_infos.log",
{ok, Fd} = file:open(File, [write, raw, binary, append]),
Fun = fun(Pi) ->
Info = io_lib:format("=>~p \n\n", [Pi]),
case filelib:is_file(File) of
true -> file:write(Fd, Info);
false ->
file:close(Fd),
{ok, NewFd} = file:open(File, [write, raw, binary, append]),
file:write(NewFd, Info)
end,
timer:sleep(20)
end,
[Fun(erlang:process_info(P)) || P <- erlang:processes()].
rfc1123_local_date() ->
rfc1123_local_date(os:timestamp()).
rfc1123_local_date({A, B, C}) ->
rfc1123_local_date(calendar:now_to_local_time({A, B, C}));
rfc1123_local_date({{YYYY, MM, DD}, {Hour, Min, Sec}}) ->
DayNumber = calendar:day_of_the_week({YYYY, MM, DD}),
lists:flatten(
io_lib:format("~s, ~2.2.0w ~3.s ~4.4.0w ~2.2.0w:~2.2.0w:~2.2.0w GMT",
[httpd_util:day(DayNumber), DD, httpd_util:month(MM), YYYY, Hour, Min, Sec]));
rfc1123_local_date(Epoch) when erlang:is_integer(Epoch) ->
rfc1123_local_date(calendar:gregorian_seconds_to_datetime(Epoch + 62167219200)).
%% @doc erlang_dump
crash_dump() ->
Date = erlang:list_to_binary(rfc1123_local_date()),
Header = binary:list_to_bin([<<"=erl_crash_dump:0.2\n">>, Date, <<"\nSystem version: ">>]),
Ets = ets_info(),
Report = binary:list_to_bin([Header, erlang:list_to_binary(erlang:system_info(system_version)),
erlang:system_info(info), erlang:system_info(procs), Ets, erlang:system_info(dist),
<<"=loaded_modules\n">>, binary:replace(erlang:system_info(loaded),
<<"\n">>, <<"\n=mod:">>, [global])]),
file:write_file("erl_crash.dump", Report).
ets_info() ->
binary:list_to_bin([ets_table_info(T) || T <- ets:all()]).
ets_table_info(Table) ->
Info = ets:info(Table),
Owner = erlang:list_to_binary(erlang:pid_to_list(proplists:get_value(owner, Info))),
TableN = erlang:list_to_binary(erlang:atom_to_list(proplists:get_value(name, Info))),
Name = erlang:list_to_binary(erlang:atom_to_list(proplists:get_value(name, Info))),
Objects = erlang:list_to_binary(erlang:integer_to_list(proplists:get_value(size, Info))),
binary:list_to_bin([<<"=ets:">>, Owner, <<"\nTable: ">>, TableN, <<"\nName: ">>, Name,
<<"\nObjects: ">>, Objects, <<"\n">>]).
%% 检查溢出的内存,强制gc, 并写入日志分析
check_mem(MemLim) ->
lists:foreach(
fun(P) ->
case is_pid(P) andalso erlang:is_process_alive(P) of
true ->
{memory, Mem} = erlang:process_info(P, memory),
case Mem > MemLim of
true ->
erlang:garbage_collect(P);
false ->
[]
end;
false ->
[]
end
end, erlang:processes()).
%% @spec top() -> ok
%% @doc 查看系统当前的综合信息
top() ->
Release = erlang:system_info(otp_release),
SchedNum = erlang:system_info(schedulers),
ProcCount = erlang:system_info(process_count),
ProcLimit = erlang:system_info(process_limit),
ProcMemUsed = erlang:memory(processes_used),
EtsMemAlc = erlang:memory(ets),
MemTot = erlang:memory(total),
%PetNum = all_pets(),
io:format(
"++++++++++++++++++++++++++++++++++++++++++~n"
" Node: ~p~n"
" Erlang Ver: ~p~n"
" Free Threads: ~p~n"
" Process Used Memory: ~pMb~n"
" Ets Used Memory: ~pMb~n"
" Erlang VM Used Memory: ~pMb~n"
" Process Limit: ~p~n"
" Process Used: ~p~n"
"++++++++++++++++++++++++++++++++++++++++++~n"
, [node(), Release, SchedNum, ProcMemUsed / 1024 / 1024, EtsMemAlc / 1024 / 1024, MemTot / 1024 / 1024, ProcLimit, ProcCount]),
ok.
%% @doc 运维要用
top_back() ->
Release = erlang:system_info(otp_release),
SchedNum = erlang:system_info(schedulers),
ProcCount = erlang:system_info(process_count),
ProcLimit = erlang:system_info(process_limit),
ProcMemUsed = erlang:memory(processes_used),
EtsMemAlc = erlang:memory(ets),
MemTot = erlang:memory(total),
Str = io_lib:format(
" Erlang 版本: ~p~n"
" 可使用的调度线程: ~p~n"
" 所有进程使用的内存: ~pMb~n"
" 所有ets使用的内存: ~pMb~n"
" Erlang系统占用内存: ~pMb~n"
" 可创建进程数量上限: ~p~n"
" 当前进程数: ~p~n"
, [Release, SchedNum, ProcMemUsed / 1024 / 1024, EtsMemAlc / 1024 / 1024, MemTot / 1024 / 1024, ProcLimit, ProcCount]),
binary_to_list(list_to_binary(Str)).
%% @spec ets_mem() -> term()
%% @doc 查看内存占用最多的30张ets表
ets_mem() ->
L = ets:all(),
Mems = lists:map(fun(Tab) ->
Info = ets:info(Tab),
case lists:keyfind(memory, 1, Info) of
{memory, Mem} -> {Tab, Mem};
_ -> {Tab, 0}
end
end, L),
L1 = lists:sublist(lists:reverse(lists:keysort(2, Mems)), 30),
io:format("~n--------------------------------------------------~n"
"~-30w ~w~n--------------------------------------------------~n"
, [table, used_memory]),
lists:foreach(
fun({Tab, Mem}) ->
io:format("~-30w ~wKb~n", [Tab, Mem / 1024])
end, L1).
%% @spec tcp_links() -> Info
%% @doc 统计tcp链接
tcp_links() ->
L = erlang:ports(),
F = fun(P) ->
Pinfo = erlang:port_info(P),
case lists:keyfind(name, 1, Pinfo) of
{name, "tcp_inet"} -> true;
_ -> false
end
end,
L1 = lists:filter(F, L),
io:format("~n当前socket数量(包括链接数据库的socket): ~w~n", [length(L1)]).
%% @doc 备份进程信息
dump_process_info(Pid) ->
{{Year, Month, Day}, {Hour, Minutes, Second}} = util:local_time(),
{ok, FileHandle} = file:open(util:fbin("~s-~w-~w-~w-~w-~w-~w", [<<"../logs/pid_info.dump">>, Year, Month, Day, Hour, Minutes, Second]), write),
case erlang:process_info(Pid) of
Info when is_list(Info) ->
lists:foreach(fun({messages, Messages}) ->
case Messages =:= [] of
true ->
io:format(FileHandle, "~w~n", [{messages, Messages}]);
_ ->
io:format(FileHandle, "{messages,~n", []),
lists:foreach(fun(M) ->
io:format(FileHandle, " ~w~n", [M])
end, Messages),
io:format(FileHandle, "}~n", [])
end;
({dictionary, Dics}) ->
case Dics =:= [] of
true ->
io:format(FileHandle, "~w~n", [{dictionary, Dics}]);
_ ->
io:format(FileHandle, "{dictionary,~n", []),
lists:foreach(fun(M) ->
io:format(FileHandle, " ~w~n", [M])
end, Dics),
io:format(FileHandle, "}~n", [])
end;
(E) ->
io:format(FileHandle, "~w~n", [E])
end, Info);
_ ->
io:format("not find pid info")
end,
file:close(FileHandle).
get_process_info_and_zero_value(InfoName) ->
PList = erlang:processes(),
ZList = lists:filter(
fun(T) ->
case erlang:process_info(T, InfoName) of
{InfoName, 0} -> false;
_ -> true
end
end, PList),
ZZList = lists:map(
fun(T) -> {T, erlang:process_info(T, InfoName), erlang:process_info(T, registered_name)}
end, ZList),
[length(PList), InfoName, length(ZZList), ZZList].
get_process_info_and_large_than_value(InfoName, Value) ->
PList = erlang:processes(),
ZList = lists:filter(
fun(T) ->
case erlang:process_info(T, InfoName) of
{InfoName, VV} ->
if VV > Value -> true;
true -> false
end;
_ -> true
end
end, PList),
ZZList = lists:map(
fun(T) -> {T, erlang:process_info(T, InfoName), erlang:process_info(T, registered_name)}
end, ZList),
[length(PList), InfoName, Value, length(ZZList), ZZList].
get_msg_queue() ->
io:fwrite("process count:~p~n~p value is not 0 count:~p~nLists:~p~n",
get_process_info_and_zero_value(message_queue_len)).
get_memory() ->
io:fwrite("process count:~p~n~p value is large than ~p count:~p~nLists:~p~n",
get_process_info_and_large_than_value(memory, 1048576)).
get_memory(Value) ->
io:fwrite("process count:~p~n~p value is large than ~p count:~p~nLists:~p~n",
get_process_info_and_large_than_value(memory, Value)).
get_heap() ->
io:fwrite("process count:~p~n~p value is large than ~p count:~p~nLists:~p~n",
get_process_info_and_large_than_value(heap_size, 1048576)).
get_heap(Value) ->
io:fwrite("process count:~p~n~p value is large than ~p count:~p~nLists:~p~n",
get_process_info_and_large_than_value(heap_size, Value)).
get_processes() ->
io:fwrite("process count:~p~n~p value is large than ~p count:~p~nLists:~p~n",
get_process_info_and_large_than_value(memory, 0)).