|
|
- -module(utVMInfo).
-
- -compile([export_all, nowarn_export_all]).
-
- %% 打印并排序各个表的缓存消耗
- show_cache() ->
- io:format("table name | memory | size~n", []),
- lists:reverse(lists:keysort(2, [{T, ets:info(T, memory), ets:info(T, size)} || T <- ets:all()])).
-
- %% 打印进程消耗内存的信息
- show_process() ->
- lists:reverse(lists:keysort(2, [{erlang:process_info(P, registered_name), erlang:process_info(P, heap_size)} || P <- erlang:processes()])).
-
- %% 打印当前进程数量
- show_process_count() ->
- length(erlang:processes()).
-
- %% 反编译
- %% 确认线上运行代码是否正确,reltools没掌握好,升级偶尔出现问题
- decompile(Mod) ->
- {ok,{_,[{abstract_code,{_,AC}}]}} = beam_lib:chunks(code:which(Mod), [abstract_code]),
- io:format("~s~n", [erl_prettypr:format(erl_syntax:form_list(AC))]).
-
- %% 进程栈
- %% 类似于jstack,发现大量进程挂起,进程数过高,运行慢,hang住等问题用到
- pstack(Reg) when is_atom(Reg) ->
- case whereis(Reg) of
- undefined -> undefined;
- Pid -> pstack(Pid)
- end;
- pstack(Pid) ->
- io:format("~s~n", [element(2, process_info(Pid, backtrace))]).
-
- %% ====================================================================
- %% etop
- %% 分析内存、cpu占用进程,即使数十w进程node 也能正常使用
- %% 进程CPU占用排名
- %% --------------------------------------------------------------------
- etop() ->
- spawn(fun() -> etop:start([{output, text}, {interval, 10}, {lines, 20}, {sort, reductions}]) end).
-
- %% 进程Mem占用排名
- etop_mem() ->
- spawn(fun() -> etop:start([{output, text}, {interval, 10}, {lines, 20}, {sort, memory}]) end).
-
- %% 停止etop
- etop_stop() ->
- etop:stop().
- %% ====================================================================
-
- %% 对所有process做gc
- %% 进程内存过高时,来一发,看看是内存泄露还是gc不过来
- gc_all() ->
- [erlang:garbage_collect(Pid) || Pid <- processes()],
- ok.
-
- %% 对MFA 执行分析,会严重减缓运行,建议只对小量业务执行
- %% 结果:
- %% fprof 结果比较详细,能够输出热点调用路径
- fprof(M, F, A) ->
- fprof:start(),
- fprof:apply(M, F, A),
- fprof:profile(),
- fprof:analyse(),
- fprof:stop().
-
- %% 对整个节点内所有进程执行eprof, eprof 对线上业务有一定影响,慎用!
- %% 建议TimeoutSec<10s,且进程数< 1000,否则可能导致节点crash
- %% 结果:
- %% 输出每个方法实际执行时间(不会累计方法内其他mod调用执行时间)
- %% 只能得到mod - Fun 执行次数 执行耗时
- eprof_all(TimeoutSec) ->
- eprof(processes() -- [whereis(eprof)], TimeoutSec).
-
- eprof(Pids, TimeoutSec) ->
- eprof:start(),
- eprof:start_profiling(Pids),
- timer:sleep(TimeoutSec),
- eprof:stop_profiling(),
- eprof:analyze(total),
- eprof:stop().
-
- %% scheduler usage
- %% 统计下1s每个调度器CPU的实际利用率(因为有spin wait、调度工作, 可能usage 比top显示低很多)
- scheduler_usage() ->
- scheduler_usage(1000).
-
- scheduler_usage(RunMs) ->
- erlang:system_flag(scheduler_wall_time, true),
- Ts0 = lists:sort(erlang:statistics(scheduler_wall_time)),
- timer:sleep(RunMs),
- Ts1 = lists:sort(erlang:statistics(scheduler_wall_time)),
- erlang:system_flag(scheduler_wall_time, false),
- Cores = lists:map(fun({{_I, A0, T0}, {I, A1, T1}}) ->
- {I, (A1 - A0) / (T1 - T0)} end, lists:zip(Ts0, Ts1)),
- {A, T} = lists:foldl(fun({{_, A0, T0}, {_, A1, T1}}, {Ai,Ti}) ->
- {Ai + (A1 - A0), Ti + (T1 - T0)} end, {0, 0}, lists:zip(Ts0, Ts1)),
- Total = A/T,
- io:format("~p~n", [[{total, Total} | Cores]]).
-
- %% 进程调度
- %% 统计下1s内调度进程数量(含义:第一个数字执行进程数量,第二个数字迁移进程数量)
- scheduler_stat() ->
- scheduler_stat(1000).
-
- scheduler_stat(RunMs) ->
- erlang:system_flag(scheduling_statistics, enable),
- Ts0 = erlang:system_info(total_scheduling_statistics),
- timer:sleep(RunMs),
- Ts1 = erlang:system_info(total_scheduling_statistics),
- erlang:system_flag(scheduling_statistics, disable),
- lists:map(fun({{_Key, In0, Out0}, {Key, In1, Out1}}) ->
- {Key, In1 - In0, Out1 - Out0} end, lists:zip(Ts0, Ts1)).
-
- %% ====================================================================
- %% trace 日志
- %% 会把mod 每次调用详细MFA log 下来,args 太大就不好看了
- %% trace Mod 所有方法的调用
- %% --------------------------------------------------------------------
- trace(Mod) ->
- dbg:tracer(),
- dbg:tpl(Mod, '_', []),
- dbg:p(all, c).
-
- %% trace Node上指定 Mod 所有方法的调用, 结果将输出到本地shell
- trace(Node, Mod) ->
- dbg:tracer(),
- dbg:n(Node),
- dbg:tpl(Mod, '_', []),
- dbg:p(all, c).
-
- %% 停止trace
- trace_stop() ->
- dbg:stop_clear().
- %% ====================================================================
-
- %% 内存高OOM 排查工具
- %% etop 无法应对10w+ 进程节点, 下面代码就没问题了;找到可疑proc后通过pstack、message_queu_len 排查原因
- proc_mem_all(SizeLimitKb) ->
- Procs = [{undefined, Pid} || Pid<- erlang:processes()],
- proc_mem(Procs, SizeLimitKb).
-
- proc_mem(SizeLimitKb) ->
- Procs = [{Name, Pid} || {_, Name, Pid, _} <- release_handler_1:get_supervised_procs(),
- is_process_alive(Pid)],
- proc_mem(Procs, SizeLimitKb).
-
- proc_mem(Procs, SizeLimitKb) ->
- SizeLimit = SizeLimitKb * 1024,
- {R, Total} = lists:foldl(fun({Name, Pid}, {Acc, TotalSize}) ->
- case erlang:process_info(Pid, total_heap_size) of
- {_, Size0} ->
- Size = Size0*8,
- case Size > SizeLimit of
- true -> {[{Name, Pid, Size} | Acc], TotalSize+Size};
- false -> {Acc, TotalSize}
- end;
- _ -> {Acc, TotalSize}
- end
- end, {[], 0}, Procs),
- R1 = lists:keysort(3, R),
- {Total, lists:reverse(R1)}.
-
- show(N) ->
- F = fun(P) ->
- case catch process_info(P, [memory, dictionary]) of
- [{_, Memory}, {_, Dict}] ->
- InitStart = util:prop_get_value('$initial_call', Dict, null),
- {InitStart, Memory};
- _ -> {null, 0}
- end
- end,
- Infos1 = lists:map(F, processes()),
- Infos2 = [{Name, M} || {Name, M} <- Infos1, Name =/= null],
- SortFun = fun({_, M1}, {_, M2}) -> M1 > M2 end,
- Infos3 = lists:sort(SortFun, Infos2),
- Infos4 = lists:sublist(Infos3, N),
- [io:format("~p : ~p ~n", [Name, M]) || {Name, M} <- Infos4],
- ok.
-
- show(N, SkipNames) ->
- F = fun(P) ->
- case catch process_info(P, [memory, dictionary]) of
- [{_, Memory}, {_, Dict}] ->
- InitStart = util:prop_get_value('$initial_call', Dict, null),
- case catch tuple_to_list(InitStart) of
- [Name | _] ->
- case lists:member(Name, SkipNames) of
- true -> {null, 0};
- false -> {InitStart, Memory}
- end;
- _ -> {null, 0}
- end;
- _ -> {null, 0}
- end
- end,
- Infos1 = lists:map(F, processes()),
- Infos2 = [{Name, M} || {Name, M} <- Infos1, Name =/= null],
- SortFun = fun({_, M1}, {_, M2}) -> M1 > M2 end,
- Infos3 = lists:sort(SortFun, Infos2),
- Infos4 = lists:sublist(Infos3, N),
- [io:format("~p : ~p ~n", [Name, M]) || {Name, M} <- Infos4],
- ok.
-
- show1(N) ->
- F = fun(P, Acc) ->
- case catch process_info(P, [memory, dictionary]) of
- [{_, Memory}, {_, Dict}] ->
- InitStart = util:prop_get_value('$initial_call', Dict, null),
- case lists:keyfind(InitStart, 1, Acc) of
- false -> [{InitStart, Memory, 1} | Acc];
- {InitStart, Memory1, Num} -> lists:keystore(InitStart, 1, Acc, {InitStart, Memory + Memory1, Num + 1})
- end;
- _ -> Acc
- end
- end,
- Infos1 = lists:foldl(F, [], processes()),
- Infos2 = [{Name, M, Num} || {Name, M, Num} <- Infos1, Name =/= null],
- SortFun = fun({_, M1, _}, {_, M2, _}) -> M1 > M2 end,
- Infos3 = lists:sort(SortFun, Infos2),
- Infos4 = lists:sublist(Infos3, N),
- [io:format("~p : per_memory=~p process_num=~p ~n", [Name, (M div Num), Num]) || {Name, M, Num} <- Infos4],
- ok.
-
- %% 得到CPU核数
- coreCnt() ->
- erlang:system_info(schedulers).
-
- %% 获取当前进程运行的核id
- coreIndex() ->
- erlang:system_info(scheduler_id).
-
-
- %% @doc 节点所有进程信息
- process_infos() ->
- filelib:ensure_dir("./logs/"),
- File = "./logs/processes_infos.log",
- {ok, Fd} = file:open(File, [write, raw, binary, append]),
- Fun = fun(Pi) ->
- Info = io_lib:format("=>~p \n\n", [Pi]),
- case filelib:is_file(File) of
- true -> file:write(Fd, Info);
- false ->
- file:close(Fd),
- {ok, NewFd} = file:open(File, [write, raw, binary, append]),
- file:write(NewFd, Info)
- end,
- timer:sleep(20)
- end,
- [Fun(erlang:process_info(P)) || P <- erlang:processes()].
-
- rfc1123_local_date() ->
- rfc1123_local_date(os:timestamp()).
- rfc1123_local_date({A, B, C}) ->
- rfc1123_local_date(calendar:now_to_local_time({A, B, C}));
- rfc1123_local_date({{YYYY, MM, DD}, {Hour, Min, Sec}}) ->
- DayNumber = calendar:day_of_the_week({YYYY, MM, DD}),
- lists:flatten(
- io_lib:format("~s, ~2.2.0w ~3.s ~4.4.0w ~2.2.0w:~2.2.0w:~2.2.0w GMT",
- [httpd_util:day(DayNumber), DD, httpd_util:month(MM), YYYY, Hour, Min, Sec]));
- rfc1123_local_date(Epoch) when erlang:is_integer(Epoch) ->
- rfc1123_local_date(calendar:gregorian_seconds_to_datetime(Epoch + 62167219200)).
-
- %% @doc erlang_dump
- crash_dump() ->
- Date = erlang:list_to_binary(rfc1123_local_date()),
- Header = binary:list_to_bin([<<"=erl_crash_dump:0.2\n">>, Date, <<"\nSystem version: ">>]),
- Ets = ets_info(),
- Report = binary:list_to_bin([Header, erlang:list_to_binary(erlang:system_info(system_version)),
- erlang:system_info(info), erlang:system_info(procs), Ets, erlang:system_info(dist),
- <<"=loaded_modules\n">>, binary:replace(erlang:system_info(loaded),
- <<"\n">>, <<"\n=mod:">>, [global])]),
- file:write_file("erl_crash.dump", Report).
-
- ets_info() ->
- binary:list_to_bin([ets_table_info(T) || T <- ets:all()]).
-
- ets_table_info(Table) ->
- Info = ets:info(Table),
- Owner = erlang:list_to_binary(erlang:pid_to_list(proplists:get_value(owner, Info))),
- TableN = erlang:list_to_binary(erlang:atom_to_list(proplists:get_value(name, Info))),
- Name = erlang:list_to_binary(erlang:atom_to_list(proplists:get_value(name, Info))),
- Objects = erlang:list_to_binary(erlang:integer_to_list(proplists:get_value(size, Info))),
- binary:list_to_bin([<<"=ets:">>, Owner, <<"\nTable: ">>, TableN, <<"\nName: ">>, Name,
- <<"\nObjects: ">>, Objects, <<"\n">>]).
-
- %% 检查溢出的内存,强制gc, 并写入日志分析
- check_mem(MemLim) ->
- lists:foreach(
- fun(P) ->
- case is_pid(P) andalso erlang:is_process_alive(P) of
- true ->
- {memory, Mem} = erlang:process_info(P, memory),
- case Mem > MemLim of
- true ->
- erlang:garbage_collect(P);
- false ->
- []
- end;
- false ->
- []
- end
- end, erlang:processes()).
-
- %% @spec top() -> ok
- %% @doc 查看系统当前的综合信息
- top() ->
- Release = erlang:system_info(otp_release),
- SchedNum = erlang:system_info(schedulers),
- ProcCount = erlang:system_info(process_count),
- ProcLimit = erlang:system_info(process_limit),
- ProcMemUsed = erlang:memory(processes_used),
- EtsMemAlc = erlang:memory(ets),
- MemTot = erlang:memory(total),
- %PetNum = all_pets(),
- io:format(
- "++++++++++++++++++++++++++++++++++++++++++~n"
- " Node: ~p~n"
- " Erlang Ver: ~p~n"
- " Free Threads: ~p~n"
- " Process Used Memory: ~pMb~n"
- " Ets Used Memory: ~pMb~n"
- " Erlang VM Used Memory: ~pMb~n"
- " Process Limit: ~p~n"
- " Process Used: ~p~n"
- "++++++++++++++++++++++++++++++++++++++++++~n"
- , [node(), Release, SchedNum, ProcMemUsed / 1024 / 1024, EtsMemAlc / 1024 / 1024, MemTot / 1024 / 1024, ProcLimit, ProcCount]),
- ok.
-
- %% @doc 运维要用
- top_back() ->
- Release = erlang:system_info(otp_release),
- SchedNum = erlang:system_info(schedulers),
- ProcCount = erlang:system_info(process_count),
- ProcLimit = erlang:system_info(process_limit),
- ProcMemUsed = erlang:memory(processes_used),
- EtsMemAlc = erlang:memory(ets),
- MemTot = erlang:memory(total),
- Str = io_lib:format(
- " Erlang 版本: ~p~n"
- " 可使用的调度线程: ~p~n"
- " 所有进程使用的内存: ~pMb~n"
- " 所有ets使用的内存: ~pMb~n"
- " Erlang系统占用内存: ~pMb~n"
- " 可创建进程数量上限: ~p~n"
- " 当前进程数: ~p~n"
- , [Release, SchedNum, ProcMemUsed / 1024 / 1024, EtsMemAlc / 1024 / 1024, MemTot / 1024 / 1024, ProcLimit, ProcCount]),
- binary_to_list(list_to_binary(Str)).
-
- %% @spec ets_mem() -> term()
- %% @doc 查看内存占用最多的30张ets表
- ets_mem() ->
- L = ets:all(),
- Mems = lists:map(fun(Tab) ->
- Info = ets:info(Tab),
- case lists:keyfind(memory, 1, Info) of
- {memory, Mem} -> {Tab, Mem};
- _ -> {Tab, 0}
- end
- end, L),
- L1 = lists:sublist(lists:reverse(lists:keysort(2, Mems)), 30),
- io:format("~n--------------------------------------------------~n"
- "~-30w ~w~n--------------------------------------------------~n"
- , [table, used_memory]),
- lists:foreach(
- fun({Tab, Mem}) ->
- io:format("~-30w ~wKb~n", [Tab, Mem / 1024])
- end, L1).
-
- %% @spec tcp_links() -> Info
- %% @doc 统计tcp链接
- tcp_links() ->
- L = erlang:ports(),
- F = fun(P) ->
- Pinfo = erlang:port_info(P),
- case lists:keyfind(name, 1, Pinfo) of
- {name, "tcp_inet"} -> true;
- _ -> false
- end
- end,
- L1 = lists:filter(F, L),
- io:format("~n当前socket数量(包括链接数据库的socket): ~w~n", [length(L1)]).
-
-
- %% @doc 备份进程信息
- dump_process_info(Pid) ->
- {{Year, Month, Day}, {Hour, Minutes, Second}} = util:local_time(),
- {ok, FileHandle} = file:open(util:fbin("~s-~w-~w-~w-~w-~w-~w", [<<"../logs/pid_info.dump">>, Year, Month, Day, Hour, Minutes, Second]), write),
- case erlang:process_info(Pid) of
- Info when is_list(Info) ->
- lists:foreach(fun({messages, Messages}) ->
- case Messages =:= [] of
- true ->
- io:format(FileHandle, "~w~n", [{messages, Messages}]);
- _ ->
- io:format(FileHandle, "{messages,~n", []),
- lists:foreach(fun(M) ->
- io:format(FileHandle, " ~w~n", [M])
- end, Messages),
- io:format(FileHandle, "}~n", [])
- end;
- ({dictionary, Dics}) ->
- case Dics =:= [] of
- true ->
- io:format(FileHandle, "~w~n", [{dictionary, Dics}]);
- _ ->
- io:format(FileHandle, "{dictionary,~n", []),
- lists:foreach(fun(M) ->
- io:format(FileHandle, " ~w~n", [M])
- end, Dics),
- io:format(FileHandle, "}~n", [])
- end;
- (E) ->
- io:format(FileHandle, "~w~n", [E])
- end, Info);
- _ ->
- io:format("not find pid info")
- end,
- file:close(FileHandle).
-
- get_process_info_and_zero_value(InfoName) ->
- PList = erlang:processes(),
- ZList = lists:filter(
- fun(T) ->
- case erlang:process_info(T, InfoName) of
- {InfoName, 0} -> false;
- _ -> true
- end
- end, PList),
- ZZList = lists:map(
- fun(T) -> {T, erlang:process_info(T, InfoName), erlang:process_info(T, registered_name)}
- end, ZList),
- [length(PList), InfoName, length(ZZList), ZZList].
-
- get_process_info_and_large_than_value(InfoName, Value) ->
- PList = erlang:processes(),
- ZList = lists:filter(
- fun(T) ->
- case erlang:process_info(T, InfoName) of
- {InfoName, VV} ->
- if VV > Value -> true;
- true -> false
- end;
- _ -> true
- end
- end, PList),
- ZZList = lists:map(
- fun(T) -> {T, erlang:process_info(T, InfoName), erlang:process_info(T, registered_name)}
- end, ZList),
- [length(PList), InfoName, Value, length(ZZList), ZZList].
-
- get_msg_queue() ->
- io:fwrite("process count:~p~n~p value is not 0 count:~p~nLists:~p~n",
- get_process_info_and_zero_value(message_queue_len)).
-
- get_memory() ->
- io:fwrite("process count:~p~n~p value is large than ~p count:~p~nLists:~p~n",
- get_process_info_and_large_than_value(memory, 1048576)).
-
- get_memory(Value) ->
- io:fwrite("process count:~p~n~p value is large than ~p count:~p~nLists:~p~n",
- get_process_info_and_large_than_value(memory, Value)).
-
- get_heap() ->
- io:fwrite("process count:~p~n~p value is large than ~p count:~p~nLists:~p~n",
- get_process_info_and_large_than_value(heap_size, 1048576)).
-
- get_heap(Value) ->
- io:fwrite("process count:~p~n~p value is large than ~p count:~p~nLists:~p~n",
- get_process_info_and_large_than_value(heap_size, Value)).
-
- get_processes() ->
- io:fwrite("process count:~p~n~p value is large than ~p count:~p~nLists:~p~n",
- get_process_info_and_large_than_value(memory, 0)).
-
-
|