session.c 60 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845184618471848184918501851185218531854185518561857185818591860186118621863186418651866186718681869187018711872187318741875187618771878187918801881188218831884188518861887188818891890189118921893189418951896189718981899190019011902190319041905190619071908190919101911191219131914191519161917191819191920192119221923192419251926192719281929193019311932193319341935193619371938193919401941194219431944194519461947194819491950195119521953195419551956195719581959196019611962196319641965196619671968196919701971197219731974197519761977197819791980198119821983198419851986198719881989199019911992199319941995199619971998199920002001200220032004200520062007200820092010201120122013201420152016201720182019202020212022202320242025202620272028202920302031203220332034203520362037203820392040204120422043204420452046204720482049205020512052205320542055205620572058205920602061206220632064206520662067206820692070207120722073207420752076207720782079208020812082208320842085208620872088208920902091209220932094209520962097209820992100210121022103210421052106210721082109211021112112211321142115211621172118211921202121212221232124212521262127212821292130213121322133213421352136213721382139214021412142214321442145214621472148214921502151215221532154215521562157215821592160216121622163216421652166216721682169217021712172217321742175217621772178217921802181218221832184218521862187218821892190219121922193219421952196219721982199220022012202220322042205220622072208220922102211221222132214221522162217221822192220222122222223222422252226222722282229223022312232223322342235223622372238223922402241224222432244224522462247224822492250
  1. // SPDX-License-Identifier: GPL-2.0
  2. #include <errno.h>
  3. #include <inttypes.h>
  4. #include <linux/kernel.h>
  5. #include <traceevent/event-parse.h>
  6. #include <api/fs/fs.h>
  7. #include <byteswap.h>
  8. #include <unistd.h>
  9. #include <sys/types.h>
  10. #include <sys/mman.h>
  11. #include "evlist.h"
  12. #include "evsel.h"
  13. #include "memswap.h"
  14. #include "session.h"
  15. #include "tool.h"
  16. #include "sort.h"
  17. #include "util.h"
  18. #include "cpumap.h"
  19. #include "perf_regs.h"
  20. #include "asm/bug.h"
  21. #include "auxtrace.h"
  22. #include "thread.h"
  23. #include "thread-stack.h"
  24. #include "stat.h"
  25. #include "arch/common.h"
  26. static int perf_session__deliver_event(struct perf_session *session,
  27. union perf_event *event,
  28. struct perf_tool *tool,
  29. u64 file_offset);
  30. static int perf_session__open(struct perf_session *session)
  31. {
  32. struct perf_data *data = session->data;
  33. if (perf_session__read_header(session) < 0) {
  34. pr_err("incompatible file format (rerun with -v to learn more)\n");
  35. return -1;
  36. }
  37. if (perf_data__is_pipe(data))
  38. return 0;
  39. if (perf_header__has_feat(&session->header, HEADER_STAT))
  40. return 0;
  41. if (!perf_evlist__valid_sample_type(session->evlist)) {
  42. pr_err("non matching sample_type\n");
  43. return -1;
  44. }
  45. if (!perf_evlist__valid_sample_id_all(session->evlist)) {
  46. pr_err("non matching sample_id_all\n");
  47. return -1;
  48. }
  49. if (!perf_evlist__valid_read_format(session->evlist)) {
  50. pr_err("non matching read_format\n");
  51. return -1;
  52. }
  53. return 0;
  54. }
  55. void perf_session__set_id_hdr_size(struct perf_session *session)
  56. {
  57. u16 id_hdr_size = perf_evlist__id_hdr_size(session->evlist);
  58. machines__set_id_hdr_size(&session->machines, id_hdr_size);
  59. }
  60. int perf_session__create_kernel_maps(struct perf_session *session)
  61. {
  62. int ret = machine__create_kernel_maps(&session->machines.host);
  63. if (ret >= 0)
  64. ret = machines__create_guest_kernel_maps(&session->machines);
  65. return ret;
  66. }
  67. static void perf_session__destroy_kernel_maps(struct perf_session *session)
  68. {
  69. machines__destroy_kernel_maps(&session->machines);
  70. }
  71. static bool perf_session__has_comm_exec(struct perf_session *session)
  72. {
  73. struct perf_evsel *evsel;
  74. evlist__for_each_entry(session->evlist, evsel) {
  75. if (evsel->attr.comm_exec)
  76. return true;
  77. }
  78. return false;
  79. }
  80. static void perf_session__set_comm_exec(struct perf_session *session)
  81. {
  82. bool comm_exec = perf_session__has_comm_exec(session);
  83. machines__set_comm_exec(&session->machines, comm_exec);
  84. }
  85. static int ordered_events__deliver_event(struct ordered_events *oe,
  86. struct ordered_event *event)
  87. {
  88. struct perf_session *session = container_of(oe, struct perf_session,
  89. ordered_events);
  90. return perf_session__deliver_event(session, event->event,
  91. session->tool, event->file_offset);
  92. }
  93. struct perf_session *perf_session__new(struct perf_data *data,
  94. bool repipe, struct perf_tool *tool)
  95. {
  96. struct perf_session *session = zalloc(sizeof(*session));
  97. if (!session)
  98. goto out;
  99. session->repipe = repipe;
  100. session->tool = tool;
  101. INIT_LIST_HEAD(&session->auxtrace_index);
  102. machines__init(&session->machines);
  103. ordered_events__init(&session->ordered_events, ordered_events__deliver_event);
  104. if (data) {
  105. if (perf_data__open(data))
  106. goto out_delete;
  107. session->data = data;
  108. if (perf_data__is_read(data)) {
  109. if (perf_session__open(session) < 0)
  110. goto out_close;
  111. /*
  112. * set session attributes that are present in perf.data
  113. * but not in pipe-mode.
  114. */
  115. if (!data->is_pipe) {
  116. perf_session__set_id_hdr_size(session);
  117. perf_session__set_comm_exec(session);
  118. }
  119. }
  120. } else {
  121. session->machines.host.env = &perf_env;
  122. }
  123. session->machines.host.single_address_space =
  124. perf_env__single_address_space(session->machines.host.env);
  125. if (!data || perf_data__is_write(data)) {
  126. /*
  127. * In O_RDONLY mode this will be performed when reading the
  128. * kernel MMAP event, in perf_event__process_mmap().
  129. */
  130. if (perf_session__create_kernel_maps(session) < 0)
  131. pr_warning("Cannot read kernel map\n");
  132. }
  133. /*
  134. * In pipe-mode, evlist is empty until PERF_RECORD_HEADER_ATTR is
  135. * processed, so perf_evlist__sample_id_all is not meaningful here.
  136. */
  137. if ((!data || !data->is_pipe) && tool && tool->ordering_requires_timestamps &&
  138. tool->ordered_events && !perf_evlist__sample_id_all(session->evlist)) {
  139. dump_printf("WARNING: No sample_id_all support, falling back to unordered processing\n");
  140. tool->ordered_events = false;
  141. }
  142. return session;
  143. out_close:
  144. perf_data__close(data);
  145. out_delete:
  146. perf_session__delete(session);
  147. out:
  148. return NULL;
  149. }
  150. static void perf_session__delete_threads(struct perf_session *session)
  151. {
  152. machine__delete_threads(&session->machines.host);
  153. }
  154. void perf_session__delete(struct perf_session *session)
  155. {
  156. if (session == NULL)
  157. return;
  158. auxtrace__free(session);
  159. auxtrace_index__free(&session->auxtrace_index);
  160. perf_session__destroy_kernel_maps(session);
  161. perf_session__delete_threads(session);
  162. perf_env__exit(&session->header.env);
  163. machines__exit(&session->machines);
  164. if (session->data)
  165. perf_data__close(session->data);
  166. free(session);
  167. }
  168. static int process_event_synth_tracing_data_stub(struct perf_tool *tool
  169. __maybe_unused,
  170. union perf_event *event
  171. __maybe_unused,
  172. struct perf_session *session
  173. __maybe_unused)
  174. {
  175. dump_printf(": unhandled!\n");
  176. return 0;
  177. }
  178. static int process_event_synth_attr_stub(struct perf_tool *tool __maybe_unused,
  179. union perf_event *event __maybe_unused,
  180. struct perf_evlist **pevlist
  181. __maybe_unused)
  182. {
  183. dump_printf(": unhandled!\n");
  184. return 0;
  185. }
  186. static int process_event_synth_event_update_stub(struct perf_tool *tool __maybe_unused,
  187. union perf_event *event __maybe_unused,
  188. struct perf_evlist **pevlist
  189. __maybe_unused)
  190. {
  191. if (dump_trace)
  192. perf_event__fprintf_event_update(event, stdout);
  193. dump_printf(": unhandled!\n");
  194. return 0;
  195. }
  196. static int process_event_sample_stub(struct perf_tool *tool __maybe_unused,
  197. union perf_event *event __maybe_unused,
  198. struct perf_sample *sample __maybe_unused,
  199. struct perf_evsel *evsel __maybe_unused,
  200. struct machine *machine __maybe_unused)
  201. {
  202. dump_printf(": unhandled!\n");
  203. return 0;
  204. }
  205. static int process_event_stub(struct perf_tool *tool __maybe_unused,
  206. union perf_event *event __maybe_unused,
  207. struct perf_sample *sample __maybe_unused,
  208. struct machine *machine __maybe_unused)
  209. {
  210. dump_printf(": unhandled!\n");
  211. return 0;
  212. }
  213. static int process_finished_round_stub(struct perf_tool *tool __maybe_unused,
  214. union perf_event *event __maybe_unused,
  215. struct ordered_events *oe __maybe_unused)
  216. {
  217. dump_printf(": unhandled!\n");
  218. return 0;
  219. }
  220. static int process_finished_round(struct perf_tool *tool,
  221. union perf_event *event,
  222. struct ordered_events *oe);
  223. static int skipn(int fd, off_t n)
  224. {
  225. char buf[4096];
  226. ssize_t ret;
  227. while (n > 0) {
  228. ret = read(fd, buf, min(n, (off_t)sizeof(buf)));
  229. if (ret <= 0)
  230. return ret;
  231. n -= ret;
  232. }
  233. return 0;
  234. }
  235. static s64 process_event_auxtrace_stub(struct perf_tool *tool __maybe_unused,
  236. union perf_event *event,
  237. struct perf_session *session
  238. __maybe_unused)
  239. {
  240. dump_printf(": unhandled!\n");
  241. if (perf_data__is_pipe(session->data))
  242. skipn(perf_data__fd(session->data), event->auxtrace.size);
  243. return event->auxtrace.size;
  244. }
  245. static int process_event_op2_stub(struct perf_tool *tool __maybe_unused,
  246. union perf_event *event __maybe_unused,
  247. struct perf_session *session __maybe_unused)
  248. {
  249. dump_printf(": unhandled!\n");
  250. return 0;
  251. }
  252. static
  253. int process_event_thread_map_stub(struct perf_tool *tool __maybe_unused,
  254. union perf_event *event __maybe_unused,
  255. struct perf_session *session __maybe_unused)
  256. {
  257. if (dump_trace)
  258. perf_event__fprintf_thread_map(event, stdout);
  259. dump_printf(": unhandled!\n");
  260. return 0;
  261. }
  262. static
  263. int process_event_cpu_map_stub(struct perf_tool *tool __maybe_unused,
  264. union perf_event *event __maybe_unused,
  265. struct perf_session *session __maybe_unused)
  266. {
  267. if (dump_trace)
  268. perf_event__fprintf_cpu_map(event, stdout);
  269. dump_printf(": unhandled!\n");
  270. return 0;
  271. }
  272. static
  273. int process_event_stat_config_stub(struct perf_tool *tool __maybe_unused,
  274. union perf_event *event __maybe_unused,
  275. struct perf_session *session __maybe_unused)
  276. {
  277. if (dump_trace)
  278. perf_event__fprintf_stat_config(event, stdout);
  279. dump_printf(": unhandled!\n");
  280. return 0;
  281. }
  282. static int process_stat_stub(struct perf_tool *tool __maybe_unused,
  283. union perf_event *event __maybe_unused,
  284. struct perf_session *perf_session
  285. __maybe_unused)
  286. {
  287. if (dump_trace)
  288. perf_event__fprintf_stat(event, stdout);
  289. dump_printf(": unhandled!\n");
  290. return 0;
  291. }
  292. static int process_stat_round_stub(struct perf_tool *tool __maybe_unused,
  293. union perf_event *event __maybe_unused,
  294. struct perf_session *perf_session
  295. __maybe_unused)
  296. {
  297. if (dump_trace)
  298. perf_event__fprintf_stat_round(event, stdout);
  299. dump_printf(": unhandled!\n");
  300. return 0;
  301. }
  302. void perf_tool__fill_defaults(struct perf_tool *tool)
  303. {
  304. if (tool->sample == NULL)
  305. tool->sample = process_event_sample_stub;
  306. if (tool->mmap == NULL)
  307. tool->mmap = process_event_stub;
  308. if (tool->mmap2 == NULL)
  309. tool->mmap2 = process_event_stub;
  310. if (tool->comm == NULL)
  311. tool->comm = process_event_stub;
  312. if (tool->namespaces == NULL)
  313. tool->namespaces = process_event_stub;
  314. if (tool->fork == NULL)
  315. tool->fork = process_event_stub;
  316. if (tool->exit == NULL)
  317. tool->exit = process_event_stub;
  318. if (tool->lost == NULL)
  319. tool->lost = perf_event__process_lost;
  320. if (tool->lost_samples == NULL)
  321. tool->lost_samples = perf_event__process_lost_samples;
  322. if (tool->aux == NULL)
  323. tool->aux = perf_event__process_aux;
  324. if (tool->itrace_start == NULL)
  325. tool->itrace_start = perf_event__process_itrace_start;
  326. if (tool->context_switch == NULL)
  327. tool->context_switch = perf_event__process_switch;
  328. if (tool->read == NULL)
  329. tool->read = process_event_sample_stub;
  330. if (tool->throttle == NULL)
  331. tool->throttle = process_event_stub;
  332. if (tool->unthrottle == NULL)
  333. tool->unthrottle = process_event_stub;
  334. if (tool->attr == NULL)
  335. tool->attr = process_event_synth_attr_stub;
  336. if (tool->event_update == NULL)
  337. tool->event_update = process_event_synth_event_update_stub;
  338. if (tool->tracing_data == NULL)
  339. tool->tracing_data = process_event_synth_tracing_data_stub;
  340. if (tool->build_id == NULL)
  341. tool->build_id = process_event_op2_stub;
  342. if (tool->finished_round == NULL) {
  343. if (tool->ordered_events)
  344. tool->finished_round = process_finished_round;
  345. else
  346. tool->finished_round = process_finished_round_stub;
  347. }
  348. if (tool->id_index == NULL)
  349. tool->id_index = process_event_op2_stub;
  350. if (tool->auxtrace_info == NULL)
  351. tool->auxtrace_info = process_event_op2_stub;
  352. if (tool->auxtrace == NULL)
  353. tool->auxtrace = process_event_auxtrace_stub;
  354. if (tool->auxtrace_error == NULL)
  355. tool->auxtrace_error = process_event_op2_stub;
  356. if (tool->thread_map == NULL)
  357. tool->thread_map = process_event_thread_map_stub;
  358. if (tool->cpu_map == NULL)
  359. tool->cpu_map = process_event_cpu_map_stub;
  360. if (tool->stat_config == NULL)
  361. tool->stat_config = process_event_stat_config_stub;
  362. if (tool->stat == NULL)
  363. tool->stat = process_stat_stub;
  364. if (tool->stat_round == NULL)
  365. tool->stat_round = process_stat_round_stub;
  366. if (tool->time_conv == NULL)
  367. tool->time_conv = process_event_op2_stub;
  368. if (tool->feature == NULL)
  369. tool->feature = process_event_op2_stub;
  370. }
  371. static void swap_sample_id_all(union perf_event *event, void *data)
  372. {
  373. void *end = (void *) event + event->header.size;
  374. int size = end - data;
  375. BUG_ON(size % sizeof(u64));
  376. mem_bswap_64(data, size);
  377. }
  378. static void perf_event__all64_swap(union perf_event *event,
  379. bool sample_id_all __maybe_unused)
  380. {
  381. struct perf_event_header *hdr = &event->header;
  382. mem_bswap_64(hdr + 1, event->header.size - sizeof(*hdr));
  383. }
  384. static void perf_event__comm_swap(union perf_event *event, bool sample_id_all)
  385. {
  386. event->comm.pid = bswap_32(event->comm.pid);
  387. event->comm.tid = bswap_32(event->comm.tid);
  388. if (sample_id_all) {
  389. void *data = &event->comm.comm;
  390. data += PERF_ALIGN(strlen(data) + 1, sizeof(u64));
  391. swap_sample_id_all(event, data);
  392. }
  393. }
  394. static void perf_event__mmap_swap(union perf_event *event,
  395. bool sample_id_all)
  396. {
  397. event->mmap.pid = bswap_32(event->mmap.pid);
  398. event->mmap.tid = bswap_32(event->mmap.tid);
  399. event->mmap.start = bswap_64(event->mmap.start);
  400. event->mmap.len = bswap_64(event->mmap.len);
  401. event->mmap.pgoff = bswap_64(event->mmap.pgoff);
  402. if (sample_id_all) {
  403. void *data = &event->mmap.filename;
  404. data += PERF_ALIGN(strlen(data) + 1, sizeof(u64));
  405. swap_sample_id_all(event, data);
  406. }
  407. }
  408. static void perf_event__mmap2_swap(union perf_event *event,
  409. bool sample_id_all)
  410. {
  411. event->mmap2.pid = bswap_32(event->mmap2.pid);
  412. event->mmap2.tid = bswap_32(event->mmap2.tid);
  413. event->mmap2.start = bswap_64(event->mmap2.start);
  414. event->mmap2.len = bswap_64(event->mmap2.len);
  415. event->mmap2.pgoff = bswap_64(event->mmap2.pgoff);
  416. event->mmap2.maj = bswap_32(event->mmap2.maj);
  417. event->mmap2.min = bswap_32(event->mmap2.min);
  418. event->mmap2.ino = bswap_64(event->mmap2.ino);
  419. event->mmap2.ino_generation = bswap_64(event->mmap2.ino_generation);
  420. if (sample_id_all) {
  421. void *data = &event->mmap2.filename;
  422. data += PERF_ALIGN(strlen(data) + 1, sizeof(u64));
  423. swap_sample_id_all(event, data);
  424. }
  425. }
  426. static void perf_event__task_swap(union perf_event *event, bool sample_id_all)
  427. {
  428. event->fork.pid = bswap_32(event->fork.pid);
  429. event->fork.tid = bswap_32(event->fork.tid);
  430. event->fork.ppid = bswap_32(event->fork.ppid);
  431. event->fork.ptid = bswap_32(event->fork.ptid);
  432. event->fork.time = bswap_64(event->fork.time);
  433. if (sample_id_all)
  434. swap_sample_id_all(event, &event->fork + 1);
  435. }
  436. static void perf_event__read_swap(union perf_event *event, bool sample_id_all)
  437. {
  438. event->read.pid = bswap_32(event->read.pid);
  439. event->read.tid = bswap_32(event->read.tid);
  440. event->read.value = bswap_64(event->read.value);
  441. event->read.time_enabled = bswap_64(event->read.time_enabled);
  442. event->read.time_running = bswap_64(event->read.time_running);
  443. event->read.id = bswap_64(event->read.id);
  444. if (sample_id_all)
  445. swap_sample_id_all(event, &event->read + 1);
  446. }
  447. static void perf_event__aux_swap(union perf_event *event, bool sample_id_all)
  448. {
  449. event->aux.aux_offset = bswap_64(event->aux.aux_offset);
  450. event->aux.aux_size = bswap_64(event->aux.aux_size);
  451. event->aux.flags = bswap_64(event->aux.flags);
  452. if (sample_id_all)
  453. swap_sample_id_all(event, &event->aux + 1);
  454. }
  455. static void perf_event__itrace_start_swap(union perf_event *event,
  456. bool sample_id_all)
  457. {
  458. event->itrace_start.pid = bswap_32(event->itrace_start.pid);
  459. event->itrace_start.tid = bswap_32(event->itrace_start.tid);
  460. if (sample_id_all)
  461. swap_sample_id_all(event, &event->itrace_start + 1);
  462. }
  463. static void perf_event__switch_swap(union perf_event *event, bool sample_id_all)
  464. {
  465. if (event->header.type == PERF_RECORD_SWITCH_CPU_WIDE) {
  466. event->context_switch.next_prev_pid =
  467. bswap_32(event->context_switch.next_prev_pid);
  468. event->context_switch.next_prev_tid =
  469. bswap_32(event->context_switch.next_prev_tid);
  470. }
  471. if (sample_id_all)
  472. swap_sample_id_all(event, &event->context_switch + 1);
  473. }
  474. static void perf_event__throttle_swap(union perf_event *event,
  475. bool sample_id_all)
  476. {
  477. event->throttle.time = bswap_64(event->throttle.time);
  478. event->throttle.id = bswap_64(event->throttle.id);
  479. event->throttle.stream_id = bswap_64(event->throttle.stream_id);
  480. if (sample_id_all)
  481. swap_sample_id_all(event, &event->throttle + 1);
  482. }
  483. static u8 revbyte(u8 b)
  484. {
  485. int rev = (b >> 4) | ((b & 0xf) << 4);
  486. rev = ((rev & 0xcc) >> 2) | ((rev & 0x33) << 2);
  487. rev = ((rev & 0xaa) >> 1) | ((rev & 0x55) << 1);
  488. return (u8) rev;
  489. }
  490. /*
  491. * XXX this is hack in attempt to carry flags bitfield
  492. * through endian village. ABI says:
  493. *
  494. * Bit-fields are allocated from right to left (least to most significant)
  495. * on little-endian implementations and from left to right (most to least
  496. * significant) on big-endian implementations.
  497. *
  498. * The above seems to be byte specific, so we need to reverse each
  499. * byte of the bitfield. 'Internet' also says this might be implementation
  500. * specific and we probably need proper fix and carry perf_event_attr
  501. * bitfield flags in separate data file FEAT_ section. Thought this seems
  502. * to work for now.
  503. */
  504. static void swap_bitfield(u8 *p, unsigned len)
  505. {
  506. unsigned i;
  507. for (i = 0; i < len; i++) {
  508. *p = revbyte(*p);
  509. p++;
  510. }
  511. }
  512. /* exported for swapping attributes in file header */
  513. void perf_event__attr_swap(struct perf_event_attr *attr)
  514. {
  515. attr->type = bswap_32(attr->type);
  516. attr->size = bswap_32(attr->size);
  517. #define bswap_safe(f, n) \
  518. (attr->size > (offsetof(struct perf_event_attr, f) + \
  519. sizeof(attr->f) * (n)))
  520. #define bswap_field(f, sz) \
  521. do { \
  522. if (bswap_safe(f, 0)) \
  523. attr->f = bswap_##sz(attr->f); \
  524. } while(0)
  525. #define bswap_field_16(f) bswap_field(f, 16)
  526. #define bswap_field_32(f) bswap_field(f, 32)
  527. #define bswap_field_64(f) bswap_field(f, 64)
  528. bswap_field_64(config);
  529. bswap_field_64(sample_period);
  530. bswap_field_64(sample_type);
  531. bswap_field_64(read_format);
  532. bswap_field_32(wakeup_events);
  533. bswap_field_32(bp_type);
  534. bswap_field_64(bp_addr);
  535. bswap_field_64(bp_len);
  536. bswap_field_64(branch_sample_type);
  537. bswap_field_64(sample_regs_user);
  538. bswap_field_32(sample_stack_user);
  539. bswap_field_32(aux_watermark);
  540. bswap_field_16(sample_max_stack);
  541. /*
  542. * After read_format are bitfields. Check read_format because
  543. * we are unable to use offsetof on bitfield.
  544. */
  545. if (bswap_safe(read_format, 1))
  546. swap_bitfield((u8 *) (&attr->read_format + 1),
  547. sizeof(u64));
  548. #undef bswap_field_64
  549. #undef bswap_field_32
  550. #undef bswap_field
  551. #undef bswap_safe
  552. }
  553. static void perf_event__hdr_attr_swap(union perf_event *event,
  554. bool sample_id_all __maybe_unused)
  555. {
  556. size_t size;
  557. perf_event__attr_swap(&event->attr.attr);
  558. size = event->header.size;
  559. size -= (void *)&event->attr.id - (void *)event;
  560. mem_bswap_64(event->attr.id, size);
  561. }
  562. static void perf_event__event_update_swap(union perf_event *event,
  563. bool sample_id_all __maybe_unused)
  564. {
  565. event->event_update.type = bswap_64(event->event_update.type);
  566. event->event_update.id = bswap_64(event->event_update.id);
  567. }
  568. static void perf_event__event_type_swap(union perf_event *event,
  569. bool sample_id_all __maybe_unused)
  570. {
  571. event->event_type.event_type.event_id =
  572. bswap_64(event->event_type.event_type.event_id);
  573. }
  574. static void perf_event__tracing_data_swap(union perf_event *event,
  575. bool sample_id_all __maybe_unused)
  576. {
  577. event->tracing_data.size = bswap_32(event->tracing_data.size);
  578. }
  579. static void perf_event__auxtrace_info_swap(union perf_event *event,
  580. bool sample_id_all __maybe_unused)
  581. {
  582. size_t size;
  583. event->auxtrace_info.type = bswap_32(event->auxtrace_info.type);
  584. size = event->header.size;
  585. size -= (void *)&event->auxtrace_info.priv - (void *)event;
  586. mem_bswap_64(event->auxtrace_info.priv, size);
  587. }
  588. static void perf_event__auxtrace_swap(union perf_event *event,
  589. bool sample_id_all __maybe_unused)
  590. {
  591. event->auxtrace.size = bswap_64(event->auxtrace.size);
  592. event->auxtrace.offset = bswap_64(event->auxtrace.offset);
  593. event->auxtrace.reference = bswap_64(event->auxtrace.reference);
  594. event->auxtrace.idx = bswap_32(event->auxtrace.idx);
  595. event->auxtrace.tid = bswap_32(event->auxtrace.tid);
  596. event->auxtrace.cpu = bswap_32(event->auxtrace.cpu);
  597. }
  598. static void perf_event__auxtrace_error_swap(union perf_event *event,
  599. bool sample_id_all __maybe_unused)
  600. {
  601. event->auxtrace_error.type = bswap_32(event->auxtrace_error.type);
  602. event->auxtrace_error.code = bswap_32(event->auxtrace_error.code);
  603. event->auxtrace_error.cpu = bswap_32(event->auxtrace_error.cpu);
  604. event->auxtrace_error.pid = bswap_32(event->auxtrace_error.pid);
  605. event->auxtrace_error.tid = bswap_32(event->auxtrace_error.tid);
  606. event->auxtrace_error.ip = bswap_64(event->auxtrace_error.ip);
  607. }
  608. static void perf_event__thread_map_swap(union perf_event *event,
  609. bool sample_id_all __maybe_unused)
  610. {
  611. unsigned i;
  612. event->thread_map.nr = bswap_64(event->thread_map.nr);
  613. for (i = 0; i < event->thread_map.nr; i++)
  614. event->thread_map.entries[i].pid = bswap_64(event->thread_map.entries[i].pid);
  615. }
  616. static void perf_event__cpu_map_swap(union perf_event *event,
  617. bool sample_id_all __maybe_unused)
  618. {
  619. struct cpu_map_data *data = &event->cpu_map.data;
  620. struct cpu_map_entries *cpus;
  621. struct cpu_map_mask *mask;
  622. unsigned i;
  623. data->type = bswap_64(data->type);
  624. switch (data->type) {
  625. case PERF_CPU_MAP__CPUS:
  626. cpus = (struct cpu_map_entries *)data->data;
  627. cpus->nr = bswap_16(cpus->nr);
  628. for (i = 0; i < cpus->nr; i++)
  629. cpus->cpu[i] = bswap_16(cpus->cpu[i]);
  630. break;
  631. case PERF_CPU_MAP__MASK:
  632. mask = (struct cpu_map_mask *) data->data;
  633. mask->nr = bswap_16(mask->nr);
  634. mask->long_size = bswap_16(mask->long_size);
  635. switch (mask->long_size) {
  636. case 4: mem_bswap_32(&mask->mask, mask->nr); break;
  637. case 8: mem_bswap_64(&mask->mask, mask->nr); break;
  638. default:
  639. pr_err("cpu_map swap: unsupported long size\n");
  640. }
  641. default:
  642. break;
  643. }
  644. }
  645. static void perf_event__stat_config_swap(union perf_event *event,
  646. bool sample_id_all __maybe_unused)
  647. {
  648. u64 size;
  649. size = event->stat_config.nr * sizeof(event->stat_config.data[0]);
  650. size += 1; /* nr item itself */
  651. mem_bswap_64(&event->stat_config.nr, size);
  652. }
  653. static void perf_event__stat_swap(union perf_event *event,
  654. bool sample_id_all __maybe_unused)
  655. {
  656. event->stat.id = bswap_64(event->stat.id);
  657. event->stat.thread = bswap_32(event->stat.thread);
  658. event->stat.cpu = bswap_32(event->stat.cpu);
  659. event->stat.val = bswap_64(event->stat.val);
  660. event->stat.ena = bswap_64(event->stat.ena);
  661. event->stat.run = bswap_64(event->stat.run);
  662. }
  663. static void perf_event__stat_round_swap(union perf_event *event,
  664. bool sample_id_all __maybe_unused)
  665. {
  666. event->stat_round.type = bswap_64(event->stat_round.type);
  667. event->stat_round.time = bswap_64(event->stat_round.time);
  668. }
  669. typedef void (*perf_event__swap_op)(union perf_event *event,
  670. bool sample_id_all);
  671. static perf_event__swap_op perf_event__swap_ops[] = {
  672. [PERF_RECORD_MMAP] = perf_event__mmap_swap,
  673. [PERF_RECORD_MMAP2] = perf_event__mmap2_swap,
  674. [PERF_RECORD_COMM] = perf_event__comm_swap,
  675. [PERF_RECORD_FORK] = perf_event__task_swap,
  676. [PERF_RECORD_EXIT] = perf_event__task_swap,
  677. [PERF_RECORD_LOST] = perf_event__all64_swap,
  678. [PERF_RECORD_READ] = perf_event__read_swap,
  679. [PERF_RECORD_THROTTLE] = perf_event__throttle_swap,
  680. [PERF_RECORD_UNTHROTTLE] = perf_event__throttle_swap,
  681. [PERF_RECORD_SAMPLE] = perf_event__all64_swap,
  682. [PERF_RECORD_AUX] = perf_event__aux_swap,
  683. [PERF_RECORD_ITRACE_START] = perf_event__itrace_start_swap,
  684. [PERF_RECORD_LOST_SAMPLES] = perf_event__all64_swap,
  685. [PERF_RECORD_SWITCH] = perf_event__switch_swap,
  686. [PERF_RECORD_SWITCH_CPU_WIDE] = perf_event__switch_swap,
  687. [PERF_RECORD_HEADER_ATTR] = perf_event__hdr_attr_swap,
  688. [PERF_RECORD_HEADER_EVENT_TYPE] = perf_event__event_type_swap,
  689. [PERF_RECORD_HEADER_TRACING_DATA] = perf_event__tracing_data_swap,
  690. [PERF_RECORD_HEADER_BUILD_ID] = NULL,
  691. [PERF_RECORD_ID_INDEX] = perf_event__all64_swap,
  692. [PERF_RECORD_AUXTRACE_INFO] = perf_event__auxtrace_info_swap,
  693. [PERF_RECORD_AUXTRACE] = perf_event__auxtrace_swap,
  694. [PERF_RECORD_AUXTRACE_ERROR] = perf_event__auxtrace_error_swap,
  695. [PERF_RECORD_THREAD_MAP] = perf_event__thread_map_swap,
  696. [PERF_RECORD_CPU_MAP] = perf_event__cpu_map_swap,
  697. [PERF_RECORD_STAT_CONFIG] = perf_event__stat_config_swap,
  698. [PERF_RECORD_STAT] = perf_event__stat_swap,
  699. [PERF_RECORD_STAT_ROUND] = perf_event__stat_round_swap,
  700. [PERF_RECORD_EVENT_UPDATE] = perf_event__event_update_swap,
  701. [PERF_RECORD_TIME_CONV] = perf_event__all64_swap,
  702. [PERF_RECORD_HEADER_MAX] = NULL,
  703. };
  704. /*
  705. * When perf record finishes a pass on every buffers, it records this pseudo
  706. * event.
  707. * We record the max timestamp t found in the pass n.
  708. * Assuming these timestamps are monotonic across cpus, we know that if
  709. * a buffer still has events with timestamps below t, they will be all
  710. * available and then read in the pass n + 1.
  711. * Hence when we start to read the pass n + 2, we can safely flush every
  712. * events with timestamps below t.
  713. *
  714. * ============ PASS n =================
  715. * CPU 0 | CPU 1
  716. * |
  717. * cnt1 timestamps | cnt2 timestamps
  718. * 1 | 2
  719. * 2 | 3
  720. * - | 4 <--- max recorded
  721. *
  722. * ============ PASS n + 1 ==============
  723. * CPU 0 | CPU 1
  724. * |
  725. * cnt1 timestamps | cnt2 timestamps
  726. * 3 | 5
  727. * 4 | 6
  728. * 5 | 7 <---- max recorded
  729. *
  730. * Flush every events below timestamp 4
  731. *
  732. * ============ PASS n + 2 ==============
  733. * CPU 0 | CPU 1
  734. * |
  735. * cnt1 timestamps | cnt2 timestamps
  736. * 6 | 8
  737. * 7 | 9
  738. * - | 10
  739. *
  740. * Flush every events below timestamp 7
  741. * etc...
  742. */
  743. static int process_finished_round(struct perf_tool *tool __maybe_unused,
  744. union perf_event *event __maybe_unused,
  745. struct ordered_events *oe)
  746. {
  747. if (dump_trace)
  748. fprintf(stdout, "\n");
  749. return ordered_events__flush(oe, OE_FLUSH__ROUND);
  750. }
  751. int perf_session__queue_event(struct perf_session *s, union perf_event *event,
  752. u64 timestamp, u64 file_offset)
  753. {
  754. return ordered_events__queue(&s->ordered_events, event, timestamp, file_offset);
  755. }
  756. static void callchain__lbr_callstack_printf(struct perf_sample *sample)
  757. {
  758. struct ip_callchain *callchain = sample->callchain;
  759. struct branch_stack *lbr_stack = sample->branch_stack;
  760. u64 kernel_callchain_nr = callchain->nr;
  761. unsigned int i;
  762. for (i = 0; i < kernel_callchain_nr; i++) {
  763. if (callchain->ips[i] == PERF_CONTEXT_USER)
  764. break;
  765. }
  766. if ((i != kernel_callchain_nr) && lbr_stack->nr) {
  767. u64 total_nr;
  768. /*
  769. * LBR callstack can only get user call chain,
  770. * i is kernel call chain number,
  771. * 1 is PERF_CONTEXT_USER.
  772. *
  773. * The user call chain is stored in LBR registers.
  774. * LBR are pair registers. The caller is stored
  775. * in "from" register, while the callee is stored
  776. * in "to" register.
  777. * For example, there is a call stack
  778. * "A"->"B"->"C"->"D".
  779. * The LBR registers will recorde like
  780. * "C"->"D", "B"->"C", "A"->"B".
  781. * So only the first "to" register and all "from"
  782. * registers are needed to construct the whole stack.
  783. */
  784. total_nr = i + 1 + lbr_stack->nr + 1;
  785. kernel_callchain_nr = i + 1;
  786. printf("... LBR call chain: nr:%" PRIu64 "\n", total_nr);
  787. for (i = 0; i < kernel_callchain_nr; i++)
  788. printf("..... %2d: %016" PRIx64 "\n",
  789. i, callchain->ips[i]);
  790. printf("..... %2d: %016" PRIx64 "\n",
  791. (int)(kernel_callchain_nr), lbr_stack->entries[0].to);
  792. for (i = 0; i < lbr_stack->nr; i++)
  793. printf("..... %2d: %016" PRIx64 "\n",
  794. (int)(i + kernel_callchain_nr + 1), lbr_stack->entries[i].from);
  795. }
  796. }
  797. static void callchain__printf(struct perf_evsel *evsel,
  798. struct perf_sample *sample)
  799. {
  800. unsigned int i;
  801. struct ip_callchain *callchain = sample->callchain;
  802. if (perf_evsel__has_branch_callstack(evsel))
  803. callchain__lbr_callstack_printf(sample);
  804. printf("... FP chain: nr:%" PRIu64 "\n", callchain->nr);
  805. for (i = 0; i < callchain->nr; i++)
  806. printf("..... %2d: %016" PRIx64 "\n",
  807. i, callchain->ips[i]);
  808. }
  809. static void branch_stack__printf(struct perf_sample *sample)
  810. {
  811. uint64_t i;
  812. printf("... branch stack: nr:%" PRIu64 "\n", sample->branch_stack->nr);
  813. for (i = 0; i < sample->branch_stack->nr; i++) {
  814. struct branch_entry *e = &sample->branch_stack->entries[i];
  815. printf("..... %2"PRIu64": %016" PRIx64 " -> %016" PRIx64 " %hu cycles %s%s%s%s %x\n",
  816. i, e->from, e->to,
  817. (unsigned short)e->flags.cycles,
  818. e->flags.mispred ? "M" : " ",
  819. e->flags.predicted ? "P" : " ",
  820. e->flags.abort ? "A" : " ",
  821. e->flags.in_tx ? "T" : " ",
  822. (unsigned)e->flags.reserved);
  823. }
  824. }
  825. static void regs_dump__printf(u64 mask, u64 *regs)
  826. {
  827. unsigned rid, i = 0;
  828. for_each_set_bit(rid, (unsigned long *) &mask, sizeof(mask) * 8) {
  829. u64 val = regs[i++];
  830. printf(".... %-5s 0x%" PRIx64 "\n",
  831. perf_reg_name(rid), val);
  832. }
  833. }
  834. static const char *regs_abi[] = {
  835. [PERF_SAMPLE_REGS_ABI_NONE] = "none",
  836. [PERF_SAMPLE_REGS_ABI_32] = "32-bit",
  837. [PERF_SAMPLE_REGS_ABI_64] = "64-bit",
  838. };
  839. static inline const char *regs_dump_abi(struct regs_dump *d)
  840. {
  841. if (d->abi > PERF_SAMPLE_REGS_ABI_64)
  842. return "unknown";
  843. return regs_abi[d->abi];
  844. }
  845. static void regs__printf(const char *type, struct regs_dump *regs)
  846. {
  847. u64 mask = regs->mask;
  848. printf("... %s regs: mask 0x%" PRIx64 " ABI %s\n",
  849. type,
  850. mask,
  851. regs_dump_abi(regs));
  852. regs_dump__printf(mask, regs->regs);
  853. }
  854. static void regs_user__printf(struct perf_sample *sample)
  855. {
  856. struct regs_dump *user_regs = &sample->user_regs;
  857. if (user_regs->regs)
  858. regs__printf("user", user_regs);
  859. }
  860. static void regs_intr__printf(struct perf_sample *sample)
  861. {
  862. struct regs_dump *intr_regs = &sample->intr_regs;
  863. if (intr_regs->regs)
  864. regs__printf("intr", intr_regs);
  865. }
  866. static void stack_user__printf(struct stack_dump *dump)
  867. {
  868. printf("... ustack: size %" PRIu64 ", offset 0x%x\n",
  869. dump->size, dump->offset);
  870. }
  871. static void perf_evlist__print_tstamp(struct perf_evlist *evlist,
  872. union perf_event *event,
  873. struct perf_sample *sample)
  874. {
  875. u64 sample_type = __perf_evlist__combined_sample_type(evlist);
  876. if (event->header.type != PERF_RECORD_SAMPLE &&
  877. !perf_evlist__sample_id_all(evlist)) {
  878. fputs("-1 -1 ", stdout);
  879. return;
  880. }
  881. if ((sample_type & PERF_SAMPLE_CPU))
  882. printf("%u ", sample->cpu);
  883. if (sample_type & PERF_SAMPLE_TIME)
  884. printf("%" PRIu64 " ", sample->time);
  885. }
  886. static void sample_read__printf(struct perf_sample *sample, u64 read_format)
  887. {
  888. printf("... sample_read:\n");
  889. if (read_format & PERF_FORMAT_TOTAL_TIME_ENABLED)
  890. printf("...... time enabled %016" PRIx64 "\n",
  891. sample->read.time_enabled);
  892. if (read_format & PERF_FORMAT_TOTAL_TIME_RUNNING)
  893. printf("...... time running %016" PRIx64 "\n",
  894. sample->read.time_running);
  895. if (read_format & PERF_FORMAT_GROUP) {
  896. u64 i;
  897. printf(".... group nr %" PRIu64 "\n", sample->read.group.nr);
  898. for (i = 0; i < sample->read.group.nr; i++) {
  899. struct sample_read_value *value;
  900. value = &sample->read.group.values[i];
  901. printf("..... id %016" PRIx64
  902. ", value %016" PRIx64 "\n",
  903. value->id, value->value);
  904. }
  905. } else
  906. printf("..... id %016" PRIx64 ", value %016" PRIx64 "\n",
  907. sample->read.one.id, sample->read.one.value);
  908. }
  909. static void dump_event(struct perf_evlist *evlist, union perf_event *event,
  910. u64 file_offset, struct perf_sample *sample)
  911. {
  912. if (!dump_trace)
  913. return;
  914. printf("\n%#" PRIx64 " [%#x]: event: %d\n",
  915. file_offset, event->header.size, event->header.type);
  916. trace_event(event);
  917. if (sample)
  918. perf_evlist__print_tstamp(evlist, event, sample);
  919. printf("%#" PRIx64 " [%#x]: PERF_RECORD_%s", file_offset,
  920. event->header.size, perf_event__name(event->header.type));
  921. }
  922. static void dump_sample(struct perf_evsel *evsel, union perf_event *event,
  923. struct perf_sample *sample)
  924. {
  925. u64 sample_type;
  926. if (!dump_trace)
  927. return;
  928. printf("(IP, 0x%x): %d/%d: %#" PRIx64 " period: %" PRIu64 " addr: %#" PRIx64 "\n",
  929. event->header.misc, sample->pid, sample->tid, sample->ip,
  930. sample->period, sample->addr);
  931. sample_type = evsel->attr.sample_type;
  932. if (evsel__has_callchain(evsel))
  933. callchain__printf(evsel, sample);
  934. if ((sample_type & PERF_SAMPLE_BRANCH_STACK) && !perf_evsel__has_branch_callstack(evsel))
  935. branch_stack__printf(sample);
  936. if (sample_type & PERF_SAMPLE_REGS_USER)
  937. regs_user__printf(sample);
  938. if (sample_type & PERF_SAMPLE_REGS_INTR)
  939. regs_intr__printf(sample);
  940. if (sample_type & PERF_SAMPLE_STACK_USER)
  941. stack_user__printf(&sample->user_stack);
  942. if (sample_type & PERF_SAMPLE_WEIGHT)
  943. printf("... weight: %" PRIu64 "\n", sample->weight);
  944. if (sample_type & PERF_SAMPLE_DATA_SRC)
  945. printf(" . data_src: 0x%"PRIx64"\n", sample->data_src);
  946. if (sample_type & PERF_SAMPLE_PHYS_ADDR)
  947. printf(" .. phys_addr: 0x%"PRIx64"\n", sample->phys_addr);
  948. if (sample_type & PERF_SAMPLE_TRANSACTION)
  949. printf("... transaction: %" PRIx64 "\n", sample->transaction);
  950. if (sample_type & PERF_SAMPLE_READ)
  951. sample_read__printf(sample, evsel->attr.read_format);
  952. }
  953. static void dump_read(struct perf_evsel *evsel, union perf_event *event)
  954. {
  955. struct read_event *read_event = &event->read;
  956. u64 read_format;
  957. if (!dump_trace)
  958. return;
  959. printf(": %d %d %s %" PRIu64 "\n", event->read.pid, event->read.tid,
  960. evsel ? perf_evsel__name(evsel) : "FAIL",
  961. event->read.value);
  962. if (!evsel)
  963. return;
  964. read_format = evsel->attr.read_format;
  965. if (read_format & PERF_FORMAT_TOTAL_TIME_ENABLED)
  966. printf("... time enabled : %" PRIu64 "\n", read_event->time_enabled);
  967. if (read_format & PERF_FORMAT_TOTAL_TIME_RUNNING)
  968. printf("... time running : %" PRIu64 "\n", read_event->time_running);
  969. if (read_format & PERF_FORMAT_ID)
  970. printf("... id : %" PRIu64 "\n", read_event->id);
  971. }
  972. static struct machine *machines__find_for_cpumode(struct machines *machines,
  973. union perf_event *event,
  974. struct perf_sample *sample)
  975. {
  976. struct machine *machine;
  977. if (perf_guest &&
  978. ((sample->cpumode == PERF_RECORD_MISC_GUEST_KERNEL) ||
  979. (sample->cpumode == PERF_RECORD_MISC_GUEST_USER))) {
  980. u32 pid;
  981. if (event->header.type == PERF_RECORD_MMAP
  982. || event->header.type == PERF_RECORD_MMAP2)
  983. pid = event->mmap.pid;
  984. else
  985. pid = sample->pid;
  986. machine = machines__find(machines, pid);
  987. if (!machine)
  988. machine = machines__findnew(machines, DEFAULT_GUEST_KERNEL_ID);
  989. return machine;
  990. }
  991. return &machines->host;
  992. }
  993. static int deliver_sample_value(struct perf_evlist *evlist,
  994. struct perf_tool *tool,
  995. union perf_event *event,
  996. struct perf_sample *sample,
  997. struct sample_read_value *v,
  998. struct machine *machine)
  999. {
  1000. struct perf_sample_id *sid = perf_evlist__id2sid(evlist, v->id);
  1001. if (sid) {
  1002. sample->id = v->id;
  1003. sample->period = v->value - sid->period;
  1004. sid->period = v->value;
  1005. }
  1006. if (!sid || sid->evsel == NULL) {
  1007. ++evlist->stats.nr_unknown_id;
  1008. return 0;
  1009. }
  1010. return tool->sample(tool, event, sample, sid->evsel, machine);
  1011. }
  1012. static int deliver_sample_group(struct perf_evlist *evlist,
  1013. struct perf_tool *tool,
  1014. union perf_event *event,
  1015. struct perf_sample *sample,
  1016. struct machine *machine)
  1017. {
  1018. int ret = -EINVAL;
  1019. u64 i;
  1020. for (i = 0; i < sample->read.group.nr; i++) {
  1021. ret = deliver_sample_value(evlist, tool, event, sample,
  1022. &sample->read.group.values[i],
  1023. machine);
  1024. if (ret)
  1025. break;
  1026. }
  1027. return ret;
  1028. }
  1029. static int
  1030. perf_evlist__deliver_sample(struct perf_evlist *evlist,
  1031. struct perf_tool *tool,
  1032. union perf_event *event,
  1033. struct perf_sample *sample,
  1034. struct perf_evsel *evsel,
  1035. struct machine *machine)
  1036. {
  1037. /* We know evsel != NULL. */
  1038. u64 sample_type = evsel->attr.sample_type;
  1039. u64 read_format = evsel->attr.read_format;
  1040. /* Standard sample delivery. */
  1041. if (!(sample_type & PERF_SAMPLE_READ))
  1042. return tool->sample(tool, event, sample, evsel, machine);
  1043. /* For PERF_SAMPLE_READ we have either single or group mode. */
  1044. if (read_format & PERF_FORMAT_GROUP)
  1045. return deliver_sample_group(evlist, tool, event, sample,
  1046. machine);
  1047. else
  1048. return deliver_sample_value(evlist, tool, event, sample,
  1049. &sample->read.one, machine);
  1050. }
  1051. static int machines__deliver_event(struct machines *machines,
  1052. struct perf_evlist *evlist,
  1053. union perf_event *event,
  1054. struct perf_sample *sample,
  1055. struct perf_tool *tool, u64 file_offset)
  1056. {
  1057. struct perf_evsel *evsel;
  1058. struct machine *machine;
  1059. dump_event(evlist, event, file_offset, sample);
  1060. evsel = perf_evlist__id2evsel(evlist, sample->id);
  1061. machine = machines__find_for_cpumode(machines, event, sample);
  1062. switch (event->header.type) {
  1063. case PERF_RECORD_SAMPLE:
  1064. if (evsel == NULL) {
  1065. ++evlist->stats.nr_unknown_id;
  1066. return 0;
  1067. }
  1068. dump_sample(evsel, event, sample);
  1069. if (machine == NULL) {
  1070. ++evlist->stats.nr_unprocessable_samples;
  1071. return 0;
  1072. }
  1073. return perf_evlist__deliver_sample(evlist, tool, event, sample, evsel, machine);
  1074. case PERF_RECORD_MMAP:
  1075. return tool->mmap(tool, event, sample, machine);
  1076. case PERF_RECORD_MMAP2:
  1077. if (event->header.misc & PERF_RECORD_MISC_PROC_MAP_PARSE_TIMEOUT)
  1078. ++evlist->stats.nr_proc_map_timeout;
  1079. return tool->mmap2(tool, event, sample, machine);
  1080. case PERF_RECORD_COMM:
  1081. return tool->comm(tool, event, sample, machine);
  1082. case PERF_RECORD_NAMESPACES:
  1083. return tool->namespaces(tool, event, sample, machine);
  1084. case PERF_RECORD_FORK:
  1085. return tool->fork(tool, event, sample, machine);
  1086. case PERF_RECORD_EXIT:
  1087. return tool->exit(tool, event, sample, machine);
  1088. case PERF_RECORD_LOST:
  1089. if (tool->lost == perf_event__process_lost)
  1090. evlist->stats.total_lost += event->lost.lost;
  1091. return tool->lost(tool, event, sample, machine);
  1092. case PERF_RECORD_LOST_SAMPLES:
  1093. if (tool->lost_samples == perf_event__process_lost_samples)
  1094. evlist->stats.total_lost_samples += event->lost_samples.lost;
  1095. return tool->lost_samples(tool, event, sample, machine);
  1096. case PERF_RECORD_READ:
  1097. dump_read(evsel, event);
  1098. return tool->read(tool, event, sample, evsel, machine);
  1099. case PERF_RECORD_THROTTLE:
  1100. return tool->throttle(tool, event, sample, machine);
  1101. case PERF_RECORD_UNTHROTTLE:
  1102. return tool->unthrottle(tool, event, sample, machine);
  1103. case PERF_RECORD_AUX:
  1104. if (tool->aux == perf_event__process_aux) {
  1105. if (event->aux.flags & PERF_AUX_FLAG_TRUNCATED)
  1106. evlist->stats.total_aux_lost += 1;
  1107. if (event->aux.flags & PERF_AUX_FLAG_PARTIAL)
  1108. evlist->stats.total_aux_partial += 1;
  1109. }
  1110. return tool->aux(tool, event, sample, machine);
  1111. case PERF_RECORD_ITRACE_START:
  1112. return tool->itrace_start(tool, event, sample, machine);
  1113. case PERF_RECORD_SWITCH:
  1114. case PERF_RECORD_SWITCH_CPU_WIDE:
  1115. return tool->context_switch(tool, event, sample, machine);
  1116. default:
  1117. ++evlist->stats.nr_unknown_events;
  1118. return -1;
  1119. }
  1120. }
  1121. static int perf_session__deliver_event(struct perf_session *session,
  1122. union perf_event *event,
  1123. struct perf_tool *tool,
  1124. u64 file_offset)
  1125. {
  1126. struct perf_sample sample;
  1127. int ret;
  1128. ret = perf_evlist__parse_sample(session->evlist, event, &sample);
  1129. if (ret) {
  1130. pr_err("Can't parse sample, err = %d\n", ret);
  1131. return ret;
  1132. }
  1133. ret = auxtrace__process_event(session, event, &sample, tool);
  1134. if (ret < 0)
  1135. return ret;
  1136. if (ret > 0)
  1137. return 0;
  1138. return machines__deliver_event(&session->machines, session->evlist,
  1139. event, &sample, tool, file_offset);
  1140. }
  1141. static s64 perf_session__process_user_event(struct perf_session *session,
  1142. union perf_event *event,
  1143. u64 file_offset)
  1144. {
  1145. struct ordered_events *oe = &session->ordered_events;
  1146. struct perf_tool *tool = session->tool;
  1147. struct perf_sample sample = { .time = 0, };
  1148. int fd = perf_data__fd(session->data);
  1149. int err;
  1150. dump_event(session->evlist, event, file_offset, &sample);
  1151. /* These events are processed right away */
  1152. switch (event->header.type) {
  1153. case PERF_RECORD_HEADER_ATTR:
  1154. err = tool->attr(tool, event, &session->evlist);
  1155. if (err == 0) {
  1156. perf_session__set_id_hdr_size(session);
  1157. perf_session__set_comm_exec(session);
  1158. }
  1159. return err;
  1160. case PERF_RECORD_EVENT_UPDATE:
  1161. return tool->event_update(tool, event, &session->evlist);
  1162. case PERF_RECORD_HEADER_EVENT_TYPE:
  1163. /*
  1164. * Depreceated, but we need to handle it for sake
  1165. * of old data files create in pipe mode.
  1166. */
  1167. return 0;
  1168. case PERF_RECORD_HEADER_TRACING_DATA:
  1169. /* setup for reading amidst mmap */
  1170. lseek(fd, file_offset, SEEK_SET);
  1171. return tool->tracing_data(tool, event, session);
  1172. case PERF_RECORD_HEADER_BUILD_ID:
  1173. return tool->build_id(tool, event, session);
  1174. case PERF_RECORD_FINISHED_ROUND:
  1175. return tool->finished_round(tool, event, oe);
  1176. case PERF_RECORD_ID_INDEX:
  1177. return tool->id_index(tool, event, session);
  1178. case PERF_RECORD_AUXTRACE_INFO:
  1179. return tool->auxtrace_info(tool, event, session);
  1180. case PERF_RECORD_AUXTRACE:
  1181. /* setup for reading amidst mmap */
  1182. lseek(fd, file_offset + event->header.size, SEEK_SET);
  1183. return tool->auxtrace(tool, event, session);
  1184. case PERF_RECORD_AUXTRACE_ERROR:
  1185. perf_session__auxtrace_error_inc(session, event);
  1186. return tool->auxtrace_error(tool, event, session);
  1187. case PERF_RECORD_THREAD_MAP:
  1188. return tool->thread_map(tool, event, session);
  1189. case PERF_RECORD_CPU_MAP:
  1190. return tool->cpu_map(tool, event, session);
  1191. case PERF_RECORD_STAT_CONFIG:
  1192. return tool->stat_config(tool, event, session);
  1193. case PERF_RECORD_STAT:
  1194. return tool->stat(tool, event, session);
  1195. case PERF_RECORD_STAT_ROUND:
  1196. return tool->stat_round(tool, event, session);
  1197. case PERF_RECORD_TIME_CONV:
  1198. session->time_conv = event->time_conv;
  1199. return tool->time_conv(tool, event, session);
  1200. case PERF_RECORD_HEADER_FEATURE:
  1201. return tool->feature(tool, event, session);
  1202. default:
  1203. return -EINVAL;
  1204. }
  1205. }
  1206. int perf_session__deliver_synth_event(struct perf_session *session,
  1207. union perf_event *event,
  1208. struct perf_sample *sample)
  1209. {
  1210. struct perf_evlist *evlist = session->evlist;
  1211. struct perf_tool *tool = session->tool;
  1212. events_stats__inc(&evlist->stats, event->header.type);
  1213. if (event->header.type >= PERF_RECORD_USER_TYPE_START)
  1214. return perf_session__process_user_event(session, event, 0);
  1215. return machines__deliver_event(&session->machines, evlist, event, sample, tool, 0);
  1216. }
  1217. static void event_swap(union perf_event *event, bool sample_id_all)
  1218. {
  1219. perf_event__swap_op swap;
  1220. swap = perf_event__swap_ops[event->header.type];
  1221. if (swap)
  1222. swap(event, sample_id_all);
  1223. }
  1224. int perf_session__peek_event(struct perf_session *session, off_t file_offset,
  1225. void *buf, size_t buf_sz,
  1226. union perf_event **event_ptr,
  1227. struct perf_sample *sample)
  1228. {
  1229. union perf_event *event;
  1230. size_t hdr_sz, rest;
  1231. int fd;
  1232. if (session->one_mmap && !session->header.needs_swap) {
  1233. event = file_offset - session->one_mmap_offset +
  1234. session->one_mmap_addr;
  1235. goto out_parse_sample;
  1236. }
  1237. if (perf_data__is_pipe(session->data))
  1238. return -1;
  1239. fd = perf_data__fd(session->data);
  1240. hdr_sz = sizeof(struct perf_event_header);
  1241. if (buf_sz < hdr_sz)
  1242. return -1;
  1243. if (lseek(fd, file_offset, SEEK_SET) == (off_t)-1 ||
  1244. readn(fd, buf, hdr_sz) != (ssize_t)hdr_sz)
  1245. return -1;
  1246. event = (union perf_event *)buf;
  1247. if (session->header.needs_swap)
  1248. perf_event_header__bswap(&event->header);
  1249. if (event->header.size < hdr_sz || event->header.size > buf_sz)
  1250. return -1;
  1251. rest = event->header.size - hdr_sz;
  1252. if (readn(fd, buf, rest) != (ssize_t)rest)
  1253. return -1;
  1254. if (session->header.needs_swap)
  1255. event_swap(event, perf_evlist__sample_id_all(session->evlist));
  1256. out_parse_sample:
  1257. if (sample && event->header.type < PERF_RECORD_USER_TYPE_START &&
  1258. perf_evlist__parse_sample(session->evlist, event, sample))
  1259. return -1;
  1260. *event_ptr = event;
  1261. return 0;
  1262. }
  1263. static s64 perf_session__process_event(struct perf_session *session,
  1264. union perf_event *event, u64 file_offset)
  1265. {
  1266. struct perf_evlist *evlist = session->evlist;
  1267. struct perf_tool *tool = session->tool;
  1268. int ret;
  1269. if (session->header.needs_swap)
  1270. event_swap(event, perf_evlist__sample_id_all(evlist));
  1271. if (event->header.type >= PERF_RECORD_HEADER_MAX)
  1272. return -EINVAL;
  1273. events_stats__inc(&evlist->stats, event->header.type);
  1274. if (event->header.type >= PERF_RECORD_USER_TYPE_START)
  1275. return perf_session__process_user_event(session, event, file_offset);
  1276. if (tool->ordered_events) {
  1277. u64 timestamp = -1ULL;
  1278. ret = perf_evlist__parse_sample_timestamp(evlist, event, &timestamp);
  1279. if (ret && ret != -1)
  1280. return ret;
  1281. ret = perf_session__queue_event(session, event, timestamp, file_offset);
  1282. if (ret != -ETIME)
  1283. return ret;
  1284. }
  1285. return perf_session__deliver_event(session, event, tool, file_offset);
  1286. }
  1287. void perf_event_header__bswap(struct perf_event_header *hdr)
  1288. {
  1289. hdr->type = bswap_32(hdr->type);
  1290. hdr->misc = bswap_16(hdr->misc);
  1291. hdr->size = bswap_16(hdr->size);
  1292. }
  1293. struct thread *perf_session__findnew(struct perf_session *session, pid_t pid)
  1294. {
  1295. return machine__findnew_thread(&session->machines.host, -1, pid);
  1296. }
  1297. int perf_session__register_idle_thread(struct perf_session *session)
  1298. {
  1299. struct thread *thread;
  1300. int err = 0;
  1301. thread = machine__findnew_thread(&session->machines.host, 0, 0);
  1302. if (thread == NULL || thread__set_comm(thread, "swapper", 0)) {
  1303. pr_err("problem inserting idle task.\n");
  1304. err = -1;
  1305. }
  1306. if (thread == NULL || thread__set_namespaces(thread, 0, NULL)) {
  1307. pr_err("problem inserting idle task.\n");
  1308. err = -1;
  1309. }
  1310. /* machine__findnew_thread() got the thread, so put it */
  1311. thread__put(thread);
  1312. return err;
  1313. }
  1314. static void
  1315. perf_session__warn_order(const struct perf_session *session)
  1316. {
  1317. const struct ordered_events *oe = &session->ordered_events;
  1318. struct perf_evsel *evsel;
  1319. bool should_warn = true;
  1320. evlist__for_each_entry(session->evlist, evsel) {
  1321. if (evsel->attr.write_backward)
  1322. should_warn = false;
  1323. }
  1324. if (!should_warn)
  1325. return;
  1326. if (oe->nr_unordered_events != 0)
  1327. ui__warning("%u out of order events recorded.\n", oe->nr_unordered_events);
  1328. }
  1329. static void perf_session__warn_about_errors(const struct perf_session *session)
  1330. {
  1331. const struct events_stats *stats = &session->evlist->stats;
  1332. if (session->tool->lost == perf_event__process_lost &&
  1333. stats->nr_events[PERF_RECORD_LOST] != 0) {
  1334. ui__warning("Processed %d events and lost %d chunks!\n\n"
  1335. "Check IO/CPU overload!\n\n",
  1336. stats->nr_events[0],
  1337. stats->nr_events[PERF_RECORD_LOST]);
  1338. }
  1339. if (session->tool->lost_samples == perf_event__process_lost_samples) {
  1340. double drop_rate;
  1341. drop_rate = (double)stats->total_lost_samples /
  1342. (double) (stats->nr_events[PERF_RECORD_SAMPLE] + stats->total_lost_samples);
  1343. if (drop_rate > 0.05) {
  1344. ui__warning("Processed %" PRIu64 " samples and lost %3.2f%%!\n\n",
  1345. stats->nr_events[PERF_RECORD_SAMPLE] + stats->total_lost_samples,
  1346. drop_rate * 100.0);
  1347. }
  1348. }
  1349. if (session->tool->aux == perf_event__process_aux &&
  1350. stats->total_aux_lost != 0) {
  1351. ui__warning("AUX data lost %" PRIu64 " times out of %u!\n\n",
  1352. stats->total_aux_lost,
  1353. stats->nr_events[PERF_RECORD_AUX]);
  1354. }
  1355. if (session->tool->aux == perf_event__process_aux &&
  1356. stats->total_aux_partial != 0) {
  1357. bool vmm_exclusive = false;
  1358. (void)sysfs__read_bool("module/kvm_intel/parameters/vmm_exclusive",
  1359. &vmm_exclusive);
  1360. ui__warning("AUX data had gaps in it %" PRIu64 " times out of %u!\n\n"
  1361. "Are you running a KVM guest in the background?%s\n\n",
  1362. stats->total_aux_partial,
  1363. stats->nr_events[PERF_RECORD_AUX],
  1364. vmm_exclusive ?
  1365. "\nReloading kvm_intel module with vmm_exclusive=0\n"
  1366. "will reduce the gaps to only guest's timeslices." :
  1367. "");
  1368. }
  1369. if (stats->nr_unknown_events != 0) {
  1370. ui__warning("Found %u unknown events!\n\n"
  1371. "Is this an older tool processing a perf.data "
  1372. "file generated by a more recent tool?\n\n"
  1373. "If that is not the case, consider "
  1374. "reporting to linux-kernel@vger.kernel.org.\n\n",
  1375. stats->nr_unknown_events);
  1376. }
  1377. if (stats->nr_unknown_id != 0) {
  1378. ui__warning("%u samples with id not present in the header\n",
  1379. stats->nr_unknown_id);
  1380. }
  1381. if (stats->nr_invalid_chains != 0) {
  1382. ui__warning("Found invalid callchains!\n\n"
  1383. "%u out of %u events were discarded for this reason.\n\n"
  1384. "Consider reporting to linux-kernel@vger.kernel.org.\n\n",
  1385. stats->nr_invalid_chains,
  1386. stats->nr_events[PERF_RECORD_SAMPLE]);
  1387. }
  1388. if (stats->nr_unprocessable_samples != 0) {
  1389. ui__warning("%u unprocessable samples recorded.\n"
  1390. "Do you have a KVM guest running and not using 'perf kvm'?\n",
  1391. stats->nr_unprocessable_samples);
  1392. }
  1393. perf_session__warn_order(session);
  1394. events_stats__auxtrace_error_warn(stats);
  1395. if (stats->nr_proc_map_timeout != 0) {
  1396. ui__warning("%d map information files for pre-existing threads were\n"
  1397. "not processed, if there are samples for addresses they\n"
  1398. "will not be resolved, you may find out which are these\n"
  1399. "threads by running with -v and redirecting the output\n"
  1400. "to a file.\n"
  1401. "The time limit to process proc map is too short?\n"
  1402. "Increase it by --proc-map-timeout\n",
  1403. stats->nr_proc_map_timeout);
  1404. }
  1405. }
  1406. static int perf_session__flush_thread_stack(struct thread *thread,
  1407. void *p __maybe_unused)
  1408. {
  1409. return thread_stack__flush(thread);
  1410. }
  1411. static int perf_session__flush_thread_stacks(struct perf_session *session)
  1412. {
  1413. return machines__for_each_thread(&session->machines,
  1414. perf_session__flush_thread_stack,
  1415. NULL);
  1416. }
  1417. volatile int session_done;
  1418. static int __perf_session__process_pipe_events(struct perf_session *session)
  1419. {
  1420. struct ordered_events *oe = &session->ordered_events;
  1421. struct perf_tool *tool = session->tool;
  1422. int fd = perf_data__fd(session->data);
  1423. union perf_event *event;
  1424. uint32_t size, cur_size = 0;
  1425. void *buf = NULL;
  1426. s64 skip = 0;
  1427. u64 head;
  1428. ssize_t err;
  1429. void *p;
  1430. perf_tool__fill_defaults(tool);
  1431. head = 0;
  1432. cur_size = sizeof(union perf_event);
  1433. buf = malloc(cur_size);
  1434. if (!buf)
  1435. return -errno;
  1436. ordered_events__set_copy_on_queue(oe, true);
  1437. more:
  1438. event = buf;
  1439. err = readn(fd, event, sizeof(struct perf_event_header));
  1440. if (err <= 0) {
  1441. if (err == 0)
  1442. goto done;
  1443. pr_err("failed to read event header\n");
  1444. goto out_err;
  1445. }
  1446. if (session->header.needs_swap)
  1447. perf_event_header__bswap(&event->header);
  1448. size = event->header.size;
  1449. if (size < sizeof(struct perf_event_header)) {
  1450. pr_err("bad event header size\n");
  1451. goto out_err;
  1452. }
  1453. if (size > cur_size) {
  1454. void *new = realloc(buf, size);
  1455. if (!new) {
  1456. pr_err("failed to allocate memory to read event\n");
  1457. goto out_err;
  1458. }
  1459. buf = new;
  1460. cur_size = size;
  1461. event = buf;
  1462. }
  1463. p = event;
  1464. p += sizeof(struct perf_event_header);
  1465. if (size - sizeof(struct perf_event_header)) {
  1466. err = readn(fd, p, size - sizeof(struct perf_event_header));
  1467. if (err <= 0) {
  1468. if (err == 0) {
  1469. pr_err("unexpected end of event stream\n");
  1470. goto done;
  1471. }
  1472. pr_err("failed to read event data\n");
  1473. goto out_err;
  1474. }
  1475. }
  1476. if ((skip = perf_session__process_event(session, event, head)) < 0) {
  1477. pr_err("%#" PRIx64 " [%#x]: failed to process type: %d\n",
  1478. head, event->header.size, event->header.type);
  1479. err = -EINVAL;
  1480. goto out_err;
  1481. }
  1482. head += size;
  1483. if (skip > 0)
  1484. head += skip;
  1485. if (!session_done())
  1486. goto more;
  1487. done:
  1488. /* do the final flush for ordered samples */
  1489. err = ordered_events__flush(oe, OE_FLUSH__FINAL);
  1490. if (err)
  1491. goto out_err;
  1492. err = auxtrace__flush_events(session, tool);
  1493. if (err)
  1494. goto out_err;
  1495. err = perf_session__flush_thread_stacks(session);
  1496. out_err:
  1497. free(buf);
  1498. if (!tool->no_warn)
  1499. perf_session__warn_about_errors(session);
  1500. ordered_events__free(&session->ordered_events);
  1501. auxtrace__free_events(session);
  1502. return err;
  1503. }
  1504. static union perf_event *
  1505. fetch_mmaped_event(struct perf_session *session,
  1506. u64 head, size_t mmap_size, char *buf)
  1507. {
  1508. union perf_event *event;
  1509. /*
  1510. * Ensure we have enough space remaining to read
  1511. * the size of the event in the headers.
  1512. */
  1513. if (head + sizeof(event->header) > mmap_size)
  1514. return NULL;
  1515. event = (union perf_event *)(buf + head);
  1516. if (session->header.needs_swap)
  1517. perf_event_header__bswap(&event->header);
  1518. if (head + event->header.size > mmap_size) {
  1519. /* We're not fetching the event so swap back again */
  1520. if (session->header.needs_swap)
  1521. perf_event_header__bswap(&event->header);
  1522. return NULL;
  1523. }
  1524. return event;
  1525. }
  1526. /*
  1527. * On 64bit we can mmap the data file in one go. No need for tiny mmap
  1528. * slices. On 32bit we use 32MB.
  1529. */
  1530. #if BITS_PER_LONG == 64
  1531. #define MMAP_SIZE ULLONG_MAX
  1532. #define NUM_MMAPS 1
  1533. #else
  1534. #define MMAP_SIZE (32 * 1024 * 1024ULL)
  1535. #define NUM_MMAPS 128
  1536. #endif
  1537. static int __perf_session__process_events(struct perf_session *session,
  1538. u64 data_offset, u64 data_size,
  1539. u64 file_size)
  1540. {
  1541. struct ordered_events *oe = &session->ordered_events;
  1542. struct perf_tool *tool = session->tool;
  1543. int fd = perf_data__fd(session->data);
  1544. u64 head, page_offset, file_offset, file_pos, size;
  1545. int err, mmap_prot, mmap_flags, map_idx = 0;
  1546. size_t mmap_size;
  1547. char *buf, *mmaps[NUM_MMAPS];
  1548. union perf_event *event;
  1549. struct ui_progress prog;
  1550. s64 skip;
  1551. perf_tool__fill_defaults(tool);
  1552. page_offset = page_size * (data_offset / page_size);
  1553. file_offset = page_offset;
  1554. head = data_offset - page_offset;
  1555. if (data_size == 0)
  1556. goto out;
  1557. if (data_offset + data_size < file_size)
  1558. file_size = data_offset + data_size;
  1559. ui_progress__init_size(&prog, file_size, "Processing events...");
  1560. mmap_size = MMAP_SIZE;
  1561. if (mmap_size > file_size) {
  1562. mmap_size = file_size;
  1563. session->one_mmap = true;
  1564. }
  1565. memset(mmaps, 0, sizeof(mmaps));
  1566. mmap_prot = PROT_READ;
  1567. mmap_flags = MAP_SHARED;
  1568. if (session->header.needs_swap) {
  1569. mmap_prot |= PROT_WRITE;
  1570. mmap_flags = MAP_PRIVATE;
  1571. }
  1572. remap:
  1573. buf = mmap(NULL, mmap_size, mmap_prot, mmap_flags, fd,
  1574. file_offset);
  1575. if (buf == MAP_FAILED) {
  1576. pr_err("failed to mmap file\n");
  1577. err = -errno;
  1578. goto out_err;
  1579. }
  1580. mmaps[map_idx] = buf;
  1581. map_idx = (map_idx + 1) & (ARRAY_SIZE(mmaps) - 1);
  1582. file_pos = file_offset + head;
  1583. if (session->one_mmap) {
  1584. session->one_mmap_addr = buf;
  1585. session->one_mmap_offset = file_offset;
  1586. }
  1587. more:
  1588. event = fetch_mmaped_event(session, head, mmap_size, buf);
  1589. if (!event) {
  1590. if (mmaps[map_idx]) {
  1591. munmap(mmaps[map_idx], mmap_size);
  1592. mmaps[map_idx] = NULL;
  1593. }
  1594. page_offset = page_size * (head / page_size);
  1595. file_offset += page_offset;
  1596. head -= page_offset;
  1597. goto remap;
  1598. }
  1599. size = event->header.size;
  1600. if (size < sizeof(struct perf_event_header) ||
  1601. (skip = perf_session__process_event(session, event, file_pos)) < 0) {
  1602. pr_err("%#" PRIx64 " [%#x]: failed to process type: %d\n",
  1603. file_offset + head, event->header.size,
  1604. event->header.type);
  1605. err = -EINVAL;
  1606. goto out_err;
  1607. }
  1608. if (skip)
  1609. size += skip;
  1610. head += size;
  1611. file_pos += size;
  1612. ui_progress__update(&prog, size);
  1613. if (session_done())
  1614. goto out;
  1615. if (file_pos < file_size)
  1616. goto more;
  1617. out:
  1618. /* do the final flush for ordered samples */
  1619. err = ordered_events__flush(oe, OE_FLUSH__FINAL);
  1620. if (err)
  1621. goto out_err;
  1622. err = auxtrace__flush_events(session, tool);
  1623. if (err)
  1624. goto out_err;
  1625. err = perf_session__flush_thread_stacks(session);
  1626. out_err:
  1627. ui_progress__finish();
  1628. if (!tool->no_warn)
  1629. perf_session__warn_about_errors(session);
  1630. /*
  1631. * We may switching perf.data output, make ordered_events
  1632. * reusable.
  1633. */
  1634. ordered_events__reinit(&session->ordered_events);
  1635. auxtrace__free_events(session);
  1636. session->one_mmap = false;
  1637. return err;
  1638. }
  1639. int perf_session__process_events(struct perf_session *session)
  1640. {
  1641. u64 size = perf_data__size(session->data);
  1642. int err;
  1643. if (perf_session__register_idle_thread(session) < 0)
  1644. return -ENOMEM;
  1645. if (!perf_data__is_pipe(session->data))
  1646. err = __perf_session__process_events(session,
  1647. session->header.data_offset,
  1648. session->header.data_size, size);
  1649. else
  1650. err = __perf_session__process_pipe_events(session);
  1651. return err;
  1652. }
  1653. bool perf_session__has_traces(struct perf_session *session, const char *msg)
  1654. {
  1655. struct perf_evsel *evsel;
  1656. evlist__for_each_entry(session->evlist, evsel) {
  1657. if (evsel->attr.type == PERF_TYPE_TRACEPOINT)
  1658. return true;
  1659. }
  1660. pr_err("No trace sample to read. Did you call 'perf %s'?\n", msg);
  1661. return false;
  1662. }
  1663. int map__set_kallsyms_ref_reloc_sym(struct map *map, const char *symbol_name, u64 addr)
  1664. {
  1665. char *bracket;
  1666. struct ref_reloc_sym *ref;
  1667. struct kmap *kmap;
  1668. ref = zalloc(sizeof(struct ref_reloc_sym));
  1669. if (ref == NULL)
  1670. return -ENOMEM;
  1671. ref->name = strdup(symbol_name);
  1672. if (ref->name == NULL) {
  1673. free(ref);
  1674. return -ENOMEM;
  1675. }
  1676. bracket = strchr(ref->name, ']');
  1677. if (bracket)
  1678. *bracket = '\0';
  1679. ref->addr = addr;
  1680. kmap = map__kmap(map);
  1681. if (kmap)
  1682. kmap->ref_reloc_sym = ref;
  1683. return 0;
  1684. }
  1685. size_t perf_session__fprintf_dsos(struct perf_session *session, FILE *fp)
  1686. {
  1687. return machines__fprintf_dsos(&session->machines, fp);
  1688. }
  1689. size_t perf_session__fprintf_dsos_buildid(struct perf_session *session, FILE *fp,
  1690. bool (skip)(struct dso *dso, int parm), int parm)
  1691. {
  1692. return machines__fprintf_dsos_buildid(&session->machines, fp, skip, parm);
  1693. }
  1694. size_t perf_session__fprintf_nr_events(struct perf_session *session, FILE *fp)
  1695. {
  1696. size_t ret;
  1697. const char *msg = "";
  1698. if (perf_header__has_feat(&session->header, HEADER_AUXTRACE))
  1699. msg = " (excludes AUX area (e.g. instruction trace) decoded / synthesized events)";
  1700. ret = fprintf(fp, "\nAggregated stats:%s\n", msg);
  1701. ret += events_stats__fprintf(&session->evlist->stats, fp);
  1702. return ret;
  1703. }
  1704. size_t perf_session__fprintf(struct perf_session *session, FILE *fp)
  1705. {
  1706. /*
  1707. * FIXME: Here we have to actually print all the machines in this
  1708. * session, not just the host...
  1709. */
  1710. return machine__fprintf(&session->machines.host, fp);
  1711. }
  1712. struct perf_evsel *perf_session__find_first_evtype(struct perf_session *session,
  1713. unsigned int type)
  1714. {
  1715. struct perf_evsel *pos;
  1716. evlist__for_each_entry(session->evlist, pos) {
  1717. if (pos->attr.type == type)
  1718. return pos;
  1719. }
  1720. return NULL;
  1721. }
  1722. int perf_session__cpu_bitmap(struct perf_session *session,
  1723. const char *cpu_list, unsigned long *cpu_bitmap)
  1724. {
  1725. int i, err = -1;
  1726. struct cpu_map *map;
  1727. for (i = 0; i < PERF_TYPE_MAX; ++i) {
  1728. struct perf_evsel *evsel;
  1729. evsel = perf_session__find_first_evtype(session, i);
  1730. if (!evsel)
  1731. continue;
  1732. if (!(evsel->attr.sample_type & PERF_SAMPLE_CPU)) {
  1733. pr_err("File does not contain CPU events. "
  1734. "Remove -C option to proceed.\n");
  1735. return -1;
  1736. }
  1737. }
  1738. map = cpu_map__new(cpu_list);
  1739. if (map == NULL) {
  1740. pr_err("Invalid cpu_list\n");
  1741. return -1;
  1742. }
  1743. for (i = 0; i < map->nr; i++) {
  1744. int cpu = map->map[i];
  1745. if (cpu >= MAX_NR_CPUS) {
  1746. pr_err("Requested CPU %d too large. "
  1747. "Consider raising MAX_NR_CPUS\n", cpu);
  1748. goto out_delete_map;
  1749. }
  1750. set_bit(cpu, cpu_bitmap);
  1751. }
  1752. err = 0;
  1753. out_delete_map:
  1754. cpu_map__put(map);
  1755. return err;
  1756. }
  1757. void perf_session__fprintf_info(struct perf_session *session, FILE *fp,
  1758. bool full)
  1759. {
  1760. if (session == NULL || fp == NULL)
  1761. return;
  1762. fprintf(fp, "# ========\n");
  1763. perf_header__fprintf_info(session, fp, full);
  1764. fprintf(fp, "# ========\n#\n");
  1765. }
  1766. int __perf_session__set_tracepoints_handlers(struct perf_session *session,
  1767. const struct perf_evsel_str_handler *assocs,
  1768. size_t nr_assocs)
  1769. {
  1770. struct perf_evsel *evsel;
  1771. size_t i;
  1772. int err;
  1773. for (i = 0; i < nr_assocs; i++) {
  1774. /*
  1775. * Adding a handler for an event not in the session,
  1776. * just ignore it.
  1777. */
  1778. evsel = perf_evlist__find_tracepoint_by_name(session->evlist, assocs[i].name);
  1779. if (evsel == NULL)
  1780. continue;
  1781. err = -EEXIST;
  1782. if (evsel->handler != NULL)
  1783. goto out;
  1784. evsel->handler = assocs[i].handler;
  1785. }
  1786. err = 0;
  1787. out:
  1788. return err;
  1789. }
  1790. int perf_event__process_id_index(struct perf_tool *tool __maybe_unused,
  1791. union perf_event *event,
  1792. struct perf_session *session)
  1793. {
  1794. struct perf_evlist *evlist = session->evlist;
  1795. struct id_index_event *ie = &event->id_index;
  1796. size_t i, nr, max_nr;
  1797. max_nr = (ie->header.size - sizeof(struct id_index_event)) /
  1798. sizeof(struct id_index_entry);
  1799. nr = ie->nr;
  1800. if (nr > max_nr)
  1801. return -EINVAL;
  1802. if (dump_trace)
  1803. fprintf(stdout, " nr: %zu\n", nr);
  1804. for (i = 0; i < nr; i++) {
  1805. struct id_index_entry *e = &ie->entries[i];
  1806. struct perf_sample_id *sid;
  1807. if (dump_trace) {
  1808. fprintf(stdout, " ... id: %"PRIu64, e->id);
  1809. fprintf(stdout, " idx: %"PRIu64, e->idx);
  1810. fprintf(stdout, " cpu: %"PRId64, e->cpu);
  1811. fprintf(stdout, " tid: %"PRId64"\n", e->tid);
  1812. }
  1813. sid = perf_evlist__id2sid(evlist, e->id);
  1814. if (!sid)
  1815. return -ENOENT;
  1816. sid->idx = e->idx;
  1817. sid->cpu = e->cpu;
  1818. sid->tid = e->tid;
  1819. }
  1820. return 0;
  1821. }
  1822. int perf_event__synthesize_id_index(struct perf_tool *tool,
  1823. perf_event__handler_t process,
  1824. struct perf_evlist *evlist,
  1825. struct machine *machine)
  1826. {
  1827. union perf_event *ev;
  1828. struct perf_evsel *evsel;
  1829. size_t nr = 0, i = 0, sz, max_nr, n;
  1830. int err;
  1831. pr_debug2("Synthesizing id index\n");
  1832. max_nr = (UINT16_MAX - sizeof(struct id_index_event)) /
  1833. sizeof(struct id_index_entry);
  1834. evlist__for_each_entry(evlist, evsel)
  1835. nr += evsel->ids;
  1836. n = nr > max_nr ? max_nr : nr;
  1837. sz = sizeof(struct id_index_event) + n * sizeof(struct id_index_entry);
  1838. ev = zalloc(sz);
  1839. if (!ev)
  1840. return -ENOMEM;
  1841. ev->id_index.header.type = PERF_RECORD_ID_INDEX;
  1842. ev->id_index.header.size = sz;
  1843. ev->id_index.nr = n;
  1844. evlist__for_each_entry(evlist, evsel) {
  1845. u32 j;
  1846. for (j = 0; j < evsel->ids; j++) {
  1847. struct id_index_entry *e;
  1848. struct perf_sample_id *sid;
  1849. if (i >= n) {
  1850. err = process(tool, ev, NULL, machine);
  1851. if (err)
  1852. goto out_err;
  1853. nr -= n;
  1854. i = 0;
  1855. }
  1856. e = &ev->id_index.entries[i++];
  1857. e->id = evsel->id[j];
  1858. sid = perf_evlist__id2sid(evlist, e->id);
  1859. if (!sid) {
  1860. free(ev);
  1861. return -ENOENT;
  1862. }
  1863. e->idx = sid->idx;
  1864. e->cpu = sid->cpu;
  1865. e->tid = sid->tid;
  1866. }
  1867. }
  1868. sz = sizeof(struct id_index_event) + nr * sizeof(struct id_index_entry);
  1869. ev->id_index.header.size = sz;
  1870. ev->id_index.nr = nr;
  1871. err = process(tool, ev, NULL, machine);
  1872. out_err:
  1873. free(ev);
  1874. return err;
  1875. }