123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461 |
- # export-to-sqlite.py: export perf data to a sqlite3 database
- # Copyright (c) 2017, Intel Corporation.
- #
- # This program is free software; you can redistribute it and/or modify it
- # under the terms and conditions of the GNU General Public License,
- # version 2, as published by the Free Software Foundation.
- #
- # This program is distributed in the hope it will be useful, but WITHOUT
- # ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
- # FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
- # more details.
- from __future__ import print_function
- import os
- import sys
- import struct
- import datetime
- # To use this script you will need to have installed package python-pyside which
- # provides LGPL-licensed Python bindings for Qt. You will also need the package
- # libqt4-sql-sqlite for Qt sqlite3 support.
- #
- # An example of using this script with Intel PT:
- #
- # $ perf record -e intel_pt//u ls
- # $ perf script -s ~/libexec/perf-core/scripts/python/export-to-sqlite.py pt_example branches calls
- # 2017-07-31 14:26:07.326913 Creating database...
- # 2017-07-31 14:26:07.538097 Writing records...
- # 2017-07-31 14:26:09.889292 Adding indexes
- # 2017-07-31 14:26:09.958746 Done
- #
- # To browse the database, sqlite3 can be used e.g.
- #
- # $ sqlite3 pt_example
- # sqlite> .header on
- # sqlite> select * from samples_view where id < 10;
- # sqlite> .mode column
- # sqlite> select * from samples_view where id < 10;
- # sqlite> .tables
- # sqlite> .schema samples_view
- # sqlite> .quit
- #
- # An example of using the database is provided by the script
- # call-graph-from-sql.py. Refer to that script for details.
- #
- # The database structure is practically the same as created by the script
- # export-to-postgresql.py. Refer to that script for details. A notable
- # difference is the 'transaction' column of the 'samples' table which is
- # renamed 'transaction_' in sqlite because 'transaction' is a reserved word.
- from PySide.QtSql import *
- sys.path.append(os.environ['PERF_EXEC_PATH'] + \
- '/scripts/python/Perf-Trace-Util/lib/Perf/Trace')
- # These perf imports are not used at present
- #from perf_trace_context import *
- #from Core import *
- perf_db_export_mode = True
- perf_db_export_calls = False
- perf_db_export_callchains = False
- def printerr(*args, **keyword_args):
- print(*args, file=sys.stderr, **keyword_args)
- def usage():
- printerr("Usage is: export-to-sqlite.py <database name> [<columns>] [<calls>] [<callchains>]");
- printerr("where: columns 'all' or 'branches'");
- printerr(" calls 'calls' => create calls and call_paths table");
- printerr(" callchains 'callchains' => create call_paths table");
- raise Exception("Too few arguments")
- if (len(sys.argv) < 2):
- usage()
- dbname = sys.argv[1]
- if (len(sys.argv) >= 3):
- columns = sys.argv[2]
- else:
- columns = "all"
- if columns not in ("all", "branches"):
- usage()
- branches = (columns == "branches")
- for i in range(3,len(sys.argv)):
- if (sys.argv[i] == "calls"):
- perf_db_export_calls = True
- elif (sys.argv[i] == "callchains"):
- perf_db_export_callchains = True
- else:
- usage()
- def do_query(q, s):
- if (q.exec_(s)):
- return
- raise Exception("Query failed: " + q.lastError().text())
- def do_query_(q):
- if (q.exec_()):
- return
- raise Exception("Query failed: " + q.lastError().text())
- print(datetime.datetime.today(), "Creating database ...")
- db_exists = False
- try:
- f = open(dbname)
- f.close()
- db_exists = True
- except:
- pass
- if db_exists:
- raise Exception(dbname + " already exists")
- db = QSqlDatabase.addDatabase('QSQLITE')
- db.setDatabaseName(dbname)
- db.open()
- query = QSqlQuery(db)
- do_query(query, 'PRAGMA journal_mode = OFF')
- do_query(query, 'BEGIN TRANSACTION')
- do_query(query, 'CREATE TABLE selected_events ('
- 'id integer NOT NULL PRIMARY KEY,'
- 'name varchar(80))')
- do_query(query, 'CREATE TABLE machines ('
- 'id integer NOT NULL PRIMARY KEY,'
- 'pid integer,'
- 'root_dir varchar(4096))')
- do_query(query, 'CREATE TABLE threads ('
- 'id integer NOT NULL PRIMARY KEY,'
- 'machine_id bigint,'
- 'process_id bigint,'
- 'pid integer,'
- 'tid integer)')
- do_query(query, 'CREATE TABLE comms ('
- 'id integer NOT NULL PRIMARY KEY,'
- 'comm varchar(16))')
- do_query(query, 'CREATE TABLE comm_threads ('
- 'id integer NOT NULL PRIMARY KEY,'
- 'comm_id bigint,'
- 'thread_id bigint)')
- do_query(query, 'CREATE TABLE dsos ('
- 'id integer NOT NULL PRIMARY KEY,'
- 'machine_id bigint,'
- 'short_name varchar(256),'
- 'long_name varchar(4096),'
- 'build_id varchar(64))')
- do_query(query, 'CREATE TABLE symbols ('
- 'id integer NOT NULL PRIMARY KEY,'
- 'dso_id bigint,'
- 'sym_start bigint,'
- 'sym_end bigint,'
- 'binding integer,'
- 'name varchar(2048))')
- do_query(query, 'CREATE TABLE branch_types ('
- 'id integer NOT NULL PRIMARY KEY,'
- 'name varchar(80))')
- if branches:
- do_query(query, 'CREATE TABLE samples ('
- 'id integer NOT NULL PRIMARY KEY,'
- 'evsel_id bigint,'
- 'machine_id bigint,'
- 'thread_id bigint,'
- 'comm_id bigint,'
- 'dso_id bigint,'
- 'symbol_id bigint,'
- 'sym_offset bigint,'
- 'ip bigint,'
- 'time bigint,'
- 'cpu integer,'
- 'to_dso_id bigint,'
- 'to_symbol_id bigint,'
- 'to_sym_offset bigint,'
- 'to_ip bigint,'
- 'branch_type integer,'
- 'in_tx boolean,'
- 'call_path_id bigint)')
- else:
- do_query(query, 'CREATE TABLE samples ('
- 'id integer NOT NULL PRIMARY KEY,'
- 'evsel_id bigint,'
- 'machine_id bigint,'
- 'thread_id bigint,'
- 'comm_id bigint,'
- 'dso_id bigint,'
- 'symbol_id bigint,'
- 'sym_offset bigint,'
- 'ip bigint,'
- 'time bigint,'
- 'cpu integer,'
- 'to_dso_id bigint,'
- 'to_symbol_id bigint,'
- 'to_sym_offset bigint,'
- 'to_ip bigint,'
- 'period bigint,'
- 'weight bigint,'
- 'transaction_ bigint,'
- 'data_src bigint,'
- 'branch_type integer,'
- 'in_tx boolean,'
- 'call_path_id bigint)')
- if perf_db_export_calls or perf_db_export_callchains:
- do_query(query, 'CREATE TABLE call_paths ('
- 'id integer NOT NULL PRIMARY KEY,'
- 'parent_id bigint,'
- 'symbol_id bigint,'
- 'ip bigint)')
- if perf_db_export_calls:
- do_query(query, 'CREATE TABLE calls ('
- 'id integer NOT NULL PRIMARY KEY,'
- 'thread_id bigint,'
- 'comm_id bigint,'
- 'call_path_id bigint,'
- 'call_time bigint,'
- 'return_time bigint,'
- 'branch_count bigint,'
- 'call_id bigint,'
- 'return_id bigint,'
- 'parent_call_path_id bigint,'
- 'flags integer)')
- # printf was added to sqlite in version 3.8.3
- sqlite_has_printf = False
- try:
- do_query(query, 'SELECT printf("") FROM machines')
- sqlite_has_printf = True
- except:
- pass
- def emit_to_hex(x):
- if sqlite_has_printf:
- return 'printf("%x", ' + x + ')'
- else:
- return x
- do_query(query, 'CREATE VIEW machines_view AS '
- 'SELECT '
- 'id,'
- 'pid,'
- 'root_dir,'
- 'CASE WHEN id=0 THEN \'unknown\' WHEN pid=-1 THEN \'host\' ELSE \'guest\' END AS host_or_guest'
- ' FROM machines')
- do_query(query, 'CREATE VIEW dsos_view AS '
- 'SELECT '
- 'id,'
- 'machine_id,'
- '(SELECT host_or_guest FROM machines_view WHERE id = machine_id) AS host_or_guest,'
- 'short_name,'
- 'long_name,'
- 'build_id'
- ' FROM dsos')
- do_query(query, 'CREATE VIEW symbols_view AS '
- 'SELECT '
- 'id,'
- 'name,'
- '(SELECT short_name FROM dsos WHERE id=dso_id) AS dso,'
- 'dso_id,'
- 'sym_start,'
- 'sym_end,'
- 'CASE WHEN binding=0 THEN \'local\' WHEN binding=1 THEN \'global\' ELSE \'weak\' END AS binding'
- ' FROM symbols')
- do_query(query, 'CREATE VIEW threads_view AS '
- 'SELECT '
- 'id,'
- 'machine_id,'
- '(SELECT host_or_guest FROM machines_view WHERE id = machine_id) AS host_or_guest,'
- 'process_id,'
- 'pid,'
- 'tid'
- ' FROM threads')
- do_query(query, 'CREATE VIEW comm_threads_view AS '
- 'SELECT '
- 'comm_id,'
- '(SELECT comm FROM comms WHERE id = comm_id) AS command,'
- 'thread_id,'
- '(SELECT pid FROM threads WHERE id = thread_id) AS pid,'
- '(SELECT tid FROM threads WHERE id = thread_id) AS tid'
- ' FROM comm_threads')
- if perf_db_export_calls or perf_db_export_callchains:
- do_query(query, 'CREATE VIEW call_paths_view AS '
- 'SELECT '
- 'c.id,'
- + emit_to_hex('c.ip') + ' AS ip,'
- 'c.symbol_id,'
- '(SELECT name FROM symbols WHERE id = c.symbol_id) AS symbol,'
- '(SELECT dso_id FROM symbols WHERE id = c.symbol_id) AS dso_id,'
- '(SELECT dso FROM symbols_view WHERE id = c.symbol_id) AS dso_short_name,'
- 'c.parent_id,'
- + emit_to_hex('p.ip') + ' AS parent_ip,'
- 'p.symbol_id AS parent_symbol_id,'
- '(SELECT name FROM symbols WHERE id = p.symbol_id) AS parent_symbol,'
- '(SELECT dso_id FROM symbols WHERE id = p.symbol_id) AS parent_dso_id,'
- '(SELECT dso FROM symbols_view WHERE id = p.symbol_id) AS parent_dso_short_name'
- ' FROM call_paths c INNER JOIN call_paths p ON p.id = c.parent_id')
- if perf_db_export_calls:
- do_query(query, 'CREATE VIEW calls_view AS '
- 'SELECT '
- 'calls.id,'
- 'thread_id,'
- '(SELECT pid FROM threads WHERE id = thread_id) AS pid,'
- '(SELECT tid FROM threads WHERE id = thread_id) AS tid,'
- '(SELECT comm FROM comms WHERE id = comm_id) AS command,'
- 'call_path_id,'
- + emit_to_hex('ip') + ' AS ip,'
- 'symbol_id,'
- '(SELECT name FROM symbols WHERE id = symbol_id) AS symbol,'
- 'call_time,'
- 'return_time,'
- 'return_time - call_time AS elapsed_time,'
- 'branch_count,'
- 'call_id,'
- 'return_id,'
- 'CASE WHEN flags=1 THEN \'no call\' WHEN flags=2 THEN \'no return\' WHEN flags=3 THEN \'no call/return\' ELSE \'\' END AS flags,'
- 'parent_call_path_id'
- ' FROM calls INNER JOIN call_paths ON call_paths.id = call_path_id')
- do_query(query, 'CREATE VIEW samples_view AS '
- 'SELECT '
- 'id,'
- 'time,'
- 'cpu,'
- '(SELECT pid FROM threads WHERE id = thread_id) AS pid,'
- '(SELECT tid FROM threads WHERE id = thread_id) AS tid,'
- '(SELECT comm FROM comms WHERE id = comm_id) AS command,'
- '(SELECT name FROM selected_events WHERE id = evsel_id) AS event,'
- + emit_to_hex('ip') + ' AS ip_hex,'
- '(SELECT name FROM symbols WHERE id = symbol_id) AS symbol,'
- 'sym_offset,'
- '(SELECT short_name FROM dsos WHERE id = dso_id) AS dso_short_name,'
- + emit_to_hex('to_ip') + ' AS to_ip_hex,'
- '(SELECT name FROM symbols WHERE id = to_symbol_id) AS to_symbol,'
- 'to_sym_offset,'
- '(SELECT short_name FROM dsos WHERE id = to_dso_id) AS to_dso_short_name,'
- '(SELECT name FROM branch_types WHERE id = branch_type) AS branch_type_name,'
- 'in_tx'
- ' FROM samples')
- do_query(query, 'END TRANSACTION')
- evsel_query = QSqlQuery(db)
- evsel_query.prepare("INSERT INTO selected_events VALUES (?, ?)")
- machine_query = QSqlQuery(db)
- machine_query.prepare("INSERT INTO machines VALUES (?, ?, ?)")
- thread_query = QSqlQuery(db)
- thread_query.prepare("INSERT INTO threads VALUES (?, ?, ?, ?, ?)")
- comm_query = QSqlQuery(db)
- comm_query.prepare("INSERT INTO comms VALUES (?, ?)")
- comm_thread_query = QSqlQuery(db)
- comm_thread_query.prepare("INSERT INTO comm_threads VALUES (?, ?, ?)")
- dso_query = QSqlQuery(db)
- dso_query.prepare("INSERT INTO dsos VALUES (?, ?, ?, ?, ?)")
- symbol_query = QSqlQuery(db)
- symbol_query.prepare("INSERT INTO symbols VALUES (?, ?, ?, ?, ?, ?)")
- branch_type_query = QSqlQuery(db)
- branch_type_query.prepare("INSERT INTO branch_types VALUES (?, ?)")
- sample_query = QSqlQuery(db)
- if branches:
- sample_query.prepare("INSERT INTO samples VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)")
- else:
- sample_query.prepare("INSERT INTO samples VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)")
- if perf_db_export_calls or perf_db_export_callchains:
- call_path_query = QSqlQuery(db)
- call_path_query.prepare("INSERT INTO call_paths VALUES (?, ?, ?, ?)")
- if perf_db_export_calls:
- call_query = QSqlQuery(db)
- call_query.prepare("INSERT INTO calls VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)")
- def trace_begin():
- print(datetime.datetime.today(), "Writing records...")
- do_query(query, 'BEGIN TRANSACTION')
- # id == 0 means unknown. It is easier to create records for them than replace the zeroes with NULLs
- evsel_table(0, "unknown")
- machine_table(0, 0, "unknown")
- thread_table(0, 0, 0, -1, -1)
- comm_table(0, "unknown")
- dso_table(0, 0, "unknown", "unknown", "")
- symbol_table(0, 0, 0, 0, 0, "unknown")
- sample_table(0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0)
- if perf_db_export_calls or perf_db_export_callchains:
- call_path_table(0, 0, 0, 0)
- unhandled_count = 0
- def trace_end():
- do_query(query, 'END TRANSACTION')
- print(datetime.datetime.today(), "Adding indexes")
- if perf_db_export_calls:
- do_query(query, 'CREATE INDEX pcpid_idx ON calls (parent_call_path_id)')
- if (unhandled_count):
- print(datetime.datetime.today(), "Warning: ", unhandled_count, " unhandled events")
- print(datetime.datetime.today(), "Done")
- def trace_unhandled(event_name, context, event_fields_dict):
- global unhandled_count
- unhandled_count += 1
- def sched__sched_switch(*x):
- pass
- def bind_exec(q, n, x):
- for xx in x[0:n]:
- q.addBindValue(str(xx))
- do_query_(q)
- def evsel_table(*x):
- bind_exec(evsel_query, 2, x)
- def machine_table(*x):
- bind_exec(machine_query, 3, x)
- def thread_table(*x):
- bind_exec(thread_query, 5, x)
- def comm_table(*x):
- bind_exec(comm_query, 2, x)
- def comm_thread_table(*x):
- bind_exec(comm_thread_query, 3, x)
- def dso_table(*x):
- bind_exec(dso_query, 5, x)
- def symbol_table(*x):
- bind_exec(symbol_query, 6, x)
- def branch_type_table(*x):
- bind_exec(branch_type_query, 2, x)
- def sample_table(*x):
- if branches:
- for xx in x[0:15]:
- sample_query.addBindValue(str(xx))
- for xx in x[19:22]:
- sample_query.addBindValue(str(xx))
- do_query_(sample_query)
- else:
- bind_exec(sample_query, 22, x)
- def call_path_table(*x):
- bind_exec(call_path_query, 4, x)
- def call_return_table(*x):
- bind_exec(call_query, 11, x)
|