1# export-to-postgresql.py: export perf data to a postgresql database 2# Copyright (c) 2014, Intel Corporation. 3# 4# This program is free software; you can redistribute it and/or modify it 5# under the terms and conditions of the GNU General Public License, 6# version 2, as published by the Free Software Foundation. 7# 8# This program is distributed in the hope it will be useful, but WITHOUT 9# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or 10# FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for 11# more details. 12 13import os 14import sys 15import struct 16import datetime 17 18from PySide.QtSql import * 19 20# Need to access PostgreSQL C library directly to use COPY FROM STDIN 21from ctypes import * 22libpq = CDLL("libpq.so.5") 23PQconnectdb = libpq.PQconnectdb 24PQconnectdb.restype = c_void_p 25PQfinish = libpq.PQfinish 26PQstatus = libpq.PQstatus 27PQexec = libpq.PQexec 28PQexec.restype = c_void_p 29PQresultStatus = libpq.PQresultStatus 30PQputCopyData = libpq.PQputCopyData 31PQputCopyData.argtypes = [ c_void_p, c_void_p, c_int ] 32PQputCopyEnd = libpq.PQputCopyEnd 33PQputCopyEnd.argtypes = [ c_void_p, c_void_p ] 34 35sys.path.append(os.environ['PERF_EXEC_PATH'] + \ 36 '/scripts/python/Perf-Trace-Util/lib/Perf/Trace') 37 38# These perf imports are not used at present 39#from perf_trace_context import * 40#from Core import * 41 42perf_db_export_mode = True 43 44def usage(): 45 print >> sys.stderr, "Usage is: export-to-postgresql.py <database name> [<columns>]" 46 print >> sys.stderr, "where: columns 'all' or 'branches'" 47 raise Exception("Too few arguments") 48 49if (len(sys.argv) < 2): 50 usage() 51 52dbname = sys.argv[1] 53 54if (len(sys.argv) >= 3): 55 columns = sys.argv[2] 56else: 57 columns = "all" 58 59if columns not in ("all", "branches"): 60 usage() 61 62branches = (columns == "branches") 63 64output_dir_name = os.getcwd() + "/" + dbname + "-perf-data" 65os.mkdir(output_dir_name) 66 67def do_query(q, s): 68 if (q.exec_(s)): 69 return 70 raise Exception("Query failed: " + q.lastError().text()) 71 72print datetime.datetime.today(), "Creating database..." 73 74db = QSqlDatabase.addDatabase('QPSQL') 75query = QSqlQuery(db) 76db.setDatabaseName('postgres') 77db.open() 78try: 79 do_query(query, 'CREATE DATABASE ' + dbname) 80except: 81 os.rmdir(output_dir_name) 82 raise 83query.finish() 84query.clear() 85db.close() 86 87db.setDatabaseName(dbname) 88db.open() 89 90query = QSqlQuery(db) 91do_query(query, 'SET client_min_messages TO WARNING') 92 93do_query(query, 'CREATE TABLE selected_events (' 94 'id bigint NOT NULL,' 95 'name varchar(80))') 96do_query(query, 'CREATE TABLE machines (' 97 'id bigint NOT NULL,' 98 'pid integer,' 99 'root_dir varchar(4096))') 100do_query(query, 'CREATE TABLE threads (' 101 'id bigint NOT NULL,' 102 'machine_id bigint,' 103 'process_id bigint,' 104 'pid integer,' 105 'tid integer)') 106do_query(query, 'CREATE TABLE comms (' 107 'id bigint NOT NULL,' 108 'comm varchar(16))') 109do_query(query, 'CREATE TABLE comm_threads (' 110 'id bigint NOT NULL,' 111 'comm_id bigint,' 112 'thread_id bigint)') 113do_query(query, 'CREATE TABLE dsos (' 114 'id bigint NOT NULL,' 115 'machine_id bigint,' 116 'short_name varchar(256),' 117 'long_name varchar(4096),' 118 'build_id varchar(64))') 119do_query(query, 'CREATE TABLE symbols (' 120 'id bigint NOT NULL,' 121 'dso_id bigint,' 122 'sym_start bigint,' 123 'sym_end bigint,' 124 'binding integer,' 125 'name varchar(2048))') 126do_query(query, 'CREATE TABLE branch_types (' 127 'id integer NOT NULL,' 128 'name varchar(80))') 129 130if branches: 131 do_query(query, 'CREATE TABLE samples (' 132 'id bigint NOT NULL,' 133 'evsel_id bigint,' 134 'machine_id bigint,' 135 'thread_id bigint,' 136 'comm_id bigint,' 137 'dso_id bigint,' 138 'symbol_id bigint,' 139 'sym_offset bigint,' 140 'ip bigint,' 141 'time bigint,' 142 'cpu integer,' 143 'to_dso_id bigint,' 144 'to_symbol_id bigint,' 145 'to_sym_offset bigint,' 146 'to_ip bigint,' 147 'branch_type integer,' 148 'in_tx boolean)') 149else: 150 do_query(query, 'CREATE TABLE samples (' 151 'id bigint NOT NULL,' 152 'evsel_id bigint,' 153 'machine_id bigint,' 154 'thread_id bigint,' 155 'comm_id bigint,' 156 'dso_id bigint,' 157 'symbol_id bigint,' 158 'sym_offset bigint,' 159 'ip bigint,' 160 'time bigint,' 161 'cpu integer,' 162 'to_dso_id bigint,' 163 'to_symbol_id bigint,' 164 'to_sym_offset bigint,' 165 'to_ip bigint,' 166 'period bigint,' 167 'weight bigint,' 168 'transaction bigint,' 169 'data_src bigint,' 170 'branch_type integer,' 171 'in_tx boolean)') 172 173do_query(query, 'CREATE VIEW samples_view AS ' 174 'SELECT ' 175 'id,' 176 'time,' 177 'cpu,' 178 '(SELECT pid FROM threads WHERE id = thread_id) AS pid,' 179 '(SELECT tid FROM threads WHERE id = thread_id) AS tid,' 180 '(SELECT comm FROM comms WHERE id = comm_id) AS command,' 181 '(SELECT name FROM selected_events WHERE id = evsel_id) AS event,' 182 'to_hex(ip) AS ip_hex,' 183 '(SELECT name FROM symbols WHERE id = symbol_id) AS symbol,' 184 'sym_offset,' 185 '(SELECT short_name FROM dsos WHERE id = dso_id) AS dso_short_name,' 186 'to_hex(to_ip) AS to_ip_hex,' 187 '(SELECT name FROM symbols WHERE id = to_symbol_id) AS to_symbol,' 188 'to_sym_offset,' 189 '(SELECT short_name FROM dsos WHERE id = to_dso_id) AS to_dso_short_name,' 190 '(SELECT name FROM branch_types WHERE id = branch_type) AS branch_type_name,' 191 'in_tx' 192 ' FROM samples') 193 194 195file_header = struct.pack("!11sii", "PGCOPY\n\377\r\n\0", 0, 0) 196file_trailer = "\377\377" 197 198def open_output_file(file_name): 199 path_name = output_dir_name + "/" + file_name 200 file = open(path_name, "w+") 201 file.write(file_header) 202 return file 203 204def close_output_file(file): 205 file.write(file_trailer) 206 file.close() 207 208def copy_output_file_direct(file, table_name): 209 close_output_file(file) 210 sql = "COPY " + table_name + " FROM '" + file.name + "' (FORMAT 'binary')" 211 do_query(query, sql) 212 213# Use COPY FROM STDIN because security may prevent postgres from accessing the files directly 214def copy_output_file(file, table_name): 215 conn = PQconnectdb("dbname = " + dbname) 216 if (PQstatus(conn)): 217 raise Exception("COPY FROM STDIN PQconnectdb failed") 218 file.write(file_trailer) 219 file.seek(0) 220 sql = "COPY " + table_name + " FROM STDIN (FORMAT 'binary')" 221 res = PQexec(conn, sql) 222 if (PQresultStatus(res) != 4): 223 raise Exception("COPY FROM STDIN PQexec failed") 224 data = file.read(65536) 225 while (len(data)): 226 ret = PQputCopyData(conn, data, len(data)) 227 if (ret != 1): 228 raise Exception("COPY FROM STDIN PQputCopyData failed, error " + str(ret)) 229 data = file.read(65536) 230 ret = PQputCopyEnd(conn, None) 231 if (ret != 1): 232 raise Exception("COPY FROM STDIN PQputCopyEnd failed, error " + str(ret)) 233 PQfinish(conn) 234 235def remove_output_file(file): 236 name = file.name 237 file.close() 238 os.unlink(name) 239 240evsel_file = open_output_file("evsel_table.bin") 241machine_file = open_output_file("machine_table.bin") 242thread_file = open_output_file("thread_table.bin") 243comm_file = open_output_file("comm_table.bin") 244comm_thread_file = open_output_file("comm_thread_table.bin") 245dso_file = open_output_file("dso_table.bin") 246symbol_file = open_output_file("symbol_table.bin") 247branch_type_file = open_output_file("branch_type_table.bin") 248sample_file = open_output_file("sample_table.bin") 249 250def trace_begin(): 251 print datetime.datetime.today(), "Writing to intermediate files..." 252 # id == 0 means unknown. It is easier to create records for them than replace the zeroes with NULLs 253 evsel_table(0, "unknown") 254 machine_table(0, 0, "unknown") 255 thread_table(0, 0, 0, -1, -1) 256 comm_table(0, "unknown") 257 dso_table(0, 0, "unknown", "unknown", "") 258 symbol_table(0, 0, 0, 0, 0, "unknown") 259 260unhandled_count = 0 261 262def trace_end(): 263 print datetime.datetime.today(), "Copying to database..." 264 copy_output_file(evsel_file, "selected_events") 265 copy_output_file(machine_file, "machines") 266 copy_output_file(thread_file, "threads") 267 copy_output_file(comm_file, "comms") 268 copy_output_file(comm_thread_file, "comm_threads") 269 copy_output_file(dso_file, "dsos") 270 copy_output_file(symbol_file, "symbols") 271 copy_output_file(branch_type_file, "branch_types") 272 copy_output_file(sample_file, "samples") 273 274 print datetime.datetime.today(), "Removing intermediate files..." 275 remove_output_file(evsel_file) 276 remove_output_file(machine_file) 277 remove_output_file(thread_file) 278 remove_output_file(comm_file) 279 remove_output_file(comm_thread_file) 280 remove_output_file(dso_file) 281 remove_output_file(symbol_file) 282 remove_output_file(branch_type_file) 283 remove_output_file(sample_file) 284 os.rmdir(output_dir_name) 285 print datetime.datetime.today(), "Adding primary keys" 286 do_query(query, 'ALTER TABLE selected_events ADD PRIMARY KEY (id)') 287 do_query(query, 'ALTER TABLE machines ADD PRIMARY KEY (id)') 288 do_query(query, 'ALTER TABLE threads ADD PRIMARY KEY (id)') 289 do_query(query, 'ALTER TABLE comms ADD PRIMARY KEY (id)') 290 do_query(query, 'ALTER TABLE comm_threads ADD PRIMARY KEY (id)') 291 do_query(query, 'ALTER TABLE dsos ADD PRIMARY KEY (id)') 292 do_query(query, 'ALTER TABLE symbols ADD PRIMARY KEY (id)') 293 do_query(query, 'ALTER TABLE branch_types ADD PRIMARY KEY (id)') 294 do_query(query, 'ALTER TABLE samples ADD PRIMARY KEY (id)') 295 296 print datetime.datetime.today(), "Adding foreign keys" 297 do_query(query, 'ALTER TABLE threads ' 298 'ADD CONSTRAINT machinefk FOREIGN KEY (machine_id) REFERENCES machines (id),' 299 'ADD CONSTRAINT processfk FOREIGN KEY (process_id) REFERENCES threads (id)') 300 do_query(query, 'ALTER TABLE comm_threads ' 301 'ADD CONSTRAINT commfk FOREIGN KEY (comm_id) REFERENCES comms (id),' 302 'ADD CONSTRAINT threadfk FOREIGN KEY (thread_id) REFERENCES threads (id)') 303 do_query(query, 'ALTER TABLE dsos ' 304 'ADD CONSTRAINT machinefk FOREIGN KEY (machine_id) REFERENCES machines (id)') 305 do_query(query, 'ALTER TABLE symbols ' 306 'ADD CONSTRAINT dsofk FOREIGN KEY (dso_id) REFERENCES dsos (id)') 307 do_query(query, 'ALTER TABLE samples ' 308 'ADD CONSTRAINT evselfk FOREIGN KEY (evsel_id) REFERENCES selected_events (id),' 309 'ADD CONSTRAINT machinefk FOREIGN KEY (machine_id) REFERENCES machines (id),' 310 'ADD CONSTRAINT threadfk FOREIGN KEY (thread_id) REFERENCES threads (id),' 311 'ADD CONSTRAINT commfk FOREIGN KEY (comm_id) REFERENCES comms (id),' 312 'ADD CONSTRAINT dsofk FOREIGN KEY (dso_id) REFERENCES dsos (id),' 313 'ADD CONSTRAINT symbolfk FOREIGN KEY (symbol_id) REFERENCES symbols (id),' 314 'ADD CONSTRAINT todsofk FOREIGN KEY (to_dso_id) REFERENCES dsos (id),' 315 'ADD CONSTRAINT tosymbolfk FOREIGN KEY (to_symbol_id) REFERENCES symbols (id)') 316 317 if (unhandled_count): 318 print datetime.datetime.today(), "Warning: ", unhandled_count, " unhandled events" 319 print datetime.datetime.today(), "Done" 320 321def trace_unhandled(event_name, context, event_fields_dict): 322 global unhandled_count 323 unhandled_count += 1 324 325def sched__sched_switch(*x): 326 pass 327 328def evsel_table(evsel_id, evsel_name, *x): 329 n = len(evsel_name) 330 fmt = "!hiqi" + str(n) + "s" 331 value = struct.pack(fmt, 2, 8, evsel_id, n, evsel_name) 332 evsel_file.write(value) 333 334def machine_table(machine_id, pid, root_dir, *x): 335 n = len(root_dir) 336 fmt = "!hiqiii" + str(n) + "s" 337 value = struct.pack(fmt, 3, 8, machine_id, 4, pid, n, root_dir) 338 machine_file.write(value) 339 340def thread_table(thread_id, machine_id, process_id, pid, tid, *x): 341 value = struct.pack("!hiqiqiqiiii", 5, 8, thread_id, 8, machine_id, 8, process_id, 4, pid, 4, tid) 342 thread_file.write(value) 343 344def comm_table(comm_id, comm_str, *x): 345 n = len(comm_str) 346 fmt = "!hiqi" + str(n) + "s" 347 value = struct.pack(fmt, 2, 8, comm_id, n, comm_str) 348 comm_file.write(value) 349 350def comm_thread_table(comm_thread_id, comm_id, thread_id, *x): 351 fmt = "!hiqiqiq" 352 value = struct.pack(fmt, 3, 8, comm_thread_id, 8, comm_id, 8, thread_id) 353 comm_thread_file.write(value) 354 355def dso_table(dso_id, machine_id, short_name, long_name, build_id, *x): 356 n1 = len(short_name) 357 n2 = len(long_name) 358 n3 = len(build_id) 359 fmt = "!hiqiqi" + str(n1) + "si" + str(n2) + "si" + str(n3) + "s" 360 value = struct.pack(fmt, 5, 8, dso_id, 8, machine_id, n1, short_name, n2, long_name, n3, build_id) 361 dso_file.write(value) 362 363def symbol_table(symbol_id, dso_id, sym_start, sym_end, binding, symbol_name, *x): 364 n = len(symbol_name) 365 fmt = "!hiqiqiqiqiii" + str(n) + "s" 366 value = struct.pack(fmt, 6, 8, symbol_id, 8, dso_id, 8, sym_start, 8, sym_end, 4, binding, n, symbol_name) 367 symbol_file.write(value) 368 369def branch_type_table(branch_type, name, *x): 370 n = len(name) 371 fmt = "!hiii" + str(n) + "s" 372 value = struct.pack(fmt, 2, 4, branch_type, n, name) 373 branch_type_file.write(value) 374 375def sample_table(sample_id, evsel_id, machine_id, thread_id, comm_id, dso_id, symbol_id, sym_offset, ip, time, cpu, to_dso_id, to_symbol_id, to_sym_offset, to_ip, period, weight, transaction, data_src, branch_type, in_tx, *x): 376 if branches: 377 value = struct.pack("!hiqiqiqiqiqiqiqiqiqiqiiiqiqiqiqiiiB", 17, 8, sample_id, 8, evsel_id, 8, machine_id, 8, thread_id, 8, comm_id, 8, dso_id, 8, symbol_id, 8, sym_offset, 8, ip, 8, time, 4, cpu, 8, to_dso_id, 8, to_symbol_id, 8, to_sym_offset, 8, to_ip, 4, branch_type, 1, in_tx) 378 else: 379 value = struct.pack("!hiqiqiqiqiqiqiqiqiqiqiiiqiqiqiqiqiqiqiqiiiB", 21, 8, sample_id, 8, evsel_id, 8, machine_id, 8, thread_id, 8, comm_id, 8, dso_id, 8, symbol_id, 8, sym_offset, 8, ip, 8, time, 4, cpu, 8, to_dso_id, 8, to_symbol_id, 8, to_sym_offset, 8, to_ip, 8, period, 8, weight, 8, transaction, 8, data_src, 4, branch_type, 1, in_tx) 380 sample_file.write(value) 381