Bryan Huntsman | 3f2bc4d | 2011-08-16 17:27:22 -0700 | [diff] [blame] | 1 | /* Copyright (c) 2010-2011, Code Aurora Forum. All rights reserved. |
| 2 | * |
| 3 | * This program is free software; you can redistribute it and/or modify |
| 4 | * it under the terms of the GNU General Public License version 2 and |
| 5 | * only version 2 as published by the Free Software Foundation. |
| 6 | * |
| 7 | * This program is distributed in the hope that it will be useful, |
| 8 | * but WITHOUT ANY WARRANTY; without even the implied warranty of |
| 9 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
| 10 | * GNU General Public License for more details. |
| 11 | * |
| 12 | */ |
| 13 | |
| 14 | /* #define DEBUG */ |
| 15 | #define ALIGN_CPU |
| 16 | |
| 17 | #include <linux/spinlock.h> |
| 18 | #include <linux/debugfs.h> |
| 19 | #include <linux/relay.h> |
| 20 | #include <linux/slab.h> |
| 21 | #include <linux/time.h> |
| 22 | #include <linux/sched.h> |
Jeremy Gebben | 6061bc7 | 2011-04-18 15:23:16 -0600 | [diff] [blame] | 23 | #include <mach/socinfo.h> |
Bryan Huntsman | 3f2bc4d | 2011-08-16 17:27:22 -0700 | [diff] [blame] | 24 | |
| 25 | #include "kgsl.h" |
| 26 | #include "kgsl_cffdump.h" |
| 27 | #include "kgsl_debugfs.h" |
Sushmita Susheelendra | 22d8717 | 2011-05-09 16:40:02 -0600 | [diff] [blame] | 28 | #include "kgsl_log.h" |
| 29 | #include "kgsl_sharedmem.h" |
| 30 | #include "adreno_pm4types.h" |
Bryan Huntsman | 3f2bc4d | 2011-08-16 17:27:22 -0700 | [diff] [blame] | 31 | |
| 32 | static struct rchan *chan; |
| 33 | static struct dentry *dir; |
| 34 | static int suspended; |
| 35 | static size_t dropped; |
| 36 | static size_t subbuf_size = 256*1024; |
| 37 | static size_t n_subbufs = 64; |
| 38 | |
| 39 | /* forward declarations */ |
| 40 | static void destroy_channel(void); |
| 41 | static struct rchan *create_channel(unsigned subbuf_size, unsigned n_subbufs); |
| 42 | |
| 43 | static spinlock_t cffdump_lock; |
| 44 | static ulong serial_nr; |
| 45 | static ulong total_bytes; |
| 46 | static ulong total_syncmem; |
| 47 | static long last_sec; |
| 48 | |
| 49 | #define MEMBUF_SIZE 64 |
| 50 | |
| 51 | #define CFF_OP_WRITE_REG 0x00000002 |
| 52 | struct cff_op_write_reg { |
| 53 | unsigned char op; |
| 54 | uint addr; |
| 55 | uint value; |
Sushmita Susheelendra | 22d8717 | 2011-05-09 16:40:02 -0600 | [diff] [blame] | 56 | } __packed; |
Bryan Huntsman | 3f2bc4d | 2011-08-16 17:27:22 -0700 | [diff] [blame] | 57 | |
| 58 | #define CFF_OP_POLL_REG 0x00000004 |
| 59 | struct cff_op_poll_reg { |
| 60 | unsigned char op; |
| 61 | uint addr; |
| 62 | uint value; |
| 63 | uint mask; |
Sushmita Susheelendra | 22d8717 | 2011-05-09 16:40:02 -0600 | [diff] [blame] | 64 | } __packed; |
Bryan Huntsman | 3f2bc4d | 2011-08-16 17:27:22 -0700 | [diff] [blame] | 65 | |
| 66 | #define CFF_OP_WAIT_IRQ 0x00000005 |
| 67 | struct cff_op_wait_irq { |
| 68 | unsigned char op; |
Sushmita Susheelendra | 22d8717 | 2011-05-09 16:40:02 -0600 | [diff] [blame] | 69 | } __packed; |
Bryan Huntsman | 3f2bc4d | 2011-08-16 17:27:22 -0700 | [diff] [blame] | 70 | |
Bryan Huntsman | 3f2bc4d | 2011-08-16 17:27:22 -0700 | [diff] [blame] | 71 | #define CFF_OP_RMW 0x0000000a |
| 72 | |
| 73 | #define CFF_OP_WRITE_MEM 0x0000000b |
| 74 | struct cff_op_write_mem { |
| 75 | unsigned char op; |
| 76 | uint addr; |
| 77 | uint value; |
Sushmita Susheelendra | 22d8717 | 2011-05-09 16:40:02 -0600 | [diff] [blame] | 78 | } __packed; |
Bryan Huntsman | 3f2bc4d | 2011-08-16 17:27:22 -0700 | [diff] [blame] | 79 | |
| 80 | #define CFF_OP_WRITE_MEMBUF 0x0000000c |
| 81 | struct cff_op_write_membuf { |
| 82 | unsigned char op; |
| 83 | uint addr; |
| 84 | ushort count; |
| 85 | uint buffer[MEMBUF_SIZE]; |
Sushmita Susheelendra | 22d8717 | 2011-05-09 16:40:02 -0600 | [diff] [blame] | 86 | } __packed; |
Bryan Huntsman | 3f2bc4d | 2011-08-16 17:27:22 -0700 | [diff] [blame] | 87 | |
Jeremy Gebben | 6061bc7 | 2011-04-18 15:23:16 -0600 | [diff] [blame] | 88 | #define CFF_OP_MEMORY_BASE 0x0000000d |
| 89 | struct cff_op_memory_base { |
| 90 | unsigned char op; |
| 91 | uint base; |
| 92 | uint size; |
| 93 | uint gmemsize; |
| 94 | } __packed; |
| 95 | |
| 96 | #define CFF_OP_HANG 0x0000000e |
| 97 | struct cff_op_hang { |
| 98 | unsigned char op; |
| 99 | } __packed; |
| 100 | |
Bryan Huntsman | 3f2bc4d | 2011-08-16 17:27:22 -0700 | [diff] [blame] | 101 | #define CFF_OP_EOF 0xffffffff |
| 102 | struct cff_op_eof { |
| 103 | unsigned char op; |
Sushmita Susheelendra | 22d8717 | 2011-05-09 16:40:02 -0600 | [diff] [blame] | 104 | } __packed; |
Bryan Huntsman | 3f2bc4d | 2011-08-16 17:27:22 -0700 | [diff] [blame] | 105 | |
Sushmita Susheelendra | 41f8fa3 | 2011-05-11 17:15:58 -0600 | [diff] [blame^] | 106 | #define CFF_OP_VERIFY_MEM_FILE 0x00000007 |
| 107 | #define CFF_OP_WRITE_SURFACE_PARAMS 0x00000011 |
| 108 | struct cff_op_user_event { |
| 109 | unsigned char op; |
| 110 | unsigned int op1; |
| 111 | unsigned int op2; |
| 112 | unsigned int op3; |
| 113 | unsigned int op4; |
| 114 | unsigned int op5; |
| 115 | } __packed; |
| 116 | |
Bryan Huntsman | 3f2bc4d | 2011-08-16 17:27:22 -0700 | [diff] [blame] | 117 | |
| 118 | static void b64_encodeblock(unsigned char in[3], unsigned char out[4], int len) |
| 119 | { |
| 120 | static const char tob64[] = "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmno" |
| 121 | "pqrstuvwxyz0123456789+/"; |
| 122 | |
| 123 | out[0] = tob64[in[0] >> 2]; |
| 124 | out[1] = tob64[((in[0] & 0x03) << 4) | ((in[1] & 0xf0) >> 4)]; |
| 125 | out[2] = (unsigned char) (len > 1 ? tob64[((in[1] & 0x0f) << 2) |
| 126 | | ((in[2] & 0xc0) >> 6)] : '='); |
| 127 | out[3] = (unsigned char) (len > 2 ? tob64[in[2] & 0x3f] : '='); |
| 128 | } |
| 129 | |
| 130 | static void b64_encode(const unsigned char *in_buf, int in_size, |
| 131 | unsigned char *out_buf, int out_bufsize, int *out_size) |
| 132 | { |
| 133 | unsigned char in[3], out[4]; |
| 134 | int i, len; |
| 135 | |
| 136 | *out_size = 0; |
| 137 | while (in_size > 0) { |
| 138 | len = 0; |
| 139 | for (i = 0; i < 3; ++i) { |
| 140 | if (in_size-- > 0) { |
| 141 | in[i] = *in_buf++; |
| 142 | ++len; |
| 143 | } else |
| 144 | in[i] = 0; |
| 145 | } |
| 146 | if (len) { |
| 147 | b64_encodeblock(in, out, len); |
| 148 | if (out_bufsize < 4) { |
| 149 | pr_warn("kgsl: cffdump: %s: out of buffer\n", |
| 150 | __func__); |
| 151 | return; |
| 152 | } |
| 153 | for (i = 0; i < 4; ++i) |
| 154 | *out_buf++ = out[i]; |
| 155 | *out_size += 4; |
| 156 | out_bufsize -= 4; |
| 157 | } |
| 158 | } |
| 159 | } |
| 160 | |
| 161 | #define KLOG_TMPBUF_SIZE (1024) |
| 162 | static void klog_printk(const char *fmt, ...) |
| 163 | { |
| 164 | /* per-cpu klog formatting temporary buffer */ |
| 165 | static char klog_buf[NR_CPUS][KLOG_TMPBUF_SIZE]; |
| 166 | |
| 167 | va_list args; |
| 168 | int len; |
| 169 | char *cbuf; |
| 170 | unsigned long flags; |
| 171 | |
| 172 | local_irq_save(flags); |
| 173 | cbuf = klog_buf[smp_processor_id()]; |
| 174 | va_start(args, fmt); |
| 175 | len = vsnprintf(cbuf, KLOG_TMPBUF_SIZE, fmt, args); |
| 176 | total_bytes += len; |
| 177 | va_end(args); |
| 178 | relay_write(chan, cbuf, len); |
| 179 | local_irq_restore(flags); |
| 180 | } |
| 181 | |
| 182 | static struct cff_op_write_membuf cff_op_write_membuf; |
| 183 | static void cffdump_membuf(int id, unsigned char *out_buf, int out_bufsize) |
| 184 | { |
| 185 | void *data; |
| 186 | int len, out_size; |
| 187 | struct cff_op_write_mem cff_op_write_mem; |
| 188 | |
| 189 | uint addr = cff_op_write_membuf.addr |
| 190 | - sizeof(uint)*cff_op_write_membuf.count; |
| 191 | |
| 192 | if (!cff_op_write_membuf.count) { |
| 193 | pr_warn("kgsl: cffdump: membuf: count == 0, skipping"); |
| 194 | return; |
| 195 | } |
| 196 | |
| 197 | if (cff_op_write_membuf.count != 1) { |
| 198 | cff_op_write_membuf.op = CFF_OP_WRITE_MEMBUF; |
| 199 | cff_op_write_membuf.addr = addr; |
| 200 | len = sizeof(cff_op_write_membuf) - |
| 201 | sizeof(uint)*(MEMBUF_SIZE - cff_op_write_membuf.count); |
| 202 | data = &cff_op_write_membuf; |
| 203 | } else { |
| 204 | cff_op_write_mem.op = CFF_OP_WRITE_MEM; |
| 205 | cff_op_write_mem.addr = addr; |
| 206 | cff_op_write_mem.value = cff_op_write_membuf.buffer[0]; |
| 207 | data = &cff_op_write_mem; |
| 208 | len = sizeof(cff_op_write_mem); |
| 209 | } |
| 210 | b64_encode(data, len, out_buf, out_bufsize, &out_size); |
| 211 | out_buf[out_size] = 0; |
| 212 | klog_printk("%ld:%d;%s\n", ++serial_nr, id, out_buf); |
| 213 | cff_op_write_membuf.count = 0; |
| 214 | cff_op_write_membuf.addr = 0; |
| 215 | } |
| 216 | |
| 217 | static void cffdump_printline(int id, uint opcode, uint op1, uint op2, |
Sushmita Susheelendra | 41f8fa3 | 2011-05-11 17:15:58 -0600 | [diff] [blame^] | 218 | uint op3, uint op4, uint op5) |
Bryan Huntsman | 3f2bc4d | 2011-08-16 17:27:22 -0700 | [diff] [blame] | 219 | { |
| 220 | struct cff_op_write_reg cff_op_write_reg; |
| 221 | struct cff_op_poll_reg cff_op_poll_reg; |
| 222 | struct cff_op_wait_irq cff_op_wait_irq; |
Jeremy Gebben | 6061bc7 | 2011-04-18 15:23:16 -0600 | [diff] [blame] | 223 | struct cff_op_memory_base cff_op_memory_base; |
| 224 | struct cff_op_hang cff_op_hang; |
Bryan Huntsman | 3f2bc4d | 2011-08-16 17:27:22 -0700 | [diff] [blame] | 225 | struct cff_op_eof cff_op_eof; |
Sushmita Susheelendra | 41f8fa3 | 2011-05-11 17:15:58 -0600 | [diff] [blame^] | 226 | struct cff_op_user_event cff_op_user_event; |
Bryan Huntsman | 3f2bc4d | 2011-08-16 17:27:22 -0700 | [diff] [blame] | 227 | unsigned char out_buf[sizeof(cff_op_write_membuf)/3*4 + 16]; |
| 228 | void *data; |
| 229 | int len = 0, out_size; |
| 230 | long cur_secs; |
| 231 | |
| 232 | spin_lock(&cffdump_lock); |
| 233 | if (opcode == CFF_OP_WRITE_MEM) { |
| 234 | if (op1 < 0x40000000 || op1 >= 0x60000000) |
| 235 | KGSL_CORE_ERR("addr out-of-range: op1=%08x", op1); |
| 236 | if ((cff_op_write_membuf.addr != op1 && |
| 237 | cff_op_write_membuf.count) |
| 238 | || (cff_op_write_membuf.count == MEMBUF_SIZE)) |
| 239 | cffdump_membuf(id, out_buf, sizeof(out_buf)); |
| 240 | |
| 241 | cff_op_write_membuf.buffer[cff_op_write_membuf.count++] = op2; |
| 242 | cff_op_write_membuf.addr = op1 + sizeof(uint); |
| 243 | spin_unlock(&cffdump_lock); |
| 244 | return; |
| 245 | } else if (cff_op_write_membuf.count) |
| 246 | cffdump_membuf(id, out_buf, sizeof(out_buf)); |
| 247 | spin_unlock(&cffdump_lock); |
| 248 | |
| 249 | switch (opcode) { |
| 250 | case CFF_OP_WRITE_REG: |
| 251 | cff_op_write_reg.op = opcode; |
| 252 | cff_op_write_reg.addr = op1; |
| 253 | cff_op_write_reg.value = op2; |
| 254 | data = &cff_op_write_reg; |
| 255 | len = sizeof(cff_op_write_reg); |
| 256 | break; |
| 257 | |
| 258 | case CFF_OP_POLL_REG: |
| 259 | cff_op_poll_reg.op = opcode; |
| 260 | cff_op_poll_reg.addr = op1; |
| 261 | cff_op_poll_reg.value = op2; |
| 262 | cff_op_poll_reg.mask = op3; |
| 263 | data = &cff_op_poll_reg; |
| 264 | len = sizeof(cff_op_poll_reg); |
| 265 | break; |
| 266 | |
| 267 | case CFF_OP_WAIT_IRQ: |
| 268 | cff_op_wait_irq.op = opcode; |
| 269 | data = &cff_op_wait_irq; |
| 270 | len = sizeof(cff_op_wait_irq); |
| 271 | break; |
| 272 | |
Jeremy Gebben | 6061bc7 | 2011-04-18 15:23:16 -0600 | [diff] [blame] | 273 | case CFF_OP_MEMORY_BASE: |
| 274 | cff_op_memory_base.op = opcode; |
| 275 | cff_op_memory_base.base = op1; |
| 276 | cff_op_memory_base.size = op2; |
| 277 | cff_op_memory_base.gmemsize = op3; |
| 278 | data = &cff_op_memory_base; |
| 279 | len = sizeof(cff_op_memory_base); |
| 280 | break; |
| 281 | |
| 282 | case CFF_OP_HANG: |
| 283 | cff_op_hang.op = opcode; |
| 284 | data = &cff_op_hang; |
| 285 | len = sizeof(cff_op_hang); |
| 286 | break; |
| 287 | |
Bryan Huntsman | 3f2bc4d | 2011-08-16 17:27:22 -0700 | [diff] [blame] | 288 | case CFF_OP_EOF: |
| 289 | cff_op_eof.op = opcode; |
| 290 | data = &cff_op_eof; |
| 291 | len = sizeof(cff_op_eof); |
| 292 | break; |
Sushmita Susheelendra | 41f8fa3 | 2011-05-11 17:15:58 -0600 | [diff] [blame^] | 293 | |
| 294 | case CFF_OP_WRITE_SURFACE_PARAMS: |
| 295 | case CFF_OP_VERIFY_MEM_FILE: |
| 296 | cff_op_user_event.op = opcode; |
| 297 | cff_op_user_event.op1 = op1; |
| 298 | cff_op_user_event.op2 = op2; |
| 299 | cff_op_user_event.op3 = op3; |
| 300 | cff_op_user_event.op4 = op4; |
| 301 | cff_op_user_event.op5 = op5; |
| 302 | data = &cff_op_user_event; |
| 303 | len = sizeof(cff_op_user_event); |
| 304 | break; |
Bryan Huntsman | 3f2bc4d | 2011-08-16 17:27:22 -0700 | [diff] [blame] | 305 | } |
| 306 | |
| 307 | if (len) { |
| 308 | b64_encode(data, len, out_buf, sizeof(out_buf), &out_size); |
| 309 | out_buf[out_size] = 0; |
| 310 | klog_printk("%ld:%d;%s\n", ++serial_nr, id, out_buf); |
| 311 | } else |
| 312 | pr_warn("kgsl: cffdump: unhandled opcode: %d\n", opcode); |
| 313 | |
| 314 | cur_secs = get_seconds(); |
| 315 | if ((cur_secs - last_sec) > 10 || (last_sec - cur_secs) > 10) { |
| 316 | pr_info("kgsl: cffdump: total [bytes:%lu kB, syncmem:%lu kB], " |
| 317 | "seq#: %lu\n", total_bytes/1024, total_syncmem/1024, |
| 318 | serial_nr); |
| 319 | last_sec = cur_secs; |
| 320 | } |
| 321 | } |
| 322 | |
| 323 | void kgsl_cffdump_init() |
| 324 | { |
| 325 | struct dentry *debugfs_dir = kgsl_get_debugfs_dir(); |
| 326 | |
| 327 | #ifdef ALIGN_CPU |
| 328 | cpumask_t mask; |
| 329 | |
| 330 | cpumask_clear(&mask); |
Lucille Sylvester | 57996e3 | 2011-05-26 19:12:22 -0600 | [diff] [blame] | 331 | cpumask_set_cpu(0, &mask); |
Bryan Huntsman | 3f2bc4d | 2011-08-16 17:27:22 -0700 | [diff] [blame] | 332 | sched_setaffinity(0, &mask); |
| 333 | #endif |
| 334 | if (!debugfs_dir || IS_ERR(debugfs_dir)) { |
| 335 | KGSL_CORE_ERR("Debugfs directory is bad\n"); |
| 336 | return; |
| 337 | } |
| 338 | |
| 339 | kgsl_cff_dump_enable = 1; |
| 340 | |
| 341 | spin_lock_init(&cffdump_lock); |
| 342 | |
| 343 | dir = debugfs_create_dir("cff", debugfs_dir); |
| 344 | if (!dir) { |
| 345 | KGSL_CORE_ERR("debugfs_create_dir failed\n"); |
| 346 | return; |
| 347 | } |
| 348 | |
| 349 | chan = create_channel(subbuf_size, n_subbufs); |
| 350 | } |
| 351 | |
| 352 | void kgsl_cffdump_destroy() |
| 353 | { |
| 354 | if (chan) |
| 355 | relay_flush(chan); |
| 356 | destroy_channel(); |
| 357 | if (dir) |
| 358 | debugfs_remove(dir); |
| 359 | } |
| 360 | |
| 361 | void kgsl_cffdump_open(enum kgsl_deviceid device_id) |
| 362 | { |
Jeremy Gebben | 6061bc7 | 2011-04-18 15:23:16 -0600 | [diff] [blame] | 363 | /*TODO: move this to where we can report correct gmemsize*/ |
| 364 | unsigned int va_base; |
| 365 | |
| 366 | if (cpu_is_msm8x60() || cpu_is_msm8960()) |
| 367 | va_base = 0x40000000; |
| 368 | else |
| 369 | va_base = 0x20000000; |
| 370 | |
| 371 | kgsl_cffdump_memory_base(device_id, va_base, |
| 372 | CONFIG_MSM_KGSL_PAGE_TABLE_SIZE, SZ_256K); |
| 373 | } |
| 374 | |
| 375 | void kgsl_cffdump_memory_base(enum kgsl_deviceid device_id, unsigned int base, |
| 376 | unsigned int range, unsigned gmemsize) |
| 377 | { |
Sushmita Susheelendra | 41f8fa3 | 2011-05-11 17:15:58 -0600 | [diff] [blame^] | 378 | cffdump_printline(device_id, CFF_OP_MEMORY_BASE, base, |
| 379 | range, gmemsize, 0, 0); |
Jeremy Gebben | 6061bc7 | 2011-04-18 15:23:16 -0600 | [diff] [blame] | 380 | } |
| 381 | |
| 382 | void kgsl_cffdump_hang(enum kgsl_deviceid device_id) |
| 383 | { |
Sushmita Susheelendra | 41f8fa3 | 2011-05-11 17:15:58 -0600 | [diff] [blame^] | 384 | cffdump_printline(device_id, CFF_OP_HANG, 0, 0, 0, 0, 0); |
Bryan Huntsman | 3f2bc4d | 2011-08-16 17:27:22 -0700 | [diff] [blame] | 385 | } |
| 386 | |
| 387 | void kgsl_cffdump_close(enum kgsl_deviceid device_id) |
| 388 | { |
Sushmita Susheelendra | 41f8fa3 | 2011-05-11 17:15:58 -0600 | [diff] [blame^] | 389 | cffdump_printline(device_id, CFF_OP_EOF, 0, 0, 0, 0, 0); |
| 390 | } |
| 391 | |
| 392 | void kgsl_cffdump_user_event(unsigned int cff_opcode, unsigned int op1, |
| 393 | unsigned int op2, unsigned int op3, |
| 394 | unsigned int op4, unsigned int op5) |
| 395 | { |
| 396 | cffdump_printline(-1, cff_opcode, op1, op2, op3, op4, op5); |
Bryan Huntsman | 3f2bc4d | 2011-08-16 17:27:22 -0700 | [diff] [blame] | 397 | } |
| 398 | |
| 399 | void kgsl_cffdump_syncmem(struct kgsl_device_private *dev_priv, |
| 400 | const struct kgsl_memdesc *memdesc, uint gpuaddr, uint sizebytes, |
| 401 | bool clean_cache) |
| 402 | { |
| 403 | const void *src; |
| 404 | uint host_size; |
| 405 | uint physaddr; |
| 406 | |
| 407 | if (!kgsl_cff_dump_enable) |
| 408 | return; |
| 409 | |
| 410 | total_syncmem += sizebytes; |
| 411 | |
| 412 | if (memdesc == NULL) { |
| 413 | struct kgsl_mem_entry *entry; |
| 414 | spin_lock(&dev_priv->process_priv->mem_lock); |
| 415 | entry = kgsl_sharedmem_find_region(dev_priv->process_priv, |
| 416 | gpuaddr, sizebytes); |
| 417 | spin_unlock(&dev_priv->process_priv->mem_lock); |
| 418 | if (entry == NULL) { |
| 419 | KGSL_CORE_ERR("did not find mapping " |
| 420 | "for gpuaddr: 0x%08x\n", gpuaddr); |
| 421 | return; |
| 422 | } |
| 423 | memdesc = &entry->memdesc; |
| 424 | } |
| 425 | BUG_ON(memdesc->gpuaddr == 0); |
| 426 | BUG_ON(gpuaddr == 0); |
| 427 | physaddr = kgsl_get_realaddr(memdesc) + (gpuaddr - memdesc->gpuaddr); |
| 428 | |
| 429 | src = kgsl_gpuaddr_to_vaddr(memdesc, gpuaddr, &host_size); |
| 430 | if (src == NULL || host_size < sizebytes) { |
Sushmita Susheelendra | 22d8717 | 2011-05-09 16:40:02 -0600 | [diff] [blame] | 431 | KGSL_CORE_ERR("did not find mapping for " |
Bryan Huntsman | 3f2bc4d | 2011-08-16 17:27:22 -0700 | [diff] [blame] | 432 | "gpuaddr: 0x%08x, m->host: 0x%p, phys: 0x%08x\n", |
| 433 | gpuaddr, memdesc->hostptr, memdesc->physaddr); |
| 434 | return; |
| 435 | } |
| 436 | |
| 437 | if (clean_cache) { |
| 438 | /* Ensure that this memory region is not read from the |
| 439 | * cache but fetched fresh */ |
| 440 | |
| 441 | mb(); |
| 442 | |
Sushmita Susheelendra | 22d8717 | 2011-05-09 16:40:02 -0600 | [diff] [blame] | 443 | kgsl_cache_range_op((struct kgsl_memdesc *)memdesc, |
| 444 | KGSL_CACHE_OP_INV); |
Bryan Huntsman | 3f2bc4d | 2011-08-16 17:27:22 -0700 | [diff] [blame] | 445 | } |
| 446 | |
| 447 | BUG_ON(physaddr > 0x66000000 && physaddr < 0x66ffffff); |
| 448 | while (sizebytes > 3) { |
Sushmita Susheelendra | 41f8fa3 | 2011-05-11 17:15:58 -0600 | [diff] [blame^] | 449 | cffdump_printline(-1, CFF_OP_WRITE_MEM, gpuaddr, *(uint *)src, |
| 450 | 0, 0, 0); |
| 451 | gpuaddr += 4; |
Bryan Huntsman | 3f2bc4d | 2011-08-16 17:27:22 -0700 | [diff] [blame] | 452 | src += 4; |
| 453 | sizebytes -= 4; |
| 454 | } |
| 455 | if (sizebytes > 0) |
Sushmita Susheelendra | 41f8fa3 | 2011-05-11 17:15:58 -0600 | [diff] [blame^] | 456 | cffdump_printline(-1, CFF_OP_WRITE_MEM, gpuaddr, *(uint *)src, |
| 457 | 0, 0, 0); |
Bryan Huntsman | 3f2bc4d | 2011-08-16 17:27:22 -0700 | [diff] [blame] | 458 | } |
| 459 | |
| 460 | void kgsl_cffdump_setmem(uint addr, uint value, uint sizebytes) |
| 461 | { |
| 462 | if (!kgsl_cff_dump_enable) |
| 463 | return; |
| 464 | |
| 465 | BUG_ON(addr > 0x66000000 && addr < 0x66ffffff); |
| 466 | while (sizebytes > 3) { |
| 467 | /* Use 32bit memory writes as long as there's at least |
| 468 | * 4 bytes left */ |
Sushmita Susheelendra | 41f8fa3 | 2011-05-11 17:15:58 -0600 | [diff] [blame^] | 469 | cffdump_printline(-1, CFF_OP_WRITE_MEM, addr, value, |
| 470 | 0, 0, 0); |
Bryan Huntsman | 3f2bc4d | 2011-08-16 17:27:22 -0700 | [diff] [blame] | 471 | addr += 4; |
| 472 | sizebytes -= 4; |
| 473 | } |
| 474 | if (sizebytes > 0) |
Sushmita Susheelendra | 41f8fa3 | 2011-05-11 17:15:58 -0600 | [diff] [blame^] | 475 | cffdump_printline(-1, CFF_OP_WRITE_MEM, addr, value, |
| 476 | 0, 0, 0); |
Bryan Huntsman | 3f2bc4d | 2011-08-16 17:27:22 -0700 | [diff] [blame] | 477 | } |
| 478 | |
| 479 | void kgsl_cffdump_regwrite(enum kgsl_deviceid device_id, uint addr, |
| 480 | uint value) |
| 481 | { |
| 482 | if (!kgsl_cff_dump_enable) |
| 483 | return; |
| 484 | |
Sushmita Susheelendra | 41f8fa3 | 2011-05-11 17:15:58 -0600 | [diff] [blame^] | 485 | cffdump_printline(device_id, CFF_OP_WRITE_REG, addr, value, |
| 486 | 0, 0, 0); |
Bryan Huntsman | 3f2bc4d | 2011-08-16 17:27:22 -0700 | [diff] [blame] | 487 | } |
| 488 | |
| 489 | void kgsl_cffdump_regpoll(enum kgsl_deviceid device_id, uint addr, |
| 490 | uint value, uint mask) |
| 491 | { |
| 492 | if (!kgsl_cff_dump_enable) |
| 493 | return; |
| 494 | |
Sushmita Susheelendra | 41f8fa3 | 2011-05-11 17:15:58 -0600 | [diff] [blame^] | 495 | cffdump_printline(device_id, CFF_OP_POLL_REG, addr, value, |
| 496 | mask, 0, 0); |
Bryan Huntsman | 3f2bc4d | 2011-08-16 17:27:22 -0700 | [diff] [blame] | 497 | } |
| 498 | |
| 499 | void kgsl_cffdump_slavewrite(uint addr, uint value) |
| 500 | { |
| 501 | if (!kgsl_cff_dump_enable) |
| 502 | return; |
| 503 | |
Sushmita Susheelendra | 41f8fa3 | 2011-05-11 17:15:58 -0600 | [diff] [blame^] | 504 | cffdump_printline(-1, CFF_OP_WRITE_REG, addr, value, 0, 0, 0); |
Bryan Huntsman | 3f2bc4d | 2011-08-16 17:27:22 -0700 | [diff] [blame] | 505 | } |
| 506 | |
| 507 | int kgsl_cffdump_waitirq(void) |
| 508 | { |
| 509 | if (!kgsl_cff_dump_enable) |
| 510 | return 0; |
| 511 | |
Sushmita Susheelendra | 41f8fa3 | 2011-05-11 17:15:58 -0600 | [diff] [blame^] | 512 | cffdump_printline(-1, CFF_OP_WAIT_IRQ, 0, 0, 0, 0, 0); |
Bryan Huntsman | 3f2bc4d | 2011-08-16 17:27:22 -0700 | [diff] [blame] | 513 | |
| 514 | return 1; |
| 515 | } |
| 516 | EXPORT_SYMBOL(kgsl_cffdump_waitirq); |
| 517 | |
| 518 | #define ADDRESS_STACK_SIZE 256 |
| 519 | #define GET_PM4_TYPE3_OPCODE(x) ((*(x) >> 8) & 0xFF) |
| 520 | static unsigned int kgsl_cffdump_addr_count; |
| 521 | |
| 522 | static bool kgsl_cffdump_handle_type3(struct kgsl_device_private *dev_priv, |
| 523 | uint *hostaddr, bool check_only) |
| 524 | { |
| 525 | static uint addr_stack[ADDRESS_STACK_SIZE]; |
| 526 | static uint size_stack[ADDRESS_STACK_SIZE]; |
| 527 | |
| 528 | switch (GET_PM4_TYPE3_OPCODE(hostaddr)) { |
Sushmita Susheelendra | fbb46aa | 2011-08-25 18:05:08 -0600 | [diff] [blame] | 529 | case CP_INDIRECT_BUFFER_PFD: |
| 530 | case CP_INDIRECT_BUFFER: |
Bryan Huntsman | 3f2bc4d | 2011-08-16 17:27:22 -0700 | [diff] [blame] | 531 | { |
| 532 | /* traverse indirect buffers */ |
| 533 | int i; |
| 534 | uint ibaddr = hostaddr[1]; |
| 535 | uint ibsize = hostaddr[2]; |
| 536 | |
| 537 | /* is this address already in encountered? */ |
| 538 | for (i = 0; |
| 539 | i < kgsl_cffdump_addr_count && addr_stack[i] != ibaddr; |
| 540 | ++i) |
| 541 | ; |
| 542 | |
| 543 | if (kgsl_cffdump_addr_count == i) { |
| 544 | addr_stack[kgsl_cffdump_addr_count] = ibaddr; |
| 545 | size_stack[kgsl_cffdump_addr_count++] = ibsize; |
| 546 | |
| 547 | if (kgsl_cffdump_addr_count >= ADDRESS_STACK_SIZE) { |
| 548 | KGSL_CORE_ERR("stack overflow\n"); |
| 549 | return false; |
| 550 | } |
| 551 | |
| 552 | return kgsl_cffdump_parse_ibs(dev_priv, NULL, |
| 553 | ibaddr, ibsize, check_only); |
| 554 | } else if (size_stack[i] != ibsize) { |
| 555 | KGSL_CORE_ERR("gpuaddr: 0x%08x, " |
| 556 | "wc: %u, with size wc: %u already on the " |
| 557 | "stack\n", ibaddr, ibsize, size_stack[i]); |
| 558 | return false; |
| 559 | } |
| 560 | } |
| 561 | break; |
| 562 | } |
| 563 | |
| 564 | return true; |
| 565 | } |
| 566 | |
| 567 | /* |
| 568 | * Traverse IBs and dump them to test vector. Detect swap by inspecting |
| 569 | * register writes, keeping note of the current state, and dump |
| 570 | * framebuffer config to test vector |
| 571 | */ |
| 572 | bool kgsl_cffdump_parse_ibs(struct kgsl_device_private *dev_priv, |
| 573 | const struct kgsl_memdesc *memdesc, uint gpuaddr, int sizedwords, |
| 574 | bool check_only) |
| 575 | { |
| 576 | static uint level; /* recursion level */ |
| 577 | bool ret = true; |
| 578 | uint host_size; |
| 579 | uint *hostaddr, *hoststart; |
| 580 | int dwords_left = sizedwords; /* dwords left in the current command |
| 581 | buffer */ |
| 582 | |
| 583 | if (level == 0) |
| 584 | kgsl_cffdump_addr_count = 0; |
| 585 | |
| 586 | if (memdesc == NULL) { |
| 587 | struct kgsl_mem_entry *entry; |
| 588 | spin_lock(&dev_priv->process_priv->mem_lock); |
| 589 | entry = kgsl_sharedmem_find_region(dev_priv->process_priv, |
| 590 | gpuaddr, sizedwords * sizeof(uint)); |
| 591 | spin_unlock(&dev_priv->process_priv->mem_lock); |
| 592 | if (entry == NULL) { |
| 593 | KGSL_CORE_ERR("did not find mapping " |
| 594 | "for gpuaddr: 0x%08x\n", gpuaddr); |
| 595 | return true; |
| 596 | } |
| 597 | memdesc = &entry->memdesc; |
| 598 | } |
| 599 | |
| 600 | hostaddr = (uint *)kgsl_gpuaddr_to_vaddr(memdesc, gpuaddr, &host_size); |
| 601 | if (hostaddr == NULL) { |
| 602 | KGSL_CORE_ERR("did not find mapping for " |
| 603 | "gpuaddr: 0x%08x\n", gpuaddr); |
| 604 | return true; |
| 605 | } |
| 606 | |
| 607 | hoststart = hostaddr; |
| 608 | |
| 609 | level++; |
| 610 | |
| 611 | if (!memdesc->physaddr) { |
| 612 | KGSL_CORE_ERR("no physaddr"); |
| 613 | return true; |
| 614 | } else { |
| 615 | mb(); |
Sushmita Susheelendra | 22d8717 | 2011-05-09 16:40:02 -0600 | [diff] [blame] | 616 | kgsl_cache_range_op((struct kgsl_memdesc *)memdesc, |
| 617 | KGSL_CACHE_OP_INV); |
Bryan Huntsman | 3f2bc4d | 2011-08-16 17:27:22 -0700 | [diff] [blame] | 618 | } |
| 619 | |
| 620 | #ifdef DEBUG |
| 621 | pr_info("kgsl: cffdump: ib: gpuaddr:0x%08x, wc:%d, hptr:%p\n", |
| 622 | gpuaddr, sizedwords, hostaddr); |
| 623 | #endif |
| 624 | |
| 625 | while (dwords_left > 0) { |
| 626 | int count = 0; /* dword count including packet header */ |
| 627 | bool cur_ret = true; |
| 628 | |
| 629 | switch (*hostaddr >> 30) { |
| 630 | case 0x0: /* type-0 */ |
| 631 | count = (*hostaddr >> 16)+2; |
| 632 | break; |
| 633 | case 0x1: /* type-1 */ |
| 634 | count = 2; |
| 635 | break; |
| 636 | case 0x3: /* type-3 */ |
| 637 | count = ((*hostaddr >> 16) & 0x3fff) + 2; |
| 638 | cur_ret = kgsl_cffdump_handle_type3(dev_priv, |
| 639 | hostaddr, check_only); |
| 640 | break; |
| 641 | default: |
| 642 | pr_warn("kgsl: cffdump: parse-ib: unexpected type: " |
| 643 | "type:%d, word:0x%08x @ 0x%p, gpu:0x%08x\n", |
| 644 | *hostaddr >> 30, *hostaddr, hostaddr, |
| 645 | gpuaddr+4*(sizedwords-dwords_left)); |
| 646 | cur_ret = false; |
| 647 | count = dwords_left; |
| 648 | break; |
| 649 | } |
| 650 | |
| 651 | #ifdef DEBUG |
| 652 | if (!cur_ret) { |
| 653 | pr_info("kgsl: cffdump: bad sub-type: #:%d/%d, v:0x%08x" |
| 654 | " @ 0x%p[gb:0x%08x], level:%d\n", |
| 655 | sizedwords-dwords_left, sizedwords, *hostaddr, |
| 656 | hostaddr, gpuaddr+4*(sizedwords-dwords_left), |
| 657 | level); |
| 658 | |
| 659 | print_hex_dump(KERN_ERR, level == 1 ? "IB1:" : "IB2:", |
| 660 | DUMP_PREFIX_OFFSET, 32, 4, hoststart, |
| 661 | sizedwords*4, 0); |
| 662 | } |
| 663 | #endif |
| 664 | ret = ret && cur_ret; |
| 665 | |
| 666 | /* jump to next packet */ |
| 667 | dwords_left -= count; |
| 668 | hostaddr += count; |
| 669 | cur_ret = dwords_left >= 0; |
| 670 | |
| 671 | #ifdef DEBUG |
| 672 | if (!cur_ret) { |
| 673 | pr_info("kgsl: cffdump: bad count: c:%d, #:%d/%d, " |
| 674 | "v:0x%08x @ 0x%p[gb:0x%08x], level:%d\n", |
| 675 | count, sizedwords-(dwords_left+count), |
| 676 | sizedwords, *(hostaddr-count), hostaddr-count, |
| 677 | gpuaddr+4*(sizedwords-(dwords_left+count)), |
| 678 | level); |
| 679 | |
| 680 | print_hex_dump(KERN_ERR, level == 1 ? "IB1:" : "IB2:", |
| 681 | DUMP_PREFIX_OFFSET, 32, 4, hoststart, |
| 682 | sizedwords*4, 0); |
| 683 | } |
| 684 | #endif |
| 685 | |
| 686 | ret = ret && cur_ret; |
| 687 | } |
| 688 | |
| 689 | if (!ret) |
| 690 | pr_info("kgsl: cffdump: parsing failed: gpuaddr:0x%08x, " |
| 691 | "host:0x%p, wc:%d\n", gpuaddr, hoststart, sizedwords); |
| 692 | |
| 693 | if (!check_only) { |
| 694 | #ifdef DEBUG |
| 695 | uint offset = gpuaddr - memdesc->gpuaddr; |
| 696 | pr_info("kgsl: cffdump: ib-dump: hostptr:%p, gpuaddr:%08x, " |
| 697 | "physaddr:%08x, offset:%d, size:%d", hoststart, |
| 698 | gpuaddr, memdesc->physaddr + offset, offset, |
| 699 | sizedwords*4); |
| 700 | #endif |
| 701 | kgsl_cffdump_syncmem(dev_priv, memdesc, gpuaddr, sizedwords*4, |
| 702 | false); |
| 703 | } |
| 704 | |
| 705 | level--; |
| 706 | |
| 707 | return ret; |
| 708 | } |
| 709 | |
| 710 | static int subbuf_start_handler(struct rchan_buf *buf, |
| 711 | void *subbuf, void *prev_subbuf, uint prev_padding) |
| 712 | { |
| 713 | pr_debug("kgsl: cffdump: subbuf_start_handler(subbuf=%p, prev_subbuf" |
| 714 | "=%p, prev_padding=%08x)\n", subbuf, prev_subbuf, prev_padding); |
| 715 | |
| 716 | if (relay_buf_full(buf)) { |
| 717 | if (!suspended) { |
| 718 | suspended = 1; |
| 719 | pr_warn("kgsl: cffdump: relay: cpu %d buffer full!!!\n", |
| 720 | smp_processor_id()); |
| 721 | } |
| 722 | dropped++; |
| 723 | return 0; |
| 724 | } else if (suspended) { |
| 725 | suspended = 0; |
| 726 | pr_warn("kgsl: cffdump: relay: cpu %d buffer no longer full.\n", |
| 727 | smp_processor_id()); |
| 728 | } |
| 729 | |
| 730 | subbuf_start_reserve(buf, 0); |
| 731 | return 1; |
| 732 | } |
| 733 | |
| 734 | static struct dentry *create_buf_file_handler(const char *filename, |
| 735 | struct dentry *parent, int mode, struct rchan_buf *buf, |
| 736 | int *is_global) |
| 737 | { |
| 738 | return debugfs_create_file(filename, mode, parent, buf, |
| 739 | &relay_file_operations); |
| 740 | } |
| 741 | |
| 742 | /* |
| 743 | * file_remove() default callback. Removes relay file in debugfs. |
| 744 | */ |
| 745 | static int remove_buf_file_handler(struct dentry *dentry) |
| 746 | { |
| 747 | pr_info("kgsl: cffdump: %s()\n", __func__); |
| 748 | debugfs_remove(dentry); |
| 749 | return 0; |
| 750 | } |
| 751 | |
| 752 | /* |
| 753 | * relay callbacks |
| 754 | */ |
| 755 | static struct rchan_callbacks relay_callbacks = { |
| 756 | .subbuf_start = subbuf_start_handler, |
| 757 | .create_buf_file = create_buf_file_handler, |
| 758 | .remove_buf_file = remove_buf_file_handler, |
| 759 | }; |
| 760 | |
| 761 | /** |
| 762 | * create_channel - creates channel /debug/klog/cpuXXX |
| 763 | * |
| 764 | * Creates channel along with associated produced/consumed control files |
| 765 | * |
| 766 | * Returns channel on success, NULL otherwise |
| 767 | */ |
| 768 | static struct rchan *create_channel(unsigned subbuf_size, unsigned n_subbufs) |
| 769 | { |
| 770 | struct rchan *chan; |
| 771 | |
| 772 | pr_info("kgsl: cffdump: relay: create_channel: subbuf_size %u, " |
| 773 | "n_subbufs %u, dir 0x%p\n", subbuf_size, n_subbufs, dir); |
| 774 | |
| 775 | chan = relay_open("cpu", dir, subbuf_size, |
| 776 | n_subbufs, &relay_callbacks, NULL); |
| 777 | if (!chan) { |
| 778 | KGSL_CORE_ERR("relay_open failed\n"); |
| 779 | return NULL; |
| 780 | } |
| 781 | |
| 782 | suspended = 0; |
| 783 | dropped = 0; |
| 784 | |
| 785 | return chan; |
| 786 | } |
| 787 | |
| 788 | /** |
| 789 | * destroy_channel - destroys channel /debug/kgsl/cff/cpuXXX |
| 790 | * |
| 791 | * Destroys channel along with associated produced/consumed control files |
| 792 | */ |
| 793 | static void destroy_channel(void) |
| 794 | { |
| 795 | pr_info("kgsl: cffdump: relay: destroy_channel\n"); |
| 796 | if (chan) { |
| 797 | relay_close(chan); |
| 798 | chan = NULL; |
| 799 | } |
| 800 | } |
| 801 | |