383 lines
11 KiB
C
383 lines
11 KiB
C
/* Copyright (c) 2012, The Linux Foundation. All rights reserved.
|
|
*
|
|
* This program is free software; you can redistribute it and/or modify
|
|
* it under the terms of the GNU General Public License version 2 and
|
|
* only version 2 as published by the Free Software Foundation.
|
|
*
|
|
* This program is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU General Public License for more details.
|
|
*
|
|
*/
|
|
|
|
#include "kgsl.h"
|
|
#include "adreno.h"
|
|
#include "kgsl_snapshot.h"
|
|
|
|
#define DEBUG_SECTION_SZ(_dwords) (((_dwords) * sizeof(unsigned int)) \
|
|
+ sizeof(struct kgsl_snapshot_debug))
|
|
|
|
/* Dump the SX debug registers into a GPU snapshot debug section */
|
|
|
|
#define SXDEBUG_COUNT 0x1B
|
|
|
|
static int a2xx_snapshot_sxdebug(struct kgsl_device *device, void *snapshot,
|
|
int remain, void *priv)
|
|
{
|
|
struct kgsl_snapshot_debug *header = snapshot;
|
|
unsigned int *data = snapshot + sizeof(*header);
|
|
int i;
|
|
|
|
if (remain < DEBUG_SECTION_SZ(SXDEBUG_COUNT)) {
|
|
SNAPSHOT_ERR_NOMEM(device, "SX DEBUG");
|
|
return 0;
|
|
}
|
|
|
|
header->type = SNAPSHOT_DEBUG_SX;
|
|
header->size = SXDEBUG_COUNT;
|
|
|
|
for (i = 0; i < SXDEBUG_COUNT; i++) {
|
|
adreno_regwrite(device, REG_RBBM_DEBUG_CNTL, 0x1B00 | i);
|
|
adreno_regread(device, REG_RBBM_DEBUG_OUT, &data[i]);
|
|
}
|
|
|
|
adreno_regwrite(device, REG_RBBM_DEBUG_CNTL, 0);
|
|
|
|
return DEBUG_SECTION_SZ(SXDEBUG_COUNT);
|
|
}
|
|
|
|
#define CPDEBUG_COUNT 0x20
|
|
|
|
static int a2xx_snapshot_cpdebug(struct kgsl_device *device, void *snapshot,
|
|
int remain, void *priv)
|
|
{
|
|
struct kgsl_snapshot_debug *header = snapshot;
|
|
unsigned int *data = snapshot + sizeof(*header);
|
|
int i;
|
|
|
|
if (remain < DEBUG_SECTION_SZ(CPDEBUG_COUNT)) {
|
|
SNAPSHOT_ERR_NOMEM(device, "CP DEBUG");
|
|
return 0;
|
|
}
|
|
|
|
header->type = SNAPSHOT_DEBUG_CP;
|
|
header->size = CPDEBUG_COUNT;
|
|
|
|
for (i = 0; i < CPDEBUG_COUNT; i++) {
|
|
adreno_regwrite(device, REG_RBBM_DEBUG_CNTL, 0x1628);
|
|
adreno_regread(device, REG_RBBM_DEBUG_OUT, &data[i]);
|
|
}
|
|
|
|
adreno_regwrite(device, REG_RBBM_DEBUG_CNTL, 0);
|
|
|
|
return DEBUG_SECTION_SZ(CPDEBUG_COUNT);
|
|
}
|
|
|
|
/*
|
|
* The contents of the SQ debug sections are dword pairs:
|
|
* [register offset]:[value]
|
|
* This macro writes both dwords for the given register
|
|
*/
|
|
|
|
#define SQ_DEBUG_WRITE(_device, _reg, _data, _offset) \
|
|
do { _data[(_offset)++] = (_reg); \
|
|
adreno_regread(_device, (_reg), &_data[(_offset)++]); } while (0)
|
|
|
|
#define SQ_DEBUG_BANK_SIZE 23
|
|
|
|
static int a2xx_snapshot_sqdebug(struct kgsl_device *device, void *snapshot,
|
|
int remain, void *priv)
|
|
{
|
|
struct kgsl_snapshot_debug *header = snapshot;
|
|
unsigned int *data = snapshot + sizeof(*header);
|
|
int i, offset = 0;
|
|
int size = SQ_DEBUG_BANK_SIZE * 2 * 2;
|
|
|
|
if (remain < DEBUG_SECTION_SZ(size)) {
|
|
SNAPSHOT_ERR_NOMEM(device, "SQ Debug");
|
|
return 0;
|
|
}
|
|
|
|
header->type = SNAPSHOT_DEBUG_SQ;
|
|
header->size = size;
|
|
|
|
for (i = 0; i < 2; i++) {
|
|
SQ_DEBUG_WRITE(device, REG_SQ_DEBUG_CONST_MGR_FSM+i*0x1000,
|
|
data, offset);
|
|
SQ_DEBUG_WRITE(device, REG_SQ_DEBUG_EXP_ALLOC+i*0x1000,
|
|
data, offset);
|
|
SQ_DEBUG_WRITE(device, REG_SQ_DEBUG_FSM_ALU_0+i*0x1000,
|
|
data, offset);
|
|
SQ_DEBUG_WRITE(device, REG_SQ_DEBUG_FSM_ALU_1+i*0x1000,
|
|
data, offset);
|
|
SQ_DEBUG_WRITE(device, REG_SQ_DEBUG_GPR_PIX+i*0x1000,
|
|
data, offset);
|
|
SQ_DEBUG_WRITE(device, REG_SQ_DEBUG_GPR_VTX+i*0x1000,
|
|
data, offset);
|
|
SQ_DEBUG_WRITE(device, REG_SQ_DEBUG_INPUT_FSM+i*0x1000,
|
|
data, offset);
|
|
SQ_DEBUG_WRITE(device, REG_SQ_DEBUG_MISC+i*0x1000,
|
|
data, offset);
|
|
SQ_DEBUG_WRITE(device, REG_SQ_DEBUG_MISC_0+i*0x1000,
|
|
data, offset);
|
|
SQ_DEBUG_WRITE(device, REG_SQ_DEBUG_MISC_1+i*0x1000,
|
|
data, offset);
|
|
SQ_DEBUG_WRITE(device, REG_SQ_DEBUG_PIX_TB_0+i*0x1000,
|
|
data, offset);
|
|
SQ_DEBUG_WRITE(device, REG_SQ_DEBUG_PIX_TB_STATE_MEM+i*0x1000,
|
|
data, offset);
|
|
SQ_DEBUG_WRITE(device,
|
|
REG_SQ_DEBUG_PIX_TB_STATUS_REG_0+i*0x1000,
|
|
data, offset);
|
|
SQ_DEBUG_WRITE(device,
|
|
REG_SQ_DEBUG_PIX_TB_STATUS_REG_1+i*0x1000,
|
|
data, offset);
|
|
SQ_DEBUG_WRITE(device,
|
|
REG_SQ_DEBUG_PIX_TB_STATUS_REG_2+i*0x1000,
|
|
data, offset);
|
|
SQ_DEBUG_WRITE(device,
|
|
REG_SQ_DEBUG_PIX_TB_STATUS_REG_3+i*0x1000,
|
|
data, offset);
|
|
SQ_DEBUG_WRITE(device, REG_SQ_DEBUG_PTR_BUFF+i*0x1000,
|
|
data, offset);
|
|
SQ_DEBUG_WRITE(device, REG_SQ_DEBUG_TB_STATUS_SEL+i*0x1000,
|
|
data, offset);
|
|
SQ_DEBUG_WRITE(device, REG_SQ_DEBUG_TP_FSM+i*0x1000,
|
|
data, offset);
|
|
SQ_DEBUG_WRITE(device, REG_SQ_DEBUG_VTX_TB_0+i*0x1000,
|
|
data, offset);
|
|
SQ_DEBUG_WRITE(device, REG_SQ_DEBUG_VTX_TB_1+i*0x1000,
|
|
data, offset);
|
|
SQ_DEBUG_WRITE(device, REG_SQ_DEBUG_VTX_TB_STATE_MEM+i*0x1000,
|
|
data, offset);
|
|
}
|
|
|
|
return DEBUG_SECTION_SZ(size);
|
|
}
|
|
|
|
#define SQ_DEBUG_THREAD_SIZE 7
|
|
|
|
static int a2xx_snapshot_sqthreaddebug(struct kgsl_device *device,
|
|
void *snapshot, int remain, void *priv)
|
|
{
|
|
struct kgsl_snapshot_debug *header = snapshot;
|
|
unsigned int *data = snapshot + sizeof(*header);
|
|
int i, offset = 0;
|
|
int size = SQ_DEBUG_THREAD_SIZE * 2 * 16;
|
|
|
|
if (remain < DEBUG_SECTION_SZ(size)) {
|
|
SNAPSHOT_ERR_NOMEM(device, "SQ THREAD DEBUG");
|
|
return 0;
|
|
}
|
|
|
|
header->type = SNAPSHOT_DEBUG_SQTHREAD;
|
|
header->size = size;
|
|
|
|
for (i = 0; i < 16; i++) {
|
|
adreno_regwrite(device, REG_SQ_DEBUG_TB_STATUS_SEL,
|
|
i | (6<<4) | (i<<7) | (1<<11) | (1<<12)
|
|
| (i<<16) | (6<<20) | (i<<23));
|
|
SQ_DEBUG_WRITE(device, REG_SQ_DEBUG_VTX_TB_STATE_MEM,
|
|
data, offset);
|
|
SQ_DEBUG_WRITE(device, REG_SQ_DEBUG_VTX_TB_STATUS_REG,
|
|
data, offset);
|
|
SQ_DEBUG_WRITE(device, REG_SQ_DEBUG_PIX_TB_STATE_MEM,
|
|
data, offset);
|
|
SQ_DEBUG_WRITE(device, REG_SQ_DEBUG_PIX_TB_STATUS_REG_0,
|
|
data, offset);
|
|
SQ_DEBUG_WRITE(device, REG_SQ_DEBUG_PIX_TB_STATUS_REG_1,
|
|
data, offset);
|
|
SQ_DEBUG_WRITE(device, REG_SQ_DEBUG_PIX_TB_STATUS_REG_2,
|
|
data, offset);
|
|
SQ_DEBUG_WRITE(device, REG_SQ_DEBUG_PIX_TB_STATUS_REG_3,
|
|
data, offset);
|
|
}
|
|
|
|
return DEBUG_SECTION_SZ(size);
|
|
}
|
|
|
|
#define MIUDEBUG_COUNT 0x10
|
|
|
|
static int a2xx_snapshot_miudebug(struct kgsl_device *device, void *snapshot,
|
|
int remain, void *priv)
|
|
{
|
|
struct kgsl_snapshot_debug *header = snapshot;
|
|
unsigned int *data = snapshot + sizeof(*header);
|
|
int i;
|
|
|
|
if (remain < DEBUG_SECTION_SZ(MIUDEBUG_COUNT)) {
|
|
SNAPSHOT_ERR_NOMEM(device, "MIU DEBUG");
|
|
return 0;
|
|
}
|
|
|
|
header->type = SNAPSHOT_DEBUG_MIU;
|
|
header->size = MIUDEBUG_COUNT;
|
|
|
|
for (i = 0; i < MIUDEBUG_COUNT; i++) {
|
|
adreno_regwrite(device, REG_RBBM_DEBUG_CNTL, 0x1600 | i);
|
|
adreno_regread(device, REG_RBBM_DEBUG_OUT, &data[i]);
|
|
}
|
|
|
|
adreno_regwrite(device, REG_RBBM_DEBUG_CNTL, 0);
|
|
|
|
return DEBUG_SECTION_SZ(MIUDEBUG_COUNT);
|
|
}
|
|
|
|
/* Snapshot the istore memory */
|
|
static int a2xx_snapshot_istore(struct kgsl_device *device, void *snapshot,
|
|
int remain, void *priv)
|
|
{
|
|
struct kgsl_snapshot_istore *header = snapshot;
|
|
unsigned int *data = snapshot + sizeof(*header);
|
|
struct adreno_device *adreno_dev = ADRENO_DEVICE(device);
|
|
int count, i;
|
|
|
|
count = adreno_dev->istore_size * adreno_dev->instruction_size;
|
|
|
|
if (remain < (count * 4) + sizeof(*header)) {
|
|
KGSL_DRV_ERR(device,
|
|
"snapshot: Not enough memory for the istore section");
|
|
return 0;
|
|
}
|
|
|
|
header->count = adreno_dev->istore_size;
|
|
|
|
for (i = 0; i < count; i++)
|
|
kgsl_regread(device, ADRENO_ISTORE_START + i, &data[i]);
|
|
|
|
return (count * 4) + sizeof(*header);
|
|
}
|
|
|
|
/* A2XX GPU snapshot function - this is where all of the A2XX specific
|
|
* bits and pieces are grabbed into the snapshot memory
|
|
*/
|
|
|
|
void *a2xx_snapshot(struct adreno_device *adreno_dev, void *snapshot,
|
|
int *remain, int hang)
|
|
{
|
|
struct kgsl_device *device = &adreno_dev->dev;
|
|
struct kgsl_snapshot_registers_list list;
|
|
struct kgsl_snapshot_registers regs;
|
|
unsigned int pmoverride;
|
|
|
|
/* Choose the register set to dump */
|
|
|
|
if (adreno_is_a20x(adreno_dev)) {
|
|
regs.regs = (unsigned int *) a200_registers;
|
|
regs.count = a200_registers_count;
|
|
} else if (adreno_is_a220(adreno_dev)) {
|
|
regs.regs = (unsigned int *) a220_registers;
|
|
regs.count = a220_registers_count;
|
|
} else if (adreno_is_a225(adreno_dev)) {
|
|
regs.regs = (unsigned int *) a225_registers;
|
|
regs.count = a225_registers_count;
|
|
}
|
|
|
|
list.registers = ®s;
|
|
list.count = 1;
|
|
|
|
/* Master set of (non debug) registers */
|
|
snapshot = kgsl_snapshot_add_section(device,
|
|
KGSL_SNAPSHOT_SECTION_REGS, snapshot, remain,
|
|
kgsl_snapshot_dump_regs, &list);
|
|
|
|
/* CP_STATE_DEBUG indexed registers */
|
|
snapshot = kgsl_snapshot_indexed_registers(device, snapshot,
|
|
remain, REG_CP_STATE_DEBUG_INDEX,
|
|
REG_CP_STATE_DEBUG_DATA, 0x0, 0x14);
|
|
|
|
/* CP_ME indexed registers */
|
|
snapshot = kgsl_snapshot_indexed_registers(device, snapshot,
|
|
remain, REG_CP_ME_CNTL, REG_CP_ME_STATUS,
|
|
64, 44);
|
|
|
|
/*
|
|
* Need to temporarily turn off clock gating for the debug bus to
|
|
* work
|
|
*/
|
|
|
|
adreno_regread(device, REG_RBBM_PM_OVERRIDE2, &pmoverride);
|
|
adreno_regwrite(device, REG_RBBM_PM_OVERRIDE2, 0xFF);
|
|
|
|
/* SX debug registers */
|
|
snapshot = kgsl_snapshot_add_section(device,
|
|
KGSL_SNAPSHOT_SECTION_DEBUG, snapshot, remain,
|
|
a2xx_snapshot_sxdebug, NULL);
|
|
|
|
/* SU debug indexed registers (only for < 470) */
|
|
if (!adreno_is_a22x(adreno_dev))
|
|
snapshot = kgsl_snapshot_indexed_registers(device, snapshot,
|
|
remain, REG_PA_SU_DEBUG_CNTL,
|
|
REG_PA_SU_DEBUG_DATA,
|
|
0, 0x1B);
|
|
|
|
/* CP debug registers */
|
|
snapshot = kgsl_snapshot_add_section(device,
|
|
KGSL_SNAPSHOT_SECTION_DEBUG, snapshot, remain,
|
|
a2xx_snapshot_cpdebug, NULL);
|
|
|
|
/* MH debug indexed registers */
|
|
snapshot = kgsl_snapshot_indexed_registers(device, snapshot,
|
|
remain, MH_DEBUG_CTRL, MH_DEBUG_DATA, 0x0, 0x40);
|
|
|
|
/* Leia only register sets */
|
|
if (adreno_is_a22x(adreno_dev)) {
|
|
/* RB DEBUG indexed regisers */
|
|
snapshot = kgsl_snapshot_indexed_registers(device, snapshot,
|
|
remain, REG_RB_DEBUG_CNTL, REG_RB_DEBUG_DATA, 0, 8);
|
|
|
|
/* RB DEBUG indexed registers bank 2 */
|
|
snapshot = kgsl_snapshot_indexed_registers(device, snapshot,
|
|
remain, REG_RB_DEBUG_CNTL, REG_RB_DEBUG_DATA + 0x1000,
|
|
0, 8);
|
|
|
|
/* PC_DEBUG indexed registers */
|
|
snapshot = kgsl_snapshot_indexed_registers(device, snapshot,
|
|
remain, REG_PC_DEBUG_CNTL, REG_PC_DEBUG_DATA, 0, 8);
|
|
|
|
/* GRAS_DEBUG indexed registers */
|
|
snapshot = kgsl_snapshot_indexed_registers(device, snapshot,
|
|
remain, REG_GRAS_DEBUG_CNTL, REG_GRAS_DEBUG_DATA, 0, 4);
|
|
|
|
/* MIU debug registers */
|
|
snapshot = kgsl_snapshot_add_section(device,
|
|
KGSL_SNAPSHOT_SECTION_DEBUG, snapshot, remain,
|
|
a2xx_snapshot_miudebug, NULL);
|
|
|
|
/* SQ DEBUG debug registers */
|
|
snapshot = kgsl_snapshot_add_section(device,
|
|
KGSL_SNAPSHOT_SECTION_DEBUG, snapshot, remain,
|
|
a2xx_snapshot_sqdebug, NULL);
|
|
|
|
/*
|
|
* Reading SQ THREAD causes bad things to happen on a running
|
|
* system, so only read it if the GPU is already hung
|
|
*/
|
|
|
|
if (hang) {
|
|
/* SQ THREAD debug registers */
|
|
snapshot = kgsl_snapshot_add_section(device,
|
|
KGSL_SNAPSHOT_SECTION_DEBUG, snapshot, remain,
|
|
a2xx_snapshot_sqthreaddebug, NULL);
|
|
}
|
|
}
|
|
|
|
/*
|
|
* Only dump the istore on a hang - reading it on a running system
|
|
* has a non zero chance of hanging the GPU.
|
|
*/
|
|
|
|
if (adreno_is_a2xx(adreno_dev) && hang) {
|
|
snapshot = kgsl_snapshot_add_section(device,
|
|
KGSL_SNAPSHOT_SECTION_ISTORE, snapshot, remain,
|
|
a2xx_snapshot_istore, NULL);
|
|
}
|
|
|
|
|
|
/* Reset the clock gating */
|
|
adreno_regwrite(device, REG_RBBM_PM_OVERRIDE2, pmoverride);
|
|
|
|
return snapshot;
|
|
}
|