880d405719
git-subtree-dir: qcom/opensource/graphics-kernel git-subtree-mainline:992813d9c1
git-subtree-split:b4fdc4c042
Change-Id: repo: https://git.codelinaro.org/clo/la/platform/vendor/qcom/opensource/graphics-kernel tag: GRAPHICS.LA.14.0.r1-07700-lanai.0
1408 lines
36 KiB
C
1408 lines
36 KiB
C
// SPDX-License-Identifier: GPL-2.0-only
|
|
/*
|
|
* Copyright (c) 2020-2021, The Linux Foundation. All rights reserved.
|
|
* Copyright (c) 2022-2024, Qualcomm Innovation Center, Inc. All rights reserved.
|
|
*/
|
|
|
|
#include <linux/clk.h>
|
|
#include <linux/component.h>
|
|
#include <linux/interconnect.h>
|
|
|
|
#include "adreno.h"
|
|
#include "adreno_a6xx.h"
|
|
#include "adreno_a6xx_hwsched.h"
|
|
#include "adreno_hfi.h"
|
|
#include "adreno_snapshot.h"
|
|
#include "kgsl_bus.h"
|
|
#include "kgsl_device.h"
|
|
#include "kgsl_trace.h"
|
|
|
|
static size_t adreno_hwsched_snapshot_rb(struct kgsl_device *device, u8 *buf,
|
|
size_t remain, void *priv)
|
|
{
|
|
struct kgsl_snapshot_rb_v2 *header = (struct kgsl_snapshot_rb_v2 *)buf;
|
|
u32 *data = (u32 *)(buf + sizeof(*header));
|
|
struct kgsl_memdesc *rb = (struct kgsl_memdesc *)priv;
|
|
|
|
if (remain < rb->size + sizeof(*header)) {
|
|
SNAPSHOT_ERR_NOMEM(device, "RB");
|
|
return 0;
|
|
}
|
|
|
|
header->start = 0;
|
|
header->end = rb->size >> 2;
|
|
header->rptr = 0;
|
|
header->rbsize = rb->size >> 2;
|
|
header->count = rb->size >> 2;
|
|
header->timestamp_queued = 0;
|
|
header->timestamp_retired = 0;
|
|
header->gpuaddr = rb->gpuaddr;
|
|
header->id = 0;
|
|
|
|
memcpy(data, rb->hostptr, rb->size);
|
|
|
|
return rb->size + sizeof(*header);
|
|
}
|
|
|
|
static void a6xx_hwsched_snapshot_preemption_record(struct kgsl_device *device,
|
|
struct kgsl_snapshot *snapshot, struct kgsl_memdesc *md, u64 offset)
|
|
{
|
|
struct kgsl_snapshot_section_header *section_header =
|
|
(struct kgsl_snapshot_section_header *)snapshot->ptr;
|
|
u8 *dest = snapshot->ptr + sizeof(*section_header);
|
|
struct kgsl_snapshot_gpu_object_v2 *header =
|
|
(struct kgsl_snapshot_gpu_object_v2 *)dest;
|
|
const struct adreno_a6xx_core *a6xx_core = to_a6xx_core(ADRENO_DEVICE(device));
|
|
u64 ctxt_record_size = A6XX_CP_CTXRECORD_SIZE_IN_BYTES;
|
|
size_t section_size;
|
|
|
|
if (a6xx_core->ctxt_record_size)
|
|
ctxt_record_size = a6xx_core->ctxt_record_size;
|
|
|
|
ctxt_record_size = min_t(u64, ctxt_record_size, device->snapshot_ctxt_record_size);
|
|
|
|
section_size = sizeof(*section_header) + sizeof(*header) + ctxt_record_size;
|
|
|
|
if (snapshot->remain < section_size) {
|
|
SNAPSHOT_ERR_NOMEM(device, "PREEMPTION RECORD");
|
|
return;
|
|
}
|
|
|
|
section_header->magic = SNAPSHOT_SECTION_MAGIC;
|
|
section_header->id = KGSL_SNAPSHOT_SECTION_GPU_OBJECT_V2;
|
|
section_header->size = section_size;
|
|
|
|
header->size = ctxt_record_size >> 2;
|
|
header->gpuaddr = md->gpuaddr + offset;
|
|
header->ptbase =
|
|
kgsl_mmu_pagetable_get_ttbr0(device->mmu.defaultpagetable);
|
|
header->type = SNAPSHOT_GPU_OBJECT_GLOBAL;
|
|
|
|
dest += sizeof(*header);
|
|
|
|
memcpy(dest, md->hostptr + offset, ctxt_record_size);
|
|
|
|
snapshot->ptr += section_header->size;
|
|
snapshot->remain -= section_header->size;
|
|
snapshot->size += section_header->size;
|
|
}
|
|
|
|
static void snapshot_preemption_records(struct kgsl_device *device,
|
|
struct kgsl_snapshot *snapshot, struct kgsl_memdesc *md)
|
|
{
|
|
const struct adreno_a6xx_core *a6xx_core =
|
|
to_a6xx_core(ADRENO_DEVICE(device));
|
|
u64 ctxt_record_size = A6XX_CP_CTXRECORD_SIZE_IN_BYTES;
|
|
u64 offset;
|
|
|
|
if (a6xx_core->ctxt_record_size)
|
|
ctxt_record_size = a6xx_core->ctxt_record_size;
|
|
|
|
/* All preemption records exist as a single mem alloc entry */
|
|
for (offset = 0; offset < md->size; offset += ctxt_record_size)
|
|
a6xx_hwsched_snapshot_preemption_record(device, snapshot, md,
|
|
offset);
|
|
}
|
|
|
|
static void *get_rb_hostptr(struct adreno_device *adreno_dev,
|
|
u64 gpuaddr, u32 size)
|
|
{
|
|
struct a6xx_hwsched_hfi *hw_hfi = to_a6xx_hwsched_hfi(adreno_dev);
|
|
u64 offset;
|
|
u32 i;
|
|
|
|
for (i = 0; i < hw_hfi->mem_alloc_entries; i++) {
|
|
struct kgsl_memdesc *md = hw_hfi->mem_alloc_table[i].md;
|
|
|
|
if (md && (gpuaddr >= md->gpuaddr) &&
|
|
((gpuaddr + size) <= (md->gpuaddr + md->size))) {
|
|
offset = gpuaddr - md->gpuaddr;
|
|
return md->hostptr + offset;
|
|
}
|
|
}
|
|
return NULL;
|
|
}
|
|
|
|
static u32 a6xx_copy_gpu_global(void *out, void *in, u32 size)
|
|
{
|
|
if (out && in) {
|
|
memcpy(out, in, size);
|
|
return size;
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
|
|
static void adreno_hwsched_snapshot_rb_payload(struct adreno_device *adreno_dev,
|
|
struct kgsl_snapshot *snapshot, struct payload_section *payload)
|
|
{
|
|
struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
|
|
struct kgsl_snapshot_section_header *section_header =
|
|
(struct kgsl_snapshot_section_header *)snapshot->ptr;
|
|
u8 *buf = snapshot->ptr + sizeof(*section_header);
|
|
struct kgsl_snapshot_rb_v2 *header = (struct kgsl_snapshot_rb_v2 *)buf;
|
|
u32 *data = (u32 *)(buf + sizeof(*header));
|
|
u32 size = adreno_hwsched_parse_payload(payload, KEY_RB_SIZEDWORDS) << 2;
|
|
u64 lo, hi, gpuaddr;
|
|
void *rb_hostptr;
|
|
char str[16];
|
|
|
|
lo = adreno_hwsched_parse_payload(payload, KEY_RB_GPUADDR_LO);
|
|
hi = adreno_hwsched_parse_payload(payload, KEY_RB_GPUADDR_HI);
|
|
gpuaddr = hi << 32 | lo;
|
|
|
|
/* Sanity check to make sure there is enough for the header */
|
|
if (snapshot->remain < sizeof(*section_header))
|
|
goto err;
|
|
|
|
rb_hostptr = get_rb_hostptr(adreno_dev, gpuaddr, size);
|
|
|
|
/* If the gpuaddress and size don't match any allocation, then abort */
|
|
if (((snapshot->remain - sizeof(*section_header)) <
|
|
(size + sizeof(*header))) ||
|
|
!a6xx_copy_gpu_global(data, rb_hostptr, size))
|
|
goto err;
|
|
|
|
if (device->dump_all_ibs) {
|
|
u64 rbaddr;
|
|
|
|
kgsl_regread64(device, A6XX_CP_RB_BASE,
|
|
A6XX_CP_RB_BASE_HI, &rbaddr);
|
|
|
|
/* Parse all IBs from current RB */
|
|
if (rbaddr == gpuaddr)
|
|
adreno_snapshot_dump_all_ibs(device, rb_hostptr, snapshot);
|
|
}
|
|
|
|
header->start = 0;
|
|
header->end = size >> 2;
|
|
header->rptr = adreno_hwsched_parse_payload(payload, KEY_RB_RPTR);
|
|
header->wptr = adreno_hwsched_parse_payload(payload, KEY_RB_WPTR);
|
|
header->rbsize = size >> 2;
|
|
header->count = size >> 2;
|
|
header->timestamp_queued = adreno_hwsched_parse_payload(payload,
|
|
KEY_RB_QUEUED_TS);
|
|
header->timestamp_retired = adreno_hwsched_parse_payload(payload,
|
|
KEY_RB_RETIRED_TS);
|
|
header->gpuaddr = gpuaddr;
|
|
header->id = adreno_hwsched_parse_payload(payload, KEY_RB_ID);
|
|
|
|
section_header->magic = SNAPSHOT_SECTION_MAGIC;
|
|
section_header->id = KGSL_SNAPSHOT_SECTION_RB_V2;
|
|
section_header->size = size + sizeof(*header) + sizeof(*section_header);
|
|
|
|
snapshot->ptr += section_header->size;
|
|
snapshot->remain -= section_header->size;
|
|
snapshot->size += section_header->size;
|
|
|
|
return;
|
|
err:
|
|
snprintf(str, sizeof(str), "RB addr:0x%llx", gpuaddr);
|
|
SNAPSHOT_ERR_NOMEM(device, str);
|
|
}
|
|
|
|
static bool parse_payload_rb_legacy(struct adreno_device *adreno_dev,
|
|
struct kgsl_snapshot *snapshot)
|
|
{
|
|
struct hfi_context_bad_cmd_legacy *cmd = adreno_dev->hwsched.ctxt_bad;
|
|
u32 i = 0, payload_bytes;
|
|
void *start;
|
|
bool ret = false;
|
|
|
|
/* Skip if we didn't receive a context bad HFI */
|
|
if (!cmd->hdr)
|
|
return false;
|
|
|
|
payload_bytes = (MSG_HDR_GET_SIZE(cmd->hdr) << 2) -
|
|
offsetof(struct hfi_context_bad_cmd_legacy, payload);
|
|
|
|
start = &cmd->payload[0];
|
|
|
|
while (i < payload_bytes) {
|
|
struct payload_section *payload = start + i;
|
|
|
|
if (payload->type == PAYLOAD_RB) {
|
|
adreno_hwsched_snapshot_rb_payload(adreno_dev, snapshot, payload);
|
|
ret = true;
|
|
}
|
|
|
|
i += sizeof(*payload) + (payload->dwords << 2);
|
|
}
|
|
|
|
return ret;
|
|
}
|
|
|
|
static bool parse_payload_rb(struct adreno_device *adreno_dev,
|
|
struct kgsl_snapshot *snapshot)
|
|
{
|
|
struct hfi_context_bad_cmd *cmd = adreno_dev->hwsched.ctxt_bad;
|
|
u32 i = 0, payload_bytes;
|
|
void *start;
|
|
bool ret = false;
|
|
|
|
/* Skip if we didn't receive a context bad HFI */
|
|
if (!cmd->hdr)
|
|
return false;
|
|
|
|
payload_bytes = (MSG_HDR_GET_SIZE(cmd->hdr) << 2) -
|
|
offsetof(struct hfi_context_bad_cmd, payload);
|
|
|
|
start = &cmd->payload[0];
|
|
|
|
while (i < payload_bytes) {
|
|
struct payload_section *payload = start + i;
|
|
|
|
if (payload->type == PAYLOAD_RB) {
|
|
adreno_hwsched_snapshot_rb_payload(adreno_dev,
|
|
snapshot, payload);
|
|
ret = true;
|
|
}
|
|
|
|
i += sizeof(*payload) + (payload->dwords << 2);
|
|
}
|
|
|
|
return ret;
|
|
}
|
|
|
|
void a6xx_hwsched_snapshot(struct adreno_device *adreno_dev,
|
|
struct kgsl_snapshot *snapshot)
|
|
{
|
|
struct a6xx_gmu_device *gmu = to_a6xx_gmu(adreno_dev);
|
|
struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
|
|
struct a6xx_hwsched_hfi *hw_hfi = to_a6xx_hwsched_hfi(adreno_dev);
|
|
u32 i;
|
|
bool skip_memkind_rb = false;
|
|
bool parse_payload;
|
|
|
|
a6xx_gmu_snapshot(adreno_dev, snapshot);
|
|
|
|
adreno_hwsched_parse_fault_cmdobj(adreno_dev, snapshot);
|
|
|
|
/*
|
|
* First try to dump ringbuffers using context bad HFI payloads
|
|
* because they have all the ringbuffer parameters. If ringbuffer
|
|
* payloads are not present, fall back to dumping ringbuffers
|
|
* based on MEMKIND_RB
|
|
*/
|
|
if (GMU_VER_MINOR(gmu->ver.hfi) < 2)
|
|
parse_payload = parse_payload_rb_legacy(adreno_dev, snapshot);
|
|
else
|
|
parse_payload = parse_payload_rb(adreno_dev, snapshot);
|
|
|
|
if (parse_payload)
|
|
skip_memkind_rb = true;
|
|
|
|
for (i = 0; i < hw_hfi->mem_alloc_entries; i++) {
|
|
struct hfi_mem_alloc_entry *entry = &hw_hfi->mem_alloc_table[i];
|
|
|
|
if (entry->desc.mem_kind == HFI_MEMKIND_RB && !skip_memkind_rb)
|
|
kgsl_snapshot_add_section(device,
|
|
KGSL_SNAPSHOT_SECTION_RB_V2,
|
|
snapshot, adreno_hwsched_snapshot_rb,
|
|
entry->md);
|
|
|
|
if (entry->desc.mem_kind == HFI_MEMKIND_SCRATCH)
|
|
kgsl_snapshot_add_section(device,
|
|
KGSL_SNAPSHOT_SECTION_GPU_OBJECT_V2,
|
|
snapshot, adreno_snapshot_global,
|
|
entry->md);
|
|
|
|
if (entry->desc.mem_kind == HFI_MEMKIND_PROFILE)
|
|
kgsl_snapshot_add_section(device,
|
|
KGSL_SNAPSHOT_SECTION_GPU_OBJECT_V2,
|
|
snapshot, adreno_snapshot_global,
|
|
entry->md);
|
|
|
|
if (entry->desc.mem_kind == HFI_MEMKIND_CSW_SMMU_INFO)
|
|
kgsl_snapshot_add_section(device,
|
|
KGSL_SNAPSHOT_SECTION_GPU_OBJECT_V2,
|
|
snapshot, adreno_snapshot_global,
|
|
entry->md);
|
|
|
|
if (entry->desc.mem_kind == HFI_MEMKIND_CSW_PRIV_NON_SECURE)
|
|
snapshot_preemption_records(device, snapshot,
|
|
entry->md);
|
|
|
|
if (entry->desc.mem_kind == HFI_MEMKIND_PREEMPT_SCRATCH)
|
|
kgsl_snapshot_add_section(device,
|
|
KGSL_SNAPSHOT_SECTION_GPU_OBJECT_V2,
|
|
snapshot, adreno_snapshot_global,
|
|
entry->md);
|
|
}
|
|
}
|
|
|
|
static int a6xx_hwsched_gmu_first_boot(struct adreno_device *adreno_dev)
|
|
{
|
|
struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
|
|
struct kgsl_pwrctrl *pwr = &device->pwrctrl;
|
|
struct a6xx_gmu_device *gmu = to_a6xx_gmu(adreno_dev);
|
|
int level, ret = 0;
|
|
|
|
kgsl_pwrctrl_request_state(device, KGSL_STATE_AWARE);
|
|
|
|
a6xx_gmu_aop_send_acd_state(gmu, adreno_dev->acd_enabled);
|
|
|
|
ret = kgsl_pwrctrl_enable_cx_gdsc(device);
|
|
if (ret)
|
|
return ret;
|
|
|
|
ret = a6xx_gmu_enable_clks(adreno_dev, GMU_MAX_PWRLEVELS - 1);
|
|
if (ret)
|
|
goto gdsc_off;
|
|
|
|
ret = a6xx_gmu_load_fw(adreno_dev);
|
|
if (ret)
|
|
goto clks_gdsc_off;
|
|
|
|
ret = a6xx_gmu_itcm_shadow(adreno_dev);
|
|
if (ret)
|
|
goto clks_gdsc_off;
|
|
|
|
if (!test_bit(GMU_PRIV_PDC_RSC_LOADED, &gmu->flags)) {
|
|
ret = a6xx_load_pdc_ucode(adreno_dev);
|
|
if (ret)
|
|
goto clks_gdsc_off;
|
|
|
|
a6xx_load_rsc_ucode(adreno_dev);
|
|
set_bit(GMU_PRIV_PDC_RSC_LOADED, &gmu->flags);
|
|
}
|
|
|
|
a6xx_gmu_register_config(adreno_dev);
|
|
|
|
a6xx_gmu_version_info(adreno_dev);
|
|
|
|
if (GMU_VER_MINOR(gmu->ver.hfi) < 2)
|
|
set_bit(ADRENO_HWSCHED_CTX_BAD_LEGACY, &adreno_dev->hwsched.flags);
|
|
|
|
a6xx_gmu_irq_enable(adreno_dev);
|
|
|
|
/* Vote for minimal DDR BW for GMU to init */
|
|
level = pwr->pwrlevels[pwr->default_pwrlevel].bus_min;
|
|
|
|
icc_set_bw(pwr->icc_path, 0, kBps_to_icc(pwr->ddr_table[level]));
|
|
|
|
/* Clear any hwsched faults that might have been left over */
|
|
adreno_hwsched_clear_fault(adreno_dev);
|
|
|
|
ret = a6xx_gmu_device_start(adreno_dev);
|
|
if (ret)
|
|
goto err;
|
|
|
|
ret = a6xx_hwsched_hfi_start(adreno_dev);
|
|
if (ret)
|
|
goto err;
|
|
|
|
icc_set_bw(pwr->icc_path, 0, 0);
|
|
|
|
device->gmu_fault = false;
|
|
|
|
kgsl_pwrctrl_set_state(device, KGSL_STATE_AWARE);
|
|
|
|
return 0;
|
|
|
|
err:
|
|
a6xx_gmu_irq_disable(adreno_dev);
|
|
|
|
if (device->gmu_fault) {
|
|
a6xx_gmu_suspend(adreno_dev);
|
|
|
|
return ret;
|
|
}
|
|
|
|
clks_gdsc_off:
|
|
clk_bulk_disable_unprepare(gmu->num_clks, gmu->clks);
|
|
|
|
gdsc_off:
|
|
a6xx_gmu_disable_gdsc(adreno_dev);
|
|
|
|
a6xx_rdpm_cx_freq_update(gmu, 0);
|
|
|
|
return ret;
|
|
}
|
|
|
|
static int a6xx_hwsched_gmu_boot(struct adreno_device *adreno_dev)
|
|
{
|
|
struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
|
|
struct a6xx_gmu_device *gmu = to_a6xx_gmu(adreno_dev);
|
|
int ret = 0;
|
|
|
|
kgsl_pwrctrl_request_state(device, KGSL_STATE_AWARE);
|
|
|
|
ret = kgsl_pwrctrl_enable_cx_gdsc(device);
|
|
if (ret)
|
|
return ret;
|
|
|
|
ret = a6xx_gmu_enable_clks(adreno_dev, GMU_MAX_PWRLEVELS - 1);
|
|
if (ret)
|
|
goto gdsc_off;
|
|
|
|
ret = a6xx_rscc_wakeup_sequence(adreno_dev);
|
|
if (ret)
|
|
goto clks_gdsc_off;
|
|
|
|
ret = a6xx_gmu_load_fw(adreno_dev);
|
|
if (ret)
|
|
goto clks_gdsc_off;
|
|
|
|
a6xx_gmu_register_config(adreno_dev);
|
|
|
|
a6xx_gmu_irq_enable(adreno_dev);
|
|
|
|
/* Clear any hwsched faults that might have been left over */
|
|
adreno_hwsched_clear_fault(adreno_dev);
|
|
|
|
ret = a6xx_gmu_device_start(adreno_dev);
|
|
if (ret)
|
|
goto err;
|
|
|
|
ret = a6xx_hwsched_hfi_start(adreno_dev);
|
|
if (ret)
|
|
goto err;
|
|
|
|
device->gmu_fault = false;
|
|
|
|
kgsl_pwrctrl_set_state(device, KGSL_STATE_AWARE);
|
|
|
|
return 0;
|
|
err:
|
|
a6xx_gmu_irq_disable(adreno_dev);
|
|
|
|
if (device->gmu_fault) {
|
|
a6xx_gmu_suspend(adreno_dev);
|
|
|
|
return ret;
|
|
}
|
|
|
|
clks_gdsc_off:
|
|
clk_bulk_disable_unprepare(gmu->num_clks, gmu->clks);
|
|
|
|
gdsc_off:
|
|
a6xx_gmu_disable_gdsc(adreno_dev);
|
|
|
|
a6xx_rdpm_cx_freq_update(gmu, 0);
|
|
|
|
return ret;
|
|
}
|
|
|
|
void a6xx_hwsched_active_count_put(struct adreno_device *adreno_dev)
|
|
{
|
|
struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
|
|
|
|
if (WARN_ON(!mutex_is_locked(&device->mutex)))
|
|
return;
|
|
|
|
if (WARN(atomic_read(&device->active_cnt) == 0,
|
|
"Unbalanced get/put calls to KGSL active count\n"))
|
|
return;
|
|
|
|
if (atomic_dec_and_test(&device->active_cnt)) {
|
|
kgsl_pwrscale_update_stats(device);
|
|
kgsl_pwrscale_update(device);
|
|
kgsl_start_idle_timer(device);
|
|
}
|
|
|
|
trace_kgsl_active_count(device,
|
|
(unsigned long) __builtin_return_address(0));
|
|
|
|
wake_up(&device->active_cnt_wq);
|
|
}
|
|
|
|
static int a6xx_hwsched_notify_slumber(struct adreno_device *adreno_dev)
|
|
{
|
|
struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
|
|
struct kgsl_pwrctrl *pwr = &device->pwrctrl;
|
|
struct a6xx_gmu_device *gmu = to_a6xx_gmu(adreno_dev);
|
|
struct hfi_prep_slumber_cmd req;
|
|
int ret;
|
|
|
|
ret = CMD_MSG_HDR(req, H2F_MSG_PREPARE_SLUMBER);
|
|
if (ret)
|
|
return ret;
|
|
|
|
req.freq = gmu->hfi.dcvs_table.gpu_level_num -
|
|
pwr->default_pwrlevel - 1;
|
|
req.bw = pwr->pwrlevels[pwr->default_pwrlevel].bus_freq;
|
|
|
|
/* Disable the power counter so that the GMU is not busy */
|
|
gmu_core_regwrite(device, A6XX_GMU_CX_GMU_POWER_COUNTER_ENABLE, 0);
|
|
|
|
ret = a6xx_hfi_send_cmd_async(adreno_dev, &req, sizeof(req));
|
|
|
|
/*
|
|
* GEMNOC can enter power collapse state during GPU power down sequence.
|
|
* This could abort CX GDSC collapse. Assert Qactive to avoid this.
|
|
*/
|
|
if ((adreno_is_a662(adreno_dev) || adreno_is_a621(adreno_dev) ||
|
|
adreno_is_a635(adreno_dev)))
|
|
gmu_core_regwrite(device, A6XX_GPU_GMU_CX_GMU_CX_FALNEXT_INTF, 0x1);
|
|
|
|
return ret;
|
|
}
|
|
static int a6xx_hwsched_gmu_power_off(struct adreno_device *adreno_dev)
|
|
{
|
|
struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
|
|
struct a6xx_gmu_device *gmu = to_a6xx_gmu(adreno_dev);
|
|
int ret = 0;
|
|
|
|
if (device->gmu_fault)
|
|
goto error;
|
|
|
|
/* Wait for the lowest idle level we requested */
|
|
ret = a6xx_gmu_wait_for_lowest_idle(adreno_dev);
|
|
if (ret)
|
|
goto error;
|
|
|
|
ret = a6xx_hwsched_notify_slumber(adreno_dev);
|
|
if (ret)
|
|
goto error;
|
|
|
|
ret = a6xx_gmu_wait_for_idle(adreno_dev);
|
|
if (ret)
|
|
goto error;
|
|
|
|
ret = a6xx_rscc_sleep_sequence(adreno_dev);
|
|
|
|
a6xx_rdpm_mx_freq_update(gmu, 0);
|
|
|
|
/* Now that we are done with GMU and GPU, Clear the GBIF */
|
|
ret = a6xx_halt_gbif(adreno_dev);
|
|
/* De-assert the halts */
|
|
kgsl_regwrite(device, A6XX_GBIF_HALT, 0x0);
|
|
|
|
a6xx_gmu_irq_disable(adreno_dev);
|
|
|
|
a6xx_hwsched_hfi_stop(adreno_dev);
|
|
|
|
clk_bulk_disable_unprepare(gmu->num_clks, gmu->clks);
|
|
|
|
a6xx_gmu_disable_gdsc(adreno_dev);
|
|
|
|
a6xx_rdpm_cx_freq_update(gmu, 0);
|
|
|
|
kgsl_pwrctrl_set_state(device, KGSL_STATE_NONE);
|
|
|
|
return ret;
|
|
|
|
error:
|
|
a6xx_gmu_irq_disable(adreno_dev);
|
|
a6xx_hwsched_hfi_stop(adreno_dev);
|
|
a6xx_gmu_suspend(adreno_dev);
|
|
|
|
return ret;
|
|
}
|
|
|
|
static int a6xx_hwsched_gpu_boot(struct adreno_device *adreno_dev)
|
|
{
|
|
struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
|
|
int ret;
|
|
|
|
ret = kgsl_mmu_start(device);
|
|
if (ret)
|
|
goto err;
|
|
|
|
ret = a6xx_gmu_oob_set(device, oob_gpu);
|
|
if (ret)
|
|
goto err;
|
|
|
|
/* Clear the busy_data stats - we're starting over from scratch */
|
|
memset(&adreno_dev->busy_data, 0, sizeof(adreno_dev->busy_data));
|
|
|
|
/* Restore performance counter registers with saved values */
|
|
adreno_perfcounter_restore(adreno_dev);
|
|
|
|
a6xx_start(adreno_dev);
|
|
|
|
/* Re-initialize the coresight registers if applicable */
|
|
adreno_coresight_start(adreno_dev);
|
|
|
|
adreno_perfcounter_start(adreno_dev);
|
|
|
|
/* Clear FSR here in case it is set from a previous pagefault */
|
|
kgsl_mmu_clear_fsr(&device->mmu);
|
|
|
|
a6xx_enable_gpu_irq(adreno_dev);
|
|
|
|
ret = a6xx_hwsched_cp_init(adreno_dev);
|
|
if (ret) {
|
|
a6xx_disable_gpu_irq(adreno_dev);
|
|
goto err;
|
|
}
|
|
|
|
/*
|
|
* At this point it is safe to assume that we recovered. Setting
|
|
* this field allows us to take a new snapshot for the next failure
|
|
* if we are prioritizing the first unrecoverable snapshot.
|
|
*/
|
|
if (device->snapshot)
|
|
device->snapshot->recovered = true;
|
|
|
|
device->reset_counter++;
|
|
err:
|
|
a6xx_gmu_oob_clear(device, oob_gpu);
|
|
|
|
if (ret)
|
|
a6xx_hwsched_gmu_power_off(adreno_dev);
|
|
|
|
return ret;
|
|
}
|
|
|
|
static void hwsched_idle_timer(struct timer_list *t)
|
|
{
|
|
struct kgsl_device *device = container_of(t, struct kgsl_device,
|
|
idle_timer);
|
|
|
|
kgsl_schedule_work(&device->idle_check_ws);
|
|
}
|
|
|
|
static int a6xx_hwsched_gmu_memory_init(struct adreno_device *adreno_dev)
|
|
{
|
|
struct a6xx_gmu_device *gmu = to_a6xx_gmu(adreno_dev);
|
|
|
|
/* GMU Virtual register bank */
|
|
if (IS_ERR_OR_NULL(gmu->vrb)) {
|
|
gmu->vrb = reserve_gmu_kernel_block(gmu, 0, GMU_VRB_SIZE,
|
|
GMU_NONCACHED_KERNEL, 0);
|
|
|
|
if (IS_ERR(gmu->vrb))
|
|
return PTR_ERR(gmu->vrb);
|
|
|
|
/* Populate size of the virtual register bank */
|
|
gmu_core_set_vrb_register(gmu->vrb->hostptr, VRB_SIZE_IDX,
|
|
gmu->vrb->size >> 2);
|
|
}
|
|
|
|
/* GMU trace log */
|
|
if (IS_ERR_OR_NULL(gmu->trace.md)) {
|
|
gmu->trace.md = reserve_gmu_kernel_block(gmu, 0,
|
|
GMU_TRACE_SIZE, GMU_NONCACHED_KERNEL, 0);
|
|
|
|
if (IS_ERR(gmu->trace.md))
|
|
return PTR_ERR(gmu->trace.md);
|
|
|
|
/* Pass trace buffer address to GMU through the VRB */
|
|
gmu_core_set_vrb_register(gmu->vrb->hostptr,
|
|
VRB_TRACE_BUFFER_ADDR_IDX,
|
|
gmu->trace.md->gmuaddr);
|
|
|
|
/* Initialize the GMU trace buffer header */
|
|
gmu_core_trace_header_init(&gmu->trace);
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int a6xx_hwsched_gmu_init(struct adreno_device *adreno_dev)
|
|
{
|
|
int ret;
|
|
|
|
ret = a6xx_gmu_parse_fw(adreno_dev);
|
|
if (ret)
|
|
return ret;
|
|
|
|
ret = a6xx_gmu_memory_init(adreno_dev);
|
|
if (ret)
|
|
return ret;
|
|
|
|
ret = a6xx_hwsched_gmu_memory_init(adreno_dev);
|
|
if (ret)
|
|
return ret;
|
|
|
|
return a6xx_hwsched_hfi_init(adreno_dev);
|
|
}
|
|
|
|
static void a6xx_hwsched_touch_wakeup(struct adreno_device *adreno_dev)
|
|
{
|
|
struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
|
|
struct a6xx_gmu_device *gmu = to_a6xx_gmu(adreno_dev);
|
|
int ret;
|
|
|
|
/*
|
|
* Do not wake up a suspended device or until the first boot sequence
|
|
* has been completed.
|
|
*/
|
|
if (test_bit(GMU_PRIV_PM_SUSPEND, &gmu->flags) ||
|
|
!test_bit(GMU_PRIV_FIRST_BOOT_DONE, &gmu->flags))
|
|
return;
|
|
|
|
if (test_bit(GMU_PRIV_GPU_STARTED, &gmu->flags))
|
|
goto done;
|
|
|
|
kgsl_pwrctrl_request_state(device, KGSL_STATE_ACTIVE);
|
|
|
|
ret = a6xx_hwsched_gmu_boot(adreno_dev);
|
|
if (ret)
|
|
return;
|
|
|
|
ret = a6xx_hwsched_gpu_boot(adreno_dev);
|
|
if (ret)
|
|
return;
|
|
|
|
kgsl_pwrscale_wake(device);
|
|
|
|
set_bit(GMU_PRIV_GPU_STARTED, &gmu->flags);
|
|
|
|
device->pwrctrl.last_stat_updated = ktime_get();
|
|
|
|
kgsl_pwrctrl_set_state(device, KGSL_STATE_ACTIVE);
|
|
|
|
done:
|
|
/*
|
|
* When waking up from a touch event we want to stay active long enough
|
|
* for the user to send a draw command. The default idle timer timeout
|
|
* is shorter than we want so go ahead and push the idle timer out
|
|
* further for this special case
|
|
*/
|
|
mod_timer(&device->idle_timer, jiffies +
|
|
msecs_to_jiffies(adreno_wake_timeout));
|
|
}
|
|
|
|
static int a6xx_hwsched_boot(struct adreno_device *adreno_dev)
|
|
{
|
|
struct a6xx_gmu_device *gmu = to_a6xx_gmu(adreno_dev);
|
|
struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
|
|
int ret;
|
|
|
|
if (test_bit(GMU_PRIV_GPU_STARTED, &gmu->flags))
|
|
return 0;
|
|
|
|
kgsl_pwrctrl_request_state(device, KGSL_STATE_ACTIVE);
|
|
|
|
adreno_hwsched_start(adreno_dev);
|
|
|
|
if (IS_ENABLED(CONFIG_QCOM_KGSL_HIBERNATION) &&
|
|
!test_bit(GMU_PRIV_PDC_RSC_LOADED, &gmu->flags))
|
|
ret = a6xx_hwsched_gmu_first_boot(adreno_dev);
|
|
else
|
|
ret = a6xx_hwsched_gmu_boot(adreno_dev);
|
|
if (ret)
|
|
return ret;
|
|
|
|
ret = a6xx_hwsched_gpu_boot(adreno_dev);
|
|
if (ret)
|
|
return ret;
|
|
|
|
kgsl_start_idle_timer(device);
|
|
|
|
kgsl_pwrscale_wake(device);
|
|
|
|
set_bit(GMU_PRIV_GPU_STARTED, &gmu->flags);
|
|
|
|
device->pwrctrl.last_stat_updated = ktime_get();
|
|
|
|
kgsl_pwrctrl_set_state(device, KGSL_STATE_ACTIVE);
|
|
|
|
return ret;
|
|
}
|
|
|
|
static int a6xx_hwsched_first_boot(struct adreno_device *adreno_dev)
|
|
{
|
|
struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
|
|
struct a6xx_gmu_device *gmu = to_a6xx_gmu(adreno_dev);
|
|
int ret;
|
|
|
|
if (test_bit(GMU_PRIV_FIRST_BOOT_DONE, &gmu->flags))
|
|
return a6xx_hwsched_boot(adreno_dev);
|
|
|
|
if (adreno_preemption_feature_set(adreno_dev))
|
|
set_bit(ADRENO_DEVICE_PREEMPTION, &adreno_dev->priv);
|
|
|
|
adreno_hwsched_start(adreno_dev);
|
|
|
|
ret = a6xx_microcode_read(adreno_dev);
|
|
if (ret)
|
|
return ret;
|
|
|
|
ret = a6xx_init(adreno_dev);
|
|
if (ret)
|
|
return ret;
|
|
|
|
ret = a6xx_hwsched_gmu_init(adreno_dev);
|
|
if (ret)
|
|
return ret;
|
|
|
|
kgsl_pwrctrl_request_state(device, KGSL_STATE_ACTIVE);
|
|
|
|
ret = a6xx_hwsched_gmu_first_boot(adreno_dev);
|
|
if (ret)
|
|
return ret;
|
|
|
|
ret = a6xx_hwsched_gpu_boot(adreno_dev);
|
|
if (ret)
|
|
return ret;
|
|
|
|
adreno_get_bus_counters(adreno_dev);
|
|
|
|
adreno_dev->cooperative_reset = ADRENO_FEATURE(adreno_dev,
|
|
ADRENO_COOP_RESET);
|
|
|
|
set_bit(GMU_PRIV_FIRST_BOOT_DONE, &gmu->flags);
|
|
set_bit(GMU_PRIV_GPU_STARTED, &gmu->flags);
|
|
|
|
/*
|
|
* There is a possible deadlock scenario during kgsl firmware reading
|
|
* (request_firmware) and devfreq update calls. During first boot, kgsl
|
|
* device mutex is held and then request_firmware is called for reading
|
|
* firmware. request_firmware internally takes dev_pm_qos_mtx lock.
|
|
* Whereas in case of devfreq update calls triggered by thermal/bcl or
|
|
* devfreq sysfs, it first takes the same dev_pm_qos_mtx lock and then
|
|
* tries to take kgsl device mutex as part of get_dev_status/target
|
|
* calls. This results in deadlock when both thread are unable to acquire
|
|
* the mutex held by other thread. Enable devfreq updates now as we are
|
|
* done reading all firmware files.
|
|
*/
|
|
device->pwrscale.devfreq_enabled = true;
|
|
|
|
device->pwrctrl.last_stat_updated = ktime_get();
|
|
|
|
kgsl_pwrctrl_set_state(device, KGSL_STATE_ACTIVE);
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int a6xx_hwsched_power_off(struct adreno_device *adreno_dev)
|
|
{
|
|
struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
|
|
struct a6xx_gmu_device *gmu = to_a6xx_gmu(adreno_dev);
|
|
int ret;
|
|
|
|
if (!test_bit(GMU_PRIV_GPU_STARTED, &gmu->flags))
|
|
return 0;
|
|
|
|
kgsl_pwrctrl_request_state(device, KGSL_STATE_SLUMBER);
|
|
|
|
ret = a6xx_gmu_oob_set(device, oob_gpu);
|
|
if (ret) {
|
|
a6xx_gmu_oob_clear(device, oob_gpu);
|
|
goto no_gx_power;
|
|
}
|
|
|
|
kgsl_pwrscale_update_stats(device);
|
|
|
|
/* Save active coresight registers if applicable */
|
|
adreno_coresight_stop(adreno_dev);
|
|
|
|
/* Save physical performance counter values before GPU power down*/
|
|
adreno_perfcounter_save(adreno_dev);
|
|
|
|
adreno_irqctrl(adreno_dev, 0);
|
|
|
|
a6xx_gmu_oob_clear(device, oob_gpu);
|
|
|
|
no_gx_power:
|
|
kgsl_pwrctrl_irq(device, false);
|
|
|
|
a6xx_hwsched_gmu_power_off(adreno_dev);
|
|
|
|
adreno_hwsched_unregister_contexts(adreno_dev);
|
|
|
|
adreno_llcc_slice_deactivate(adreno_dev);
|
|
|
|
clear_bit(GMU_PRIV_GPU_STARTED, &gmu->flags);
|
|
|
|
del_timer_sync(&device->idle_timer);
|
|
|
|
kgsl_pwrscale_sleep(device);
|
|
|
|
kgsl_pwrctrl_clear_l3_vote(device);
|
|
|
|
kgsl_pwrctrl_set_state(device, KGSL_STATE_SLUMBER);
|
|
|
|
return ret;
|
|
}
|
|
|
|
static void hwsched_idle_check(struct work_struct *work)
|
|
{
|
|
struct kgsl_device *device = container_of(work,
|
|
struct kgsl_device, idle_check_ws);
|
|
struct adreno_device *adreno_dev = ADRENO_DEVICE(device);
|
|
|
|
mutex_lock(&device->mutex);
|
|
|
|
if (test_bit(GMU_DISABLE_SLUMBER, &device->gmu_core.flags))
|
|
goto done;
|
|
|
|
if (atomic_read(&device->active_cnt) || time_is_after_jiffies(device->idle_jiffies)) {
|
|
kgsl_pwrscale_update(device);
|
|
kgsl_start_idle_timer(device);
|
|
goto done;
|
|
}
|
|
|
|
spin_lock(&device->submit_lock);
|
|
if (device->submit_now) {
|
|
spin_unlock(&device->submit_lock);
|
|
kgsl_pwrscale_update(device);
|
|
kgsl_start_idle_timer(device);
|
|
goto done;
|
|
}
|
|
|
|
device->skip_inline_submit = true;
|
|
spin_unlock(&device->submit_lock);
|
|
|
|
if (!a6xx_hw_isidle(adreno_dev)) {
|
|
dev_err(device->dev, "GPU isn't idle before SLUMBER\n");
|
|
gmu_core_fault_snapshot(device);
|
|
}
|
|
|
|
a6xx_hwsched_power_off(adreno_dev);
|
|
|
|
done:
|
|
mutex_unlock(&device->mutex);
|
|
}
|
|
|
|
static int a6xx_hwsched_first_open(struct adreno_device *adreno_dev)
|
|
{
|
|
struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
|
|
int ret;
|
|
|
|
/*
|
|
* Do the one time settings that need to happen when we
|
|
* attempt to boot the gpu the very first time
|
|
*/
|
|
ret = a6xx_hwsched_first_boot(adreno_dev);
|
|
if (ret)
|
|
return ret;
|
|
|
|
/*
|
|
* A client that does a first_open but never closes the device
|
|
* may prevent us from going back to SLUMBER. So trigger the idle
|
|
* check by incrementing the active count and immediately releasing it.
|
|
*/
|
|
atomic_inc(&device->active_cnt);
|
|
a6xx_hwsched_active_count_put(adreno_dev);
|
|
|
|
return 0;
|
|
}
|
|
|
|
int a6xx_hwsched_active_count_get(struct adreno_device *adreno_dev)
|
|
{
|
|
struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
|
|
struct a6xx_gmu_device *gmu = to_a6xx_gmu(adreno_dev);
|
|
int ret = 0;
|
|
|
|
if (WARN_ON(!mutex_is_locked(&device->mutex)))
|
|
return -EINVAL;
|
|
|
|
if (test_bit(GMU_PRIV_PM_SUSPEND, &gmu->flags))
|
|
return -EINVAL;
|
|
|
|
if ((atomic_read(&device->active_cnt) == 0))
|
|
ret = a6xx_hwsched_boot(adreno_dev);
|
|
|
|
if (ret == 0)
|
|
atomic_inc(&device->active_cnt);
|
|
|
|
trace_kgsl_active_count(device,
|
|
(unsigned long) __builtin_return_address(0));
|
|
|
|
return ret;
|
|
}
|
|
|
|
static int a6xx_hwsched_dcvs_set(struct adreno_device *adreno_dev,
|
|
int gpu_pwrlevel, int bus_level)
|
|
{
|
|
struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
|
|
struct kgsl_pwrctrl *pwr = &device->pwrctrl;
|
|
struct a6xx_gmu_device *gmu = to_a6xx_gmu(adreno_dev);
|
|
struct hfi_dcvstable_cmd *table = &gmu->hfi.dcvs_table;
|
|
struct hfi_gx_bw_perf_vote_cmd req = {
|
|
.ack_type = DCVS_ACK_BLOCK,
|
|
.freq = INVALID_DCVS_IDX,
|
|
.bw = INVALID_DCVS_IDX,
|
|
};
|
|
int ret;
|
|
|
|
if (!test_bit(GMU_PRIV_HFI_STARTED, &gmu->flags))
|
|
return 0;
|
|
|
|
/* Do not set to XO and lower GPU clock vote from GMU */
|
|
if ((gpu_pwrlevel != INVALID_DCVS_IDX) &&
|
|
(gpu_pwrlevel >= table->gpu_level_num - 1)) {
|
|
dev_err(&gmu->pdev->dev, "Invalid gpu dcvs request: %d\n",
|
|
gpu_pwrlevel);
|
|
return -EINVAL;
|
|
}
|
|
|
|
if (gpu_pwrlevel < table->gpu_level_num - 1)
|
|
req.freq = table->gpu_level_num - gpu_pwrlevel - 1;
|
|
|
|
if (bus_level < pwr->ddr_table_count && bus_level > 0)
|
|
req.bw = bus_level;
|
|
|
|
/* GMU will vote for slumber levels through the sleep sequence */
|
|
if ((req.freq == INVALID_DCVS_IDX) && (req.bw == INVALID_DCVS_IDX))
|
|
return 0;
|
|
|
|
ret = CMD_MSG_HDR(req, H2F_MSG_GX_BW_PERF_VOTE);
|
|
if (ret)
|
|
return ret;
|
|
|
|
ret = a6xx_hfi_send_cmd_async(adreno_dev, &req, sizeof(req));
|
|
|
|
if (ret) {
|
|
dev_err_ratelimited(&gmu->pdev->dev,
|
|
"Failed to set GPU perf idx %u, bw idx %u\n",
|
|
req.freq, req.bw);
|
|
|
|
/*
|
|
* If this was a dcvs request along side an active gpu, request
|
|
* dispatcher based reset and recovery.
|
|
*/
|
|
if (test_bit(GMU_PRIV_GPU_STARTED, &gmu->flags))
|
|
adreno_hwsched_fault(adreno_dev, ADRENO_GMU_FAULT);
|
|
}
|
|
|
|
if (req.freq != INVALID_DCVS_IDX)
|
|
a6xx_rdpm_mx_freq_update(gmu,
|
|
gmu->hfi.dcvs_table.gx_votes[req.freq].freq);
|
|
|
|
return ret;
|
|
}
|
|
|
|
static int a6xx_hwsched_clock_set(struct adreno_device *adreno_dev,
|
|
u32 pwrlevel)
|
|
{
|
|
return a6xx_hwsched_dcvs_set(adreno_dev, pwrlevel, INVALID_DCVS_IDX);
|
|
}
|
|
|
|
static void scale_gmu_frequency(struct adreno_device *adreno_dev, int buslevel)
|
|
{
|
|
struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
|
|
struct kgsl_pwrctrl *pwr = &device->pwrctrl;
|
|
struct a6xx_gmu_device *gmu = to_a6xx_gmu(adreno_dev);
|
|
static unsigned long prev_freq;
|
|
unsigned long freq = gmu->freqs[0];
|
|
|
|
if (!gmu->perf_ddr_bw)
|
|
return;
|
|
|
|
/*
|
|
* Scale the GMU if DDR is at a CX corner at which GMU can run at
|
|
* a higher frequency
|
|
*/
|
|
if (pwr->ddr_table[buslevel] >= gmu->perf_ddr_bw)
|
|
freq = gmu->freqs[GMU_MAX_PWRLEVELS - 1];
|
|
|
|
if (prev_freq == freq)
|
|
return;
|
|
|
|
if (kgsl_clk_set_rate(gmu->clks, gmu->num_clks, "gmu_clk", freq)) {
|
|
dev_err(&gmu->pdev->dev, "Unable to set the GMU clock to %ld\n",
|
|
freq);
|
|
return;
|
|
}
|
|
|
|
a6xx_rdpm_cx_freq_update(gmu, freq / 1000);
|
|
|
|
trace_kgsl_gmu_pwrlevel(freq, prev_freq);
|
|
|
|
prev_freq = freq;
|
|
}
|
|
|
|
static int a6xx_hwsched_bus_set(struct adreno_device *adreno_dev, int buslevel,
|
|
u32 ab)
|
|
{
|
|
struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
|
|
struct kgsl_pwrctrl *pwr = &device->pwrctrl;
|
|
int ret = 0;
|
|
|
|
kgsl_icc_set_tag(pwr, buslevel);
|
|
|
|
if (buslevel != pwr->cur_buslevel) {
|
|
ret = a6xx_hwsched_dcvs_set(adreno_dev, INVALID_DCVS_IDX,
|
|
buslevel);
|
|
if (ret)
|
|
return ret;
|
|
|
|
scale_gmu_frequency(adreno_dev, buslevel);
|
|
|
|
pwr->cur_buslevel = buslevel;
|
|
}
|
|
|
|
if (ab != pwr->cur_ab) {
|
|
icc_set_bw(pwr->icc_path, MBps_to_icc(ab), 0);
|
|
pwr->cur_ab = ab;
|
|
}
|
|
|
|
trace_kgsl_buslevel(device, pwr->active_pwrlevel, pwr->cur_buslevel, pwr->cur_ab);
|
|
return ret;
|
|
}
|
|
|
|
static int a6xx_hwsched_pm_suspend(struct adreno_device *adreno_dev)
|
|
{
|
|
struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
|
|
struct a6xx_gmu_device *gmu = to_a6xx_gmu(adreno_dev);
|
|
int ret;
|
|
|
|
if (test_bit(GMU_PRIV_PM_SUSPEND, &gmu->flags))
|
|
return 0;
|
|
|
|
kgsl_pwrctrl_request_state(device, KGSL_STATE_SUSPEND);
|
|
|
|
/* Halt any new submissions */
|
|
reinit_completion(&device->halt_gate);
|
|
|
|
/**
|
|
* Wait for the dispatcher to retire everything by waiting
|
|
* for the active count to go to zero.
|
|
*/
|
|
ret = kgsl_active_count_wait(device, 0, msecs_to_jiffies(100));
|
|
if (ret) {
|
|
dev_err(device->dev, "Timed out waiting for the active count\n");
|
|
goto err;
|
|
}
|
|
|
|
ret = adreno_hwsched_idle(adreno_dev);
|
|
if (ret)
|
|
goto err;
|
|
|
|
a6xx_hwsched_power_off(adreno_dev);
|
|
|
|
adreno_get_gpu_halt(adreno_dev);
|
|
|
|
set_bit(GMU_PRIV_PM_SUSPEND, &gmu->flags);
|
|
|
|
kgsl_pwrctrl_set_state(device, KGSL_STATE_SUSPEND);
|
|
|
|
return 0;
|
|
|
|
err:
|
|
adreno_hwsched_start(adreno_dev);
|
|
|
|
return ret;
|
|
}
|
|
|
|
void a6xx_hwsched_handle_watchdog(struct adreno_device *adreno_dev)
|
|
{
|
|
struct a6xx_gmu_device *gmu = to_a6xx_gmu(adreno_dev);
|
|
struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
|
|
u32 mask;
|
|
|
|
/* Temporarily mask the watchdog interrupt to prevent a storm */
|
|
gmu_core_regread(device, A6XX_GMU_AO_HOST_INTERRUPT_MASK,
|
|
&mask);
|
|
gmu_core_regwrite(device, A6XX_GMU_AO_HOST_INTERRUPT_MASK,
|
|
(mask | GMU_INT_WDOG_BITE));
|
|
|
|
a6xx_gmu_send_nmi(device, false);
|
|
|
|
dev_err_ratelimited(&gmu->pdev->dev,
|
|
"GMU watchdog expired interrupt received\n");
|
|
|
|
adreno_hwsched_fault(adreno_dev, ADRENO_GMU_FAULT);
|
|
}
|
|
|
|
static void a6xx_hwsched_pm_resume(struct adreno_device *adreno_dev)
|
|
{
|
|
struct a6xx_gmu_device *gmu = to_a6xx_gmu(adreno_dev);
|
|
|
|
if (WARN(!test_bit(GMU_PRIV_PM_SUSPEND, &gmu->flags),
|
|
"resume invoked without a suspend\n"))
|
|
return;
|
|
|
|
adreno_put_gpu_halt(adreno_dev);
|
|
|
|
adreno_hwsched_start(adreno_dev);
|
|
|
|
clear_bit(GMU_PRIV_PM_SUSPEND, &gmu->flags);
|
|
}
|
|
|
|
static void a6xx_hwsched_drain_ctxt_unregister(struct adreno_device *adreno_dev)
|
|
{
|
|
struct a6xx_hwsched_hfi *hfi = to_a6xx_hwsched_hfi(adreno_dev);
|
|
struct pending_cmd *cmd = NULL;
|
|
|
|
read_lock(&hfi->msglock);
|
|
|
|
list_for_each_entry(cmd, &hfi->msglist, node) {
|
|
if (MSG_HDR_GET_ID(cmd->sent_hdr) == H2F_MSG_UNREGISTER_CONTEXT)
|
|
complete(&cmd->complete);
|
|
}
|
|
|
|
read_unlock(&hfi->msglock);
|
|
}
|
|
|
|
int a6xx_hwsched_reset_replay(struct adreno_device *adreno_dev)
|
|
{
|
|
struct a6xx_gmu_device *gmu = to_a6xx_gmu(adreno_dev);
|
|
int ret;
|
|
|
|
/*
|
|
* Any pending context unregister packets will be lost
|
|
* since we hard reset the GMU. This means any threads waiting
|
|
* for context unregister hfi ack will timeout. Wake them
|
|
* to avoid false positive ack timeout messages later.
|
|
*/
|
|
a6xx_hwsched_drain_ctxt_unregister(adreno_dev);
|
|
|
|
adreno_hwsched_unregister_contexts(adreno_dev);
|
|
|
|
if (!test_bit(GMU_PRIV_GPU_STARTED, &gmu->flags))
|
|
return 0;
|
|
|
|
a6xx_disable_gpu_irq(adreno_dev);
|
|
|
|
a6xx_gmu_irq_disable(adreno_dev);
|
|
|
|
a6xx_hwsched_hfi_stop(adreno_dev);
|
|
|
|
a6xx_gmu_suspend(adreno_dev);
|
|
|
|
adreno_llcc_slice_deactivate(adreno_dev);
|
|
|
|
clear_bit(GMU_PRIV_GPU_STARTED, &gmu->flags);
|
|
|
|
ret = a6xx_hwsched_boot(adreno_dev);
|
|
|
|
if (!ret)
|
|
adreno_hwsched_replay(adreno_dev);
|
|
|
|
BUG_ON(ret);
|
|
|
|
return ret;
|
|
}
|
|
|
|
const struct adreno_power_ops a6xx_hwsched_power_ops = {
|
|
.first_open = a6xx_hwsched_first_open,
|
|
.last_close = a6xx_hwsched_power_off,
|
|
.active_count_get = a6xx_hwsched_active_count_get,
|
|
.active_count_put = a6xx_hwsched_active_count_put,
|
|
.touch_wakeup = a6xx_hwsched_touch_wakeup,
|
|
.pm_suspend = a6xx_hwsched_pm_suspend,
|
|
.pm_resume = a6xx_hwsched_pm_resume,
|
|
.gpu_clock_set = a6xx_hwsched_clock_set,
|
|
.gpu_bus_set = a6xx_hwsched_bus_set,
|
|
};
|
|
|
|
const struct adreno_hwsched_ops a6xx_hwsched_ops = {
|
|
.submit_drawobj = a6xx_hwsched_submit_drawobj,
|
|
.preempt_count = a6xx_hwsched_preempt_count_get,
|
|
};
|
|
|
|
int a6xx_hwsched_probe(struct platform_device *pdev,
|
|
u32 chipid, const struct adreno_gpu_core *gpucore)
|
|
{
|
|
struct adreno_device *adreno_dev;
|
|
struct kgsl_device *device;
|
|
struct a6xx_hwsched_device *a6xx_hwsched_dev;
|
|
int ret;
|
|
|
|
a6xx_hwsched_dev = devm_kzalloc(&pdev->dev, sizeof(*a6xx_hwsched_dev),
|
|
GFP_KERNEL);
|
|
if (!a6xx_hwsched_dev)
|
|
return -ENOMEM;
|
|
|
|
adreno_dev = &a6xx_hwsched_dev->a6xx_dev.adreno_dev;
|
|
|
|
adreno_dev->hwsched_enabled = true;
|
|
|
|
adreno_dev->irq_mask = A6XX_HWSCHED_INT_MASK;
|
|
|
|
ret = a6xx_probe_common(pdev, adreno_dev, chipid, gpucore);
|
|
if (ret)
|
|
return ret;
|
|
|
|
device = KGSL_DEVICE(adreno_dev);
|
|
|
|
INIT_WORK(&device->idle_check_ws, hwsched_idle_check);
|
|
|
|
timer_setup(&device->idle_timer, hwsched_idle_timer, 0);
|
|
|
|
return adreno_hwsched_init(adreno_dev, &a6xx_hwsched_ops);
|
|
}
|
|
|
|
int a6xx_hwsched_add_to_minidump(struct adreno_device *adreno_dev)
|
|
{
|
|
struct a6xx_device *a6xx_dev = container_of(adreno_dev,
|
|
struct a6xx_device, adreno_dev);
|
|
struct a6xx_hwsched_device *a6xx_hwsched = container_of(a6xx_dev,
|
|
struct a6xx_hwsched_device, a6xx_dev);
|
|
struct a6xx_hwsched_hfi *hw_hfi = &a6xx_hwsched->hwsched_hfi;
|
|
int ret, i;
|
|
|
|
ret = kgsl_add_va_to_minidump(adreno_dev->dev.dev, KGSL_HWSCHED_DEVICE,
|
|
(void *)(a6xx_hwsched), sizeof(struct a6xx_hwsched_device));
|
|
if (ret)
|
|
return ret;
|
|
|
|
if (!IS_ERR_OR_NULL(a6xx_dev->gmu.gmu_log)) {
|
|
ret = kgsl_add_va_to_minidump(adreno_dev->dev.dev,
|
|
KGSL_GMU_LOG_ENTRY,
|
|
a6xx_dev->gmu.gmu_log->hostptr,
|
|
a6xx_dev->gmu.gmu_log->size);
|
|
if (ret)
|
|
return ret;
|
|
}
|
|
|
|
if (!IS_ERR_OR_NULL(a6xx_dev->gmu.hfi.hfi_mem)) {
|
|
ret = kgsl_add_va_to_minidump(adreno_dev->dev.dev,
|
|
KGSL_HFIMEM_ENTRY,
|
|
a6xx_dev->gmu.hfi.hfi_mem->hostptr,
|
|
a6xx_dev->gmu.hfi.hfi_mem->size);
|
|
if (ret)
|
|
return ret;
|
|
}
|
|
|
|
if (!IS_ERR_OR_NULL(a6xx_dev->gmu.vrb)) {
|
|
ret = kgsl_add_va_to_minidump(adreno_dev->dev.dev,
|
|
KGSL_GMU_VRB_ENTRY,
|
|
a6xx_dev->gmu.vrb->hostptr,
|
|
a6xx_dev->gmu.vrb->size);
|
|
if (ret)
|
|
return ret;
|
|
}
|
|
|
|
if (!IS_ERR_OR_NULL(a6xx_dev->gmu.dump_mem)) {
|
|
ret = kgsl_add_va_to_minidump(adreno_dev->dev.dev,
|
|
KGSL_GMU_DUMPMEM_ENTRY,
|
|
a6xx_dev->gmu.dump_mem->hostptr,
|
|
a6xx_dev->gmu.dump_mem->size);
|
|
if (ret)
|
|
return ret;
|
|
}
|
|
|
|
if (!IS_ERR_OR_NULL(a6xx_dev->gmu.trace.md)) {
|
|
ret = kgsl_add_va_to_minidump(adreno_dev->dev.dev,
|
|
KGSL_GMU_TRACE_ENTRY,
|
|
a6xx_dev->gmu.trace.md->hostptr,
|
|
a6xx_dev->gmu.trace.md->size);
|
|
if (ret)
|
|
return ret;
|
|
}
|
|
|
|
/* Dump HFI hwsched global mem alloc entries */
|
|
for (i = 0; i < hw_hfi->mem_alloc_entries; i++) {
|
|
struct hfi_mem_alloc_entry *entry = &hw_hfi->mem_alloc_table[i];
|
|
char hfi_minidump_str[MAX_VA_MINIDUMP_STR_LEN] = {0};
|
|
u32 rb_id = 0;
|
|
|
|
if (!hfi_get_minidump_string(entry->desc.mem_kind,
|
|
&hfi_minidump_str[0],
|
|
sizeof(hfi_minidump_str), &rb_id)) {
|
|
ret = kgsl_add_va_to_minidump(adreno_dev->dev.dev,
|
|
hfi_minidump_str,
|
|
entry->md->hostptr,
|
|
entry->md->size);
|
|
if (ret)
|
|
return ret;
|
|
}
|
|
}
|
|
|
|
if (!IS_ERR_OR_NULL(hw_hfi->big_ib)) {
|
|
ret = kgsl_add_va_to_minidump(adreno_dev->dev.dev,
|
|
KGSL_HFI_BIG_IB_ENTRY,
|
|
hw_hfi->big_ib->hostptr,
|
|
hw_hfi->big_ib->size);
|
|
if (ret)
|
|
return ret;
|
|
}
|
|
|
|
if (!IS_ERR_OR_NULL(hw_hfi->big_ib_recurring))
|
|
ret = kgsl_add_va_to_minidump(adreno_dev->dev.dev,
|
|
KGSL_HFI_BIG_IB_REC_ENTRY,
|
|
hw_hfi->big_ib_recurring->hostptr,
|
|
hw_hfi->big_ib_recurring->size);
|
|
|
|
return ret;
|
|
}
|