123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845184618471848184918501851185218531854185518561857185818591860186118621863186418651866186718681869187018711872187318741875187618771878187918801881188218831884188518861887188818891890189118921893189418951896189718981899190019011902190319041905 |
- // SPDX-License-Identifier: GPL-2.0-only
- /*
- * Copyright (c) 2021, The Linux Foundation. All rights reserved.
- * Copyright (c) 2023-2024, Qualcomm Innovation Center, Inc. All rights reserved.
- */
- #include <linux/clk.h>
- #include <linux/component.h>
- #include <linux/interconnect.h>
- #include <linux/soc/qcom/llcc-qcom.h>
- #include "adreno.h"
- #include "adreno_gen8.h"
- #include "adreno_gen8_hwsched.h"
- #include "adreno_snapshot.h"
- #include "kgsl_bus.h"
- #include "kgsl_device.h"
- #include "kgsl_trace.h"
- static void _wakeup_hw_fence_waiters(struct adreno_device *adreno_dev, u32 fault)
- {
- struct gen8_hwsched_hfi *hfi = to_gen8_hwsched_hfi(adreno_dev);
- bool lock = !in_interrupt();
- if (!test_bit(ADRENO_HWSCHED_HW_FENCE, &adreno_dev->hwsched.flags))
- return;
- /*
- * We could be in interrupt context here, which means we need to use spin_lock_irqsave
- * (which disables interrupts) everywhere we take this lock. Instead of that, simply
- * avoid taking this lock if we are recording a fault from an interrupt handler.
- */
- if (lock)
- spin_lock(&hfi->hw_fence.lock);
- clear_bit(GEN8_HWSCHED_HW_FENCE_SLEEP_BIT, &hfi->hw_fence.flags);
- /* Avoid creating new hardware fences until recovery is complete */
- set_bit(GEN8_HWSCHED_HW_FENCE_ABORT_BIT, &hfi->hw_fence.flags);
- if (!lock) {
- /*
- * This barrier ensures that the above bitops complete before we wake up the waiters
- */
- smp_wmb();
- } else {
- spin_unlock(&hfi->hw_fence.lock);
- }
- wake_up_all(&hfi->hw_fence.unack_wq);
- del_timer_sync(&hfi->hw_fence_timer);
- }
- void gen8_hwsched_fault(struct adreno_device *adreno_dev, u32 fault)
- {
- /*
- * Wake up any threads that may be sleeping waiting for the hardware fence unack count to
- * drop to a desired threshold.
- */
- _wakeup_hw_fence_waiters(adreno_dev, fault);
- adreno_hwsched_fault(adreno_dev, fault);
- }
- static size_t gen8_hwsched_snapshot_rb(struct kgsl_device *device, u8 *buf,
- size_t remain, void *priv)
- {
- struct kgsl_snapshot_rb_v2 *header = (struct kgsl_snapshot_rb_v2 *)buf;
- u32 *data = (u32 *)(buf + sizeof(*header));
- struct kgsl_memdesc *rb = (struct kgsl_memdesc *)priv;
- if (remain < rb->size + sizeof(*header)) {
- SNAPSHOT_ERR_NOMEM(device, "RB");
- return 0;
- }
- header->start = 0;
- header->end = rb->size >> 2;
- header->rptr = 0;
- header->rbsize = rb->size >> 2;
- header->count = rb->size >> 2;
- header->timestamp_queued = 0;
- header->timestamp_retired = 0;
- header->gpuaddr = rb->gpuaddr;
- header->id = 0;
- memcpy(data, rb->hostptr, rb->size);
- return rb->size + sizeof(*header);
- }
- static void gen8_hwsched_snapshot_preemption_record(struct kgsl_device *device,
- struct kgsl_snapshot *snapshot, struct kgsl_memdesc *md, u64 offset)
- {
- struct kgsl_snapshot_section_header *section_header =
- (struct kgsl_snapshot_section_header *)snapshot->ptr;
- u8 *dest = snapshot->ptr + sizeof(*section_header);
- struct kgsl_snapshot_gpu_object_v2 *header =
- (struct kgsl_snapshot_gpu_object_v2 *)dest;
- u64 ctxt_record_size = max_t(u64, GEN8_SNAPSHOT_CTXRECORD_SIZE_IN_BYTES,
- device->snapshot_ctxt_record_size);
- size_t section_size;
- section_size = sizeof(*section_header) + sizeof(*header) + ctxt_record_size;
- if (snapshot->remain < section_size) {
- SNAPSHOT_ERR_NOMEM(device, "PREEMPTION RECORD");
- return;
- }
- section_header->magic = SNAPSHOT_SECTION_MAGIC;
- section_header->id = KGSL_SNAPSHOT_SECTION_GPU_OBJECT_V2;
- section_header->size = section_size;
- header->size = ctxt_record_size >> 2;
- header->gpuaddr = md->gpuaddr + offset;
- header->ptbase =
- kgsl_mmu_pagetable_get_ttbr0(device->mmu.defaultpagetable);
- header->type = SNAPSHOT_GPU_OBJECT_GLOBAL;
- dest += sizeof(*header);
- memcpy(dest, md->hostptr + offset, ctxt_record_size);
- snapshot->ptr += section_header->size;
- snapshot->remain -= section_header->size;
- snapshot->size += section_header->size;
- }
- static void snapshot_preemption_records(struct kgsl_device *device,
- struct kgsl_snapshot *snapshot, struct kgsl_memdesc *md)
- {
- u64 ctxt_record_size = md->size;
- u64 offset;
- do_div(ctxt_record_size, KGSL_PRIORITY_MAX_RB_LEVELS);
- /* All preemption records exist as a single mem alloc entry */
- for (offset = 0; offset < md->size; offset += ctxt_record_size)
- gen8_hwsched_snapshot_preemption_record(device, snapshot, md,
- offset);
- }
- static void *get_rb_hostptr(struct adreno_device *adreno_dev,
- u64 gpuaddr, u32 size)
- {
- struct gen8_hwsched_hfi *hw_hfi = to_gen8_hwsched_hfi(adreno_dev);
- u64 offset;
- u32 i;
- for (i = 0; i < hw_hfi->mem_alloc_entries; i++) {
- struct kgsl_memdesc *md = hw_hfi->mem_alloc_table[i].md;
- if (md && (gpuaddr >= md->gpuaddr) &&
- ((gpuaddr + size) <= (md->gpuaddr + md->size))) {
- offset = gpuaddr - md->gpuaddr;
- return md->hostptr + offset;
- }
- }
- return NULL;
- }
- static u32 gen8_copy_gpu_global(void *out, void *in, u32 size)
- {
- if (out && in) {
- memcpy(out, in, size);
- return size;
- }
- return 0;
- }
- static void adreno_hwsched_snapshot_rb_payload(struct adreno_device *adreno_dev,
- struct kgsl_snapshot *snapshot, struct payload_section *payload)
- {
- struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
- struct kgsl_snapshot_section_header *section_header =
- (struct kgsl_snapshot_section_header *)snapshot->ptr;
- u8 *buf = snapshot->ptr + sizeof(*section_header);
- struct kgsl_snapshot_rb_v2 *header = (struct kgsl_snapshot_rb_v2 *)buf;
- u32 *data = (u32 *)(buf + sizeof(*header));
- u32 size = gen8_hwsched_parse_payload(payload, KEY_RB_SIZEDWORDS) << 2;
- u64 lo, hi, gpuaddr;
- void *rb_hostptr;
- char str[16];
- lo = gen8_hwsched_parse_payload(payload, KEY_RB_GPUADDR_LO);
- hi = gen8_hwsched_parse_payload(payload, KEY_RB_GPUADDR_HI);
- gpuaddr = hi << 32 | lo;
- /* Sanity check to make sure there is enough for the header */
- if (snapshot->remain < sizeof(*section_header))
- goto err;
- rb_hostptr = get_rb_hostptr(adreno_dev, gpuaddr, size);
- /* If the gpuaddress and size don't match any allocation, then abort */
- if (((snapshot->remain - sizeof(*section_header)) <
- (size + sizeof(*header))) ||
- !gen8_copy_gpu_global(data, rb_hostptr, size))
- goto err;
- if (device->dump_all_ibs) {
- u64 rbaddr, lpac_rbaddr;
- kgsl_regread64(device, GEN8_CP_RB_BASE_LO_GC,
- GEN8_CP_RB_BASE_HI_GC, &rbaddr);
- kgsl_regread64(device, GEN8_CP_RB_BASE_LO_LPAC,
- GEN8_CP_RB_BASE_HI_LPAC, &lpac_rbaddr);
- /* Parse all IBs from current RB */
- if ((rbaddr == gpuaddr) || (lpac_rbaddr == gpuaddr))
- adreno_snapshot_dump_all_ibs(device, rb_hostptr, snapshot);
- }
- header->start = 0;
- header->end = size >> 2;
- header->rptr = gen8_hwsched_parse_payload(payload, KEY_RB_RPTR);
- header->wptr = gen8_hwsched_parse_payload(payload, KEY_RB_WPTR);
- header->rbsize = size >> 2;
- header->count = size >> 2;
- header->timestamp_queued = gen8_hwsched_parse_payload(payload,
- KEY_RB_QUEUED_TS);
- header->timestamp_retired = gen8_hwsched_parse_payload(payload,
- KEY_RB_RETIRED_TS);
- header->gpuaddr = gpuaddr;
- header->id = gen8_hwsched_parse_payload(payload, KEY_RB_ID);
- section_header->magic = SNAPSHOT_SECTION_MAGIC;
- section_header->id = KGSL_SNAPSHOT_SECTION_RB_V2;
- section_header->size = size + sizeof(*header) + sizeof(*section_header);
- snapshot->ptr += section_header->size;
- snapshot->remain -= section_header->size;
- snapshot->size += section_header->size;
- return;
- err:
- snprintf(str, sizeof(str), "RB addr:0x%llx", gpuaddr);
- SNAPSHOT_ERR_NOMEM(device, str);
- }
- static bool parse_payload_rb(struct adreno_device *adreno_dev,
- struct kgsl_snapshot *snapshot)
- {
- struct hfi_context_bad_cmd *cmd = adreno_dev->hwsched.ctxt_bad;
- u32 i = 0, payload_bytes;
- void *start;
- bool ret = false;
- /* Skip if we didn't receive a context bad HFI */
- if (!cmd->hdr)
- return false;
- payload_bytes = (MSG_HDR_GET_SIZE(cmd->hdr) << 2) -
- offsetof(struct hfi_context_bad_cmd, payload);
- start = &cmd->payload[0];
- while (i < payload_bytes) {
- struct payload_section *payload = start + i;
- if (payload->type == PAYLOAD_RB) {
- adreno_hwsched_snapshot_rb_payload(adreno_dev,
- snapshot, payload);
- ret = true;
- }
- i += sizeof(*payload) + (payload->dwords << 2);
- }
- return ret;
- }
- static int snapshot_context_queue(int id, void *ptr, void *data)
- {
- struct kgsl_snapshot *snapshot = data;
- struct kgsl_context *context = ptr;
- struct adreno_context *drawctxt = ADRENO_CONTEXT(context);
- struct gmu_mem_type_desc desc;
- if (!context->gmu_registered)
- return 0;
- desc.memdesc = &drawctxt->gmu_context_queue;
- desc.type = SNAPSHOT_GMU_MEM_CONTEXT_QUEUE;
- kgsl_snapshot_add_section(context->device,
- KGSL_SNAPSHOT_SECTION_GMU_MEMORY,
- snapshot, gen8_snapshot_gmu_mem, &desc);
- return 0;
- }
- /* Snapshot AQE buffer */
- static size_t snapshot_aqe_buffer(struct kgsl_device *device, u8 *buf,
- size_t remain, void *priv)
- {
- struct kgsl_memdesc *memdesc = priv;
- struct kgsl_snapshot_gpu_object_v2 *header =
- (struct kgsl_snapshot_gpu_object_v2 *)buf;
- u8 *ptr = buf + sizeof(*header);
- if (IS_ERR_OR_NULL(memdesc) || memdesc->size == 0)
- return 0;
- if (remain < (memdesc->size + sizeof(*header))) {
- SNAPSHOT_ERR_NOMEM(device, "AQE BUFFER");
- return 0;
- }
- header->size = memdesc->size >> 2;
- header->gpuaddr = memdesc->gpuaddr;
- header->ptbase = MMU_DEFAULT_TTBR0(device);
- header->type = SNAPSHOT_GPU_OBJECT_GLOBAL;
- memcpy(ptr, memdesc->hostptr, memdesc->size);
- return memdesc->size + sizeof(*header);
- }
- void gen8_hwsched_snapshot(struct adreno_device *adreno_dev,
- struct kgsl_snapshot *snapshot)
- {
- struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
- struct gen8_hwsched_hfi *hw_hfi = to_gen8_hwsched_hfi(adreno_dev);
- bool skip_memkind_rb = false;
- u32 i;
- bool parse_payload;
- gen8_gmu_snapshot(adreno_dev, snapshot);
- adreno_hwsched_parse_fault_cmdobj(adreno_dev, snapshot);
- /*
- * First try to dump ringbuffers using context bad HFI payloads
- * because they have all the ringbuffer parameters. If ringbuffer
- * payloads are not present, fall back to dumping ringbuffers
- * based on MEMKIND_RB
- */
- parse_payload = parse_payload_rb(adreno_dev, snapshot);
- if (parse_payload)
- skip_memkind_rb = true;
- for (i = 0; i < hw_hfi->mem_alloc_entries; i++) {
- struct hfi_mem_alloc_entry *entry = &hw_hfi->mem_alloc_table[i];
- if (entry->desc.mem_kind == HFI_MEMKIND_RB && !skip_memkind_rb)
- kgsl_snapshot_add_section(device,
- KGSL_SNAPSHOT_SECTION_RB_V2,
- snapshot, gen8_hwsched_snapshot_rb,
- entry->md);
- if (entry->desc.mem_kind == HFI_MEMKIND_SCRATCH)
- kgsl_snapshot_add_section(device,
- KGSL_SNAPSHOT_SECTION_GPU_OBJECT_V2,
- snapshot, adreno_snapshot_global,
- entry->md);
- if (entry->desc.mem_kind == HFI_MEMKIND_PROFILE)
- kgsl_snapshot_add_section(device,
- KGSL_SNAPSHOT_SECTION_GPU_OBJECT_V2,
- snapshot, adreno_snapshot_global,
- entry->md);
- if (entry->desc.mem_kind == HFI_MEMKIND_CSW_SMMU_INFO)
- kgsl_snapshot_add_section(device,
- KGSL_SNAPSHOT_SECTION_GPU_OBJECT_V2,
- snapshot, adreno_snapshot_global,
- entry->md);
- if (entry->desc.mem_kind == HFI_MEMKIND_CSW_PRIV_NON_SECURE)
- snapshot_preemption_records(device, snapshot,
- entry->md);
- if (entry->desc.mem_kind == HFI_MEMKIND_PREEMPT_SCRATCH)
- kgsl_snapshot_add_section(device,
- KGSL_SNAPSHOT_SECTION_GPU_OBJECT_V2,
- snapshot, adreno_snapshot_global,
- entry->md);
- if (entry->desc.mem_kind == HFI_MEMKIND_AQE_BUFFER)
- kgsl_snapshot_add_section(device,
- KGSL_SNAPSHOT_SECTION_GPU_OBJECT_V2,
- snapshot, snapshot_aqe_buffer,
- entry->md);
- if (entry->desc.mem_kind == HFI_MEMKIND_HW_FENCE) {
- struct gmu_mem_type_desc desc;
- desc.memdesc = entry->md;
- desc.type = SNAPSHOT_GMU_MEM_HW_FENCE;
- kgsl_snapshot_add_section(device,
- KGSL_SNAPSHOT_SECTION_GMU_MEMORY,
- snapshot, gen8_snapshot_gmu_mem, &desc);
- }
- }
- if (!adreno_hwsched_context_queue_enabled(adreno_dev))
- return;
- read_lock(&device->context_lock);
- idr_for_each(&device->context_idr, snapshot_context_queue, snapshot);
- read_unlock(&device->context_lock);
- }
- static int gmu_clock_set_rate(struct adreno_device *adreno_dev)
- {
- struct gen8_gmu_device *gmu = to_gen8_gmu(adreno_dev);
- int ret = 0;
- /* Switch to min GMU clock */
- gen8_rdpm_cx_freq_update(gmu, gmu->freqs[0] / 1000);
- ret = kgsl_clk_set_rate(gmu->clks, gmu->num_clks, "gmu_clk",
- gmu->freqs[0]);
- if (ret)
- dev_err(&gmu->pdev->dev, "GMU clock:%d set failed:%d\n",
- gmu->freqs[0], ret);
- trace_kgsl_gmu_pwrlevel(gmu->freqs[0], gmu->freqs[GMU_MAX_PWRLEVELS - 1]);
- return ret;
- }
- static int gen8_hwsched_gmu_first_boot(struct adreno_device *adreno_dev)
- {
- struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
- struct kgsl_pwrctrl *pwr = &device->pwrctrl;
- struct gen8_gmu_device *gmu = to_gen8_gmu(adreno_dev);
- int level, ret = 0;
- kgsl_pwrctrl_request_state(device, KGSL_STATE_AWARE);
- gen8_gmu_aop_send_acd_state(gmu, adreno_dev->acd_enabled);
- ret = kgsl_pwrctrl_enable_cx_gdsc(device);
- if (ret)
- return ret;
- ret = gen8_gmu_enable_clks(adreno_dev, GMU_MAX_PWRLEVELS - 1);
- if (ret)
- goto gdsc_off;
- /*
- * Enable AHB timeout detection to catch any register access taking longer
- * time before NOC timeout gets detected. Enable this logic before any
- * register access which happens to be just after enabling clocks.
- */
- gen8_enable_ahb_timeout_detection(adreno_dev);
- /* Initialize the CX timer */
- gen8_cx_timer_init(adreno_dev);
- ret = gen8_gmu_load_fw(adreno_dev);
- if (ret)
- goto clks_gdsc_off;
- ret = gen8_gmu_itcm_shadow(adreno_dev);
- if (ret)
- goto clks_gdsc_off;
- ret = gen8_scm_gpu_init_cx_regs(adreno_dev);
- if (ret)
- goto clks_gdsc_off;
- gen8_gmu_register_config(adreno_dev);
- ret = gen8_gmu_version_info(adreno_dev);
- if (ret)
- goto clks_gdsc_off;
- gen8_gmu_irq_enable(adreno_dev);
- /* Vote for minimal DDR BW for GMU to init */
- level = pwr->pwrlevels[pwr->default_pwrlevel].bus_min;
- icc_set_bw(pwr->icc_path, 0, kBps_to_icc(pwr->ddr_table[level]));
- /* From this GMU FW all RBBM interrupts are handled at GMU */
- if (gmu->ver.core >= GMU_VERSION(5, 01, 06))
- adreno_irq_free(adreno_dev);
- /* Clear any hwsched faults that might have been left over */
- adreno_hwsched_clear_fault(adreno_dev);
- ret = gen8_gmu_device_start(adreno_dev);
- if (ret)
- goto err;
- gen8_get_gpu_feature_info(adreno_dev);
- ret = gen8_hwsched_hfi_start(adreno_dev);
- if (ret)
- goto err;
- ret = gmu_clock_set_rate(adreno_dev);
- if (ret) {
- gen8_hwsched_hfi_stop(adreno_dev);
- goto err;
- }
- if (gen8_hwsched_hfi_get_value(adreno_dev, HFI_VALUE_GMU_AB_VOTE) == 1 &&
- !WARN_ONCE(!adreno_dev->gpucore->num_ddr_channels,
- "Number of DDR channel is not specified in gpu core")) {
- adreno_dev->gmu_ab = true;
- set_bit(ADRENO_DEVICE_GMU_AB, &adreno_dev->priv);
- }
- icc_set_bw(pwr->icc_path, 0, 0);
- device->gmu_fault = false;
- kgsl_pwrctrl_set_state(device, KGSL_STATE_AWARE);
- return 0;
- err:
- gen8_gmu_irq_disable(adreno_dev);
- if (device->gmu_fault) {
- gen8_gmu_suspend(adreno_dev);
- return ret;
- }
- clks_gdsc_off:
- clk_bulk_disable_unprepare(gmu->num_clks, gmu->clks);
- gdsc_off:
- kgsl_pwrctrl_disable_cx_gdsc(device);
- gen8_rdpm_cx_freq_update(gmu, 0);
- return ret;
- }
- static int gen8_hwsched_gmu_boot(struct adreno_device *adreno_dev)
- {
- struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
- struct gen8_gmu_device *gmu = to_gen8_gmu(adreno_dev);
- int ret = 0;
- kgsl_pwrctrl_request_state(device, KGSL_STATE_AWARE);
- ret = kgsl_pwrctrl_enable_cx_gdsc(device);
- if (ret)
- return ret;
- ret = gen8_gmu_enable_clks(adreno_dev, GMU_MAX_PWRLEVELS - 1);
- if (ret)
- goto gdsc_off;
- /*
- * Enable AHB timeout detection to catch any register access taking longer
- * time before NOC timeout gets detected. Enable this logic before any
- * register access which happens to be just after enabling clocks.
- */
- gen8_enable_ahb_timeout_detection(adreno_dev);
- /* Initialize the CX timer */
- gen8_cx_timer_init(adreno_dev);
- ret = gen8_rscc_wakeup_sequence(adreno_dev);
- if (ret)
- goto clks_gdsc_off;
- ret = gen8_gmu_load_fw(adreno_dev);
- if (ret)
- goto clks_gdsc_off;
- gen8_gmu_register_config(adreno_dev);
- gen8_gmu_irq_enable(adreno_dev);
- /* Clear any hwsched faults that might have been left over */
- adreno_hwsched_clear_fault(adreno_dev);
- ret = gen8_gmu_device_start(adreno_dev);
- if (ret)
- goto err;
- ret = gen8_hwsched_hfi_start(adreno_dev);
- if (ret)
- goto err;
- ret = gmu_clock_set_rate(adreno_dev);
- if (ret) {
- gen8_hwsched_hfi_stop(adreno_dev);
- goto err;
- }
- device->gmu_fault = false;
- kgsl_pwrctrl_set_state(device, KGSL_STATE_AWARE);
- return 0;
- err:
- gen8_gmu_irq_disable(adreno_dev);
- if (device->gmu_fault) {
- gen8_gmu_suspend(adreno_dev);
- return ret;
- }
- clks_gdsc_off:
- clk_bulk_disable_unprepare(gmu->num_clks, gmu->clks);
- gdsc_off:
- kgsl_pwrctrl_disable_cx_gdsc(device);
- gen8_rdpm_cx_freq_update(gmu, 0);
- return ret;
- }
- void gen8_hwsched_active_count_put(struct adreno_device *adreno_dev)
- {
- struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
- if (WARN_ON(!mutex_is_locked(&device->mutex)))
- return;
- if (WARN(atomic_read(&device->active_cnt) == 0,
- "Unbalanced get/put calls to KGSL active count\n"))
- return;
- if (atomic_dec_and_test(&device->active_cnt)) {
- kgsl_pwrscale_update_stats(device);
- kgsl_pwrscale_update(device);
- kgsl_start_idle_timer(device);
- }
- trace_kgsl_active_count(device,
- (unsigned long) __builtin_return_address(0));
- wake_up(&device->active_cnt_wq);
- }
- static int gen8_hwsched_notify_slumber(struct adreno_device *adreno_dev)
- {
- struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
- struct kgsl_pwrctrl *pwr = &device->pwrctrl;
- struct gen8_gmu_device *gmu = to_gen8_gmu(adreno_dev);
- struct hfi_prep_slumber_cmd req;
- int ret;
- ret = CMD_MSG_HDR(req, H2F_MSG_PREPARE_SLUMBER);
- if (ret)
- return ret;
- req.freq = gmu->dcvs_table.gpu_level_num - pwr->default_pwrlevel - 1;
- req.bw = pwr->pwrlevels[pwr->default_pwrlevel].bus_freq;
- req.bw |= gen8_bus_ab_quantize(adreno_dev, 0);
- /* Disable the power counter so that the GMU is not busy */
- gmu_core_regwrite(device, GEN8_GMUCX_POWER_COUNTER_ENABLE, 0);
- ret = gen8_hfi_send_cmd_async(adreno_dev, &req, sizeof(req));
- /*
- * GEMNOC can enter power collapse state during GPU power down sequence.
- * This could abort CX GDSC collapse. Assert Qactive to avoid this.
- */
- gmu_core_regwrite(device, GEN8_GMUCX_CX_FALNEXT_INTF, 0x1);
- return ret;
- }
- static int gen8_hwsched_gmu_power_off(struct adreno_device *adreno_dev)
- {
- struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
- struct gen8_gmu_device *gmu = to_gen8_gmu(adreno_dev);
- int ret = 0;
- if (device->gmu_fault)
- goto error;
- /* Wait for the lowest idle level we requested */
- ret = gen8_gmu_wait_for_lowest_idle(adreno_dev);
- if (ret)
- goto error;
- ret = gen8_hwsched_notify_slumber(adreno_dev);
- if (ret)
- goto error;
- ret = gen8_gmu_wait_for_idle(adreno_dev);
- if (ret)
- goto error;
- ret = gen8_rscc_sleep_sequence(adreno_dev);
- gen8_rdpm_mx_freq_update(gmu, 0);
- /* Now that we are done with GMU and GPU, Clear the GBIF */
- ret = gen8_halt_gbif(adreno_dev);
- gen8_gmu_irq_disable(adreno_dev);
- gen8_hwsched_hfi_stop(adreno_dev);
- clk_bulk_disable_unprepare(gmu->num_clks, gmu->clks);
- kgsl_pwrctrl_disable_cx_gdsc(device);
- gen8_rdpm_cx_freq_update(gmu, 0);
- kgsl_pwrctrl_set_state(device, KGSL_STATE_NONE);
- return ret;
- error:
- gen8_gmu_irq_disable(adreno_dev);
- gen8_hwsched_hfi_stop(adreno_dev);
- gen8_gmu_suspend(adreno_dev);
- return ret;
- }
- static void gen8_hwsched_init_ucode_regs(struct adreno_device *adreno_dev)
- {
- struct adreno_firmware *fw = ADRENO_FW(adreno_dev, ADRENO_FW_SQE);
- struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
- /* Program the ucode base for CP */
- kgsl_regwrite(device, GEN8_CP_SQE_INSTR_BASE_LO,
- lower_32_bits(fw->memdesc->gpuaddr));
- kgsl_regwrite(device, GEN8_CP_SQE_INSTR_BASE_HI,
- upper_32_bits(fw->memdesc->gpuaddr));
- if (ADRENO_FEATURE(adreno_dev, ADRENO_AQE)) {
- fw = ADRENO_FW(adreno_dev, ADRENO_FW_AQE);
- /* Program the ucode base for AQE0 (BV coprocessor) */
- kgsl_regwrite(device, GEN8_CP_AQE_INSTR_BASE_LO_0,
- lower_32_bits(fw->memdesc->gpuaddr));
- kgsl_regwrite(device, GEN8_CP_AQE_INSTR_BASE_HI_0,
- upper_32_bits(fw->memdesc->gpuaddr));
- /* Program the ucode base for AQE1 (LPAC coprocessor) */
- if (adreno_dev->lpac_enabled) {
- kgsl_regwrite(device, GEN8_CP_AQE_INSTR_BASE_LO_1,
- lower_32_bits(fw->memdesc->gpuaddr));
- kgsl_regwrite(device, GEN8_CP_AQE_INSTR_BASE_HI_1,
- upper_32_bits(fw->memdesc->gpuaddr));
- }
- }
- }
- static int gen8_hwsched_gpu_boot(struct adreno_device *adreno_dev)
- {
- struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
- int ret;
- ret = kgsl_mmu_start(device);
- if (ret)
- goto err;
- ret = gen8_gmu_oob_set(device, oob_gpu);
- if (ret)
- goto err;
- /* Clear the busy_data stats - we're starting over from scratch */
- memset(&adreno_dev->busy_data, 0, sizeof(adreno_dev->busy_data));
- gen8_start(adreno_dev);
- /* Re-initialize the coresight registers if applicable */
- adreno_coresight_start(adreno_dev);
- adreno_perfcounter_start(adreno_dev);
- /* Clear FSR here in case it is set from a previous pagefault */
- kgsl_mmu_clear_fsr(&device->mmu);
- gen8_enable_gpu_irq(adreno_dev);
- gen8_hwsched_init_ucode_regs(adreno_dev);
- ret = gen8_hwsched_boot_gpu(adreno_dev);
- if (ret)
- goto err;
- /*
- * At this point it is safe to assume that we recovered. Setting
- * this field allows us to take a new snapshot for the next failure
- * if we are prioritizing the first unrecoverable snapshot.
- */
- if (device->snapshot)
- device->snapshot->recovered = true;
- device->reset_counter++;
- /*
- * If warmboot is enabled and we switched a sysfs node, we will do a coldboot
- * in the subseqent slumber exit. Once that is done we need to mark this bool
- * as false so that in the next run we can do warmboot
- */
- clear_bit(ADRENO_DEVICE_FORCE_COLDBOOT, &adreno_dev->priv);
- err:
- gen8_gmu_oob_clear(device, oob_gpu);
- if (ret)
- gen8_hwsched_gmu_power_off(adreno_dev);
- return ret;
- }
- static void hwsched_idle_timer(struct timer_list *t)
- {
- struct kgsl_device *device = container_of(t, struct kgsl_device,
- idle_timer);
- kgsl_schedule_work(&device->idle_check_ws);
- }
- static int gen8_gmu_warmboot_init(struct adreno_device *adreno_dev)
- {
- struct gen8_gmu_device *gmu = to_gen8_gmu(adreno_dev);
- int ret = 0;
- if (!ADRENO_FEATURE(adreno_dev, ADRENO_GMU_WARMBOOT))
- return ret;
- if (IS_ERR_OR_NULL(gmu->gmu_init_scratch)) {
- gmu->gmu_init_scratch = gen8_reserve_gmu_kernel_block(gmu, 0,
- SZ_4K, GMU_CACHE, 0);
- ret = PTR_ERR_OR_ZERO(gmu->gmu_init_scratch);
- if (ret)
- return ret;
- }
- if (IS_ERR_OR_NULL(gmu->gpu_boot_scratch)) {
- gmu->gpu_boot_scratch = gen8_reserve_gmu_kernel_block(gmu, 0,
- SZ_4K, GMU_CACHE, 0);
- ret = PTR_ERR_OR_ZERO(gmu->gpu_boot_scratch);
- }
- return ret;
- }
- static int gen8_hwsched_gmu_memory_init(struct adreno_device *adreno_dev)
- {
- struct gen8_gmu_device *gmu = to_gen8_gmu(adreno_dev);
- /* GMU Virtual register bank */
- if (IS_ERR_OR_NULL(gmu->vrb)) {
- gmu->vrb = gen8_reserve_gmu_kernel_block(gmu, 0, GMU_VRB_SIZE,
- GMU_NONCACHED_KERNEL, 0);
- if (IS_ERR(gmu->vrb))
- return PTR_ERR(gmu->vrb);
- /* Populate size of the virtual register bank */
- gmu_core_set_vrb_register(gmu->vrb->hostptr, VRB_SIZE_IDX,
- gmu->vrb->size >> 2);
- }
- /* GMU trace log */
- if (IS_ERR_OR_NULL(gmu->trace.md)) {
- gmu->trace.md = gen8_reserve_gmu_kernel_block(gmu, 0,
- GMU_TRACE_SIZE, GMU_NONCACHED_KERNEL, 0);
- if (IS_ERR(gmu->trace.md))
- return PTR_ERR(gmu->trace.md);
- /* Pass trace buffer address to GMU through the VRB */
- gmu_core_set_vrb_register(gmu->vrb->hostptr,
- VRB_TRACE_BUFFER_ADDR_IDX,
- gmu->trace.md->gmuaddr);
- /* Initialize the GMU trace buffer header */
- gmu_core_trace_header_init(&gmu->trace);
- }
- return 0;
- }
- static int gen8_hwsched_gmu_init(struct adreno_device *adreno_dev)
- {
- int ret;
- ret = gen8_gmu_parse_fw(adreno_dev);
- if (ret)
- return ret;
- ret = gen8_gmu_memory_init(adreno_dev);
- if (ret)
- return ret;
- ret = gen8_gmu_warmboot_init(adreno_dev);
- if (ret)
- return ret;
- ret = gen8_hwsched_gmu_memory_init(adreno_dev);
- if (ret)
- return ret;
- return gen8_hwsched_hfi_init(adreno_dev);
- }
- static void gen8_hwsched_touch_wakeup(struct adreno_device *adreno_dev)
- {
- struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
- struct gen8_gmu_device *gmu = to_gen8_gmu(adreno_dev);
- int ret;
- /*
- * Do not wake up a suspended device or until the first boot sequence
- * has been completed.
- */
- if (test_bit(GMU_PRIV_PM_SUSPEND, &gmu->flags) ||
- !test_bit(GMU_PRIV_FIRST_BOOT_DONE, &gmu->flags))
- return;
- if (test_bit(GMU_PRIV_GPU_STARTED, &gmu->flags))
- goto done;
- kgsl_pwrctrl_request_state(device, KGSL_STATE_ACTIVE);
- ret = gen8_hwsched_gmu_boot(adreno_dev);
- if (ret)
- return;
- ret = gen8_hwsched_gpu_boot(adreno_dev);
- if (ret)
- return;
- kgsl_pwrscale_wake(device);
- set_bit(GMU_PRIV_GPU_STARTED, &gmu->flags);
- device->pwrctrl.last_stat_updated = ktime_get();
- kgsl_pwrctrl_set_state(device, KGSL_STATE_ACTIVE);
- done:
- /*
- * When waking up from a touch event we want to stay active long enough
- * for the user to send a draw command. The default idle timer timeout
- * is shorter than we want so go ahead and push the idle timer out
- * further for this special case
- */
- mod_timer(&device->idle_timer, jiffies +
- msecs_to_jiffies(adreno_wake_timeout));
- }
- static int gen8_hwsched_boot(struct adreno_device *adreno_dev)
- {
- struct gen8_gmu_device *gmu = to_gen8_gmu(adreno_dev);
- struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
- int ret;
- if (test_bit(GMU_PRIV_GPU_STARTED, &gmu->flags))
- return 0;
- kgsl_pwrctrl_request_state(device, KGSL_STATE_ACTIVE);
- adreno_hwsched_start(adreno_dev);
- ret = gen8_hwsched_gmu_boot(adreno_dev);
- if (ret)
- return ret;
- ret = gen8_hwsched_gpu_boot(adreno_dev);
- if (ret)
- return ret;
- kgsl_start_idle_timer(device);
- kgsl_pwrscale_wake(device);
- set_bit(GMU_PRIV_GPU_STARTED, &gmu->flags);
- device->pwrctrl.last_stat_updated = ktime_get();
- kgsl_pwrctrl_set_state(device, KGSL_STATE_ACTIVE);
- return ret;
- }
- static int gen8_aqe_microcode_read(struct adreno_device *adreno_dev)
- {
- struct adreno_firmware *aqe_fw = ADRENO_FW(adreno_dev, ADRENO_FW_AQE);
- const struct adreno_gen8_core *gen8_core = to_gen8_core(adreno_dev);
- if (!ADRENO_FEATURE(adreno_dev, ADRENO_AQE))
- return 0;
- return adreno_get_firmware(adreno_dev, gen8_core->aqefw_name, aqe_fw);
- }
- static int gen8_hwsched_first_boot(struct adreno_device *adreno_dev)
- {
- struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
- struct gen8_gmu_device *gmu = to_gen8_gmu(adreno_dev);
- int ret;
- if (test_bit(GMU_PRIV_FIRST_BOOT_DONE, &gmu->flags))
- return gen8_hwsched_boot(adreno_dev);
- adreno_hwsched_start(adreno_dev);
- ret = gen8_microcode_read(adreno_dev);
- if (ret)
- return ret;
- ret = gen8_aqe_microcode_read(adreno_dev);
- if (ret)
- return ret;
- ret = gen8_init(adreno_dev);
- if (ret)
- return ret;
- ret = gen8_hwsched_gmu_init(adreno_dev);
- if (ret)
- return ret;
- kgsl_pwrctrl_request_state(device, KGSL_STATE_ACTIVE);
- ret = gen8_hwsched_gmu_first_boot(adreno_dev);
- if (ret)
- return ret;
- ret = gen8_hwsched_gpu_boot(adreno_dev);
- if (ret)
- return ret;
- adreno_get_bus_counters(adreno_dev);
- adreno_dev->cooperative_reset = ADRENO_FEATURE(adreno_dev,
- ADRENO_COOP_RESET);
- set_bit(GMU_PRIV_FIRST_BOOT_DONE, &gmu->flags);
- set_bit(GMU_PRIV_GPU_STARTED, &gmu->flags);
- /*
- * BCL needs respective Central Broadcast register to
- * be programed from TZ. This programing happens only
- * when zap shader firmware load is successful. Zap firmware
- * load can fail in boot up path hence enable BCL only after we
- * successfully complete first boot to ensure that Central
- * Broadcast register was programed before enabling BCL.
- */
- if (ADRENO_FEATURE(adreno_dev, ADRENO_BCL))
- adreno_dev->bcl_enabled = true;
- /*
- * There is a possible deadlock scenario during kgsl firmware reading
- * (request_firmware) and devfreq update calls. During first boot, kgsl
- * device mutex is held and then request_firmware is called for reading
- * firmware. request_firmware internally takes dev_pm_qos_mtx lock.
- * Whereas in case of devfreq update calls triggered by thermal/bcl or
- * devfreq sysfs, it first takes the same dev_pm_qos_mtx lock and then
- * tries to take kgsl device mutex as part of get_dev_status/target
- * calls. This results in deadlock when both thread are unable to acquire
- * the mutex held by other thread. Enable devfreq updates now as we are
- * done reading all firmware files.
- */
- device->pwrscale.devfreq_enabled = true;
- device->pwrctrl.last_stat_updated = ktime_get();
- kgsl_pwrctrl_set_state(device, KGSL_STATE_ACTIVE);
- return 0;
- }
- /**
- * drain_ctx_hw_fences_cpu - Force trigger the hardware fences that
- * were not sent to TxQueue by the GMU
- */
- static void drain_ctx_hw_fences_cpu(struct adreno_device *adreno_dev,
- struct adreno_context *drawctxt)
- {
- struct adreno_hw_fence_entry *entry, *tmp;
- spin_lock(&drawctxt->lock);
- list_for_each_entry_safe(entry, tmp, &drawctxt->hw_fence_inflight_list, node) {
- gen8_trigger_hw_fence_cpu(adreno_dev, entry);
- gen8_remove_hw_fence_entry(adreno_dev, entry);
- }
- spin_unlock(&drawctxt->lock);
- }
- static void drain_hw_fences_cpu(struct adreno_device *adreno_dev)
- {
- struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
- struct kgsl_context *context;
- int id;
- read_lock(&device->context_lock);
- idr_for_each_entry(&device->context_idr, context, id) {
- if (context->gmu_registered)
- drain_ctx_hw_fences_cpu(adreno_dev, ADRENO_CONTEXT(context));
- }
- read_unlock(&device->context_lock);
- }
- /**
- * check_inflight_hw_fences - During SLUMBER entry, we must make sure all hardware fences across
- * all registered contexts have been sent to TxQueue. If not, take a snapshot
- */
- static int check_inflight_hw_fences(struct adreno_device *adreno_dev)
- {
- struct adreno_hwsched *hwsched = &adreno_dev->hwsched;
- struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
- struct kgsl_context *context;
- int id, ret = 0;
- if (!test_bit(ADRENO_HWSCHED_HW_FENCE, &hwsched->flags))
- return 0;
- read_lock(&device->context_lock);
- idr_for_each_entry(&device->context_idr, context, id) {
- if (context->gmu_registered) {
- ret = gen8_hwsched_check_context_inflight_hw_fences(adreno_dev,
- ADRENO_CONTEXT(context));
- if (ret)
- break;
- }
- }
- read_unlock(&device->context_lock);
- if (ret)
- gmu_core_fault_snapshot(device);
- return ret;
- }
- static int gen8_hwsched_power_off(struct adreno_device *adreno_dev)
- {
- struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
- struct gen8_gmu_device *gmu = to_gen8_gmu(adreno_dev);
- int ret = 0;
- bool drain_cpu = false;
- if (!test_bit(GMU_PRIV_GPU_STARTED, &gmu->flags))
- return 0;
- kgsl_pwrctrl_request_state(device, KGSL_STATE_SLUMBER);
- ret = gen8_gmu_oob_set(device, oob_gpu);
- if (ret) {
- gen8_gmu_oob_clear(device, oob_gpu);
- goto no_gx_power;
- }
- kgsl_pwrscale_update_stats(device);
- /* Save active coresight registers if applicable */
- adreno_coresight_stop(adreno_dev);
- adreno_irqctrl(adreno_dev, 0);
- gen8_gmu_oob_clear(device, oob_gpu);
- no_gx_power:
- kgsl_pwrctrl_irq(device, false);
- /* Make sure GMU has sent all hardware fences to TxQueue */
- if (check_inflight_hw_fences(adreno_dev))
- drain_cpu = true;
- gen8_hwsched_gmu_power_off(adreno_dev);
- /* Now that we are sure that GMU is powered off, drain pending fences */
- if (drain_cpu)
- drain_hw_fences_cpu(adreno_dev);
- adreno_hwsched_unregister_contexts(adreno_dev);
- if (!IS_ERR_OR_NULL(adreno_dev->gpu_llc_slice))
- llcc_slice_deactivate(adreno_dev->gpu_llc_slice);
- if (!IS_ERR_OR_NULL(adreno_dev->gpuhtw_llc_slice))
- llcc_slice_deactivate(adreno_dev->gpuhtw_llc_slice);
- clear_bit(GMU_PRIV_GPU_STARTED, &gmu->flags);
- del_timer_sync(&device->idle_timer);
- kgsl_pwrscale_sleep(device);
- kgsl_pwrctrl_clear_l3_vote(device);
- kgsl_pwrctrl_set_state(device, KGSL_STATE_SLUMBER);
- return ret;
- }
- static void check_hw_fence_unack_count(struct adreno_device *adreno_dev)
- {
- struct gen8_hwsched_hfi *hfi = to_gen8_hwsched_hfi(adreno_dev);
- struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
- struct gen8_gmu_device *gmu = to_gen8_gmu(adreno_dev);
- u32 unack_count;
- if (!test_bit(ADRENO_HWSCHED_HW_FENCE, &adreno_dev->hwsched.flags))
- return;
- gen8_hwsched_process_msgq(adreno_dev);
- spin_lock(&hfi->hw_fence.lock);
- unack_count = hfi->hw_fence.unack_count;
- spin_unlock(&hfi->hw_fence.lock);
- if (!unack_count)
- return;
- dev_err(&gmu->pdev->dev, "hardware fence unack_count(%d) isn't zero before SLUMBER\n",
- unack_count);
- gmu_core_fault_snapshot(device);
- }
- static void hwsched_idle_check(struct work_struct *work)
- {
- struct kgsl_device *device = container_of(work,
- struct kgsl_device, idle_check_ws);
- struct adreno_device *adreno_dev = ADRENO_DEVICE(device);
- mutex_lock(&device->mutex);
- if (test_bit(GMU_DISABLE_SLUMBER, &device->gmu_core.flags))
- goto done;
- if (atomic_read(&device->active_cnt) || time_is_after_jiffies(device->idle_jiffies)) {
- kgsl_pwrscale_update(device);
- kgsl_start_idle_timer(device);
- goto done;
- }
- spin_lock(&device->submit_lock);
- if (device->submit_now) {
- spin_unlock(&device->submit_lock);
- kgsl_pwrscale_update(device);
- kgsl_start_idle_timer(device);
- goto done;
- }
- device->skip_inline_submit = true;
- spin_unlock(&device->submit_lock);
- if (!gen8_hw_isidle(adreno_dev)) {
- dev_err(device->dev, "GPU isn't idle before SLUMBER\n");
- gmu_core_fault_snapshot(device);
- }
- check_hw_fence_unack_count(adreno_dev);
- gen8_hwsched_power_off(adreno_dev);
- done:
- mutex_unlock(&device->mutex);
- }
- static int gen8_hwsched_first_open(struct adreno_device *adreno_dev)
- {
- struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
- int ret;
- /*
- * Do the one time settings that need to happen when we
- * attempt to boot the gpu the very first time
- */
- ret = gen8_hwsched_first_boot(adreno_dev);
- if (ret)
- return ret;
- /*
- * A client that does a first_open but never closes the device
- * may prevent us from going back to SLUMBER. So trigger the idle
- * check by incrementing the active count and immediately releasing it.
- */
- atomic_inc(&device->active_cnt);
- gen8_hwsched_active_count_put(adreno_dev);
- return 0;
- }
- int gen8_hwsched_active_count_get(struct adreno_device *adreno_dev)
- {
- struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
- struct gen8_gmu_device *gmu = to_gen8_gmu(adreno_dev);
- int ret = 0;
- if (WARN_ON(!mutex_is_locked(&device->mutex)))
- return -EINVAL;
- if (test_bit(GMU_PRIV_PM_SUSPEND, &gmu->flags))
- return -EINVAL;
- if ((atomic_read(&device->active_cnt) == 0))
- ret = gen8_hwsched_boot(adreno_dev);
- if (ret == 0)
- atomic_inc(&device->active_cnt);
- trace_kgsl_active_count(device,
- (unsigned long) __builtin_return_address(0));
- return ret;
- }
- static int gen8_hwsched_dcvs_set(struct adreno_device *adreno_dev,
- int gpu_pwrlevel, int bus_level, u32 ab)
- {
- struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
- struct kgsl_pwrctrl *pwr = &device->pwrctrl;
- struct gen8_gmu_device *gmu = to_gen8_gmu(adreno_dev);
- struct gen8_dcvs_table *table = &gmu->dcvs_table;
- struct hfi_gx_bw_perf_vote_cmd req = {
- .ack_type = DCVS_ACK_BLOCK,
- .freq = INVALID_DCVS_IDX,
- .bw = INVALID_DCVS_IDX,
- };
- int ret;
- if (!test_bit(GMU_PRIV_HFI_STARTED, &gmu->flags))
- return 0;
- /* Do not set to XO and lower GPU clock vote from GMU */
- if ((gpu_pwrlevel != INVALID_DCVS_IDX) &&
- (gpu_pwrlevel >= table->gpu_level_num - 1)) {
- dev_err(&gmu->pdev->dev, "Invalid gpu dcvs request: %d\n",
- gpu_pwrlevel);
- return -EINVAL;
- }
- if (gpu_pwrlevel < table->gpu_level_num - 1)
- req.freq = table->gpu_level_num - gpu_pwrlevel - 1;
- if (bus_level < pwr->ddr_table_count && bus_level > 0)
- req.bw = bus_level;
- req.bw |= gen8_bus_ab_quantize(adreno_dev, ab);
- /* GMU will vote for slumber levels through the sleep sequence */
- if ((req.freq == INVALID_DCVS_IDX) && (req.bw == INVALID_BW_VOTE))
- return 0;
- ret = CMD_MSG_HDR(req, H2F_MSG_GX_BW_PERF_VOTE);
- if (ret)
- return ret;
- ret = gen8_hfi_send_cmd_async(adreno_dev, &req, sizeof(req));
- if (ret) {
- dev_err_ratelimited(&gmu->pdev->dev,
- "Failed to set GPU perf idx %d, bw idx %d\n",
- req.freq, req.bw);
- /*
- * If this was a dcvs request along side an active gpu, request
- * dispatcher based reset and recovery.
- */
- if (test_bit(GMU_PRIV_GPU_STARTED, &gmu->flags))
- gen8_hwsched_fault(adreno_dev, ADRENO_GMU_FAULT);
- }
- if (req.freq != INVALID_DCVS_IDX)
- gen8_rdpm_mx_freq_update(gmu, gmu->dcvs_table.gx_votes[req.freq].freq);
- return ret;
- }
- static int gen8_hwsched_clock_set(struct adreno_device *adreno_dev,
- u32 pwrlevel)
- {
- return gen8_hwsched_dcvs_set(adreno_dev, pwrlevel, INVALID_DCVS_IDX, INVALID_AB_VALUE);
- }
- static void scale_gmu_frequency(struct adreno_device *adreno_dev, int buslevel)
- {
- struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
- struct kgsl_pwrctrl *pwr = &device->pwrctrl;
- struct gen8_gmu_device *gmu = to_gen8_gmu(adreno_dev);
- static unsigned long prev_freq;
- unsigned long freq = gmu->freqs[0];
- if (!gmu->perf_ddr_bw)
- return;
- /*
- * Scale the GMU if DDR is at a CX corner at which GMU can run at
- * a higher frequency
- */
- if (pwr->ddr_table[buslevel] >= gmu->perf_ddr_bw)
- freq = gmu->freqs[GMU_MAX_PWRLEVELS - 1];
- if (prev_freq == freq)
- return;
- if (kgsl_clk_set_rate(gmu->clks, gmu->num_clks, "gmu_clk", freq)) {
- dev_err(&gmu->pdev->dev, "Unable to set the GMU clock to %ld\n",
- freq);
- return;
- }
- gen8_rdpm_cx_freq_update(gmu, freq / 1000);
- trace_kgsl_gmu_pwrlevel(freq, prev_freq);
- prev_freq = freq;
- }
- static int gen8_hwsched_bus_set(struct adreno_device *adreno_dev, int buslevel,
- u32 ab)
- {
- struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
- struct kgsl_pwrctrl *pwr = &device->pwrctrl;
- int ret = 0;
- if (buslevel == pwr->cur_buslevel)
- buslevel = INVALID_DCVS_IDX;
- if ((ab == pwr->cur_ab) || (ab == 0))
- ab = INVALID_AB_VALUE;
- if ((ab == INVALID_AB_VALUE) && (buslevel == INVALID_DCVS_IDX))
- return 0;
- ret = gen8_hwsched_dcvs_set(adreno_dev, INVALID_DCVS_IDX,
- buslevel, ab);
- if (ret)
- return ret;
- if (buslevel != INVALID_DCVS_IDX) {
- scale_gmu_frequency(adreno_dev, buslevel);
- pwr->cur_buslevel = buslevel;
- }
- if (ab != INVALID_AB_VALUE) {
- if (!adreno_dev->gmu_ab)
- icc_set_bw(pwr->icc_path, MBps_to_icc(ab), 0);
- pwr->cur_ab = ab;
- }
- trace_kgsl_buslevel(device, pwr->active_pwrlevel, pwr->cur_buslevel, pwr->cur_ab);
- return ret;
- }
- static int gen8_hwsched_pm_suspend(struct adreno_device *adreno_dev)
- {
- struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
- struct gen8_gmu_device *gmu = to_gen8_gmu(adreno_dev);
- int ret;
- if (test_bit(GMU_PRIV_PM_SUSPEND, &gmu->flags))
- return 0;
- kgsl_pwrctrl_request_state(device, KGSL_STATE_SUSPEND);
- /* Halt any new submissions */
- reinit_completion(&device->halt_gate);
- /**
- * Wait for the dispatcher to retire everything by waiting
- * for the active count to go to zero.
- */
- ret = kgsl_active_count_wait(device, 0, msecs_to_jiffies(100));
- if (ret) {
- dev_err(device->dev, "Timed out waiting for the active count\n");
- goto err;
- }
- ret = adreno_hwsched_idle(adreno_dev);
- if (ret)
- goto err;
- gen8_hwsched_power_off(adreno_dev);
- adreno_get_gpu_halt(adreno_dev);
- set_bit(GMU_PRIV_PM_SUSPEND, &gmu->flags);
- kgsl_pwrctrl_set_state(device, KGSL_STATE_SUSPEND);
- return 0;
- err:
- adreno_hwsched_start(adreno_dev);
- return ret;
- }
- static void gen8_hwsched_pm_resume(struct adreno_device *adreno_dev)
- {
- struct gen8_gmu_device *gmu = to_gen8_gmu(adreno_dev);
- if (WARN(!test_bit(GMU_PRIV_PM_SUSPEND, &gmu->flags),
- "resume invoked without a suspend\n"))
- return;
- adreno_put_gpu_halt(adreno_dev);
- adreno_hwsched_start(adreno_dev);
- clear_bit(GMU_PRIV_PM_SUSPEND, &gmu->flags);
- }
- void gen8_hwsched_handle_watchdog(struct adreno_device *adreno_dev)
- {
- struct gen8_gmu_device *gmu = to_gen8_gmu(adreno_dev);
- struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
- u32 mask;
- /* Temporarily mask the watchdog interrupt to prevent a storm */
- gmu_core_regread(device, GEN8_GMUAO_AO_HOST_INTERRUPT_MASK,
- &mask);
- gmu_core_regwrite(device, GEN8_GMUAO_AO_HOST_INTERRUPT_MASK,
- (mask | GMU_INT_WDOG_BITE));
- gen8_gmu_send_nmi(device, false);
- dev_err_ratelimited(&gmu->pdev->dev,
- "GMU watchdog expired interrupt received\n");
- gen8_hwsched_fault(adreno_dev, ADRENO_GMU_FAULT);
- }
- static void gen8_hwsched_drain_ctxt_unregister(struct adreno_device *adreno_dev)
- {
- struct gen8_hwsched_hfi *hfi = to_gen8_hwsched_hfi(adreno_dev);
- struct pending_cmd *cmd = NULL;
- read_lock(&hfi->msglock);
- list_for_each_entry(cmd, &hfi->msglist, node) {
- if (MSG_HDR_GET_ID(cmd->sent_hdr) == H2F_MSG_UNREGISTER_CONTEXT)
- complete(&cmd->complete);
- }
- read_unlock(&hfi->msglock);
- }
- /**
- * process_context_hw_fences_after_reset - This function processes all hardware fences that were
- * sent to GMU prior to recovery. If a fence is not retired by the GPU, and the context is still
- * good, then move them to the reset list.
- */
- static void process_context_hw_fences_after_reset(struct adreno_device *adreno_dev,
- struct adreno_context *drawctxt, struct list_head *reset_list)
- {
- struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
- struct adreno_hw_fence_entry *entry, *tmp;
- spin_lock(&drawctxt->lock);
- list_for_each_entry_safe(entry, tmp, &drawctxt->hw_fence_inflight_list, node) {
- struct adreno_context *drawctxt = entry->drawctxt;
- struct gmu_context_queue_header *hdr = drawctxt->gmu_context_queue.hostptr;
- bool retired = kgsl_check_timestamp(device, &drawctxt->base, (u32)entry->cmd.ts);
- /* Delete the fences that GMU has sent to the TxQueue */
- if (timestamp_cmp(hdr->out_fence_ts, (u32)entry->cmd.ts) >= 0) {
- gen8_remove_hw_fence_entry(adreno_dev, entry);
- continue;
- }
- /*
- * Force retire the fences if the corresponding submission is retired by GPU
- * or if the context has gone bad
- */
- if (retired || kgsl_context_is_bad(&drawctxt->base))
- entry->cmd.flags |= HW_FENCE_FLAG_SKIP_MEMSTORE;
- list_add_tail(&entry->reset_node, reset_list);
- }
- spin_unlock(&drawctxt->lock);
- }
- /**
- * process_inflight_hw_fences_after_reset - Send hardware fences from all contexts back to the GMU
- * after fault recovery. We must wait for ack when sending each of these fences to GMU so as to
- * avoid sending a large number of hardware fences in a short span of time.
- */
- static int process_inflight_hw_fences_after_reset(struct adreno_device *adreno_dev)
- {
- struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
- struct kgsl_context *context = NULL;
- int id, ret = 0;
- struct list_head hw_fence_list;
- struct adreno_hw_fence_entry *entry, *tmp;
- /**
- * Since we need to wait for ack from GMU when sending each inflight fence back to GMU, we
- * cannot send them from within atomic context. Hence, walk list of such hardware fences
- * for each context and add it to this local list and then walk this list to send all these
- * fences to GMU.
- */
- INIT_LIST_HEAD(&hw_fence_list);
- read_lock(&device->context_lock);
- idr_for_each_entry(&device->context_idr, context, id) {
- process_context_hw_fences_after_reset(adreno_dev, ADRENO_CONTEXT(context),
- &hw_fence_list);
- }
- read_unlock(&device->context_lock);
- list_for_each_entry_safe(entry, tmp, &hw_fence_list, reset_node) {
- /*
- * This is part of the reset sequence and any error in this path will be handled by
- * the caller.
- */
- ret = gen8_send_hw_fence_hfi_wait_ack(adreno_dev, entry, 0);
- if (ret)
- break;
- list_del_init(&entry->reset_node);
- }
- return ret;
- }
- /**
- * process_detached_hw_fences_after_reset - Send fences that couldn't be sent to GMU when a context
- * got detached. We must wait for ack when sending each of these fences to GMU so as to avoid
- * sending a large number of hardware fences in a short span of time.
- */
- static int process_detached_hw_fences_after_reset(struct adreno_device *adreno_dev)
- {
- struct adreno_hw_fence_entry *entry, *tmp;
- struct gen8_hwsched_hfi *hfi = to_gen8_hwsched_hfi(adreno_dev);
- struct kgsl_context *context = NULL;
- int ret = 0;
- list_for_each_entry_safe(entry, tmp, &hfi->detached_hw_fence_list, node) {
- /*
- * This is part of the reset sequence and any error in this path will be handled by
- * the caller.
- */
- ret = gen8_send_hw_fence_hfi_wait_ack(adreno_dev, entry,
- HW_FENCE_FLAG_SKIP_MEMSTORE);
- if (ret)
- return ret;
- context = &entry->drawctxt->base;
- gen8_remove_hw_fence_entry(adreno_dev, entry);
- kgsl_context_put(context);
- }
- return ret;
- }
- static int drain_guilty_context_hw_fences(struct adreno_device *adreno_dev)
- {
- struct kgsl_device *device = KGSL_DEVICE(adreno_dev);
- struct kgsl_context *context = NULL;
- struct adreno_context *guilty = NULL;
- int id, ret = 0;
- read_lock(&device->context_lock);
- idr_for_each_entry(&device->context_idr, context, id) {
- if (test_bit(KGSL_CONTEXT_PRIV_INVALID, &context->priv) &&
- _kgsl_context_get(context)) {
- guilty = ADRENO_CONTEXT(context);
- break;
- }
- }
- read_unlock(&device->context_lock);
- if (!guilty)
- return 0;
- /*
- * We don't need drawctxt spinlock to signal these fences since the only other place
- * which can retire these fences is the context detach path and device mutex
- * ensures mutual exclusion between recovery thread and detach thread.
- */
- ret = gen8_hwsched_drain_context_hw_fences(adreno_dev, guilty);
- kgsl_context_put(&guilty->base);
- return ret;
- }
- static int handle_hw_fences_after_reset(struct adreno_device *adreno_dev)
- {
- int ret;
- ret = drain_guilty_context_hw_fences(adreno_dev);
- if (ret)
- return ret;
- /*
- * We must do this after adreno_hwsched_replay() so that context registration
- * is done before we re-send the un-retired hardware fences to the GMU
- */
- ret = process_inflight_hw_fences_after_reset(adreno_dev);
- if (ret)
- return ret;
- ret = process_detached_hw_fences_after_reset(adreno_dev);
- if (ret)
- return ret;
- return gen8_hwsched_disable_hw_fence_throttle(adreno_dev);
- }
- int gen8_hwsched_reset_replay(struct adreno_device *adreno_dev)
- {
- struct gen8_gmu_device *gmu = to_gen8_gmu(adreno_dev);
- struct gen8_hwsched_hfi *hfi = to_gen8_hwsched_hfi(adreno_dev);
- int ret;
- /*
- * Any pending context unregister packets will be lost
- * since we hard reset the GMU. This means any threads waiting
- * for context unregister hfi ack will timeout. Wake them
- * to avoid false positive ack timeout messages later.
- */
- gen8_hwsched_drain_ctxt_unregister(adreno_dev);
- if (!test_bit(GMU_PRIV_GPU_STARTED, &gmu->flags))
- return 0;
- gen8_disable_gpu_irq(adreno_dev);
- gen8_gmu_irq_disable(adreno_dev);
- gen8_hwsched_hfi_stop(adreno_dev);
- gen8_gmu_suspend(adreno_dev);
- adreno_hwsched_unregister_contexts(adreno_dev);
- clear_bit(GMU_PRIV_GPU_STARTED, &gmu->flags);
- spin_lock(&hfi->hw_fence.lock);
- /* Reset the unack count back to zero as we start afresh */
- hfi->hw_fence.unack_count = 0;
- spin_unlock(&hfi->hw_fence.lock);
- /*
- * When we reset, we want to coldboot incase any scratch corruption
- * has occurred before we faulted.
- */
- adreno_mark_for_coldboot(adreno_dev);
- ret = gen8_hwsched_boot(adreno_dev);
- if (ret)
- goto done;
- adreno_hwsched_replay(adreno_dev);
- ret = handle_hw_fences_after_reset(adreno_dev);
- done:
- BUG_ON(ret);
- return ret;
- }
- const struct adreno_power_ops gen8_hwsched_power_ops = {
- .first_open = gen8_hwsched_first_open,
- .last_close = gen8_hwsched_power_off,
- .active_count_get = gen8_hwsched_active_count_get,
- .active_count_put = gen8_hwsched_active_count_put,
- .touch_wakeup = gen8_hwsched_touch_wakeup,
- .pm_suspend = gen8_hwsched_pm_suspend,
- .pm_resume = gen8_hwsched_pm_resume,
- .gpu_clock_set = gen8_hwsched_clock_set,
- .gpu_bus_set = gen8_hwsched_bus_set,
- };
- const struct adreno_hwsched_ops gen8_hwsched_ops = {
- .submit_drawobj = gen8_hwsched_submit_drawobj,
- .preempt_count = gen8_hwsched_preempt_count_get,
- .create_hw_fence = gen8_hwsched_create_hw_fence,
- };
- int gen8_hwsched_probe(struct platform_device *pdev,
- u32 chipid, const struct adreno_gpu_core *gpucore)
- {
- struct adreno_device *adreno_dev;
- struct kgsl_device *device;
- struct gen8_hwsched_device *gen8_hwsched_dev;
- int ret;
- gen8_hwsched_dev = devm_kzalloc(&pdev->dev, sizeof(*gen8_hwsched_dev),
- GFP_KERNEL);
- if (!gen8_hwsched_dev)
- return -ENOMEM;
- adreno_dev = &gen8_hwsched_dev->gen8_dev.adreno_dev;
- adreno_dev->hwsched_enabled = true;
- adreno_dev->irq_mask = GEN8_HWSCHED_INT_MASK;
- ret = gen8_probe_common(pdev, adreno_dev, chipid, gpucore);
- if (ret)
- return ret;
- device = KGSL_DEVICE(adreno_dev);
- INIT_WORK(&device->idle_check_ws, hwsched_idle_check);
- timer_setup(&device->idle_timer, hwsched_idle_timer, 0);
- if (ADRENO_FEATURE(adreno_dev, ADRENO_LPAC))
- adreno_dev->lpac_enabled = true;
- kgsl_mmu_set_feature(device, KGSL_MMU_PAGEFAULT_TERMINATE);
- return adreno_hwsched_init(adreno_dev, &gen8_hwsched_ops);
- }
- int gen8_hwsched_add_to_minidump(struct adreno_device *adreno_dev)
- {
- struct gen8_device *gen8_dev = container_of(adreno_dev,
- struct gen8_device, adreno_dev);
- struct gen8_hwsched_device *gen8_hwsched = container_of(gen8_dev,
- struct gen8_hwsched_device, gen8_dev);
- struct gen8_hwsched_hfi *hw_hfi = &gen8_hwsched->hwsched_hfi;
- int ret, i;
- ret = kgsl_add_va_to_minidump(adreno_dev->dev.dev, KGSL_HWSCHED_DEVICE,
- (void *)(gen8_hwsched), sizeof(struct gen8_hwsched_device));
- if (ret)
- return ret;
- if (!IS_ERR_OR_NULL(gen8_dev->gmu.gmu_log)) {
- ret = kgsl_add_va_to_minidump(adreno_dev->dev.dev,
- KGSL_GMU_LOG_ENTRY,
- gen8_dev->gmu.gmu_log->hostptr,
- gen8_dev->gmu.gmu_log->size);
- if (ret)
- return ret;
- }
- if (!IS_ERR_OR_NULL(gen8_dev->gmu.hfi.hfi_mem)) {
- ret = kgsl_add_va_to_minidump(adreno_dev->dev.dev,
- KGSL_HFIMEM_ENTRY,
- gen8_dev->gmu.hfi.hfi_mem->hostptr,
- gen8_dev->gmu.hfi.hfi_mem->size);
- if (ret)
- return ret;
- }
- if (!IS_ERR_OR_NULL(gen8_dev->gmu.vrb)) {
- ret = kgsl_add_va_to_minidump(adreno_dev->dev.dev,
- KGSL_GMU_VRB_ENTRY,
- gen8_dev->gmu.vrb->hostptr,
- gen8_dev->gmu.vrb->size);
- if (ret)
- return ret;
- }
- if (!IS_ERR_OR_NULL(gen8_dev->gmu.trace.md)) {
- ret = kgsl_add_va_to_minidump(adreno_dev->dev.dev,
- KGSL_GMU_TRACE_ENTRY,
- gen8_dev->gmu.trace.md->hostptr,
- gen8_dev->gmu.trace.md->size);
- if (ret)
- return ret;
- }
- /* Dump HFI hwsched global mem alloc entries */
- for (i = 0; i < hw_hfi->mem_alloc_entries; i++) {
- struct hfi_mem_alloc_entry *entry = &hw_hfi->mem_alloc_table[i];
- char hfi_minidump_str[MAX_VA_MINIDUMP_STR_LEN] = {0};
- u32 rb_id = 0;
- if (!hfi_get_minidump_string(entry->desc.mem_kind,
- &hfi_minidump_str[0],
- sizeof(hfi_minidump_str), &rb_id)) {
- ret = kgsl_add_va_to_minidump(adreno_dev->dev.dev,
- hfi_minidump_str,
- entry->md->hostptr,
- entry->md->size);
- if (ret)
- return ret;
- }
- }
- if (!IS_ERR_OR_NULL(hw_hfi->big_ib)) {
- ret = kgsl_add_va_to_minidump(adreno_dev->dev.dev,
- KGSL_HFI_BIG_IB_ENTRY,
- hw_hfi->big_ib->hostptr,
- hw_hfi->big_ib->size);
- if (ret)
- return ret;
- }
- if (!IS_ERR_OR_NULL(hw_hfi->big_ib_recurring))
- ret = kgsl_add_va_to_minidump(adreno_dev->dev.dev,
- KGSL_HFI_BIG_IB_REC_ENTRY,
- hw_hfi->big_ib_recurring->hostptr,
- hw_hfi->big_ib_recurring->size);
- return ret;
- }
|