Blame - marvell/linux/drivers/gpu/drm/etnaviv/etnaviv_gpu.c - T108

blob: 0b7e360fed42c083bd0954c77641af310a6e1e6e [file] [log] [blame]

b.liu	e958203	2025-04-17 19:18:16 +0800	[diff] [blame^]	1	// SPDX-License-Identifier: GPL-2.0
				2	/*
				3	* Copyright (C) 2015-2018 Etnaviv Project
				4	*/
				5
				6	#include <linux/clk.h>
				7	#include <linux/component.h>
				8	#include <linux/delay.h>
				9	#include <linux/dma-fence.h>
				10	#include <linux/dma-mapping.h>
				11	#include <linux/module.h>
				12	#include <linux/of_device.h>
				13	#include <linux/platform_device.h>
				14	#include <linux/pm_runtime.h>
				15	#include <linux/regulator/consumer.h>
				16	#include <linux/thermal.h>
				17
				18	#include "etnaviv_cmdbuf.h"
				19	#include "etnaviv_dump.h"
				20	#include "etnaviv_gpu.h"
				21	#include "etnaviv_gem.h"
				22	#include "etnaviv_mmu.h"
				23	#include "etnaviv_perfmon.h"
				24	#include "etnaviv_sched.h"
				25	#include "common.xml.h"
				26	#include "state.xml.h"
				27	#include "state_hi.xml.h"
				28	#include "cmdstream.xml.h"
				29
				30	#ifndef PHYS_OFFSET
				31	#define PHYS_OFFSET 0
				32	#endif
				33
				34	static const struct platform_device_id gpu_ids[] = {
				35	{ .name = "etnaviv-gpu,2d" },
				36	{ },
				37	};
				38
				39	/*
				40	* Driver functions:
				41	*/
				42
				43	int etnaviv_gpu_get_param(struct etnaviv_gpu gpu, u32 param, u64 value)
				44	{
				45	struct etnaviv_drm_private *priv = gpu->drm->dev_private;
				46
				47	switch (param) {
				48	case ETNAVIV_PARAM_GPU_MODEL:
				49	*value = gpu->identity.model;
				50	break;
				51
				52	case ETNAVIV_PARAM_GPU_REVISION:
				53	*value = gpu->identity.revision;
				54	break;
				55
				56	case ETNAVIV_PARAM_GPU_FEATURES_0:
				57	*value = gpu->identity.features;
				58	break;
				59
				60	case ETNAVIV_PARAM_GPU_FEATURES_1:
				61	*value = gpu->identity.minor_features0;
				62	break;
				63
				64	case ETNAVIV_PARAM_GPU_FEATURES_2:
				65	*value = gpu->identity.minor_features1;
				66	break;
				67
				68	case ETNAVIV_PARAM_GPU_FEATURES_3:
				69	*value = gpu->identity.minor_features2;
				70	break;
				71
				72	case ETNAVIV_PARAM_GPU_FEATURES_4:
				73	*value = gpu->identity.minor_features3;
				74	break;
				75
				76	case ETNAVIV_PARAM_GPU_FEATURES_5:
				77	*value = gpu->identity.minor_features4;
				78	break;
				79
				80	case ETNAVIV_PARAM_GPU_FEATURES_6:
				81	*value = gpu->identity.minor_features5;
				82	break;
				83
				84	case ETNAVIV_PARAM_GPU_FEATURES_7:
				85	*value = gpu->identity.minor_features6;
				86	break;
				87
				88	case ETNAVIV_PARAM_GPU_FEATURES_8:
				89	*value = gpu->identity.minor_features7;
				90	break;
				91
				92	case ETNAVIV_PARAM_GPU_FEATURES_9:
				93	*value = gpu->identity.minor_features8;
				94	break;
				95
				96	case ETNAVIV_PARAM_GPU_FEATURES_10:
				97	*value = gpu->identity.minor_features9;
				98	break;
				99
				100	case ETNAVIV_PARAM_GPU_FEATURES_11:
				101	*value = gpu->identity.minor_features10;
				102	break;
				103
				104	case ETNAVIV_PARAM_GPU_FEATURES_12:
				105	*value = gpu->identity.minor_features11;
				106	break;
				107
				108	case ETNAVIV_PARAM_GPU_STREAM_COUNT:
				109	*value = gpu->identity.stream_count;
				110	break;
				111
				112	case ETNAVIV_PARAM_GPU_REGISTER_MAX:
				113	*value = gpu->identity.register_max;
				114	break;
				115
				116	case ETNAVIV_PARAM_GPU_THREAD_COUNT:
				117	*value = gpu->identity.thread_count;
				118	break;
				119
				120	case ETNAVIV_PARAM_GPU_VERTEX_CACHE_SIZE:
				121	*value = gpu->identity.vertex_cache_size;
				122	break;
				123
				124	case ETNAVIV_PARAM_GPU_SHADER_CORE_COUNT:
				125	*value = gpu->identity.shader_core_count;
				126	break;
				127
				128	case ETNAVIV_PARAM_GPU_PIXEL_PIPES:
				129	*value = gpu->identity.pixel_pipes;
				130	break;
				131
				132	case ETNAVIV_PARAM_GPU_VERTEX_OUTPUT_BUFFER_SIZE:
				133	*value = gpu->identity.vertex_output_buffer_size;
				134	break;
				135
				136	case ETNAVIV_PARAM_GPU_BUFFER_SIZE:
				137	*value = gpu->identity.buffer_size;
				138	break;
				139
				140	case ETNAVIV_PARAM_GPU_INSTRUCTION_COUNT:
				141	*value = gpu->identity.instruction_count;
				142	break;
				143
				144	case ETNAVIV_PARAM_GPU_NUM_CONSTANTS:
				145	*value = gpu->identity.num_constants;
				146	break;
				147
				148	case ETNAVIV_PARAM_GPU_NUM_VARYINGS:
				149	*value = gpu->identity.varyings_count;
				150	break;
				151
				152	case ETNAVIV_PARAM_SOFTPIN_START_ADDR:
				153	if (priv->mmu_global->version == ETNAVIV_IOMMU_V2)
				154	*value = ETNAVIV_SOFTPIN_START_ADDRESS;
				155	else
				156	*value = ~0ULL;
				157	break;
				158
				159	default:
				160	DBG("%s: invalid param: %u", dev_name(gpu->dev), param);
				161	return -EINVAL;
				162	}
				163
				164	return 0;
				165	}
				166
				167
				168	#define etnaviv_is_model_rev(gpu, mod, rev) \
				169	((gpu)->identity.model == chipModel_##mod && \
				170	(gpu)->identity.revision == rev)
				171	#define etnaviv_field(val, field) \
				172	(((val) & field##__MASK) >> field##__SHIFT)
				173
				174	static void etnaviv_hw_specs(struct etnaviv_gpu *gpu)
				175	{
				176	if (gpu->identity.minor_features0 &
				177	chipMinorFeatures0_MORE_MINOR_FEATURES) {
				178	u32 specs[4];
				179	unsigned int streams;
				180
				181	specs[0] = gpu_read(gpu, VIVS_HI_CHIP_SPECS);
				182	specs[1] = gpu_read(gpu, VIVS_HI_CHIP_SPECS_2);
				183	specs[2] = gpu_read(gpu, VIVS_HI_CHIP_SPECS_3);
				184	specs[3] = gpu_read(gpu, VIVS_HI_CHIP_SPECS_4);
				185
				186	gpu->identity.stream_count = etnaviv_field(specs[0],
				187	VIVS_HI_CHIP_SPECS_STREAM_COUNT);
				188	gpu->identity.register_max = etnaviv_field(specs[0],
				189	VIVS_HI_CHIP_SPECS_REGISTER_MAX);
				190	gpu->identity.thread_count = etnaviv_field(specs[0],
				191	VIVS_HI_CHIP_SPECS_THREAD_COUNT);
				192	gpu->identity.vertex_cache_size = etnaviv_field(specs[0],
				193	VIVS_HI_CHIP_SPECS_VERTEX_CACHE_SIZE);
				194	gpu->identity.shader_core_count = etnaviv_field(specs[0],
				195	VIVS_HI_CHIP_SPECS_SHADER_CORE_COUNT);
				196	gpu->identity.pixel_pipes = etnaviv_field(specs[0],
				197	VIVS_HI_CHIP_SPECS_PIXEL_PIPES);
				198	gpu->identity.vertex_output_buffer_size =
				199	etnaviv_field(specs[0],
				200	VIVS_HI_CHIP_SPECS_VERTEX_OUTPUT_BUFFER_SIZE);
				201
				202	gpu->identity.buffer_size = etnaviv_field(specs[1],
				203	VIVS_HI_CHIP_SPECS_2_BUFFER_SIZE);
				204	gpu->identity.instruction_count = etnaviv_field(specs[1],
				205	VIVS_HI_CHIP_SPECS_2_INSTRUCTION_COUNT);
				206	gpu->identity.num_constants = etnaviv_field(specs[1],
				207	VIVS_HI_CHIP_SPECS_2_NUM_CONSTANTS);
				208
				209	gpu->identity.varyings_count = etnaviv_field(specs[2],
				210	VIVS_HI_CHIP_SPECS_3_VARYINGS_COUNT);
				211
				212	/* This overrides the value from older register if non-zero */
				213	streams = etnaviv_field(specs[3],
				214	VIVS_HI_CHIP_SPECS_4_STREAM_COUNT);
				215	if (streams)
				216	gpu->identity.stream_count = streams;
				217	}
				218
				219	/* Fill in the stream count if not specified */
				220	if (gpu->identity.stream_count == 0) {
				221	if (gpu->identity.model >= 0x1000)
				222	gpu->identity.stream_count = 4;
				223	else
				224	gpu->identity.stream_count = 1;
				225	}
				226
				227	/* Convert the register max value */
				228	if (gpu->identity.register_max)
				229	gpu->identity.register_max = 1 << gpu->identity.register_max;
				230	else if (gpu->identity.model == chipModel_GC400)
				231	gpu->identity.register_max = 32;
				232	else
				233	gpu->identity.register_max = 64;
				234
				235	/* Convert thread count */
				236	if (gpu->identity.thread_count)
				237	gpu->identity.thread_count = 1 << gpu->identity.thread_count;
				238	else if (gpu->identity.model == chipModel_GC400)
				239	gpu->identity.thread_count = 64;
				240	else if (gpu->identity.model == chipModel_GC500 \|\|
				241	gpu->identity.model == chipModel_GC530)
				242	gpu->identity.thread_count = 128;
				243	else
				244	gpu->identity.thread_count = 256;
				245
				246	if (gpu->identity.vertex_cache_size == 0)
				247	gpu->identity.vertex_cache_size = 8;
				248
				249	if (gpu->identity.shader_core_count == 0) {
				250	if (gpu->identity.model >= 0x1000)
				251	gpu->identity.shader_core_count = 2;
				252	else
				253	gpu->identity.shader_core_count = 1;
				254	}
				255
				256	if (gpu->identity.pixel_pipes == 0)
				257	gpu->identity.pixel_pipes = 1;
				258
				259	/* Convert virtex buffer size */
				260	if (gpu->identity.vertex_output_buffer_size) {
				261	gpu->identity.vertex_output_buffer_size =
				262	1 << gpu->identity.vertex_output_buffer_size;
				263	} else if (gpu->identity.model == chipModel_GC400) {
				264	if (gpu->identity.revision < 0x4000)
				265	gpu->identity.vertex_output_buffer_size = 512;
				266	else if (gpu->identity.revision < 0x4200)
				267	gpu->identity.vertex_output_buffer_size = 256;
				268	else
				269	gpu->identity.vertex_output_buffer_size = 128;
				270	} else {
				271	gpu->identity.vertex_output_buffer_size = 512;
				272	}
				273
				274	switch (gpu->identity.instruction_count) {
				275	case 0:
				276	if (etnaviv_is_model_rev(gpu, GC2000, 0x5108) \|\|
				277	gpu->identity.model == chipModel_GC880)
				278	gpu->identity.instruction_count = 512;
				279	else
				280	gpu->identity.instruction_count = 256;
				281	break;
				282
				283	case 1:
				284	gpu->identity.instruction_count = 1024;
				285	break;
				286
				287	case 2:
				288	gpu->identity.instruction_count = 2048;
				289	break;
				290
				291	default:
				292	gpu->identity.instruction_count = 256;
				293	break;
				294	}
				295
				296	if (gpu->identity.num_constants == 0)
				297	gpu->identity.num_constants = 168;
				298
				299	if (gpu->identity.varyings_count == 0) {
				300	if (gpu->identity.minor_features1 & chipMinorFeatures1_HALTI0)
				301	gpu->identity.varyings_count = 12;
				302	else
				303	gpu->identity.varyings_count = 8;
				304	}
				305
				306	/*
				307	* For some cores, two varyings are consumed for position, so the
				308	* maximum varying count needs to be reduced by one.
				309	*/
				310	if (etnaviv_is_model_rev(gpu, GC5000, 0x5434) \|\|
				311	etnaviv_is_model_rev(gpu, GC4000, 0x5222) \|\|
				312	etnaviv_is_model_rev(gpu, GC4000, 0x5245) \|\|
				313	etnaviv_is_model_rev(gpu, GC4000, 0x5208) \|\|
				314	etnaviv_is_model_rev(gpu, GC3000, 0x5435) \|\|
				315	etnaviv_is_model_rev(gpu, GC2200, 0x5244) \|\|
				316	etnaviv_is_model_rev(gpu, GC2100, 0x5108) \|\|
				317	etnaviv_is_model_rev(gpu, GC2000, 0x5108) \|\|
				318	etnaviv_is_model_rev(gpu, GC1500, 0x5246) \|\|
				319	etnaviv_is_model_rev(gpu, GC880, 0x5107) \|\|
				320	etnaviv_is_model_rev(gpu, GC880, 0x5106))
				321	gpu->identity.varyings_count -= 1;
				322	}
				323
				324	static void etnaviv_hw_identify(struct etnaviv_gpu *gpu)
				325	{
				326	u32 chipIdentity;
				327
				328	chipIdentity = gpu_read(gpu, VIVS_HI_CHIP_IDENTITY);
				329
				330	/* Special case for older graphic cores. */
				331	if (etnaviv_field(chipIdentity, VIVS_HI_CHIP_IDENTITY_FAMILY) == 0x01) {
				332	gpu->identity.model = chipModel_GC500;
				333	gpu->identity.revision = etnaviv_field(chipIdentity,
				334	VIVS_HI_CHIP_IDENTITY_REVISION);
				335	} else {
				336
				337	gpu->identity.model = gpu_read(gpu, VIVS_HI_CHIP_MODEL);
				338	gpu->identity.revision = gpu_read(gpu, VIVS_HI_CHIP_REV);
				339
				340	/*
				341	* !!!! HACK ALERT !!!!
				342	* Because people change device IDs without letting software
				343	* know about it - here is the hack to make it all look the
				344	* same. Only for GC400 family.
				345	*/
				346	if ((gpu->identity.model & 0xff00) == 0x0400 &&
				347	gpu->identity.model != chipModel_GC420) {
				348	gpu->identity.model = gpu->identity.model & 0x0400;
				349	}
				350
				351	/* Another special case */
				352	if (etnaviv_is_model_rev(gpu, GC300, 0x2201)) {
				353	u32 chipDate = gpu_read(gpu, VIVS_HI_CHIP_DATE);
				354	u32 chipTime = gpu_read(gpu, VIVS_HI_CHIP_TIME);
				355
				356	if (chipDate == 0x20080814 && chipTime == 0x12051100) {
				357	/*
				358	* This IP has an ECO; put the correct
				359	* revision in it.
				360	*/
				361	gpu->identity.revision = 0x1051;
				362	}
				363	}
				364
				365	/*
				366	* NXP likes to call the GPU on the i.MX6QP GC2000+, but in
				367	* reality it's just a re-branded GC3000. We can identify this
				368	* core by the upper half of the revision register being all 1.
				369	* Fix model/rev here, so all other places can refer to this
				370	* core by its real identity.
				371	*/
				372	if (etnaviv_is_model_rev(gpu, GC2000, 0xffff5450)) {
				373	gpu->identity.model = chipModel_GC3000;
				374	gpu->identity.revision &= 0xffff;
				375	}
				376	}
				377
				378	dev_info(gpu->dev, "model: GC%x, revision: %x\n",
				379	gpu->identity.model, gpu->identity.revision);
				380
				381	gpu->idle_mask = ~VIVS_HI_IDLE_STATE_AXI_LP;
				382	/*
				383	* If there is a match in the HWDB, we aren't interested in the
				384	* remaining register values, as they might be wrong.
				385	*/
				386	if (etnaviv_fill_identity_from_hwdb(gpu))
				387	return;
				388
				389	gpu->identity.features = gpu_read(gpu, VIVS_HI_CHIP_FEATURE);
				390
				391	/* Disable fast clear on GC700. */
				392	if (gpu->identity.model == chipModel_GC700)
				393	gpu->identity.features &= ~chipFeatures_FAST_CLEAR;
				394
				395	/* These models/revisions don't have the 2D pipe bit */
				396	if ((gpu->identity.model == chipModel_GC500 &&
				397	gpu->identity.revision <= 2) \|\|
				398	gpu->identity.model == chipModel_GC300)
				399	gpu->identity.features \|= chipFeatures_PIPE_2D;
				400
				401	if ((gpu->identity.model == chipModel_GC500 &&
				402	gpu->identity.revision < 2) \|\|
				403	(gpu->identity.model == chipModel_GC300 &&
				404	gpu->identity.revision < 0x2000)) {
				405
				406	/*
				407	* GC500 rev 1.x and GC300 rev < 2.0 doesn't have these
				408	* registers.
				409	*/
				410	gpu->identity.minor_features0 = 0;
				411	gpu->identity.minor_features1 = 0;
				412	gpu->identity.minor_features2 = 0;
				413	gpu->identity.minor_features3 = 0;
				414	gpu->identity.minor_features4 = 0;
				415	gpu->identity.minor_features5 = 0;
				416	} else
				417	gpu->identity.minor_features0 =
				418	gpu_read(gpu, VIVS_HI_CHIP_MINOR_FEATURE_0);
				419
				420	if (gpu->identity.minor_features0 &
				421	chipMinorFeatures0_MORE_MINOR_FEATURES) {
				422	gpu->identity.minor_features1 =
				423	gpu_read(gpu, VIVS_HI_CHIP_MINOR_FEATURE_1);
				424	gpu->identity.minor_features2 =
				425	gpu_read(gpu, VIVS_HI_CHIP_MINOR_FEATURE_2);
				426	gpu->identity.minor_features3 =
				427	gpu_read(gpu, VIVS_HI_CHIP_MINOR_FEATURE_3);
				428	gpu->identity.minor_features4 =
				429	gpu_read(gpu, VIVS_HI_CHIP_MINOR_FEATURE_4);
				430	gpu->identity.minor_features5 =
				431	gpu_read(gpu, VIVS_HI_CHIP_MINOR_FEATURE_5);
				432	}
				433
				434	/* GC600/300 idle register reports zero bits where modules aren't present */
				435	if (gpu->identity.model == chipModel_GC600 \|\|
				436	gpu->identity.model == chipModel_GC300)
				437	gpu->idle_mask = VIVS_HI_IDLE_STATE_TX \|
				438	VIVS_HI_IDLE_STATE_RA \|
				439	VIVS_HI_IDLE_STATE_SE \|
				440	VIVS_HI_IDLE_STATE_PA \|
				441	VIVS_HI_IDLE_STATE_SH \|
				442	VIVS_HI_IDLE_STATE_PE \|
				443	VIVS_HI_IDLE_STATE_DE \|
				444	VIVS_HI_IDLE_STATE_FE;
				445
				446	etnaviv_hw_specs(gpu);
				447	}
				448
				449	static void etnaviv_gpu_load_clock(struct etnaviv_gpu *gpu, u32 clock)
				450	{
				451	gpu_write(gpu, VIVS_HI_CLOCK_CONTROL, clock \|
				452	VIVS_HI_CLOCK_CONTROL_FSCALE_CMD_LOAD);
				453	gpu_write(gpu, VIVS_HI_CLOCK_CONTROL, clock);
				454	}
				455
				456	static void etnaviv_gpu_update_clock(struct etnaviv_gpu *gpu)
				457	{
				458	if (gpu->identity.minor_features2 &
				459	chipMinorFeatures2_DYNAMIC_FREQUENCY_SCALING) {
				460	clk_set_rate(gpu->clk_core,
				461	gpu->base_rate_core >> gpu->freq_scale);
				462	clk_set_rate(gpu->clk_shader,
				463	gpu->base_rate_shader >> gpu->freq_scale);
				464	} else {
				465	unsigned int fscale = 1 << (6 - gpu->freq_scale);
				466	u32 clock = gpu_read(gpu, VIVS_HI_CLOCK_CONTROL);
				467
				468	clock &= ~VIVS_HI_CLOCK_CONTROL_FSCALE_VAL__MASK;
				469	clock \|= VIVS_HI_CLOCK_CONTROL_FSCALE_VAL(fscale);
				470	etnaviv_gpu_load_clock(gpu, clock);
				471	}
				472	}
				473
				474	static int etnaviv_hw_reset(struct etnaviv_gpu *gpu)
				475	{
				476	u32 control, idle;
				477	unsigned long timeout;
				478	bool failed = true;
				479
				480	/* We hope that the GPU resets in under one second */
				481	timeout = jiffies + msecs_to_jiffies(1000);
				482
				483	while (time_is_after_jiffies(timeout)) {
				484	/* enable clock */
				485	unsigned int fscale = 1 << (6 - gpu->freq_scale);
				486	control = VIVS_HI_CLOCK_CONTROL_FSCALE_VAL(fscale);
				487	etnaviv_gpu_load_clock(gpu, control);
				488
				489	/* isolate the GPU. */
				490	control \|= VIVS_HI_CLOCK_CONTROL_ISOLATE_GPU;
				491	gpu_write(gpu, VIVS_HI_CLOCK_CONTROL, control);
				492
				493	if (gpu->sec_mode == ETNA_SEC_KERNEL) {
				494	gpu_write(gpu, VIVS_MMUv2_AHB_CONTROL,
				495	VIVS_MMUv2_AHB_CONTROL_RESET);
				496	} else {
				497	/* set soft reset. */
				498	control \|= VIVS_HI_CLOCK_CONTROL_SOFT_RESET;
				499	gpu_write(gpu, VIVS_HI_CLOCK_CONTROL, control);
				500	}
				501
				502	/* wait for reset. */
				503	usleep_range(10, 20);
				504
				505	/* reset soft reset bit. */
				506	control &= ~VIVS_HI_CLOCK_CONTROL_SOFT_RESET;
				507	gpu_write(gpu, VIVS_HI_CLOCK_CONTROL, control);
				508
				509	/* reset GPU isolation. */
				510	control &= ~VIVS_HI_CLOCK_CONTROL_ISOLATE_GPU;
				511	gpu_write(gpu, VIVS_HI_CLOCK_CONTROL, control);
				512
				513	/* read idle register. */
				514	idle = gpu_read(gpu, VIVS_HI_IDLE_STATE);
				515
				516	/* try reseting again if FE it not idle */
				517	if ((idle & VIVS_HI_IDLE_STATE_FE) == 0) {
				518	dev_dbg(gpu->dev, "FE is not idle\n");
				519	continue;
				520	}
				521
				522	/* read reset register. */
				523	control = gpu_read(gpu, VIVS_HI_CLOCK_CONTROL);
				524
				525	/* is the GPU idle? */
				526	if (((control & VIVS_HI_CLOCK_CONTROL_IDLE_3D) == 0) \|\|
				527	((control & VIVS_HI_CLOCK_CONTROL_IDLE_2D) == 0)) {
				528	dev_dbg(gpu->dev, "GPU is not idle\n");
				529	continue;
				530	}
				531
				532	/* disable debug registers, as they are not normally needed */
				533	control \|= VIVS_HI_CLOCK_CONTROL_DISABLE_DEBUG_REGISTERS;
				534	gpu_write(gpu, VIVS_HI_CLOCK_CONTROL, control);
				535
				536	failed = false;
				537	break;
				538	}
				539
				540	if (failed) {
				541	idle = gpu_read(gpu, VIVS_HI_IDLE_STATE);
				542	control = gpu_read(gpu, VIVS_HI_CLOCK_CONTROL);
				543
				544	dev_err(gpu->dev, "GPU failed to reset: FE %sidle, 3D %sidle, 2D %sidle\n",
				545	idle & VIVS_HI_IDLE_STATE_FE ? "" : "not ",
				546	control & VIVS_HI_CLOCK_CONTROL_IDLE_3D ? "" : "not ",
				547	control & VIVS_HI_CLOCK_CONTROL_IDLE_2D ? "" : "not ");
				548
				549	return -EBUSY;
				550	}
				551
				552	/* We rely on the GPU running, so program the clock */
				553	etnaviv_gpu_update_clock(gpu);
				554
				555	gpu->fe_running = false;
				556	gpu->exec_state = -1;
				557	if (gpu->mmu_context)
				558	etnaviv_iommu_context_put(gpu->mmu_context);
				559	gpu->mmu_context = NULL;
				560
				561	return 0;
				562	}
				563
				564	static void etnaviv_gpu_enable_mlcg(struct etnaviv_gpu *gpu)
				565	{
				566	u32 pmc, ppc;
				567
				568	/* enable clock gating */
				569	ppc = gpu_read_power(gpu, VIVS_PM_POWER_CONTROLS);
				570	ppc \|= VIVS_PM_POWER_CONTROLS_ENABLE_MODULE_CLOCK_GATING;
				571
				572	/* Disable stall module clock gating for 4.3.0.1 and 4.3.0.2 revs */
				573	if (gpu->identity.revision == 0x4301 \|\|
				574	gpu->identity.revision == 0x4302)
				575	ppc \|= VIVS_PM_POWER_CONTROLS_DISABLE_STALL_MODULE_CLOCK_GATING;
				576
				577	gpu_write_power(gpu, VIVS_PM_POWER_CONTROLS, ppc);
				578
				579	pmc = gpu_read_power(gpu, VIVS_PM_MODULE_CONTROLS);
				580
				581	/* Disable PA clock gating for GC400+ without bugfix except for GC420 */
				582	if (gpu->identity.model >= chipModel_GC400 &&
				583	gpu->identity.model != chipModel_GC420 &&
				584	!(gpu->identity.minor_features3 & chipMinorFeatures3_BUG_FIXES12))
				585	pmc \|= VIVS_PM_MODULE_CONTROLS_DISABLE_MODULE_CLOCK_GATING_PA;
				586
				587	/*
				588	* Disable PE clock gating on revs < 5.0.0.0 when HZ is
				589	* present without a bug fix.
				590	*/
				591	if (gpu->identity.revision < 0x5000 &&
				592	gpu->identity.minor_features0 & chipMinorFeatures0_HZ &&
				593	!(gpu->identity.minor_features1 &
				594	chipMinorFeatures1_DISABLE_PE_GATING))
				595	pmc \|= VIVS_PM_MODULE_CONTROLS_DISABLE_MODULE_CLOCK_GATING_PE;
				596
				597	if (gpu->identity.revision < 0x5422)
				598	pmc \|= BIT(15); /* Unknown bit */
				599
				600	/* Disable TX clock gating on affected core revisions. */
				601	if (etnaviv_is_model_rev(gpu, GC4000, 0x5222) \|\|
				602	etnaviv_is_model_rev(gpu, GC2000, 0x5108))
				603	pmc \|= VIVS_PM_MODULE_CONTROLS_DISABLE_MODULE_CLOCK_GATING_TX;
				604
				605	pmc \|= VIVS_PM_MODULE_CONTROLS_DISABLE_MODULE_CLOCK_GATING_RA_HZ;
				606	pmc \|= VIVS_PM_MODULE_CONTROLS_DISABLE_MODULE_CLOCK_GATING_RA_EZ;
				607
				608	gpu_write_power(gpu, VIVS_PM_MODULE_CONTROLS, pmc);
				609	}
				610
				611	void etnaviv_gpu_start_fe(struct etnaviv_gpu *gpu, u32 address, u16 prefetch)
				612	{
				613	gpu_write(gpu, VIVS_FE_COMMAND_ADDRESS, address);
				614	gpu_write(gpu, VIVS_FE_COMMAND_CONTROL,
				615	VIVS_FE_COMMAND_CONTROL_ENABLE \|
				616	VIVS_FE_COMMAND_CONTROL_PREFETCH(prefetch));
				617
				618	if (gpu->sec_mode == ETNA_SEC_KERNEL) {
				619	gpu_write(gpu, VIVS_MMUv2_SEC_COMMAND_CONTROL,
				620	VIVS_MMUv2_SEC_COMMAND_CONTROL_ENABLE \|
				621	VIVS_MMUv2_SEC_COMMAND_CONTROL_PREFETCH(prefetch));
				622	}
				623
				624	gpu->fe_running = true;
				625	}
				626
				627	static void etnaviv_gpu_start_fe_idleloop(struct etnaviv_gpu *gpu,
				628	struct etnaviv_iommu_context *context)
				629	{
				630	u16 prefetch;
				631	u32 address;
				632
				633	/* setup the MMU */
				634	etnaviv_iommu_restore(gpu, context);
				635
				636	/* Start command processor */
				637	prefetch = etnaviv_buffer_init(gpu);
				638	address = etnaviv_cmdbuf_get_va(&gpu->buffer,
				639	&gpu->mmu_context->cmdbuf_mapping);
				640
				641	etnaviv_gpu_start_fe(gpu, address, prefetch);
				642	}
				643
				644	static void etnaviv_gpu_setup_pulse_eater(struct etnaviv_gpu *gpu)
				645	{
				646	/*
				647	* Base value for VIVS_PM_PULSE_EATER register on models where it
				648	* cannot be read, extracted from vivante kernel driver.
				649	*/
				650	u32 pulse_eater = 0x01590880;
				651
				652	if (etnaviv_is_model_rev(gpu, GC4000, 0x5208) \|\|
				653	etnaviv_is_model_rev(gpu, GC4000, 0x5222)) {
				654	pulse_eater \|= BIT(23);
				655
				656	}
				657
				658	if (etnaviv_is_model_rev(gpu, GC1000, 0x5039) \|\|
				659	etnaviv_is_model_rev(gpu, GC1000, 0x5040)) {
				660	pulse_eater &= ~BIT(16);
				661	pulse_eater \|= BIT(17);
				662	}
				663
				664	if ((gpu->identity.revision > 0x5420) &&
				665	(gpu->identity.features & chipFeatures_PIPE_3D))
				666	{
				667	/* Performance fix: disable internal DFS */
				668	pulse_eater = gpu_read_power(gpu, VIVS_PM_PULSE_EATER);
				669	pulse_eater \|= BIT(18);
				670	}
				671
				672	gpu_write_power(gpu, VIVS_PM_PULSE_EATER, pulse_eater);
				673	}
				674
				675	static void etnaviv_gpu_hw_init(struct etnaviv_gpu *gpu)
				676	{
				677	if ((etnaviv_is_model_rev(gpu, GC320, 0x5007) \|\|
				678	etnaviv_is_model_rev(gpu, GC320, 0x5220)) &&
				679	gpu_read(gpu, VIVS_HI_CHIP_TIME) != 0x2062400) {
				680	u32 mc_memory_debug;
				681
				682	mc_memory_debug = gpu_read(gpu, VIVS_MC_DEBUG_MEMORY) & ~0xff;
				683
				684	if (gpu->identity.revision == 0x5007)
				685	mc_memory_debug \|= 0x0c;
				686	else
				687	mc_memory_debug \|= 0x08;
				688
				689	gpu_write(gpu, VIVS_MC_DEBUG_MEMORY, mc_memory_debug);
				690	}
				691
				692	/* enable module-level clock gating */
				693	etnaviv_gpu_enable_mlcg(gpu);
				694
				695	/*
				696	* Update GPU AXI cache atttribute to "cacheable, no allocate".
				697	* This is necessary to prevent the iMX6 SoC locking up.
				698	*/
				699	gpu_write(gpu, VIVS_HI_AXI_CONFIG,
				700	VIVS_HI_AXI_CONFIG_AWCACHE(2) \|
				701	VIVS_HI_AXI_CONFIG_ARCACHE(2));
				702
				703	/* GC2000 rev 5108 needs a special bus config */
				704	if (etnaviv_is_model_rev(gpu, GC2000, 0x5108)) {
				705	u32 bus_config = gpu_read(gpu, VIVS_MC_BUS_CONFIG);
				706	bus_config &= ~(VIVS_MC_BUS_CONFIG_FE_BUS_CONFIG__MASK \|
				707	VIVS_MC_BUS_CONFIG_TX_BUS_CONFIG__MASK);
				708	bus_config \|= VIVS_MC_BUS_CONFIG_FE_BUS_CONFIG(1) \|
				709	VIVS_MC_BUS_CONFIG_TX_BUS_CONFIG(0);
				710	gpu_write(gpu, VIVS_MC_BUS_CONFIG, bus_config);
				711	}
				712
				713	if (gpu->sec_mode == ETNA_SEC_KERNEL) {
				714	u32 val = gpu_read(gpu, VIVS_MMUv2_AHB_CONTROL);
				715	val \|= VIVS_MMUv2_AHB_CONTROL_NONSEC_ACCESS;
				716	gpu_write(gpu, VIVS_MMUv2_AHB_CONTROL, val);
				717	}
				718
				719	/* setup the pulse eater */
				720	etnaviv_gpu_setup_pulse_eater(gpu);
				721
				722	gpu_write(gpu, VIVS_HI_INTR_ENBL, ~0U);
				723	}
				724
				725	int etnaviv_gpu_init(struct etnaviv_gpu *gpu)
				726	{
				727	struct etnaviv_drm_private *priv = gpu->drm->dev_private;
				728	int ret, i;
				729
				730	ret = pm_runtime_get_sync(gpu->dev);
				731	if (ret < 0) {
				732	dev_err(gpu->dev, "Failed to enable GPU power domain\n");
				733	goto pm_put;
				734	}
				735
				736	etnaviv_hw_identify(gpu);
				737
				738	if (gpu->identity.model == 0) {
				739	dev_err(gpu->dev, "Unknown GPU model\n");
				740	ret = -ENXIO;
				741	goto fail;
				742	}
				743
				744	/* Exclude VG cores with FE2.0 */
				745	if (gpu->identity.features & chipFeatures_PIPE_VG &&
				746	gpu->identity.features & chipFeatures_FE20) {
				747	dev_info(gpu->dev, "Ignoring GPU with VG and FE2.0\n");
				748	ret = -ENXIO;
				749	goto fail;
				750	}
				751
				752	/*
				753	* On cores with security features supported, we claim control over the
				754	* security states.
				755	*/
				756	if ((gpu->identity.minor_features7 & chipMinorFeatures7_BIT_SECURITY) &&
				757	(gpu->identity.minor_features10 & chipMinorFeatures10_SECURITY_AHB))
				758	gpu->sec_mode = ETNA_SEC_KERNEL;
				759
				760	ret = etnaviv_hw_reset(gpu);
				761	if (ret) {
				762	dev_err(gpu->dev, "GPU reset failed\n");
				763	goto fail;
				764	}
				765
				766	ret = etnaviv_iommu_global_init(gpu);
				767	if (ret)
				768	goto fail;
				769
				770	/*
				771	* Set the GPU linear window to be at the end of the DMA window, where
				772	* the CMA area is likely to reside. This ensures that we are able to
				773	* map the command buffers while having the linear window overlap as
				774	* much RAM as possible, so we can optimize mappings for other buffers.
				775	*
				776	* For 3D cores only do this if MC2.0 is present, as with MC1.0 it leads
				777	* to different views of the memory on the individual engines.
				778	*/
				779	if (!(gpu->identity.features & chipFeatures_PIPE_3D) \|\|
				780	(gpu->identity.minor_features0 & chipMinorFeatures0_MC20)) {
				781	u32 dma_mask = (u32)dma_get_required_mask(gpu->dev);
				782	if (dma_mask < PHYS_OFFSET + SZ_2G)
				783	priv->mmu_global->memory_base = PHYS_OFFSET;
				784	else
				785	priv->mmu_global->memory_base = dma_mask - SZ_2G + 1;
				786	} else if (PHYS_OFFSET >= SZ_2G) {
				787	dev_info(gpu->dev, "Need to move linear window on MC1.0, disabling TS\n");
				788	priv->mmu_global->memory_base = PHYS_OFFSET;
				789	gpu->identity.features &= ~chipFeatures_FAST_CLEAR;
				790	}
				791
				792	/* Create buffer: */
				793	ret = etnaviv_cmdbuf_init(priv->cmdbuf_suballoc, &gpu->buffer,
				794	PAGE_SIZE);
				795	if (ret) {
				796	dev_err(gpu->dev, "could not create command buffer\n");
				797	goto fail;
				798	}
				799
				800	/* Setup event management */
				801	spin_lock_init(&gpu->event_spinlock);
				802	init_completion(&gpu->event_free);
				803	bitmap_zero(gpu->event_bitmap, ETNA_NR_EVENTS);
				804	for (i = 0; i < ARRAY_SIZE(gpu->event); i++)
				805	complete(&gpu->event_free);
				806
				807	/* Now program the hardware */
				808	mutex_lock(&gpu->lock);
				809	etnaviv_gpu_hw_init(gpu);
				810	mutex_unlock(&gpu->lock);
				811
				812	pm_runtime_mark_last_busy(gpu->dev);
				813	pm_runtime_put_autosuspend(gpu->dev);
				814
				815	gpu->initialized = true;
				816
				817	return 0;
				818
				819	fail:
				820	pm_runtime_mark_last_busy(gpu->dev);
				821	pm_put:
				822	pm_runtime_put_autosuspend(gpu->dev);
				823
				824	return ret;
				825	}
				826
				827	#ifdef CONFIG_DEBUG_FS
				828	struct dma_debug {
				829	u32 address[2];
				830	u32 state[2];
				831	};
				832
				833	static void verify_dma(struct etnaviv_gpu gpu, struct dma_debug debug)
				834	{
				835	u32 i;
				836
				837	debug->address[0] = gpu_read(gpu, VIVS_FE_DMA_ADDRESS);
				838	debug->state[0] = gpu_read(gpu, VIVS_FE_DMA_DEBUG_STATE);
				839
				840	for (i = 0; i < 500; i++) {
				841	debug->address[1] = gpu_read(gpu, VIVS_FE_DMA_ADDRESS);
				842	debug->state[1] = gpu_read(gpu, VIVS_FE_DMA_DEBUG_STATE);
				843
				844	if (debug->address[0] != debug->address[1])
				845	break;
				846
				847	if (debug->state[0] != debug->state[1])
				848	break;
				849	}
				850	}
				851
				852	int etnaviv_gpu_debugfs(struct etnaviv_gpu gpu, struct seq_file m)
				853	{
				854	struct dma_debug debug;
				855	u32 dma_lo, dma_hi, axi, idle;
				856	int ret;
				857
				858	seq_printf(m, "%s Status:\n", dev_name(gpu->dev));
				859
				860	ret = pm_runtime_get_sync(gpu->dev);
				861	if (ret < 0)
				862	goto pm_put;
				863
				864	dma_lo = gpu_read(gpu, VIVS_FE_DMA_LOW);
				865	dma_hi = gpu_read(gpu, VIVS_FE_DMA_HIGH);
				866	axi = gpu_read(gpu, VIVS_HI_AXI_STATUS);
				867	idle = gpu_read(gpu, VIVS_HI_IDLE_STATE);
				868
				869	verify_dma(gpu, &debug);
				870
				871	seq_puts(m, "\tfeatures\n");
				872	seq_printf(m, "\t major_features: 0x%08x\n",
				873	gpu->identity.features);
				874	seq_printf(m, "\t minor_features0: 0x%08x\n",
				875	gpu->identity.minor_features0);
				876	seq_printf(m, "\t minor_features1: 0x%08x\n",
				877	gpu->identity.minor_features1);
				878	seq_printf(m, "\t minor_features2: 0x%08x\n",
				879	gpu->identity.minor_features2);
				880	seq_printf(m, "\t minor_features3: 0x%08x\n",
				881	gpu->identity.minor_features3);
				882	seq_printf(m, "\t minor_features4: 0x%08x\n",
				883	gpu->identity.minor_features4);
				884	seq_printf(m, "\t minor_features5: 0x%08x\n",
				885	gpu->identity.minor_features5);
				886	seq_printf(m, "\t minor_features6: 0x%08x\n",
				887	gpu->identity.minor_features6);
				888	seq_printf(m, "\t minor_features7: 0x%08x\n",
				889	gpu->identity.minor_features7);
				890	seq_printf(m, "\t minor_features8: 0x%08x\n",
				891	gpu->identity.minor_features8);
				892	seq_printf(m, "\t minor_features9: 0x%08x\n",
				893	gpu->identity.minor_features9);
				894	seq_printf(m, "\t minor_features10: 0x%08x\n",
				895	gpu->identity.minor_features10);
				896	seq_printf(m, "\t minor_features11: 0x%08x\n",
				897	gpu->identity.minor_features11);
				898
				899	seq_puts(m, "\tspecs\n");
				900	seq_printf(m, "\t stream_count: %d\n",
				901	gpu->identity.stream_count);
				902	seq_printf(m, "\t register_max: %d\n",
				903	gpu->identity.register_max);
				904	seq_printf(m, "\t thread_count: %d\n",
				905	gpu->identity.thread_count);
				906	seq_printf(m, "\t vertex_cache_size: %d\n",
				907	gpu->identity.vertex_cache_size);
				908	seq_printf(m, "\t shader_core_count: %d\n",
				909	gpu->identity.shader_core_count);
				910	seq_printf(m, "\t pixel_pipes: %d\n",
				911	gpu->identity.pixel_pipes);
				912	seq_printf(m, "\t vertex_output_buffer_size: %d\n",
				913	gpu->identity.vertex_output_buffer_size);
				914	seq_printf(m, "\t buffer_size: %d\n",
				915	gpu->identity.buffer_size);
				916	seq_printf(m, "\t instruction_count: %d\n",
				917	gpu->identity.instruction_count);
				918	seq_printf(m, "\t num_constants: %d\n",
				919	gpu->identity.num_constants);
				920	seq_printf(m, "\t varyings_count: %d\n",
				921	gpu->identity.varyings_count);
				922
				923	seq_printf(m, "\taxi: 0x%08x\n", axi);
				924	seq_printf(m, "\tidle: 0x%08x\n", idle);
				925	idle \|= ~gpu->idle_mask & ~VIVS_HI_IDLE_STATE_AXI_LP;
				926	if ((idle & VIVS_HI_IDLE_STATE_FE) == 0)
				927	seq_puts(m, "\t FE is not idle\n");
				928	if ((idle & VIVS_HI_IDLE_STATE_DE) == 0)
				929	seq_puts(m, "\t DE is not idle\n");
				930	if ((idle & VIVS_HI_IDLE_STATE_PE) == 0)
				931	seq_puts(m, "\t PE is not idle\n");
				932	if ((idle & VIVS_HI_IDLE_STATE_SH) == 0)
				933	seq_puts(m, "\t SH is not idle\n");
				934	if ((idle & VIVS_HI_IDLE_STATE_PA) == 0)
				935	seq_puts(m, "\t PA is not idle\n");
				936	if ((idle & VIVS_HI_IDLE_STATE_SE) == 0)
				937	seq_puts(m, "\t SE is not idle\n");
				938	if ((idle & VIVS_HI_IDLE_STATE_RA) == 0)
				939	seq_puts(m, "\t RA is not idle\n");
				940	if ((idle & VIVS_HI_IDLE_STATE_TX) == 0)
				941	seq_puts(m, "\t TX is not idle\n");
				942	if ((idle & VIVS_HI_IDLE_STATE_VG) == 0)
				943	seq_puts(m, "\t VG is not idle\n");
				944	if ((idle & VIVS_HI_IDLE_STATE_IM) == 0)
				945	seq_puts(m, "\t IM is not idle\n");
				946	if ((idle & VIVS_HI_IDLE_STATE_FP) == 0)
				947	seq_puts(m, "\t FP is not idle\n");
				948	if ((idle & VIVS_HI_IDLE_STATE_TS) == 0)
				949	seq_puts(m, "\t TS is not idle\n");
				950	if (idle & VIVS_HI_IDLE_STATE_AXI_LP)
				951	seq_puts(m, "\t AXI low power mode\n");
				952
				953	if (gpu->identity.features & chipFeatures_DEBUG_MODE) {
				954	u32 read0 = gpu_read(gpu, VIVS_MC_DEBUG_READ0);
				955	u32 read1 = gpu_read(gpu, VIVS_MC_DEBUG_READ1);
				956	u32 write = gpu_read(gpu, VIVS_MC_DEBUG_WRITE);
				957
				958	seq_puts(m, "\tMC\n");
				959	seq_printf(m, "\t read0: 0x%08x\n", read0);
				960	seq_printf(m, "\t read1: 0x%08x\n", read1);
				961	seq_printf(m, "\t write: 0x%08x\n", write);
				962	}
				963
				964	seq_puts(m, "\tDMA ");
				965
				966	if (debug.address[0] == debug.address[1] &&
				967	debug.state[0] == debug.state[1]) {
				968	seq_puts(m, "seems to be stuck\n");
				969	} else if (debug.address[0] == debug.address[1]) {
				970	seq_puts(m, "address is constant\n");
				971	} else {
				972	seq_puts(m, "is running\n");
				973	}
				974
				975	seq_printf(m, "\t address 0: 0x%08x\n", debug.address[0]);
				976	seq_printf(m, "\t address 1: 0x%08x\n", debug.address[1]);
				977	seq_printf(m, "\t state 0: 0x%08x\n", debug.state[0]);
				978	seq_printf(m, "\t state 1: 0x%08x\n", debug.state[1]);
				979	seq_printf(m, "\t last fetch 64 bit word: 0x%08x 0x%08x\n",
				980	dma_lo, dma_hi);
				981
				982	ret = 0;
				983
				984	pm_runtime_mark_last_busy(gpu->dev);
				985	pm_put:
				986	pm_runtime_put_autosuspend(gpu->dev);
				987
				988	return ret;
				989	}
				990	#endif
				991
				992	void etnaviv_gpu_recover_hang(struct etnaviv_gpu *gpu)
				993	{
				994	unsigned int i = 0;
				995
				996	dev_err(gpu->dev, "recover hung GPU!\n");
				997
				998	if (pm_runtime_get_sync(gpu->dev) < 0)
				999	goto pm_put;
				1000
				1001	mutex_lock(&gpu->lock);
				1002
				1003	etnaviv_hw_reset(gpu);
				1004
				1005	/* complete all events, the GPU won't do it after the reset */
				1006	spin_lock(&gpu->event_spinlock);
				1007	for_each_set_bit_from(i, gpu->event_bitmap, ETNA_NR_EVENTS)
				1008	complete(&gpu->event_free);
				1009	bitmap_zero(gpu->event_bitmap, ETNA_NR_EVENTS);
				1010	spin_unlock(&gpu->event_spinlock);
				1011
				1012	etnaviv_gpu_hw_init(gpu);
				1013
				1014	mutex_unlock(&gpu->lock);
				1015	pm_runtime_mark_last_busy(gpu->dev);
				1016	pm_put:
				1017	pm_runtime_put_autosuspend(gpu->dev);
				1018	}
				1019
				1020	/* fence object management */
				1021	struct etnaviv_fence {
				1022	struct etnaviv_gpu *gpu;
				1023	struct dma_fence base;
				1024	};
				1025
				1026	static inline struct etnaviv_fence to_etnaviv_fence(struct dma_fence fence)
				1027	{
				1028	return container_of(fence, struct etnaviv_fence, base);
				1029	}
				1030
				1031	static const char etnaviv_fence_get_driver_name(struct dma_fence fence)
				1032	{
				1033	return "etnaviv";
				1034	}
				1035
				1036	static const char etnaviv_fence_get_timeline_name(struct dma_fence fence)
				1037	{
				1038	struct etnaviv_fence *f = to_etnaviv_fence(fence);
				1039
				1040	return dev_name(f->gpu->dev);
				1041	}
				1042
				1043	static bool etnaviv_fence_signaled(struct dma_fence *fence)
				1044	{
				1045	struct etnaviv_fence *f = to_etnaviv_fence(fence);
				1046
				1047	return (s32)(f->gpu->completed_fence - f->base.seqno) >= 0;
				1048	}
				1049
				1050	static void etnaviv_fence_release(struct dma_fence *fence)
				1051	{
				1052	struct etnaviv_fence *f = to_etnaviv_fence(fence);
				1053
				1054	kfree_rcu(f, base.rcu);
				1055	}
				1056
				1057	static const struct dma_fence_ops etnaviv_fence_ops = {
				1058	.get_driver_name = etnaviv_fence_get_driver_name,
				1059	.get_timeline_name = etnaviv_fence_get_timeline_name,
				1060	.signaled = etnaviv_fence_signaled,
				1061	.release = etnaviv_fence_release,
				1062	};
				1063
				1064	static struct dma_fence etnaviv_gpu_fence_alloc(struct etnaviv_gpu gpu)
				1065	{
				1066	struct etnaviv_fence *f;
				1067
				1068	/*
				1069	* GPU lock must already be held, otherwise fence completion order might
				1070	* not match the seqno order assigned here.
				1071	*/
				1072	lockdep_assert_held(&gpu->lock);
				1073
				1074	f = kzalloc(sizeof(*f), GFP_KERNEL);
				1075	if (!f)
				1076	return NULL;
				1077
				1078	f->gpu = gpu;
				1079
				1080	dma_fence_init(&f->base, &etnaviv_fence_ops, &gpu->fence_spinlock,
				1081	gpu->fence_context, ++gpu->next_fence);
				1082
				1083	return &f->base;
				1084	}
				1085
				1086	/* returns true if fence a comes after fence b */
				1087	static inline bool fence_after(u32 a, u32 b)
				1088	{
				1089	return (s32)(a - b) > 0;
				1090	}
				1091
				1092	/*
				1093	* event management:
				1094	*/
				1095
				1096	static int event_alloc(struct etnaviv_gpu *gpu, unsigned nr_events,
				1097	unsigned int *events)
				1098	{
				1099	unsigned long timeout = msecs_to_jiffies(10 * 10000);
				1100	unsigned i, acquired = 0;
				1101
				1102	for (i = 0; i < nr_events; i++) {
				1103	unsigned long ret;
				1104
				1105	ret = wait_for_completion_timeout(&gpu->event_free, timeout);
				1106
				1107	if (!ret) {
				1108	dev_err(gpu->dev, "wait_for_completion_timeout failed");
				1109	goto out;
				1110	}
				1111
				1112	acquired++;
				1113	timeout = ret;
				1114	}
				1115
				1116	spin_lock(&gpu->event_spinlock);
				1117
				1118	for (i = 0; i < nr_events; i++) {
				1119	int event = find_first_zero_bit(gpu->event_bitmap, ETNA_NR_EVENTS);
				1120
				1121	events[i] = event;
				1122	memset(&gpu->event[event], 0, sizeof(struct etnaviv_event));
				1123	set_bit(event, gpu->event_bitmap);
				1124	}
				1125
				1126	spin_unlock(&gpu->event_spinlock);
				1127
				1128	return 0;
				1129
				1130	out:
				1131	for (i = 0; i < acquired; i++)
				1132	complete(&gpu->event_free);
				1133
				1134	return -EBUSY;
				1135	}
				1136
				1137	static void event_free(struct etnaviv_gpu *gpu, unsigned int event)
				1138	{
				1139	if (!test_bit(event, gpu->event_bitmap)) {
				1140	dev_warn(gpu->dev, "event %u is already marked as free",
				1141	event);
				1142	} else {
				1143	clear_bit(event, gpu->event_bitmap);
				1144	complete(&gpu->event_free);
				1145	}
				1146	}
				1147
				1148	/*
				1149	* Cmdstream submission/retirement:
				1150	*/
				1151	int etnaviv_gpu_wait_fence_interruptible(struct etnaviv_gpu *gpu,
				1152	u32 id, struct drm_etnaviv_timespec *timeout)
				1153	{
				1154	struct dma_fence *fence;
				1155	int ret;
				1156
				1157	/*
				1158	* Look up the fence and take a reference. We might still find a fence
				1159	* whose refcount has already dropped to zero. dma_fence_get_rcu
				1160	* pretends we didn't find a fence in that case.
				1161	*/
				1162	rcu_read_lock();
				1163	fence = idr_find(&gpu->fence_idr, id);
				1164	if (fence)
				1165	fence = dma_fence_get_rcu(fence);
				1166	rcu_read_unlock();
				1167
				1168	if (!fence)
				1169	return 0;
				1170
				1171	if (!timeout) {
				1172	/* No timeout was requested: just test for completion */
				1173	ret = dma_fence_is_signaled(fence) ? 0 : -EBUSY;
				1174	} else {
				1175	unsigned long remaining = etnaviv_timeout_to_jiffies(timeout);
				1176
				1177	ret = dma_fence_wait_timeout(fence, true, remaining);
				1178	if (ret == 0)
				1179	ret = -ETIMEDOUT;
				1180	else if (ret != -ERESTARTSYS)
				1181	ret = 0;
				1182
				1183	}
				1184
				1185	dma_fence_put(fence);
				1186	return ret;
				1187	}
				1188
				1189	/*
				1190	* Wait for an object to become inactive. This, on it's own, is not race
				1191	* free: the object is moved by the scheduler off the active list, and
				1192	* then the iova is put. Moreover, the object could be re-submitted just
				1193	* after we notice that it's become inactive.
				1194	*
				1195	* Although the retirement happens under the gpu lock, we don't want to hold
				1196	* that lock in this function while waiting.
				1197	*/
				1198	int etnaviv_gpu_wait_obj_inactive(struct etnaviv_gpu *gpu,
				1199	struct etnaviv_gem_object *etnaviv_obj,
				1200	struct drm_etnaviv_timespec *timeout)
				1201	{
				1202	unsigned long remaining;
				1203	long ret;
				1204
				1205	if (!timeout)
				1206	return !is_active(etnaviv_obj) ? 0 : -EBUSY;
				1207
				1208	remaining = etnaviv_timeout_to_jiffies(timeout);
				1209
				1210	ret = wait_event_interruptible_timeout(gpu->fence_event,
				1211	!is_active(etnaviv_obj),
				1212	remaining);
				1213	if (ret > 0)
				1214	return 0;
				1215	else if (ret == -ERESTARTSYS)
				1216	return -ERESTARTSYS;
				1217	else
				1218	return -ETIMEDOUT;
				1219	}
				1220
				1221	static void sync_point_perfmon_sample(struct etnaviv_gpu *gpu,
				1222	struct etnaviv_event *event, unsigned int flags)
				1223	{
				1224	const struct etnaviv_gem_submit *submit = event->submit;
				1225	unsigned int i;
				1226
				1227	for (i = 0; i < submit->nr_pmrs; i++) {
				1228	const struct etnaviv_perfmon_request *pmr = submit->pmrs + i;
				1229
				1230	if (pmr->flags == flags)
				1231	etnaviv_perfmon_process(gpu, pmr, submit->exec_state);
				1232	}
				1233	}
				1234
				1235	static void sync_point_perfmon_sample_pre(struct etnaviv_gpu *gpu,
				1236	struct etnaviv_event *event)
				1237	{
				1238	u32 val;
				1239
				1240	mutex_lock(&gpu->lock);
				1241
				1242	/* disable clock gating */
				1243	val = gpu_read_power(gpu, VIVS_PM_POWER_CONTROLS);
				1244	val &= ~VIVS_PM_POWER_CONTROLS_ENABLE_MODULE_CLOCK_GATING;
				1245	gpu_write_power(gpu, VIVS_PM_POWER_CONTROLS, val);
				1246
				1247	/* enable debug register */
				1248	val = gpu_read(gpu, VIVS_HI_CLOCK_CONTROL);
				1249	val &= ~VIVS_HI_CLOCK_CONTROL_DISABLE_DEBUG_REGISTERS;
				1250	gpu_write(gpu, VIVS_HI_CLOCK_CONTROL, val);
				1251
				1252	sync_point_perfmon_sample(gpu, event, ETNA_PM_PROCESS_PRE);
				1253
				1254	mutex_unlock(&gpu->lock);
				1255	}
				1256
				1257	static void sync_point_perfmon_sample_post(struct etnaviv_gpu *gpu,
				1258	struct etnaviv_event *event)
				1259	{
				1260	const struct etnaviv_gem_submit *submit = event->submit;
				1261	unsigned int i;
				1262	u32 val;
				1263
				1264	mutex_lock(&gpu->lock);
				1265
				1266	sync_point_perfmon_sample(gpu, event, ETNA_PM_PROCESS_POST);
				1267
				1268	/* disable debug register */
				1269	val = gpu_read(gpu, VIVS_HI_CLOCK_CONTROL);
				1270	val \|= VIVS_HI_CLOCK_CONTROL_DISABLE_DEBUG_REGISTERS;
				1271	gpu_write(gpu, VIVS_HI_CLOCK_CONTROL, val);
				1272
				1273	/* enable clock gating */
				1274	val = gpu_read_power(gpu, VIVS_PM_POWER_CONTROLS);
				1275	val \|= VIVS_PM_POWER_CONTROLS_ENABLE_MODULE_CLOCK_GATING;
				1276	gpu_write_power(gpu, VIVS_PM_POWER_CONTROLS, val);
				1277
				1278	mutex_unlock(&gpu->lock);
				1279
				1280	for (i = 0; i < submit->nr_pmrs; i++) {
				1281	const struct etnaviv_perfmon_request *pmr = submit->pmrs + i;
				1282
				1283	*pmr->bo_vma = pmr->sequence;
				1284	}
				1285	}
				1286
				1287
				1288	/* add bo's to gpu's ring, and kick gpu: */
				1289	struct dma_fence etnaviv_gpu_submit(struct etnaviv_gem_submit submit)
				1290	{
				1291	struct etnaviv_gpu *gpu = submit->gpu;
				1292	struct dma_fence *gpu_fence;
				1293	unsigned int i, nr_events = 1, event[3];
				1294	int ret;
				1295
				1296	if (!submit->runtime_resumed) {
				1297	ret = pm_runtime_get_sync(gpu->dev);
				1298	if (ret < 0) {
				1299	pm_runtime_put_noidle(gpu->dev);
				1300	return NULL;
				1301	}
				1302	submit->runtime_resumed = true;
				1303	}
				1304
				1305	/*
				1306	* if there are performance monitor requests we need to have
				1307	* - a sync point to re-configure gpu and process ETNA_PM_PROCESS_PRE
				1308	* requests.
				1309	* - a sync point to re-configure gpu, process ETNA_PM_PROCESS_POST requests
				1310	* and update the sequence number for userspace.
				1311	*/
				1312	if (submit->nr_pmrs)
				1313	nr_events = 3;
				1314
				1315	ret = event_alloc(gpu, nr_events, event);
				1316	if (ret) {
				1317	DRM_ERROR("no free events\n");
				1318	pm_runtime_put_noidle(gpu->dev);
				1319	return NULL;
				1320	}
				1321
				1322	mutex_lock(&gpu->lock);
				1323
				1324	gpu_fence = etnaviv_gpu_fence_alloc(gpu);
				1325	if (!gpu_fence) {
				1326	for (i = 0; i < nr_events; i++)
				1327	event_free(gpu, event[i]);
				1328
				1329	goto out_unlock;
				1330	}
				1331
				1332	if (!gpu->fe_running)
				1333	etnaviv_gpu_start_fe_idleloop(gpu, submit->mmu_context);
				1334
				1335	if (submit->prev_mmu_context)
				1336	etnaviv_iommu_context_put(submit->prev_mmu_context);
				1337	submit->prev_mmu_context = etnaviv_iommu_context_get(gpu->mmu_context);
				1338
				1339	if (submit->nr_pmrs) {
				1340	gpu->event[event[1]].sync_point = &sync_point_perfmon_sample_pre;
				1341	kref_get(&submit->refcount);
				1342	gpu->event[event[1]].submit = submit;
				1343	etnaviv_sync_point_queue(gpu, event[1]);
				1344	}
				1345
				1346	gpu->event[event[0]].fence = gpu_fence;
				1347	submit->cmdbuf.user_size = submit->cmdbuf.size - 8;
				1348	etnaviv_buffer_queue(gpu, submit->exec_state, submit->mmu_context,
				1349	event[0], &submit->cmdbuf);
				1350
				1351	if (submit->nr_pmrs) {
				1352	gpu->event[event[2]].sync_point = &sync_point_perfmon_sample_post;
				1353	kref_get(&submit->refcount);
				1354	gpu->event[event[2]].submit = submit;
				1355	etnaviv_sync_point_queue(gpu, event[2]);
				1356	}
				1357
				1358	out_unlock:
				1359	mutex_unlock(&gpu->lock);
				1360
				1361	return gpu_fence;
				1362	}
				1363
				1364	static void sync_point_worker(struct work_struct *work)
				1365	{
				1366	struct etnaviv_gpu *gpu = container_of(work, struct etnaviv_gpu,
				1367	sync_point_work);
				1368	struct etnaviv_event *event = &gpu->event[gpu->sync_point_event];
				1369	u32 addr = gpu_read(gpu, VIVS_FE_DMA_ADDRESS);
				1370
				1371	event->sync_point(gpu, event);
				1372	etnaviv_submit_put(event->submit);
				1373	event_free(gpu, gpu->sync_point_event);
				1374
				1375	/* restart FE last to avoid GPU and IRQ racing against this worker */
				1376	etnaviv_gpu_start_fe(gpu, addr + 2, 2);
				1377	}
				1378
				1379	static void dump_mmu_fault(struct etnaviv_gpu *gpu)
				1380	{
				1381	u32 status_reg, status;
				1382	int i;
				1383
				1384	if (gpu->sec_mode == ETNA_SEC_NONE)
				1385	status_reg = VIVS_MMUv2_STATUS;
				1386	else
				1387	status_reg = VIVS_MMUv2_SEC_STATUS;
				1388
				1389	status = gpu_read(gpu, status_reg);
				1390	dev_err_ratelimited(gpu->dev, "MMU fault status 0x%08x\n", status);
				1391
				1392	for (i = 0; i < 4; i++) {
				1393	u32 address_reg;
				1394
				1395	if (!(status & (VIVS_MMUv2_STATUS_EXCEPTION0__MASK << (i * 4))))
				1396	continue;
				1397
				1398	if (gpu->sec_mode == ETNA_SEC_NONE)
				1399	address_reg = VIVS_MMUv2_EXCEPTION_ADDR(i);
				1400	else
				1401	address_reg = VIVS_MMUv2_SEC_EXCEPTION_ADDR;
				1402
				1403	dev_err_ratelimited(gpu->dev, "MMU %d fault addr 0x%08x\n", i,
				1404	gpu_read(gpu, address_reg));
				1405	}
				1406	}
				1407
				1408	static irqreturn_t irq_handler(int irq, void *data)
				1409	{
				1410	struct etnaviv_gpu *gpu = data;
				1411	irqreturn_t ret = IRQ_NONE;
				1412
				1413	u32 intr = gpu_read(gpu, VIVS_HI_INTR_ACKNOWLEDGE);
				1414
				1415	if (intr != 0) {
				1416	int event;
				1417
				1418	pm_runtime_mark_last_busy(gpu->dev);
				1419
				1420	dev_dbg(gpu->dev, "intr 0x%08x\n", intr);
				1421
				1422	if (intr & VIVS_HI_INTR_ACKNOWLEDGE_AXI_BUS_ERROR) {
				1423	dev_err(gpu->dev, "AXI bus error\n");
				1424	intr &= ~VIVS_HI_INTR_ACKNOWLEDGE_AXI_BUS_ERROR;
				1425	}
				1426
				1427	if (intr & VIVS_HI_INTR_ACKNOWLEDGE_MMU_EXCEPTION) {
				1428	dump_mmu_fault(gpu);
				1429	intr &= ~VIVS_HI_INTR_ACKNOWLEDGE_MMU_EXCEPTION;
				1430	}
				1431
				1432	while ((event = ffs(intr)) != 0) {
				1433	struct dma_fence *fence;
				1434
				1435	event -= 1;
				1436
				1437	intr &= ~(1 << event);
				1438
				1439	dev_dbg(gpu->dev, "event %u\n", event);
				1440
				1441	if (gpu->event[event].sync_point) {
				1442	gpu->sync_point_event = event;
				1443	queue_work(gpu->wq, &gpu->sync_point_work);
				1444	}
				1445
				1446	fence = gpu->event[event].fence;
				1447	if (!fence)
				1448	continue;
				1449
				1450	gpu->event[event].fence = NULL;
				1451
				1452	/*
				1453	* Events can be processed out of order. Eg,
				1454	* - allocate and queue event 0
				1455	* - allocate event 1
				1456	* - event 0 completes, we process it
				1457	* - allocate and queue event 0
				1458	* - event 1 and event 0 complete
				1459	* we can end up processing event 0 first, then 1.
				1460	*/
				1461	if (fence_after(fence->seqno, gpu->completed_fence))
				1462	gpu->completed_fence = fence->seqno;
				1463	dma_fence_signal(fence);
				1464
				1465	event_free(gpu, event);
				1466	}
				1467
				1468	ret = IRQ_HANDLED;
				1469	}
				1470
				1471	return ret;
				1472	}
				1473
				1474	static int etnaviv_gpu_clk_enable(struct etnaviv_gpu *gpu)
				1475	{
				1476	int ret;
				1477
				1478	if (gpu->clk_reg) {
				1479	ret = clk_prepare_enable(gpu->clk_reg);
				1480	if (ret)
				1481	return ret;
				1482	}
				1483
				1484	if (gpu->clk_bus) {
				1485	ret = clk_prepare_enable(gpu->clk_bus);
				1486	if (ret)
				1487	goto disable_clk_reg;
				1488	}
				1489
				1490	if (gpu->clk_core) {
				1491	ret = clk_prepare_enable(gpu->clk_core);
				1492	if (ret)
				1493	goto disable_clk_bus;
				1494	}
				1495
				1496	if (gpu->clk_shader) {
				1497	ret = clk_prepare_enable(gpu->clk_shader);
				1498	if (ret)
				1499	goto disable_clk_core;
				1500	}
				1501
				1502	return 0;
				1503
				1504	disable_clk_core:
				1505	if (gpu->clk_core)
				1506	clk_disable_unprepare(gpu->clk_core);
				1507	disable_clk_bus:
				1508	if (gpu->clk_bus)
				1509	clk_disable_unprepare(gpu->clk_bus);
				1510	disable_clk_reg:
				1511	if (gpu->clk_reg)
				1512	clk_disable_unprepare(gpu->clk_reg);
				1513
				1514	return ret;
				1515	}
				1516
				1517	static int etnaviv_gpu_clk_disable(struct etnaviv_gpu *gpu)
				1518	{
				1519	if (gpu->clk_shader)
				1520	clk_disable_unprepare(gpu->clk_shader);
				1521	if (gpu->clk_core)
				1522	clk_disable_unprepare(gpu->clk_core);
				1523	if (gpu->clk_bus)
				1524	clk_disable_unprepare(gpu->clk_bus);
				1525	if (gpu->clk_reg)
				1526	clk_disable_unprepare(gpu->clk_reg);
				1527
				1528	return 0;
				1529	}
				1530
				1531	int etnaviv_gpu_wait_idle(struct etnaviv_gpu *gpu, unsigned int timeout_ms)
				1532	{
				1533	unsigned long timeout = jiffies + msecs_to_jiffies(timeout_ms);
				1534
				1535	do {
				1536	u32 idle = gpu_read(gpu, VIVS_HI_IDLE_STATE);
				1537
				1538	if ((idle & gpu->idle_mask) == gpu->idle_mask)
				1539	return 0;
				1540
				1541	if (time_is_before_jiffies(timeout)) {
				1542	dev_warn(gpu->dev,
				1543	"timed out waiting for idle: idle=0x%x\n",
				1544	idle);
				1545	return -ETIMEDOUT;
				1546	}
				1547
				1548	udelay(5);
				1549	} while (1);
				1550	}
				1551
				1552	static int etnaviv_gpu_hw_suspend(struct etnaviv_gpu *gpu)
				1553	{
				1554	if (gpu->initialized && gpu->fe_running) {
				1555	/* Replace the last WAIT with END */
				1556	mutex_lock(&gpu->lock);
				1557	etnaviv_buffer_end(gpu);
				1558	mutex_unlock(&gpu->lock);
				1559
				1560	/*
				1561	* We know that only the FE is busy here, this should
				1562	* happen quickly (as the WAIT is only 200 cycles). If
				1563	* we fail, just warn and continue.
				1564	*/
				1565	etnaviv_gpu_wait_idle(gpu, 100);
				1566
				1567	gpu->fe_running = false;
				1568	}
				1569
				1570	gpu->exec_state = -1;
				1571
				1572	return etnaviv_gpu_clk_disable(gpu);
				1573	}
				1574
				1575	#ifdef CONFIG_PM
				1576	static int etnaviv_gpu_hw_resume(struct etnaviv_gpu *gpu)
				1577	{
				1578	int ret;
				1579
				1580	ret = mutex_lock_killable(&gpu->lock);
				1581	if (ret)
				1582	return ret;
				1583
				1584	etnaviv_gpu_update_clock(gpu);
				1585	etnaviv_gpu_hw_init(gpu);
				1586
				1587	mutex_unlock(&gpu->lock);
				1588
				1589	return 0;
				1590	}
				1591	#endif
				1592
				1593	static int
				1594	etnaviv_gpu_cooling_get_max_state(struct thermal_cooling_device *cdev,
				1595	unsigned long *state)
				1596	{
				1597	*state = 6;
				1598
				1599	return 0;
				1600	}
				1601
				1602	static int
				1603	etnaviv_gpu_cooling_get_cur_state(struct thermal_cooling_device *cdev,
				1604	unsigned long *state)
				1605	{
				1606	struct etnaviv_gpu *gpu = cdev->devdata;
				1607
				1608	*state = gpu->freq_scale;
				1609
				1610	return 0;
				1611	}
				1612
				1613	static int
				1614	etnaviv_gpu_cooling_set_cur_state(struct thermal_cooling_device *cdev,
				1615	unsigned long state)
				1616	{
				1617	struct etnaviv_gpu *gpu = cdev->devdata;
				1618
				1619	mutex_lock(&gpu->lock);
				1620	gpu->freq_scale = state;
				1621	if (!pm_runtime_suspended(gpu->dev))
				1622	etnaviv_gpu_update_clock(gpu);
				1623	mutex_unlock(&gpu->lock);
				1624
				1625	return 0;
				1626	}
				1627
				1628	static struct thermal_cooling_device_ops cooling_ops = {
				1629	.get_max_state = etnaviv_gpu_cooling_get_max_state,
				1630	.get_cur_state = etnaviv_gpu_cooling_get_cur_state,
				1631	.set_cur_state = etnaviv_gpu_cooling_set_cur_state,
				1632	};
				1633
				1634	static int etnaviv_gpu_bind(struct device dev, struct device master,
				1635	void *data)
				1636	{
				1637	struct drm_device *drm = data;
				1638	struct etnaviv_drm_private *priv = drm->dev_private;
				1639	struct etnaviv_gpu *gpu = dev_get_drvdata(dev);
				1640	int ret;
				1641
				1642	if (IS_ENABLED(CONFIG_DRM_ETNAVIV_THERMAL)) {
				1643	gpu->cooling = thermal_of_cooling_device_register(dev->of_node,
				1644	(char *)dev_name(dev), gpu, &cooling_ops);
				1645	if (IS_ERR(gpu->cooling))
				1646	return PTR_ERR(gpu->cooling);
				1647	}
				1648
				1649	gpu->wq = alloc_ordered_workqueue(dev_name(dev), 0);
				1650	if (!gpu->wq) {
				1651	ret = -ENOMEM;
				1652	goto out_thermal;
				1653	}
				1654
				1655	ret = etnaviv_sched_init(gpu);
				1656	if (ret)
				1657	goto out_workqueue;
				1658
				1659	#ifdef CONFIG_PM
				1660	ret = pm_runtime_get_sync(gpu->dev);
				1661	#else
				1662	ret = etnaviv_gpu_clk_enable(gpu);
				1663	#endif
				1664	if (ret < 0)
				1665	goto out_sched;
				1666
				1667
				1668	gpu->drm = drm;
				1669	gpu->fence_context = dma_fence_context_alloc(1);
				1670	idr_init(&gpu->fence_idr);
				1671	spin_lock_init(&gpu->fence_spinlock);
				1672
				1673	INIT_WORK(&gpu->sync_point_work, sync_point_worker);
				1674	init_waitqueue_head(&gpu->fence_event);
				1675
				1676	priv->gpu[priv->num_gpus++] = gpu;
				1677
				1678	pm_runtime_mark_last_busy(gpu->dev);
				1679	pm_runtime_put_autosuspend(gpu->dev);
				1680
				1681	return 0;
				1682
				1683	out_sched:
				1684	etnaviv_sched_fini(gpu);
				1685
				1686	out_workqueue:
				1687	destroy_workqueue(gpu->wq);
				1688
				1689	out_thermal:
				1690	if (IS_ENABLED(CONFIG_DRM_ETNAVIV_THERMAL))
				1691	thermal_cooling_device_unregister(gpu->cooling);
				1692
				1693	return ret;
				1694	}
				1695
				1696	static void etnaviv_gpu_unbind(struct device dev, struct device master,
				1697	void *data)
				1698	{
				1699	struct etnaviv_gpu *gpu = dev_get_drvdata(dev);
				1700
				1701	DBG("%s", dev_name(gpu->dev));
				1702
				1703	flush_workqueue(gpu->wq);
				1704	destroy_workqueue(gpu->wq);
				1705
				1706	etnaviv_sched_fini(gpu);
				1707
				1708	#ifdef CONFIG_PM
				1709	pm_runtime_get_sync(gpu->dev);
				1710	pm_runtime_put_sync_suspend(gpu->dev);
				1711	#else
				1712	etnaviv_gpu_hw_suspend(gpu);
				1713	#endif
				1714
				1715	if (gpu->mmu_context)
				1716	etnaviv_iommu_context_put(gpu->mmu_context);
				1717
				1718	if (gpu->initialized) {
				1719	etnaviv_cmdbuf_free(&gpu->buffer);
				1720	etnaviv_iommu_global_fini(gpu);
				1721	gpu->initialized = false;
				1722	}
				1723
				1724	gpu->drm = NULL;
				1725	idr_destroy(&gpu->fence_idr);
				1726
				1727	if (IS_ENABLED(CONFIG_DRM_ETNAVIV_THERMAL))
				1728	thermal_cooling_device_unregister(gpu->cooling);
				1729	gpu->cooling = NULL;
				1730	}
				1731
				1732	static const struct component_ops gpu_ops = {
				1733	.bind = etnaviv_gpu_bind,
				1734	.unbind = etnaviv_gpu_unbind,
				1735	};
				1736
				1737	static const struct of_device_id etnaviv_gpu_match[] = {
				1738	{
				1739	.compatible = "vivante,gc"
				1740	},
				1741	{ /* sentinel */ }
				1742	};
				1743	MODULE_DEVICE_TABLE(of, etnaviv_gpu_match);
				1744
				1745	static int etnaviv_gpu_platform_probe(struct platform_device *pdev)
				1746	{
				1747	struct device *dev = &pdev->dev;
				1748	struct etnaviv_gpu *gpu;
				1749	int err;
				1750
				1751	gpu = devm_kzalloc(dev, sizeof(*gpu), GFP_KERNEL);
				1752	if (!gpu)
				1753	return -ENOMEM;
				1754
				1755	gpu->dev = &pdev->dev;
				1756	mutex_init(&gpu->lock);
				1757	mutex_init(&gpu->fence_lock);
				1758
				1759	/* Map registers: */
				1760	gpu->mmio = devm_platform_ioremap_resource(pdev, 0);
				1761	if (IS_ERR(gpu->mmio))
				1762	return PTR_ERR(gpu->mmio);
				1763
				1764	/* Get Interrupt: */
				1765	gpu->irq = platform_get_irq(pdev, 0);
				1766	if (gpu->irq < 0) {
				1767	dev_err(dev, "failed to get irq: %d\n", gpu->irq);
				1768	return gpu->irq;
				1769	}
				1770
				1771	err = devm_request_irq(&pdev->dev, gpu->irq, irq_handler, 0,
				1772	dev_name(gpu->dev), gpu);
				1773	if (err) {
				1774	dev_err(dev, "failed to request IRQ%u: %d\n", gpu->irq, err);
				1775	return err;
				1776	}
				1777
				1778	/* Get Clocks: */
				1779	gpu->clk_reg = devm_clk_get(&pdev->dev, "reg");
				1780	DBG("clk_reg: %p", gpu->clk_reg);
				1781	if (IS_ERR(gpu->clk_reg))
				1782	gpu->clk_reg = NULL;
				1783
				1784	gpu->clk_bus = devm_clk_get(&pdev->dev, "bus");
				1785	DBG("clk_bus: %p", gpu->clk_bus);
				1786	if (IS_ERR(gpu->clk_bus))
				1787	gpu->clk_bus = NULL;
				1788
				1789	gpu->clk_core = devm_clk_get(&pdev->dev, "core");
				1790	DBG("clk_core: %p", gpu->clk_core);
				1791	if (IS_ERR(gpu->clk_core))
				1792	gpu->clk_core = NULL;
				1793	gpu->base_rate_core = clk_get_rate(gpu->clk_core);
				1794
				1795	gpu->clk_shader = devm_clk_get(&pdev->dev, "shader");
				1796	DBG("clk_shader: %p", gpu->clk_shader);
				1797	if (IS_ERR(gpu->clk_shader))
				1798	gpu->clk_shader = NULL;
				1799	gpu->base_rate_shader = clk_get_rate(gpu->clk_shader);
				1800
				1801	/* TODO: figure out max mapped size */
				1802	dev_set_drvdata(dev, gpu);
				1803
				1804	/*
				1805	* We treat the device as initially suspended. The runtime PM
				1806	* autosuspend delay is rather arbitary: no measurements have
				1807	* yet been performed to determine an appropriate value.
				1808	*/
				1809	pm_runtime_use_autosuspend(gpu->dev);
				1810	pm_runtime_set_autosuspend_delay(gpu->dev, 200);
				1811	pm_runtime_enable(gpu->dev);
				1812
				1813	err = component_add(&pdev->dev, &gpu_ops);
				1814	if (err < 0) {
				1815	dev_err(&pdev->dev, "failed to register component: %d\n", err);
				1816	return err;
				1817	}
				1818
				1819	return 0;
				1820	}
				1821
				1822	static int etnaviv_gpu_platform_remove(struct platform_device *pdev)
				1823	{
				1824	component_del(&pdev->dev, &gpu_ops);
				1825	pm_runtime_disable(&pdev->dev);
				1826	return 0;
				1827	}
				1828
				1829	#ifdef CONFIG_PM
				1830	static int etnaviv_gpu_rpm_suspend(struct device *dev)
				1831	{
				1832	struct etnaviv_gpu *gpu = dev_get_drvdata(dev);
				1833	u32 idle, mask;
				1834
				1835	/* If there are any jobs in the HW queue, we're not idle */
				1836	if (atomic_read(&gpu->sched.hw_rq_count))
				1837	return -EBUSY;
				1838
				1839	/* Check whether the hardware (except FE) is idle */
				1840	mask = gpu->idle_mask & ~VIVS_HI_IDLE_STATE_FE;
				1841	idle = gpu_read(gpu, VIVS_HI_IDLE_STATE) & mask;
				1842	if (idle != mask)
				1843	return -EBUSY;
				1844
				1845	return etnaviv_gpu_hw_suspend(gpu);
				1846	}
				1847
				1848	static int etnaviv_gpu_rpm_resume(struct device *dev)
				1849	{
				1850	struct etnaviv_gpu *gpu = dev_get_drvdata(dev);
				1851	int ret;
				1852
				1853	ret = etnaviv_gpu_clk_enable(gpu);
				1854	if (ret)
				1855	return ret;
				1856
				1857	/* Re-initialise the basic hardware state */
				1858	if (gpu->drm && gpu->initialized) {
				1859	ret = etnaviv_gpu_hw_resume(gpu);
				1860	if (ret) {
				1861	etnaviv_gpu_clk_disable(gpu);
				1862	return ret;
				1863	}
				1864	}
				1865
				1866	return 0;
				1867	}
				1868	#endif
				1869
				1870	static const struct dev_pm_ops etnaviv_gpu_pm_ops = {
				1871	SET_RUNTIME_PM_OPS(etnaviv_gpu_rpm_suspend, etnaviv_gpu_rpm_resume,
				1872	NULL)
				1873	};
				1874
				1875	struct platform_driver etnaviv_gpu_driver = {
				1876	.driver = {
				1877	.name = "etnaviv-gpu",
				1878	.owner = THIS_MODULE,
				1879	.pm = &etnaviv_gpu_pm_ops,
				1880	.of_match_table = etnaviv_gpu_match,
				1881	},
				1882	.probe = etnaviv_gpu_platform_probe,
				1883	.remove = etnaviv_gpu_platform_remove,
				1884	.id_table = gpu_ids,
				1885	};