1 // SPDX-License-Identifier: GPL-2.0-only
2 /*
3  * Tegra host1x driver
4  *
5  * Copyright (c) 2010-2013, NVIDIA Corporation.
6  */
7 
8 #include <linux/clk.h>
9 #include <linux/delay.h>
10 #include <linux/dma-mapping.h>
11 #include <linux/io.h>
12 #include <linux/list.h>
13 #include <linux/module.h>
14 #include <linux/of.h>
15 #include <linux/of_platform.h>
16 #include <linux/platform_device.h>
17 #include <linux/pm_runtime.h>
18 #include <linux/slab.h>
19 
20 #include <soc/tegra/common.h>
21 
22 #define CREATE_TRACE_POINTS
23 #include <trace/events/host1x.h>
24 #undef CREATE_TRACE_POINTS
25 
26 #if IS_ENABLED(CONFIG_ARM_DMA_USE_IOMMU)
27 #include <asm/dma-iommu.h>
28 #endif
29 
30 #include "bus.h"
31 #include "channel.h"
32 #include "context.h"
33 #include "debug.h"
34 #include "dev.h"
35 #include "intr.h"
36 
37 #include "hw/host1x01.h"
38 #include "hw/host1x02.h"
39 #include "hw/host1x04.h"
40 #include "hw/host1x05.h"
41 #include "hw/host1x06.h"
42 #include "hw/host1x07.h"
43 #include "hw/host1x08.h"
44 
host1x_common_writel(struct host1x * host1x,u32 v,u32 r)45 void host1x_common_writel(struct host1x *host1x, u32 v, u32 r)
46 {
47 	writel(v, host1x->common_regs + r);
48 }
49 
host1x_hypervisor_writel(struct host1x * host1x,u32 v,u32 r)50 void host1x_hypervisor_writel(struct host1x *host1x, u32 v, u32 r)
51 {
52 	writel(v, host1x->hv_regs + r);
53 }
54 
host1x_hypervisor_readl(struct host1x * host1x,u32 r)55 u32 host1x_hypervisor_readl(struct host1x *host1x, u32 r)
56 {
57 	return readl(host1x->hv_regs + r);
58 }
59 
host1x_sync_writel(struct host1x * host1x,u32 v,u32 r)60 void host1x_sync_writel(struct host1x *host1x, u32 v, u32 r)
61 {
62 	void __iomem *sync_regs = host1x->regs + host1x->info->sync_offset;
63 
64 	writel(v, sync_regs + r);
65 }
66 
host1x_sync_readl(struct host1x * host1x,u32 r)67 u32 host1x_sync_readl(struct host1x *host1x, u32 r)
68 {
69 	void __iomem *sync_regs = host1x->regs + host1x->info->sync_offset;
70 
71 	return readl(sync_regs + r);
72 }
73 
host1x_ch_writel(struct host1x_channel * ch,u32 v,u32 r)74 void host1x_ch_writel(struct host1x_channel *ch, u32 v, u32 r)
75 {
76 	writel(v, ch->regs + r);
77 }
78 
host1x_ch_readl(struct host1x_channel * ch,u32 r)79 u32 host1x_ch_readl(struct host1x_channel *ch, u32 r)
80 {
81 	return readl(ch->regs + r);
82 }
83 
84 static const struct host1x_info host1x01_info = {
85 	.nb_channels = 8,
86 	.nb_pts = 32,
87 	.nb_mlocks = 16,
88 	.nb_bases = 8,
89 	.init = host1x01_init,
90 	.sync_offset = 0x3000,
91 	.dma_mask = DMA_BIT_MASK(32),
92 	.has_wide_gather = false,
93 	.has_hypervisor = false,
94 	.num_sid_entries = 0,
95 	.sid_table = NULL,
96 	.reserve_vblank_syncpts = true,
97 };
98 
99 static const struct host1x_info host1x02_info = {
100 	.nb_channels = 9,
101 	.nb_pts = 32,
102 	.nb_mlocks = 16,
103 	.nb_bases = 12,
104 	.init = host1x02_init,
105 	.sync_offset = 0x3000,
106 	.dma_mask = DMA_BIT_MASK(32),
107 	.has_wide_gather = false,
108 	.has_hypervisor = false,
109 	.num_sid_entries = 0,
110 	.sid_table = NULL,
111 	.reserve_vblank_syncpts = true,
112 };
113 
114 static const struct host1x_info host1x04_info = {
115 	.nb_channels = 12,
116 	.nb_pts = 192,
117 	.nb_mlocks = 16,
118 	.nb_bases = 64,
119 	.init = host1x04_init,
120 	.sync_offset = 0x2100,
121 	.dma_mask = DMA_BIT_MASK(34),
122 	.has_wide_gather = false,
123 	.has_hypervisor = false,
124 	.num_sid_entries = 0,
125 	.sid_table = NULL,
126 	.reserve_vblank_syncpts = false,
127 };
128 
129 static const struct host1x_info host1x05_info = {
130 	.nb_channels = 14,
131 	.nb_pts = 192,
132 	.nb_mlocks = 16,
133 	.nb_bases = 64,
134 	.init = host1x05_init,
135 	.sync_offset = 0x2100,
136 	.dma_mask = DMA_BIT_MASK(34),
137 	.has_wide_gather = false,
138 	.has_hypervisor = false,
139 	.num_sid_entries = 0,
140 	.sid_table = NULL,
141 	.reserve_vblank_syncpts = false,
142 };
143 
144 static const struct host1x_sid_entry tegra186_sid_table[] = {
145 	{
146 		/* VIC */
147 		.base = 0x1af0,
148 		.offset = 0x30,
149 		.limit = 0x34
150 	},
151 	{
152 		/* NVDEC */
153 		.base = 0x1b00,
154 		.offset = 0x30,
155 		.limit = 0x34
156 	},
157 };
158 
159 static const struct host1x_info host1x06_info = {
160 	.nb_channels = 63,
161 	.nb_pts = 576,
162 	.nb_mlocks = 24,
163 	.nb_bases = 16,
164 	.init = host1x06_init,
165 	.sync_offset = 0x0,
166 	.dma_mask = DMA_BIT_MASK(40),
167 	.has_wide_gather = true,
168 	.has_hypervisor = true,
169 	.num_sid_entries = ARRAY_SIZE(tegra186_sid_table),
170 	.sid_table = tegra186_sid_table,
171 	.reserve_vblank_syncpts = false,
172 	.skip_reset_assert = true,
173 };
174 
175 static const struct host1x_sid_entry tegra194_sid_table[] = {
176 	{
177 		/* VIC */
178 		.base = 0x1af0,
179 		.offset = 0x30,
180 		.limit = 0x34
181 	},
182 	{
183 		/* NVDEC */
184 		.base = 0x1b00,
185 		.offset = 0x30,
186 		.limit = 0x34
187 	},
188 	{
189 		/* NVDEC1 */
190 		.base = 0x1bc0,
191 		.offset = 0x30,
192 		.limit = 0x34
193 	},
194 };
195 
196 static const struct host1x_info host1x07_info = {
197 	.nb_channels = 63,
198 	.nb_pts = 704,
199 	.nb_mlocks = 32,
200 	.nb_bases = 0,
201 	.init = host1x07_init,
202 	.sync_offset = 0x0,
203 	.dma_mask = DMA_BIT_MASK(40),
204 	.has_wide_gather = true,
205 	.has_hypervisor = true,
206 	.num_sid_entries = ARRAY_SIZE(tegra194_sid_table),
207 	.sid_table = tegra194_sid_table,
208 	.reserve_vblank_syncpts = false,
209 };
210 
211 /*
212  * Tegra234 has two stream ID protection tables, one for setting stream IDs
213  * through the channel path via SETSTREAMID, and one for setting them via
214  * MMIO. We program each engine's data stream ID in the channel path table
215  * and firmware stream ID in the MMIO path table.
216  */
217 static const struct host1x_sid_entry tegra234_sid_table[] = {
218 	{
219 		/* SE2 MMIO */
220 		.base = 0x1658,
221 		.offset = 0x90,
222 		.limit = 0x90
223 	},
224 	{
225 		/* SE4 MMIO */
226 		.base = 0x1660,
227 		.offset = 0x90,
228 		.limit = 0x90
229 	},
230 	{
231 		/* SE2 channel */
232 		.base = 0x1738,
233 		.offset = 0x90,
234 		.limit = 0x90
235 	},
236 	{
237 		/* SE4 channel */
238 		.base = 0x1740,
239 		.offset = 0x90,
240 		.limit = 0x90
241 	},
242 	{
243 		/* VIC channel */
244 		.base = 0x17b8,
245 		.offset = 0x30,
246 		.limit = 0x30
247 	},
248 	{
249 		/* VIC MMIO */
250 		.base = 0x1688,
251 		.offset = 0x34,
252 		.limit = 0x34
253 	},
254 	{
255 		/* NVDEC channel */
256 		.base = 0x17c8,
257 		.offset = 0x30,
258 		.limit = 0x30,
259 	},
260 	{
261 		/* NVDEC MMIO */
262 		.base = 0x1698,
263 		.offset = 0x34,
264 		.limit = 0x34,
265 	},
266 };
267 
268 static const struct host1x_info host1x08_info = {
269 	.nb_channels = 63,
270 	.nb_pts = 1024,
271 	.nb_mlocks = 24,
272 	.nb_bases = 0,
273 	.init = host1x08_init,
274 	.sync_offset = 0x0,
275 	.dma_mask = DMA_BIT_MASK(40),
276 	.has_wide_gather = true,
277 	.has_hypervisor = true,
278 	.has_common = true,
279 	.num_sid_entries = ARRAY_SIZE(tegra234_sid_table),
280 	.sid_table = tegra234_sid_table,
281 	.streamid_vm_table = { 0x1004, 128 },
282 	.classid_vm_table = { 0x1404, 25 },
283 	.mmio_vm_table = { 0x1504, 25 },
284 	.reserve_vblank_syncpts = false,
285 };
286 
287 static const struct of_device_id host1x_of_match[] = {
288 	{ .compatible = "nvidia,tegra234-host1x", .data = &host1x08_info, },
289 	{ .compatible = "nvidia,tegra194-host1x", .data = &host1x07_info, },
290 	{ .compatible = "nvidia,tegra186-host1x", .data = &host1x06_info, },
291 	{ .compatible = "nvidia,tegra210-host1x", .data = &host1x05_info, },
292 	{ .compatible = "nvidia,tegra124-host1x", .data = &host1x04_info, },
293 	{ .compatible = "nvidia,tegra114-host1x", .data = &host1x02_info, },
294 	{ .compatible = "nvidia,tegra30-host1x", .data = &host1x01_info, },
295 	{ .compatible = "nvidia,tegra20-host1x", .data = &host1x01_info, },
296 	{ },
297 };
298 MODULE_DEVICE_TABLE(of, host1x_of_match);
299 
host1x_setup_virtualization_tables(struct host1x * host)300 static void host1x_setup_virtualization_tables(struct host1x *host)
301 {
302 	const struct host1x_info *info = host->info;
303 	unsigned int i;
304 
305 	if (!info->has_hypervisor)
306 		return;
307 
308 	for (i = 0; i < info->num_sid_entries; i++) {
309 		const struct host1x_sid_entry *entry = &info->sid_table[i];
310 
311 		host1x_hypervisor_writel(host, entry->offset, entry->base);
312 		host1x_hypervisor_writel(host, entry->limit, entry->base + 4);
313 	}
314 
315 	for (i = 0; i < info->streamid_vm_table.count; i++) {
316 		/* Allow access to all stream IDs to all VMs. */
317 		host1x_hypervisor_writel(host, 0xff, info->streamid_vm_table.base + 4 * i);
318 	}
319 
320 	for (i = 0; i < info->classid_vm_table.count; i++) {
321 		/* Allow access to all classes to all VMs. */
322 		host1x_hypervisor_writel(host, 0xff, info->classid_vm_table.base + 4 * i);
323 	}
324 
325 	for (i = 0; i < info->mmio_vm_table.count; i++) {
326 		/* Use VM1 (that's us) as originator VMID for engine MMIO accesses. */
327 		host1x_hypervisor_writel(host, 0x1, info->mmio_vm_table.base + 4 * i);
328 	}
329 }
330 
host1x_wants_iommu(struct host1x * host1x)331 static bool host1x_wants_iommu(struct host1x *host1x)
332 {
333 	/* Our IOMMU usage policy doesn't currently play well with GART */
334 	if (of_machine_is_compatible("nvidia,tegra20"))
335 		return false;
336 
337 	/*
338 	 * If we support addressing a maximum of 32 bits of physical memory
339 	 * and if the host1x firewall is enabled, there's no need to enable
340 	 * IOMMU support. This can happen for example on Tegra20, Tegra30
341 	 * and Tegra114.
342 	 *
343 	 * Tegra124 and later can address up to 34 bits of physical memory and
344 	 * many platforms come equipped with more than 2 GiB of system memory,
345 	 * which requires crossing the 4 GiB boundary. But there's a catch: on
346 	 * SoCs before Tegra186 (i.e. Tegra124 and Tegra210), the host1x can
347 	 * only address up to 32 bits of memory in GATHER opcodes, which means
348 	 * that command buffers need to either be in the first 2 GiB of system
349 	 * memory (which could quickly lead to memory exhaustion), or command
350 	 * buffers need to be treated differently from other buffers (which is
351 	 * not possible with the current ABI).
352 	 *
353 	 * A third option is to use the IOMMU in these cases to make sure all
354 	 * buffers will be mapped into a 32-bit IOVA space that host1x can
355 	 * address. This allows all of the system memory to be used and works
356 	 * within the limitations of the host1x on these SoCs.
357 	 *
358 	 * In summary, default to enable IOMMU on Tegra124 and later. For any
359 	 * of the earlier SoCs, only use the IOMMU for additional safety when
360 	 * the host1x firewall is disabled.
361 	 */
362 	if (host1x->info->dma_mask <= DMA_BIT_MASK(32)) {
363 		if (IS_ENABLED(CONFIG_TEGRA_HOST1X_FIREWALL))
364 			return false;
365 	}
366 
367 	return true;
368 }
369 
host1x_iommu_attach(struct host1x * host)370 static struct iommu_domain *host1x_iommu_attach(struct host1x *host)
371 {
372 	struct iommu_domain *domain = iommu_get_domain_for_dev(host->dev);
373 	int err;
374 
375 #if IS_ENABLED(CONFIG_ARM_DMA_USE_IOMMU)
376 	if (host->dev->archdata.mapping) {
377 		struct dma_iommu_mapping *mapping =
378 				to_dma_iommu_mapping(host->dev);
379 		arm_iommu_detach_device(host->dev);
380 		arm_iommu_release_mapping(mapping);
381 
382 		domain = iommu_get_domain_for_dev(host->dev);
383 	}
384 #endif
385 
386 	/*
387 	 * We may not always want to enable IOMMU support (for example if the
388 	 * host1x firewall is already enabled and we don't support addressing
389 	 * more than 32 bits of physical memory), so check for that first.
390 	 *
391 	 * Similarly, if host1x is already attached to an IOMMU (via the DMA
392 	 * API), don't try to attach again.
393 	 */
394 	if (!host1x_wants_iommu(host) || domain)
395 		return domain;
396 
397 	host->group = iommu_group_get(host->dev);
398 	if (host->group) {
399 		struct iommu_domain_geometry *geometry;
400 		dma_addr_t start, end;
401 		unsigned long order;
402 
403 		err = iova_cache_get();
404 		if (err < 0)
405 			goto put_group;
406 
407 		host->domain = iommu_paging_domain_alloc(host->dev);
408 		if (IS_ERR(host->domain)) {
409 			err = PTR_ERR(host->domain);
410 			host->domain = NULL;
411 			goto put_cache;
412 		}
413 
414 		err = iommu_attach_group(host->domain, host->group);
415 		if (err) {
416 			if (err == -ENODEV)
417 				err = 0;
418 
419 			goto free_domain;
420 		}
421 
422 		geometry = &host->domain->geometry;
423 		start = geometry->aperture_start & host->info->dma_mask;
424 		end = geometry->aperture_end & host->info->dma_mask;
425 
426 		order = __ffs(host->domain->pgsize_bitmap);
427 		init_iova_domain(&host->iova, 1UL << order, start >> order);
428 		host->iova_end = end;
429 
430 		domain = host->domain;
431 	}
432 
433 	return domain;
434 
435 free_domain:
436 	iommu_domain_free(host->domain);
437 	host->domain = NULL;
438 put_cache:
439 	iova_cache_put();
440 put_group:
441 	iommu_group_put(host->group);
442 	host->group = NULL;
443 
444 	return ERR_PTR(err);
445 }
446 
host1x_iommu_init(struct host1x * host)447 static int host1x_iommu_init(struct host1x *host)
448 {
449 	u64 mask = host->info->dma_mask;
450 	struct iommu_domain *domain;
451 	int err;
452 
453 	domain = host1x_iommu_attach(host);
454 	if (IS_ERR(domain)) {
455 		err = PTR_ERR(domain);
456 		dev_err(host->dev, "failed to attach to IOMMU: %d\n", err);
457 		return err;
458 	}
459 
460 	/*
461 	 * If we're not behind an IOMMU make sure we don't get push buffers
462 	 * that are allocated outside of the range addressable by the GATHER
463 	 * opcode.
464 	 *
465 	 * Newer generations of Tegra (Tegra186 and later) support a wide
466 	 * variant of the GATHER opcode that allows addressing more bits.
467 	 */
468 	if (!domain && !host->info->has_wide_gather)
469 		mask = DMA_BIT_MASK(32);
470 
471 	err = dma_coerce_mask_and_coherent(host->dev, mask);
472 	if (err < 0) {
473 		dev_err(host->dev, "failed to set DMA mask: %d\n", err);
474 		return err;
475 	}
476 
477 	return 0;
478 }
479 
host1x_iommu_exit(struct host1x * host)480 static void host1x_iommu_exit(struct host1x *host)
481 {
482 	if (host->domain) {
483 		put_iova_domain(&host->iova);
484 		iommu_detach_group(host->domain, host->group);
485 
486 		iommu_domain_free(host->domain);
487 		host->domain = NULL;
488 
489 		iova_cache_put();
490 
491 		iommu_group_put(host->group);
492 		host->group = NULL;
493 	}
494 }
495 
host1x_get_resets(struct host1x * host)496 static int host1x_get_resets(struct host1x *host)
497 {
498 	int err;
499 
500 	host->resets[0].id = "mc";
501 	host->resets[1].id = "host1x";
502 	host->nresets = ARRAY_SIZE(host->resets);
503 
504 	err = devm_reset_control_bulk_get_optional_exclusive_released(
505 				host->dev, host->nresets, host->resets);
506 	if (err) {
507 		dev_err(host->dev, "failed to get reset: %d\n", err);
508 		return err;
509 	}
510 
511 	return 0;
512 }
513 
host1x_probe(struct platform_device * pdev)514 static int host1x_probe(struct platform_device *pdev)
515 {
516 	struct host1x *host;
517 	int err, i;
518 
519 	host = devm_kzalloc(&pdev->dev, sizeof(*host), GFP_KERNEL);
520 	if (!host)
521 		return -ENOMEM;
522 
523 	host->info = of_device_get_match_data(&pdev->dev);
524 
525 	if (host->info->has_hypervisor) {
526 		host->regs = devm_platform_ioremap_resource_byname(pdev, "vm");
527 		if (IS_ERR(host->regs))
528 			return PTR_ERR(host->regs);
529 
530 		host->hv_regs = devm_platform_ioremap_resource_byname(pdev, "hypervisor");
531 		if (IS_ERR(host->hv_regs))
532 			return PTR_ERR(host->hv_regs);
533 
534 		if (host->info->has_common) {
535 			host->common_regs = devm_platform_ioremap_resource_byname(pdev, "common");
536 			if (IS_ERR(host->common_regs))
537 				return PTR_ERR(host->common_regs);
538 		}
539 	} else {
540 		host->regs = devm_platform_ioremap_resource(pdev, 0);
541 		if (IS_ERR(host->regs))
542 			return PTR_ERR(host->regs);
543 	}
544 
545 	for (i = 0; i < ARRAY_SIZE(host->syncpt_irqs); i++) {
546 		char irq_name[] = "syncptX";
547 
548 		sprintf(irq_name, "syncpt%d", i);
549 
550 		err = platform_get_irq_byname_optional(pdev, irq_name);
551 		if (err == -ENXIO)
552 			break;
553 		if (err < 0)
554 			return err;
555 
556 		host->syncpt_irqs[i] = err;
557 	}
558 
559 	host->num_syncpt_irqs = i;
560 
561 	/* Device tree without irq names */
562 	if (i == 0) {
563 		host->syncpt_irqs[0] = platform_get_irq(pdev, 0);
564 		if (host->syncpt_irqs[0] < 0)
565 			return host->syncpt_irqs[0];
566 
567 		host->num_syncpt_irqs = 1;
568 	}
569 
570 	mutex_init(&host->devices_lock);
571 	INIT_LIST_HEAD(&host->devices);
572 	INIT_LIST_HEAD(&host->list);
573 	host->dev = &pdev->dev;
574 
575 	/* set common host1x device data */
576 	platform_set_drvdata(pdev, host);
577 
578 	host->dev->dma_parms = &host->dma_parms;
579 	dma_set_max_seg_size(host->dev, UINT_MAX);
580 
581 	if (host->info->init) {
582 		err = host->info->init(host);
583 		if (err)
584 			return err;
585 	}
586 
587 	host->clk = devm_clk_get(&pdev->dev, NULL);
588 	if (IS_ERR(host->clk)) {
589 		err = PTR_ERR(host->clk);
590 
591 		if (err != -EPROBE_DEFER)
592 			dev_err(&pdev->dev, "failed to get clock: %d\n", err);
593 
594 		return err;
595 	}
596 
597 	err = host1x_get_resets(host);
598 	if (err)
599 		return err;
600 
601 	host1x_bo_cache_init(&host->cache);
602 
603 	err = host1x_iommu_init(host);
604 	if (err < 0) {
605 		dev_err(&pdev->dev, "failed to setup IOMMU: %d\n", err);
606 		goto destroy_cache;
607 	}
608 
609 	err = host1x_channel_list_init(&host->channel_list,
610 				       host->info->nb_channels);
611 	if (err) {
612 		dev_err(&pdev->dev, "failed to initialize channel list\n");
613 		goto iommu_exit;
614 	}
615 
616 	err = host1x_memory_context_list_init(host);
617 	if (err) {
618 		dev_err(&pdev->dev, "failed to initialize context list\n");
619 		goto free_channels;
620 	}
621 
622 	err = host1x_syncpt_init(host);
623 	if (err) {
624 		dev_err(&pdev->dev, "failed to initialize syncpts\n");
625 		goto free_contexts;
626 	}
627 
628 	pm_runtime_enable(&pdev->dev);
629 
630 	err = devm_tegra_core_dev_init_opp_table_common(&pdev->dev);
631 	if (err)
632 		goto pm_disable;
633 
634 	/* the driver's code isn't ready yet for the dynamic RPM */
635 	err = pm_runtime_resume_and_get(&pdev->dev);
636 	if (err)
637 		goto pm_disable;
638 
639 	err = host1x_intr_init(host);
640 	if (err) {
641 		dev_err(&pdev->dev, "failed to initialize interrupts\n");
642 		goto pm_put;
643 	}
644 
645 	host1x_debug_init(host);
646 
647 	err = host1x_register(host);
648 	if (err < 0)
649 		goto deinit_debugfs;
650 
651 	err = devm_of_platform_populate(&pdev->dev);
652 	if (err < 0)
653 		goto unregister;
654 
655 	return 0;
656 
657 unregister:
658 	host1x_unregister(host);
659 deinit_debugfs:
660 	host1x_debug_deinit(host);
661 	host1x_intr_deinit(host);
662 pm_put:
663 	pm_runtime_put_sync_suspend(&pdev->dev);
664 pm_disable:
665 	pm_runtime_disable(&pdev->dev);
666 	host1x_syncpt_deinit(host);
667 free_contexts:
668 	host1x_memory_context_list_free(&host->context_list);
669 free_channels:
670 	host1x_channel_list_free(&host->channel_list);
671 iommu_exit:
672 	host1x_iommu_exit(host);
673 destroy_cache:
674 	host1x_bo_cache_destroy(&host->cache);
675 
676 	return err;
677 }
678 
host1x_remove(struct platform_device * pdev)679 static void host1x_remove(struct platform_device *pdev)
680 {
681 	struct host1x *host = platform_get_drvdata(pdev);
682 
683 	host1x_unregister(host);
684 	host1x_debug_deinit(host);
685 
686 	pm_runtime_force_suspend(&pdev->dev);
687 
688 	host1x_intr_deinit(host);
689 	host1x_syncpt_deinit(host);
690 	host1x_memory_context_list_free(&host->context_list);
691 	host1x_channel_list_free(&host->channel_list);
692 	host1x_iommu_exit(host);
693 	host1x_bo_cache_destroy(&host->cache);
694 }
695 
host1x_runtime_suspend(struct device * dev)696 static int __maybe_unused host1x_runtime_suspend(struct device *dev)
697 {
698 	struct host1x *host = dev_get_drvdata(dev);
699 	int err;
700 
701 	host1x_channel_stop_all(host);
702 	host1x_intr_stop(host);
703 	host1x_syncpt_save(host);
704 
705 	if (!host->info->skip_reset_assert) {
706 		err = reset_control_bulk_assert(host->nresets, host->resets);
707 		if (err) {
708 			dev_err(dev, "failed to assert reset: %d\n", err);
709 			goto resume_host1x;
710 		}
711 
712 		usleep_range(1000, 2000);
713 	}
714 
715 	clk_disable_unprepare(host->clk);
716 	reset_control_bulk_release(host->nresets, host->resets);
717 
718 	return 0;
719 
720 resume_host1x:
721 	host1x_setup_virtualization_tables(host);
722 	host1x_syncpt_restore(host);
723 	host1x_intr_start(host);
724 
725 	return err;
726 }
727 
host1x_runtime_resume(struct device * dev)728 static int __maybe_unused host1x_runtime_resume(struct device *dev)
729 {
730 	struct host1x *host = dev_get_drvdata(dev);
731 	int err;
732 
733 	err = reset_control_bulk_acquire(host->nresets, host->resets);
734 	if (err) {
735 		dev_err(dev, "failed to acquire reset: %d\n", err);
736 		return err;
737 	}
738 
739 	err = clk_prepare_enable(host->clk);
740 	if (err) {
741 		dev_err(dev, "failed to enable clock: %d\n", err);
742 		goto release_reset;
743 	}
744 
745 	err = reset_control_bulk_deassert(host->nresets, host->resets);
746 	if (err < 0) {
747 		dev_err(dev, "failed to deassert reset: %d\n", err);
748 		goto disable_clk;
749 	}
750 
751 	host1x_setup_virtualization_tables(host);
752 	host1x_syncpt_restore(host);
753 	host1x_intr_start(host);
754 
755 	return 0;
756 
757 disable_clk:
758 	clk_disable_unprepare(host->clk);
759 release_reset:
760 	reset_control_bulk_release(host->nresets, host->resets);
761 
762 	return err;
763 }
764 
765 static const struct dev_pm_ops host1x_pm_ops = {
766 	SET_RUNTIME_PM_OPS(host1x_runtime_suspend, host1x_runtime_resume,
767 			   NULL)
768 	SET_SYSTEM_SLEEP_PM_OPS(pm_runtime_force_suspend, pm_runtime_force_resume)
769 };
770 
771 static struct platform_driver tegra_host1x_driver = {
772 	.driver = {
773 		.name = "tegra-host1x",
774 		.of_match_table = host1x_of_match,
775 		.pm = &host1x_pm_ops,
776 	},
777 	.probe = host1x_probe,
778 	.remove_new = host1x_remove,
779 };
780 
781 static struct platform_driver * const drivers[] = {
782 	&tegra_host1x_driver,
783 	&tegra_mipi_driver,
784 };
785 
tegra_host1x_init(void)786 static int __init tegra_host1x_init(void)
787 {
788 	int err;
789 
790 	err = bus_register(&host1x_bus_type);
791 	if (err < 0)
792 		return err;
793 
794 	err = platform_register_drivers(drivers, ARRAY_SIZE(drivers));
795 	if (err < 0)
796 		bus_unregister(&host1x_bus_type);
797 
798 	return err;
799 }
800 module_init(tegra_host1x_init);
801 
tegra_host1x_exit(void)802 static void __exit tegra_host1x_exit(void)
803 {
804 	platform_unregister_drivers(drivers, ARRAY_SIZE(drivers));
805 	bus_unregister(&host1x_bus_type);
806 }
807 module_exit(tegra_host1x_exit);
808 
809 /**
810  * host1x_get_dma_mask() - query the supported DMA mask for host1x
811  * @host1x: host1x instance
812  *
813  * Note that this returns the supported DMA mask for host1x, which can be
814  * different from the applicable DMA mask under certain circumstances.
815  */
host1x_get_dma_mask(struct host1x * host1x)816 u64 host1x_get_dma_mask(struct host1x *host1x)
817 {
818 	return host1x->info->dma_mask;
819 }
820 EXPORT_SYMBOL(host1x_get_dma_mask);
821 
822 MODULE_AUTHOR("Thierry Reding <thierry.reding@avionic-design.de>");
823 MODULE_AUTHOR("Terje Bergstrom <tbergstrom@nvidia.com>");
824 MODULE_DESCRIPTION("Host1x driver for Tegra products");
825 MODULE_LICENSE("GPL");
826