1  /* SPDX-License-Identifier: GPL-2.0
2   *
3   * Copyright 2016-2022 HabanaLabs, Ltd.
4   * All Rights Reserved.
5   *
6   */
7  
8  #ifndef GOYAP_H_
9  #define GOYAP_H_
10  
11  #include <uapi/drm/habanalabs_accel.h>
12  #include <linux/habanalabs/hl_boot_if.h>
13  #include "../common/habanalabs.h"
14  #include "../include/goya/goya_packets.h"
15  #include "../include/goya/goya.h"
16  #include "../include/goya/goya_async_events.h"
17  #include "../include/goya/goya_fw_if.h"
18  
19  #define NUMBER_OF_CMPLT_QUEUES		5
20  #define NUMBER_OF_EXT_HW_QUEUES		5
21  #define NUMBER_OF_CPU_HW_QUEUES		1
22  #define NUMBER_OF_INT_HW_QUEUES		9
23  #define NUMBER_OF_HW_QUEUES		(NUMBER_OF_EXT_HW_QUEUES + \
24  					NUMBER_OF_CPU_HW_QUEUES + \
25  					NUMBER_OF_INT_HW_QUEUES)
26  
27  /*
28   * Number of MSIX interrupts IDS:
29   * Each completion queue has 1 ID
30   * The event queue has 1 ID
31   */
32  #define NUMBER_OF_INTERRUPTS		(NUMBER_OF_CMPLT_QUEUES + 1)
33  
34  #if (NUMBER_OF_INTERRUPTS > GOYA_MSIX_ENTRIES)
35  #error "Number of MSIX interrupts must be smaller or equal to GOYA_MSIX_ENTRIES"
36  #endif
37  
38  #define QMAN_FENCE_TIMEOUT_USEC		10000		/* 10 ms */
39  
40  #define QMAN_STOP_TIMEOUT_USEC		100000		/* 100 ms */
41  
42  #define CORESIGHT_TIMEOUT_USEC		100000		/* 100 ms */
43  
44  #define GOYA_CPU_TIMEOUT_USEC		15000000	/* 15s */
45  
46  #define TPC_ENABLED_MASK		0xFF
47  
48  #define PLL_HIGH_DEFAULT		1575000000	/* 1.575 GHz */
49  
50  #define MAX_POWER_DEFAULT		200000		/* 200W */
51  
52  #define DC_POWER_DEFAULT		20000		/* 20W */
53  
54  #define DRAM_PHYS_DEFAULT_SIZE		0x100000000ull	/* 4GB */
55  
56  #define GOYA_DEFAULT_CARD_NAME		"HL1000"
57  
58  #define GOYA_MAX_PENDING_CS		64
59  
60  #if !IS_MAX_PENDING_CS_VALID(GOYA_MAX_PENDING_CS)
61  #error "GOYA_MAX_PENDING_CS must be power of 2 and greater than 1"
62  #endif
63  
64  /* DRAM Memory Map */
65  
66  #define CPU_FW_IMAGE_SIZE		0x10000000	/* 256MB */
67  #define MMU_PAGE_TABLES_SIZE		0x0FC00000	/* 252MB */
68  #define MMU_DRAM_DEFAULT_PAGE_SIZE	0x00200000	/* 2MB */
69  #define MMU_CACHE_MNG_SIZE		0x00001000	/* 4KB */
70  
71  #define CPU_FW_IMAGE_ADDR		DRAM_PHYS_BASE
72  #define MMU_PAGE_TABLES_ADDR		(CPU_FW_IMAGE_ADDR + CPU_FW_IMAGE_SIZE)
73  #define MMU_DRAM_DEFAULT_PAGE_ADDR	(MMU_PAGE_TABLES_ADDR + \
74  						MMU_PAGE_TABLES_SIZE)
75  #define MMU_CACHE_MNG_ADDR		(MMU_DRAM_DEFAULT_PAGE_ADDR + \
76  					MMU_DRAM_DEFAULT_PAGE_SIZE)
77  #define DRAM_DRIVER_END_ADDR		(MMU_CACHE_MNG_ADDR + \
78  						MMU_CACHE_MNG_SIZE)
79  
80  #define DRAM_BASE_ADDR_USER		0x20000000
81  
82  #if (DRAM_DRIVER_END_ADDR > DRAM_BASE_ADDR_USER)
83  #error "Driver must reserve no more than 512MB"
84  #endif
85  
86  /*
87   * SRAM Memory Map for Driver
88   *
89   * Driver occupies DRIVER_SRAM_SIZE bytes from the start of SRAM. It is used for
90   * MME/TPC QMANs
91   *
92   */
93  
94  #define MME_QMAN_BASE_OFFSET	0x000000	/* Must be 0 */
95  #define MME_QMAN_LENGTH		64
96  #define TPC_QMAN_LENGTH		64
97  
98  #define TPC0_QMAN_BASE_OFFSET	(MME_QMAN_BASE_OFFSET + \
99  				(MME_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE))
100  #define TPC1_QMAN_BASE_OFFSET	(TPC0_QMAN_BASE_OFFSET + \
101  				(TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE))
102  #define TPC2_QMAN_BASE_OFFSET	(TPC1_QMAN_BASE_OFFSET + \
103  				(TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE))
104  #define TPC3_QMAN_BASE_OFFSET	(TPC2_QMAN_BASE_OFFSET + \
105  				(TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE))
106  #define TPC4_QMAN_BASE_OFFSET	(TPC3_QMAN_BASE_OFFSET + \
107  				(TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE))
108  #define TPC5_QMAN_BASE_OFFSET	(TPC4_QMAN_BASE_OFFSET + \
109  				(TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE))
110  #define TPC6_QMAN_BASE_OFFSET	(TPC5_QMAN_BASE_OFFSET + \
111  				(TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE))
112  #define TPC7_QMAN_BASE_OFFSET	(TPC6_QMAN_BASE_OFFSET + \
113  				(TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE))
114  
115  #define SRAM_DRIVER_RES_OFFSET	(TPC7_QMAN_BASE_OFFSET + \
116  				(TPC_QMAN_LENGTH * QMAN_PQ_ENTRY_SIZE))
117  
118  #if (SRAM_DRIVER_RES_OFFSET >= GOYA_KMD_SRAM_RESERVED_SIZE_FROM_START)
119  #error "MME/TPC QMANs SRAM space exceeds limit"
120  #endif
121  
122  #define SRAM_USER_BASE_OFFSET	GOYA_KMD_SRAM_RESERVED_SIZE_FROM_START
123  
124  /* Virtual address space */
125  #define VA_HOST_SPACE_START	0x1000000000000ull	/* 256TB */
126  #define VA_HOST_SPACE_END	0x3FF8000000000ull	/* 1PB - 1TB */
127  #define VA_HOST_SPACE_SIZE	(VA_HOST_SPACE_END - \
128  					VA_HOST_SPACE_START) /* 767TB */
129  
130  #define VA_DDR_SPACE_START	0x800000000ull		/* 32GB */
131  #define VA_DDR_SPACE_END	0x2000000000ull		/* 128GB */
132  #define VA_DDR_SPACE_SIZE	(VA_DDR_SPACE_END - \
133  					VA_DDR_SPACE_START)	/* 128GB */
134  
135  #if (HL_CPU_ACCESSIBLE_MEM_SIZE != SZ_2M)
136  #error "HL_CPU_ACCESSIBLE_MEM_SIZE must be exactly 2MB to enable MMU mapping"
137  #endif
138  
139  #define VA_CPU_ACCESSIBLE_MEM_ADDR	0x8000000000ull
140  
141  #define DMA_MAX_TRANSFER_SIZE	U32_MAX
142  
143  #define HW_CAP_PLL		0x00000001
144  #define HW_CAP_DDR_0		0x00000002
145  #define HW_CAP_DDR_1		0x00000004
146  #define HW_CAP_MME		0x00000008
147  #define HW_CAP_CPU		0x00000010
148  #define HW_CAP_DMA		0x00000020
149  #define HW_CAP_MSIX		0x00000040
150  #define HW_CAP_CPU_Q		0x00000080
151  #define HW_CAP_MMU		0x00000100
152  #define HW_CAP_TPC_MBIST	0x00000200
153  #define HW_CAP_GOLDEN		0x00000400
154  #define HW_CAP_TPC		0x00000800
155  
156  struct goya_work_freq {
157  	struct hl_device *hdev;
158  	struct delayed_work work_freq;
159  };
160  
161  struct goya_device {
162  	/* TODO: remove hw_queues_lock after moving to scheduler code */
163  	spinlock_t	hw_queues_lock;
164  	struct goya_work_freq	*goya_work;
165  
166  	u64		mme_clk;
167  	u64		tpc_clk;
168  	u64		ic_clk;
169  
170  	u64		ddr_bar_cur_addr;
171  	u32		events_stat[GOYA_ASYNC_EVENT_ID_SIZE];
172  	u32		events_stat_aggregate[GOYA_ASYNC_EVENT_ID_SIZE];
173  	u32		hw_cap_initialized;
174  	u8		device_cpu_mmu_mappings_done;
175  
176  	enum hl_pll_frequency		curr_pll_profile;
177  	enum hl_pm_mng_profile		pm_mng_profile;
178  };
179  
180  int goya_set_fixed_properties(struct hl_device *hdev);
181  int goya_mmu_init(struct hl_device *hdev);
182  void goya_init_dma_qmans(struct hl_device *hdev);
183  void goya_init_mme_qmans(struct hl_device *hdev);
184  void goya_init_tpc_qmans(struct hl_device *hdev);
185  int goya_init_cpu_queues(struct hl_device *hdev);
186  void goya_init_security(struct hl_device *hdev);
187  void goya_ack_protection_bits_errors(struct hl_device *hdev);
188  int goya_late_init(struct hl_device *hdev);
189  void goya_late_fini(struct hl_device *hdev);
190  
191  void goya_ring_doorbell(struct hl_device *hdev, u32 hw_queue_id, u32 pi);
192  void goya_pqe_write(struct hl_device *hdev, __le64 *pqe, struct hl_bd *bd);
193  void goya_update_eq_ci(struct hl_device *hdev, u32 val);
194  void goya_restore_phase_topology(struct hl_device *hdev);
195  int goya_context_switch(struct hl_device *hdev, u32 asid);
196  
197  int goya_debugfs_i2c_read(struct hl_device *hdev, u8 i2c_bus,
198  			u8 i2c_addr, u8 i2c_reg, u32 *val);
199  int goya_debugfs_i2c_write(struct hl_device *hdev, u8 i2c_bus,
200  			u8 i2c_addr, u8 i2c_reg, u32 val);
201  void goya_debugfs_led_set(struct hl_device *hdev, u8 led, u8 state);
202  
203  int goya_test_queue(struct hl_device *hdev, u32 hw_queue_id);
204  int goya_test_queues(struct hl_device *hdev);
205  int goya_test_cpu_queue(struct hl_device *hdev);
206  int goya_send_cpu_message(struct hl_device *hdev, u32 *msg, u16 len,
207  				u32 timeout, u64 *result);
208  
209  long goya_get_temperature(struct hl_device *hdev, int sensor_index, u32 attr);
210  long goya_get_voltage(struct hl_device *hdev, int sensor_index, u32 attr);
211  long goya_get_current(struct hl_device *hdev, int sensor_index, u32 attr);
212  long goya_get_fan_speed(struct hl_device *hdev, int sensor_index, u32 attr);
213  long goya_get_pwm_info(struct hl_device *hdev, int sensor_index, u32 attr);
214  void goya_set_pwm_info(struct hl_device *hdev, int sensor_index, u32 attr,
215  			long value);
216  u64 goya_get_max_power(struct hl_device *hdev);
217  void goya_set_max_power(struct hl_device *hdev, u64 value);
218  
219  void goya_set_pll_profile(struct hl_device *hdev, enum hl_pll_frequency freq);
220  void goya_add_device_attr(struct hl_device *hdev, struct attribute_group *dev_clk_attr_grp,
221  				struct attribute_group *dev_vrm_attr_grp);
222  int goya_cpucp_info_get(struct hl_device *hdev);
223  int goya_debug_coresight(struct hl_device *hdev, struct hl_ctx *ctx, void *data);
224  void goya_halt_coresight(struct hl_device *hdev, struct hl_ctx *ctx);
225  
226  int goya_suspend(struct hl_device *hdev);
227  int goya_resume(struct hl_device *hdev);
228  
229  void goya_handle_eqe(struct hl_device *hdev, struct hl_eq_entry *eq_entry);
230  void *goya_get_events_stat(struct hl_device *hdev, bool aggregate, u32 *size);
231  
232  void goya_add_end_of_cb_packets(struct hl_device *hdev, void *kernel_address,
233  				u32 len, u32 original_len, u64 cq_addr, u32 cq_val,
234  				u32 msix_vec, bool eb);
235  int goya_cs_parser(struct hl_device *hdev, struct hl_cs_parser *parser);
236  int goya_scrub_device_mem(struct hl_device *hdev);
237  void *goya_get_int_queue_base(struct hl_device *hdev, u32 queue_id,
238  				dma_addr_t *dma_handle,	u16 *queue_len);
239  u32 goya_get_dma_desc_list_size(struct hl_device *hdev, struct sg_table *sgt);
240  int goya_send_heartbeat(struct hl_device *hdev);
241  void *goya_cpu_accessible_dma_pool_alloc(struct hl_device *hdev, size_t size,
242  					dma_addr_t *dma_handle);
243  void goya_cpu_accessible_dma_pool_free(struct hl_device *hdev, size_t size,
244  					void *vaddr);
245  void goya_mmu_remove_device_cpu_mappings(struct hl_device *hdev);
246  
247  u32 goya_get_queue_id_for_cq(struct hl_device *hdev, u32 cq_idx);
248  u64 goya_get_device_time(struct hl_device *hdev);
249  int goya_set_frequency(struct hl_device *hdev, enum hl_pll_frequency freq);
250  
251  #endif /* GOYAP_H_ */
252