1/*	$NetBSD: amdgpu_navi10_ih.c,v 1.2 2021/12/18 23:44:58 riastradh Exp $	*/
2
3/*
4 * Copyright 2019 Advanced Micro Devices, Inc.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the "Software"),
8 * to deal in the Software without restriction, including without limitation
9 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
10 * and/or sell copies of the Software, and to permit persons to whom the
11 * Software is furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
19 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
20 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
21 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
22 * OTHER DEALINGS IN THE SOFTWARE.
23 *
24 */
25
26#include <sys/cdefs.h>
27__KERNEL_RCSID(0, "$NetBSD: amdgpu_navi10_ih.c,v 1.2 2021/12/18 23:44:58 riastradh Exp $");
28
29#include <linux/pci.h>
30
31#include "amdgpu.h"
32#include "amdgpu_ih.h"
33
34#include "oss/osssys_5_0_0_offset.h"
35#include "oss/osssys_5_0_0_sh_mask.h"
36
37#include "soc15_common.h"
38#include "navi10_ih.h"
39
40
41static void navi10_ih_set_interrupt_funcs(struct amdgpu_device *adev);
42
43/**
44 * navi10_ih_enable_interrupts - Enable the interrupt ring buffer
45 *
46 * @adev: amdgpu_device pointer
47 *
48 * Enable the interrupt ring buffer (NAVI10).
49 */
50static void navi10_ih_enable_interrupts(struct amdgpu_device *adev)
51{
52	u32 ih_rb_cntl = RREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL);
53
54	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, RB_ENABLE, 1);
55	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, ENABLE_INTR, 1);
56	WREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL, ih_rb_cntl);
57	adev->irq.ih.enabled = true;
58}
59
60/**
61 * navi10_ih_disable_interrupts - Disable the interrupt ring buffer
62 *
63 * @adev: amdgpu_device pointer
64 *
65 * Disable the interrupt ring buffer (NAVI10).
66 */
67static void navi10_ih_disable_interrupts(struct amdgpu_device *adev)
68{
69	u32 ih_rb_cntl = RREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL);
70
71	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, RB_ENABLE, 0);
72	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, ENABLE_INTR, 0);
73	WREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL, ih_rb_cntl);
74	/* set rptr, wptr to 0 */
75	WREG32_SOC15(OSSSYS, 0, mmIH_RB_RPTR, 0);
76	WREG32_SOC15(OSSSYS, 0, mmIH_RB_WPTR, 0);
77	adev->irq.ih.enabled = false;
78	adev->irq.ih.rptr = 0;
79}
80
81static uint32_t navi10_ih_rb_cntl(struct amdgpu_ih_ring *ih, uint32_t ih_rb_cntl)
82{
83	int rb_bufsz = order_base_2(ih->ring_size / 4);
84
85	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL,
86				   MC_SPACE, ih->use_bus_addr ? 1 : 4);
87	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL,
88				   WPTR_OVERFLOW_CLEAR, 1);
89	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL,
90				   WPTR_OVERFLOW_ENABLE, 1);
91	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, RB_SIZE, rb_bufsz);
92	/* Ring Buffer write pointer writeback. If enabled, IH_RB_WPTR register
93	 * value is written to memory
94	 */
95	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL,
96				   WPTR_WRITEBACK_ENABLE, 1);
97	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, MC_SNOOP, 1);
98	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, MC_RO, 0);
99	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, MC_VMID, 0);
100
101	return ih_rb_cntl;
102}
103
104/**
105 * navi10_ih_irq_init - init and enable the interrupt ring
106 *
107 * @adev: amdgpu_device pointer
108 *
109 * Allocate a ring buffer for the interrupt controller,
110 * enable the RLC, disable interrupts, enable the IH
111 * ring buffer and enable it (NAVI).
112 * Called at device load and reume.
113 * Returns 0 for success, errors for failure.
114 */
115static int navi10_ih_irq_init(struct amdgpu_device *adev)
116{
117	struct amdgpu_ih_ring *ih = &adev->irq.ih;
118	u32 ih_rb_cntl, ih_doorbell_rtpr, ih_chicken;
119	u32 tmp;
120
121	/* disable irqs */
122	navi10_ih_disable_interrupts(adev);
123
124	adev->nbio.funcs->ih_control(adev);
125
126	/* Ring Buffer base. [39:8] of 40-bit address of the beginning of the ring buffer*/
127	WREG32_SOC15(OSSSYS, 0, mmIH_RB_BASE, ih->gpu_addr >> 8);
128	WREG32_SOC15(OSSSYS, 0, mmIH_RB_BASE_HI, (ih->gpu_addr >> 40) & 0xff);
129
130	ih_rb_cntl = RREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL);
131	ih_rb_cntl = navi10_ih_rb_cntl(ih, ih_rb_cntl);
132	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, RPTR_REARM,
133				   !!adev->irq.msi_enabled);
134
135	if (unlikely(adev->firmware.load_type == AMDGPU_FW_LOAD_DIRECT)) {
136		if (ih->use_bus_addr) {
137			ih_chicken = RREG32_SOC15(OSSSYS, 0, mmIH_CHICKEN);
138			ih_chicken = REG_SET_FIELD(ih_chicken,
139					IH_CHICKEN, MC_SPACE_GPA_ENABLE, 1);
140			WREG32_SOC15(OSSSYS, 0, mmIH_CHICKEN, ih_chicken);
141		}
142	}
143
144	WREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL, ih_rb_cntl);
145
146	/* set the writeback address whether it's enabled or not */
147	WREG32_SOC15(OSSSYS, 0, mmIH_RB_WPTR_ADDR_LO,
148		     lower_32_bits(ih->wptr_addr));
149	WREG32_SOC15(OSSSYS, 0, mmIH_RB_WPTR_ADDR_HI,
150		     upper_32_bits(ih->wptr_addr) & 0xFFFF);
151
152	/* set rptr, wptr to 0 */
153	WREG32_SOC15(OSSSYS, 0, mmIH_RB_RPTR, 0);
154	WREG32_SOC15(OSSSYS, 0, mmIH_RB_WPTR, 0);
155
156	ih_doorbell_rtpr = RREG32_SOC15(OSSSYS, 0, mmIH_DOORBELL_RPTR);
157	if (ih->use_doorbell) {
158		ih_doorbell_rtpr = REG_SET_FIELD(ih_doorbell_rtpr,
159						 IH_DOORBELL_RPTR, OFFSET,
160						 ih->doorbell_index);
161		ih_doorbell_rtpr = REG_SET_FIELD(ih_doorbell_rtpr,
162						 IH_DOORBELL_RPTR, ENABLE, 1);
163	} else {
164		ih_doorbell_rtpr = REG_SET_FIELD(ih_doorbell_rtpr,
165						 IH_DOORBELL_RPTR, ENABLE, 0);
166	}
167	WREG32_SOC15(OSSSYS, 0, mmIH_DOORBELL_RPTR, ih_doorbell_rtpr);
168
169	adev->nbio.funcs->ih_doorbell_range(adev, ih->use_doorbell,
170					    ih->doorbell_index);
171
172	tmp = RREG32_SOC15(OSSSYS, 0, mmIH_STORM_CLIENT_LIST_CNTL);
173	tmp = REG_SET_FIELD(tmp, IH_STORM_CLIENT_LIST_CNTL,
174			    CLIENT18_IS_STORM_CLIENT, 1);
175	WREG32_SOC15(OSSSYS, 0, mmIH_STORM_CLIENT_LIST_CNTL, tmp);
176
177	tmp = RREG32_SOC15(OSSSYS, 0, mmIH_INT_FLOOD_CNTL);
178	tmp = REG_SET_FIELD(tmp, IH_INT_FLOOD_CNTL, FLOOD_CNTL_ENABLE, 1);
179	WREG32_SOC15(OSSSYS, 0, mmIH_INT_FLOOD_CNTL, tmp);
180
181	pci_set_master(adev->pdev);
182
183	/* enable interrupts */
184	navi10_ih_enable_interrupts(adev);
185
186	return 0;
187}
188
189/**
190 * navi10_ih_irq_disable - disable interrupts
191 *
192 * @adev: amdgpu_device pointer
193 *
194 * Disable interrupts on the hw (NAVI10).
195 */
196static void navi10_ih_irq_disable(struct amdgpu_device *adev)
197{
198	navi10_ih_disable_interrupts(adev);
199
200	/* Wait and acknowledge irq */
201	mdelay(1);
202}
203
204/**
205 * navi10_ih_get_wptr - get the IH ring buffer wptr
206 *
207 * @adev: amdgpu_device pointer
208 *
209 * Get the IH ring buffer wptr from either the register
210 * or the writeback memory buffer (NAVI10).  Also check for
211 * ring buffer overflow and deal with it.
212 * Returns the value of the wptr.
213 */
214static u32 navi10_ih_get_wptr(struct amdgpu_device *adev,
215			      struct amdgpu_ih_ring *ih)
216{
217	u32 wptr, reg, tmp;
218
219	wptr = le32_to_cpu(*ih->wptr_cpu);
220
221	if (!REG_GET_FIELD(wptr, IH_RB_WPTR, RB_OVERFLOW))
222		goto out;
223
224	reg = SOC15_REG_OFFSET(OSSSYS, 0, mmIH_RB_WPTR);
225	wptr = RREG32_NO_KIQ(reg);
226	if (!REG_GET_FIELD(wptr, IH_RB_WPTR, RB_OVERFLOW))
227		goto out;
228	wptr = REG_SET_FIELD(wptr, IH_RB_WPTR, RB_OVERFLOW, 0);
229
230	/* When a ring buffer overflow happen start parsing interrupt
231	 * from the last not overwritten vector (wptr + 32). Hopefully
232	 * this should allow us to catch up.
233	 */
234	tmp = (wptr + 32) & ih->ptr_mask;
235	dev_warn(adev->dev, "IH ring buffer overflow "
236		 "(0x%08X, 0x%08X, 0x%08X)\n",
237		 wptr, ih->rptr, tmp);
238	ih->rptr = tmp;
239
240	reg = SOC15_REG_OFFSET(OSSSYS, 0, mmIH_RB_CNTL);
241	tmp = RREG32_NO_KIQ(reg);
242	tmp = REG_SET_FIELD(tmp, IH_RB_CNTL, WPTR_OVERFLOW_CLEAR, 1);
243	WREG32_NO_KIQ(reg, tmp);
244out:
245	return (wptr & ih->ptr_mask);
246}
247
248/**
249 * navi10_ih_decode_iv - decode an interrupt vector
250 *
251 * @adev: amdgpu_device pointer
252 *
253 * Decodes the interrupt vector at the current rptr
254 * position and also advance the position.
255 */
256static void navi10_ih_decode_iv(struct amdgpu_device *adev,
257				struct amdgpu_ih_ring *ih,
258				struct amdgpu_iv_entry *entry)
259{
260	/* wptr/rptr are in bytes! */
261	u32 ring_index = ih->rptr >> 2;
262	uint32_t dw[8];
263
264	dw[0] = le32_to_cpu(ih->ring[ring_index + 0]);
265	dw[1] = le32_to_cpu(ih->ring[ring_index + 1]);
266	dw[2] = le32_to_cpu(ih->ring[ring_index + 2]);
267	dw[3] = le32_to_cpu(ih->ring[ring_index + 3]);
268	dw[4] = le32_to_cpu(ih->ring[ring_index + 4]);
269	dw[5] = le32_to_cpu(ih->ring[ring_index + 5]);
270	dw[6] = le32_to_cpu(ih->ring[ring_index + 6]);
271	dw[7] = le32_to_cpu(ih->ring[ring_index + 7]);
272
273	entry->client_id = dw[0] & 0xff;
274	entry->src_id = (dw[0] >> 8) & 0xff;
275	entry->ring_id = (dw[0] >> 16) & 0xff;
276	entry->vmid = (dw[0] >> 24) & 0xf;
277	entry->vmid_src = (dw[0] >> 31);
278	entry->timestamp = dw[1] | ((u64)(dw[2] & 0xffff) << 32);
279	entry->timestamp_src = dw[2] >> 31;
280	entry->pasid = dw[3] & 0xffff;
281	entry->pasid_src = dw[3] >> 31;
282	entry->src_data[0] = dw[4];
283	entry->src_data[1] = dw[5];
284	entry->src_data[2] = dw[6];
285	entry->src_data[3] = dw[7];
286
287	/* wptr/rptr are in bytes! */
288	ih->rptr += 32;
289}
290
291/**
292 * navi10_ih_set_rptr - set the IH ring buffer rptr
293 *
294 * @adev: amdgpu_device pointer
295 *
296 * Set the IH ring buffer rptr.
297 */
298static void navi10_ih_set_rptr(struct amdgpu_device *adev,
299			       struct amdgpu_ih_ring *ih)
300{
301	if (ih->use_doorbell) {
302		/* XXX check if swapping is necessary on BE */
303		*ih->rptr_cpu = ih->rptr;
304		WDOORBELL32(ih->doorbell_index, ih->rptr);
305	} else
306		WREG32_SOC15(OSSSYS, 0, mmIH_RB_RPTR, ih->rptr);
307}
308
309static int navi10_ih_early_init(void *handle)
310{
311	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
312
313	navi10_ih_set_interrupt_funcs(adev);
314	return 0;
315}
316
317static int navi10_ih_sw_init(void *handle)
318{
319	int r;
320	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
321	bool use_bus_addr;
322
323	/* use gpu virtual address for ih ring
324	 * until ih_checken is programmed to allow
325	 * use bus address for ih ring by psp bl */
326	use_bus_addr =
327		(adev->firmware.load_type == AMDGPU_FW_LOAD_PSP) ? false : true;
328	r = amdgpu_ih_ring_init(adev, &adev->irq.ih, 256 * 1024, use_bus_addr);
329	if (r)
330		return r;
331
332	adev->irq.ih.use_doorbell = true;
333	adev->irq.ih.doorbell_index = adev->doorbell_index.ih << 1;
334
335	r = amdgpu_irq_init(adev);
336
337	return r;
338}
339
340static int navi10_ih_sw_fini(void *handle)
341{
342	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
343
344	amdgpu_irq_fini(adev);
345	amdgpu_ih_ring_fini(adev, &adev->irq.ih);
346
347	return 0;
348}
349
350static int navi10_ih_hw_init(void *handle)
351{
352	int r;
353	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
354
355	r = navi10_ih_irq_init(adev);
356	if (r)
357		return r;
358
359	return 0;
360}
361
362static int navi10_ih_hw_fini(void *handle)
363{
364	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
365
366	navi10_ih_irq_disable(adev);
367
368	return 0;
369}
370
371static int navi10_ih_suspend(void *handle)
372{
373	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
374
375	return navi10_ih_hw_fini(adev);
376}
377
378static int navi10_ih_resume(void *handle)
379{
380	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
381
382	return navi10_ih_hw_init(adev);
383}
384
385static bool navi10_ih_is_idle(void *handle)
386{
387	/* todo */
388	return true;
389}
390
391static int navi10_ih_wait_for_idle(void *handle)
392{
393	/* todo */
394	return -ETIMEDOUT;
395}
396
397static int navi10_ih_soft_reset(void *handle)
398{
399	/* todo */
400	return 0;
401}
402
403static void navi10_ih_update_clockgating_state(struct amdgpu_device *adev,
404					       bool enable)
405{
406	uint32_t data, def, field_val;
407
408	if (adev->cg_flags & AMD_CG_SUPPORT_IH_CG) {
409		def = data = RREG32_SOC15(OSSSYS, 0, mmIH_CLK_CTRL);
410		field_val = enable ? 0 : 1;
411		data = REG_SET_FIELD(data, IH_CLK_CTRL,
412				     DBUS_MUX_CLK_SOFT_OVERRIDE, field_val);
413		data = REG_SET_FIELD(data, IH_CLK_CTRL,
414				     OSSSYS_SHARE_CLK_SOFT_OVERRIDE, field_val);
415		data = REG_SET_FIELD(data, IH_CLK_CTRL,
416				     LIMIT_SMN_CLK_SOFT_OVERRIDE, field_val);
417		data = REG_SET_FIELD(data, IH_CLK_CTRL,
418				     DYN_CLK_SOFT_OVERRIDE, field_val);
419		data = REG_SET_FIELD(data, IH_CLK_CTRL,
420				     REG_CLK_SOFT_OVERRIDE, field_val);
421		if (def != data)
422			WREG32_SOC15(OSSSYS, 0, mmIH_CLK_CTRL, data);
423	}
424
425	return;
426}
427
428static int navi10_ih_set_clockgating_state(void *handle,
429					   enum amd_clockgating_state state)
430{
431	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
432
433	navi10_ih_update_clockgating_state(adev,
434				state == AMD_CG_STATE_GATE);
435	return 0;
436}
437
438static int navi10_ih_set_powergating_state(void *handle,
439					   enum amd_powergating_state state)
440{
441	return 0;
442}
443
444static void navi10_ih_get_clockgating_state(void *handle, u32 *flags)
445{
446	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
447
448	if (!RREG32_SOC15(OSSSYS, 0, mmIH_CLK_CTRL))
449		*flags |= AMD_CG_SUPPORT_IH_CG;
450
451	return;
452}
453
454static const struct amd_ip_funcs navi10_ih_ip_funcs = {
455	.name = "navi10_ih",
456	.early_init = navi10_ih_early_init,
457	.late_init = NULL,
458	.sw_init = navi10_ih_sw_init,
459	.sw_fini = navi10_ih_sw_fini,
460	.hw_init = navi10_ih_hw_init,
461	.hw_fini = navi10_ih_hw_fini,
462	.suspend = navi10_ih_suspend,
463	.resume = navi10_ih_resume,
464	.is_idle = navi10_ih_is_idle,
465	.wait_for_idle = navi10_ih_wait_for_idle,
466	.soft_reset = navi10_ih_soft_reset,
467	.set_clockgating_state = navi10_ih_set_clockgating_state,
468	.set_powergating_state = navi10_ih_set_powergating_state,
469	.get_clockgating_state = navi10_ih_get_clockgating_state,
470};
471
472static const struct amdgpu_ih_funcs navi10_ih_funcs = {
473	.get_wptr = navi10_ih_get_wptr,
474	.decode_iv = navi10_ih_decode_iv,
475	.set_rptr = navi10_ih_set_rptr
476};
477
478static void navi10_ih_set_interrupt_funcs(struct amdgpu_device *adev)
479{
480	if (adev->irq.ih_funcs == NULL)
481		adev->irq.ih_funcs = &navi10_ih_funcs;
482}
483
484const struct amdgpu_ip_block_version navi10_ih_ip_block =
485{
486	.type = AMD_IP_BLOCK_TYPE_IH,
487	.major = 5,
488	.minor = 0,
489	.rev = 0,
490	.funcs = &navi10_ih_ip_funcs,
491};
492