1/*
2 * Copyright 2012 Advanced Micro Devices, Inc.
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
13 *
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20 * OTHER DEALINGS IN THE SOFTWARE.
21 *
22 */
23
24#include <linux/math64.h>
25#include <linux/pci.h>
26#include <linux/seq_file.h>
27
28#include "atom.h"
29#include "evergreen.h"
30#include "ni_dpm.h"
31#include "nid.h"
32#include "r600_dpm.h"
33#include "rv770.h"
34#include "radeon.h"
35#include "radeon_asic.h"
36
37#define MC_CG_ARB_FREQ_F0           0x0a
38#define MC_CG_ARB_FREQ_F1           0x0b
39#define MC_CG_ARB_FREQ_F2           0x0c
40#define MC_CG_ARB_FREQ_F3           0x0d
41
42#define SMC_RAM_END 0xC000
43
44static const struct ni_cac_weights cac_weights_cayman_xt =
45{
46	0x15,
47	0x2,
48	0x19,
49	0x2,
50	0x8,
51	0x14,
52	0x2,
53	0x16,
54	0xE,
55	0x17,
56	0x13,
57	0x2B,
58	0x10,
59	0x7,
60	0x5,
61	0x5,
62	0x5,
63	0x2,
64	0x3,
65	0x9,
66	0x10,
67	0x10,
68	0x2B,
69	0xA,
70	0x9,
71	0x4,
72	0xD,
73	0xD,
74	0x3E,
75	0x18,
76	0x14,
77	0,
78	0x3,
79	0x3,
80	0x5,
81	0,
82	0x2,
83	0,
84	0,
85	0,
86	0,
87	0,
88	0,
89	0,
90	0,
91	0,
92	0x1CC,
93	0,
94	0x164,
95	1,
96	1,
97	1,
98	1,
99	12,
100	12,
101	12,
102	0x12,
103	0x1F,
104	132,
105	5,
106	7,
107	0,
108	{ 0, 0, 0, 0, 0, 0, 0, 0 },
109	{ 0, 0, 0, 0 },
110	true
111};
112
113static const struct ni_cac_weights cac_weights_cayman_pro =
114{
115	0x16,
116	0x4,
117	0x10,
118	0x2,
119	0xA,
120	0x16,
121	0x2,
122	0x18,
123	0x10,
124	0x1A,
125	0x16,
126	0x2D,
127	0x12,
128	0xA,
129	0x6,
130	0x6,
131	0x6,
132	0x2,
133	0x4,
134	0xB,
135	0x11,
136	0x11,
137	0x2D,
138	0xC,
139	0xC,
140	0x7,
141	0x10,
142	0x10,
143	0x3F,
144	0x1A,
145	0x16,
146	0,
147	0x7,
148	0x4,
149	0x6,
150	1,
151	0x2,
152	0x1,
153	0,
154	0,
155	0,
156	0,
157	0,
158	0,
159	0x30,
160	0,
161	0x1CF,
162	0,
163	0x166,
164	1,
165	1,
166	1,
167	1,
168	12,
169	12,
170	12,
171	0x15,
172	0x1F,
173	132,
174	6,
175	6,
176	0,
177	{ 0, 0, 0, 0, 0, 0, 0, 0 },
178	{ 0, 0, 0, 0 },
179	true
180};
181
182static const struct ni_cac_weights cac_weights_cayman_le =
183{
184	0x7,
185	0xE,
186	0x1,
187	0xA,
188	0x1,
189	0x3F,
190	0x2,
191	0x18,
192	0x10,
193	0x1A,
194	0x1,
195	0x3F,
196	0x1,
197	0xE,
198	0x6,
199	0x6,
200	0x6,
201	0x2,
202	0x4,
203	0x9,
204	0x1A,
205	0x1A,
206	0x2C,
207	0xA,
208	0x11,
209	0x8,
210	0x19,
211	0x19,
212	0x1,
213	0x1,
214	0x1A,
215	0,
216	0x8,
217	0x5,
218	0x8,
219	0x1,
220	0x3,
221	0x1,
222	0,
223	0,
224	0,
225	0,
226	0,
227	0,
228	0x38,
229	0x38,
230	0x239,
231	0x3,
232	0x18A,
233	1,
234	1,
235	1,
236	1,
237	12,
238	12,
239	12,
240	0x15,
241	0x22,
242	132,
243	6,
244	6,
245	0,
246	{ 0, 0, 0, 0, 0, 0, 0, 0 },
247	{ 0, 0, 0, 0 },
248	true
249};
250
251#define NISLANDS_MGCG_SEQUENCE  300
252
253static const u32 cayman_cgcg_cgls_default[] =
254{
255	0x000008f8, 0x00000010, 0xffffffff,
256	0x000008fc, 0x00000000, 0xffffffff,
257	0x000008f8, 0x00000011, 0xffffffff,
258	0x000008fc, 0x00000000, 0xffffffff,
259	0x000008f8, 0x00000012, 0xffffffff,
260	0x000008fc, 0x00000000, 0xffffffff,
261	0x000008f8, 0x00000013, 0xffffffff,
262	0x000008fc, 0x00000000, 0xffffffff,
263	0x000008f8, 0x00000014, 0xffffffff,
264	0x000008fc, 0x00000000, 0xffffffff,
265	0x000008f8, 0x00000015, 0xffffffff,
266	0x000008fc, 0x00000000, 0xffffffff,
267	0x000008f8, 0x00000016, 0xffffffff,
268	0x000008fc, 0x00000000, 0xffffffff,
269	0x000008f8, 0x00000017, 0xffffffff,
270	0x000008fc, 0x00000000, 0xffffffff,
271	0x000008f8, 0x00000018, 0xffffffff,
272	0x000008fc, 0x00000000, 0xffffffff,
273	0x000008f8, 0x00000019, 0xffffffff,
274	0x000008fc, 0x00000000, 0xffffffff,
275	0x000008f8, 0x0000001a, 0xffffffff,
276	0x000008fc, 0x00000000, 0xffffffff,
277	0x000008f8, 0x0000001b, 0xffffffff,
278	0x000008fc, 0x00000000, 0xffffffff,
279	0x000008f8, 0x00000020, 0xffffffff,
280	0x000008fc, 0x00000000, 0xffffffff,
281	0x000008f8, 0x00000021, 0xffffffff,
282	0x000008fc, 0x00000000, 0xffffffff,
283	0x000008f8, 0x00000022, 0xffffffff,
284	0x000008fc, 0x00000000, 0xffffffff,
285	0x000008f8, 0x00000023, 0xffffffff,
286	0x000008fc, 0x00000000, 0xffffffff,
287	0x000008f8, 0x00000024, 0xffffffff,
288	0x000008fc, 0x00000000, 0xffffffff,
289	0x000008f8, 0x00000025, 0xffffffff,
290	0x000008fc, 0x00000000, 0xffffffff,
291	0x000008f8, 0x00000026, 0xffffffff,
292	0x000008fc, 0x00000000, 0xffffffff,
293	0x000008f8, 0x00000027, 0xffffffff,
294	0x000008fc, 0x00000000, 0xffffffff,
295	0x000008f8, 0x00000028, 0xffffffff,
296	0x000008fc, 0x00000000, 0xffffffff,
297	0x000008f8, 0x00000029, 0xffffffff,
298	0x000008fc, 0x00000000, 0xffffffff,
299	0x000008f8, 0x0000002a, 0xffffffff,
300	0x000008fc, 0x00000000, 0xffffffff,
301	0x000008f8, 0x0000002b, 0xffffffff,
302	0x000008fc, 0x00000000, 0xffffffff
303};
304#define CAYMAN_CGCG_CGLS_DEFAULT_LENGTH sizeof(cayman_cgcg_cgls_default) / (3 * sizeof(u32))
305
306static const u32 cayman_cgcg_cgls_disable[] =
307{
308	0x000008f8, 0x00000010, 0xffffffff,
309	0x000008fc, 0xffffffff, 0xffffffff,
310	0x000008f8, 0x00000011, 0xffffffff,
311	0x000008fc, 0xffffffff, 0xffffffff,
312	0x000008f8, 0x00000012, 0xffffffff,
313	0x000008fc, 0xffffffff, 0xffffffff,
314	0x000008f8, 0x00000013, 0xffffffff,
315	0x000008fc, 0xffffffff, 0xffffffff,
316	0x000008f8, 0x00000014, 0xffffffff,
317	0x000008fc, 0xffffffff, 0xffffffff,
318	0x000008f8, 0x00000015, 0xffffffff,
319	0x000008fc, 0xffffffff, 0xffffffff,
320	0x000008f8, 0x00000016, 0xffffffff,
321	0x000008fc, 0xffffffff, 0xffffffff,
322	0x000008f8, 0x00000017, 0xffffffff,
323	0x000008fc, 0xffffffff, 0xffffffff,
324	0x000008f8, 0x00000018, 0xffffffff,
325	0x000008fc, 0xffffffff, 0xffffffff,
326	0x000008f8, 0x00000019, 0xffffffff,
327	0x000008fc, 0xffffffff, 0xffffffff,
328	0x000008f8, 0x0000001a, 0xffffffff,
329	0x000008fc, 0xffffffff, 0xffffffff,
330	0x000008f8, 0x0000001b, 0xffffffff,
331	0x000008fc, 0xffffffff, 0xffffffff,
332	0x000008f8, 0x00000020, 0xffffffff,
333	0x000008fc, 0x00000000, 0xffffffff,
334	0x000008f8, 0x00000021, 0xffffffff,
335	0x000008fc, 0x00000000, 0xffffffff,
336	0x000008f8, 0x00000022, 0xffffffff,
337	0x000008fc, 0x00000000, 0xffffffff,
338	0x000008f8, 0x00000023, 0xffffffff,
339	0x000008fc, 0x00000000, 0xffffffff,
340	0x000008f8, 0x00000024, 0xffffffff,
341	0x000008fc, 0x00000000, 0xffffffff,
342	0x000008f8, 0x00000025, 0xffffffff,
343	0x000008fc, 0x00000000, 0xffffffff,
344	0x000008f8, 0x00000026, 0xffffffff,
345	0x000008fc, 0x00000000, 0xffffffff,
346	0x000008f8, 0x00000027, 0xffffffff,
347	0x000008fc, 0x00000000, 0xffffffff,
348	0x000008f8, 0x00000028, 0xffffffff,
349	0x000008fc, 0x00000000, 0xffffffff,
350	0x000008f8, 0x00000029, 0xffffffff,
351	0x000008fc, 0x00000000, 0xffffffff,
352	0x000008f8, 0x0000002a, 0xffffffff,
353	0x000008fc, 0x00000000, 0xffffffff,
354	0x000008f8, 0x0000002b, 0xffffffff,
355	0x000008fc, 0x00000000, 0xffffffff,
356	0x00000644, 0x000f7902, 0x001f4180,
357	0x00000644, 0x000f3802, 0x001f4180
358};
359#define CAYMAN_CGCG_CGLS_DISABLE_LENGTH sizeof(cayman_cgcg_cgls_disable) / (3 * sizeof(u32))
360
361static const u32 cayman_cgcg_cgls_enable[] =
362{
363	0x00000644, 0x000f7882, 0x001f4080,
364	0x000008f8, 0x00000010, 0xffffffff,
365	0x000008fc, 0x00000000, 0xffffffff,
366	0x000008f8, 0x00000011, 0xffffffff,
367	0x000008fc, 0x00000000, 0xffffffff,
368	0x000008f8, 0x00000012, 0xffffffff,
369	0x000008fc, 0x00000000, 0xffffffff,
370	0x000008f8, 0x00000013, 0xffffffff,
371	0x000008fc, 0x00000000, 0xffffffff,
372	0x000008f8, 0x00000014, 0xffffffff,
373	0x000008fc, 0x00000000, 0xffffffff,
374	0x000008f8, 0x00000015, 0xffffffff,
375	0x000008fc, 0x00000000, 0xffffffff,
376	0x000008f8, 0x00000016, 0xffffffff,
377	0x000008fc, 0x00000000, 0xffffffff,
378	0x000008f8, 0x00000017, 0xffffffff,
379	0x000008fc, 0x00000000, 0xffffffff,
380	0x000008f8, 0x00000018, 0xffffffff,
381	0x000008fc, 0x00000000, 0xffffffff,
382	0x000008f8, 0x00000019, 0xffffffff,
383	0x000008fc, 0x00000000, 0xffffffff,
384	0x000008f8, 0x0000001a, 0xffffffff,
385	0x000008fc, 0x00000000, 0xffffffff,
386	0x000008f8, 0x0000001b, 0xffffffff,
387	0x000008fc, 0x00000000, 0xffffffff,
388	0x000008f8, 0x00000020, 0xffffffff,
389	0x000008fc, 0xffffffff, 0xffffffff,
390	0x000008f8, 0x00000021, 0xffffffff,
391	0x000008fc, 0xffffffff, 0xffffffff,
392	0x000008f8, 0x00000022, 0xffffffff,
393	0x000008fc, 0xffffffff, 0xffffffff,
394	0x000008f8, 0x00000023, 0xffffffff,
395	0x000008fc, 0xffffffff, 0xffffffff,
396	0x000008f8, 0x00000024, 0xffffffff,
397	0x000008fc, 0xffffffff, 0xffffffff,
398	0x000008f8, 0x00000025, 0xffffffff,
399	0x000008fc, 0xffffffff, 0xffffffff,
400	0x000008f8, 0x00000026, 0xffffffff,
401	0x000008fc, 0xffffffff, 0xffffffff,
402	0x000008f8, 0x00000027, 0xffffffff,
403	0x000008fc, 0xffffffff, 0xffffffff,
404	0x000008f8, 0x00000028, 0xffffffff,
405	0x000008fc, 0xffffffff, 0xffffffff,
406	0x000008f8, 0x00000029, 0xffffffff,
407	0x000008fc, 0xffffffff, 0xffffffff,
408	0x000008f8, 0x0000002a, 0xffffffff,
409	0x000008fc, 0xffffffff, 0xffffffff,
410	0x000008f8, 0x0000002b, 0xffffffff,
411	0x000008fc, 0xffffffff, 0xffffffff
412};
413#define CAYMAN_CGCG_CGLS_ENABLE_LENGTH  sizeof(cayman_cgcg_cgls_enable) / (3 * sizeof(u32))
414
415static const u32 cayman_mgcg_default[] =
416{
417	0x0000802c, 0xc0000000, 0xffffffff,
418	0x00003fc4, 0xc0000000, 0xffffffff,
419	0x00005448, 0x00000100, 0xffffffff,
420	0x000055e4, 0x00000100, 0xffffffff,
421	0x0000160c, 0x00000100, 0xffffffff,
422	0x00008984, 0x06000100, 0xffffffff,
423	0x0000c164, 0x00000100, 0xffffffff,
424	0x00008a18, 0x00000100, 0xffffffff,
425	0x0000897c, 0x06000100, 0xffffffff,
426	0x00008b28, 0x00000100, 0xffffffff,
427	0x00009144, 0x00800200, 0xffffffff,
428	0x00009a60, 0x00000100, 0xffffffff,
429	0x00009868, 0x00000100, 0xffffffff,
430	0x00008d58, 0x00000100, 0xffffffff,
431	0x00009510, 0x00000100, 0xffffffff,
432	0x0000949c, 0x00000100, 0xffffffff,
433	0x00009654, 0x00000100, 0xffffffff,
434	0x00009030, 0x00000100, 0xffffffff,
435	0x00009034, 0x00000100, 0xffffffff,
436	0x00009038, 0x00000100, 0xffffffff,
437	0x0000903c, 0x00000100, 0xffffffff,
438	0x00009040, 0x00000100, 0xffffffff,
439	0x0000a200, 0x00000100, 0xffffffff,
440	0x0000a204, 0x00000100, 0xffffffff,
441	0x0000a208, 0x00000100, 0xffffffff,
442	0x0000a20c, 0x00000100, 0xffffffff,
443	0x00009744, 0x00000100, 0xffffffff,
444	0x00003f80, 0x00000100, 0xffffffff,
445	0x0000a210, 0x00000100, 0xffffffff,
446	0x0000a214, 0x00000100, 0xffffffff,
447	0x000004d8, 0x00000100, 0xffffffff,
448	0x00009664, 0x00000100, 0xffffffff,
449	0x00009698, 0x00000100, 0xffffffff,
450	0x000004d4, 0x00000200, 0xffffffff,
451	0x000004d0, 0x00000000, 0xffffffff,
452	0x000030cc, 0x00000104, 0xffffffff,
453	0x0000d0c0, 0x00000100, 0xffffffff,
454	0x0000d8c0, 0x00000100, 0xffffffff,
455	0x0000802c, 0x40000000, 0xffffffff,
456	0x00003fc4, 0x40000000, 0xffffffff,
457	0x0000915c, 0x00010000, 0xffffffff,
458	0x00009160, 0x00030002, 0xffffffff,
459	0x00009164, 0x00050004, 0xffffffff,
460	0x00009168, 0x00070006, 0xffffffff,
461	0x00009178, 0x00070000, 0xffffffff,
462	0x0000917c, 0x00030002, 0xffffffff,
463	0x00009180, 0x00050004, 0xffffffff,
464	0x0000918c, 0x00010006, 0xffffffff,
465	0x00009190, 0x00090008, 0xffffffff,
466	0x00009194, 0x00070000, 0xffffffff,
467	0x00009198, 0x00030002, 0xffffffff,
468	0x0000919c, 0x00050004, 0xffffffff,
469	0x000091a8, 0x00010006, 0xffffffff,
470	0x000091ac, 0x00090008, 0xffffffff,
471	0x000091b0, 0x00070000, 0xffffffff,
472	0x000091b4, 0x00030002, 0xffffffff,
473	0x000091b8, 0x00050004, 0xffffffff,
474	0x000091c4, 0x00010006, 0xffffffff,
475	0x000091c8, 0x00090008, 0xffffffff,
476	0x000091cc, 0x00070000, 0xffffffff,
477	0x000091d0, 0x00030002, 0xffffffff,
478	0x000091d4, 0x00050004, 0xffffffff,
479	0x000091e0, 0x00010006, 0xffffffff,
480	0x000091e4, 0x00090008, 0xffffffff,
481	0x000091e8, 0x00000000, 0xffffffff,
482	0x000091ec, 0x00070000, 0xffffffff,
483	0x000091f0, 0x00030002, 0xffffffff,
484	0x000091f4, 0x00050004, 0xffffffff,
485	0x00009200, 0x00010006, 0xffffffff,
486	0x00009204, 0x00090008, 0xffffffff,
487	0x00009208, 0x00070000, 0xffffffff,
488	0x0000920c, 0x00030002, 0xffffffff,
489	0x00009210, 0x00050004, 0xffffffff,
490	0x0000921c, 0x00010006, 0xffffffff,
491	0x00009220, 0x00090008, 0xffffffff,
492	0x00009224, 0x00070000, 0xffffffff,
493	0x00009228, 0x00030002, 0xffffffff,
494	0x0000922c, 0x00050004, 0xffffffff,
495	0x00009238, 0x00010006, 0xffffffff,
496	0x0000923c, 0x00090008, 0xffffffff,
497	0x00009240, 0x00070000, 0xffffffff,
498	0x00009244, 0x00030002, 0xffffffff,
499	0x00009248, 0x00050004, 0xffffffff,
500	0x00009254, 0x00010006, 0xffffffff,
501	0x00009258, 0x00090008, 0xffffffff,
502	0x0000925c, 0x00070000, 0xffffffff,
503	0x00009260, 0x00030002, 0xffffffff,
504	0x00009264, 0x00050004, 0xffffffff,
505	0x00009270, 0x00010006, 0xffffffff,
506	0x00009274, 0x00090008, 0xffffffff,
507	0x00009278, 0x00070000, 0xffffffff,
508	0x0000927c, 0x00030002, 0xffffffff,
509	0x00009280, 0x00050004, 0xffffffff,
510	0x0000928c, 0x00010006, 0xffffffff,
511	0x00009290, 0x00090008, 0xffffffff,
512	0x000092a8, 0x00070000, 0xffffffff,
513	0x000092ac, 0x00030002, 0xffffffff,
514	0x000092b0, 0x00050004, 0xffffffff,
515	0x000092bc, 0x00010006, 0xffffffff,
516	0x000092c0, 0x00090008, 0xffffffff,
517	0x000092c4, 0x00070000, 0xffffffff,
518	0x000092c8, 0x00030002, 0xffffffff,
519	0x000092cc, 0x00050004, 0xffffffff,
520	0x000092d8, 0x00010006, 0xffffffff,
521	0x000092dc, 0x00090008, 0xffffffff,
522	0x00009294, 0x00000000, 0xffffffff,
523	0x0000802c, 0x40010000, 0xffffffff,
524	0x00003fc4, 0x40010000, 0xffffffff,
525	0x0000915c, 0x00010000, 0xffffffff,
526	0x00009160, 0x00030002, 0xffffffff,
527	0x00009164, 0x00050004, 0xffffffff,
528	0x00009168, 0x00070006, 0xffffffff,
529	0x00009178, 0x00070000, 0xffffffff,
530	0x0000917c, 0x00030002, 0xffffffff,
531	0x00009180, 0x00050004, 0xffffffff,
532	0x0000918c, 0x00010006, 0xffffffff,
533	0x00009190, 0x00090008, 0xffffffff,
534	0x00009194, 0x00070000, 0xffffffff,
535	0x00009198, 0x00030002, 0xffffffff,
536	0x0000919c, 0x00050004, 0xffffffff,
537	0x000091a8, 0x00010006, 0xffffffff,
538	0x000091ac, 0x00090008, 0xffffffff,
539	0x000091b0, 0x00070000, 0xffffffff,
540	0x000091b4, 0x00030002, 0xffffffff,
541	0x000091b8, 0x00050004, 0xffffffff,
542	0x000091c4, 0x00010006, 0xffffffff,
543	0x000091c8, 0x00090008, 0xffffffff,
544	0x000091cc, 0x00070000, 0xffffffff,
545	0x000091d0, 0x00030002, 0xffffffff,
546	0x000091d4, 0x00050004, 0xffffffff,
547	0x000091e0, 0x00010006, 0xffffffff,
548	0x000091e4, 0x00090008, 0xffffffff,
549	0x000091e8, 0x00000000, 0xffffffff,
550	0x000091ec, 0x00070000, 0xffffffff,
551	0x000091f0, 0x00030002, 0xffffffff,
552	0x000091f4, 0x00050004, 0xffffffff,
553	0x00009200, 0x00010006, 0xffffffff,
554	0x00009204, 0x00090008, 0xffffffff,
555	0x00009208, 0x00070000, 0xffffffff,
556	0x0000920c, 0x00030002, 0xffffffff,
557	0x00009210, 0x00050004, 0xffffffff,
558	0x0000921c, 0x00010006, 0xffffffff,
559	0x00009220, 0x00090008, 0xffffffff,
560	0x00009224, 0x00070000, 0xffffffff,
561	0x00009228, 0x00030002, 0xffffffff,
562	0x0000922c, 0x00050004, 0xffffffff,
563	0x00009238, 0x00010006, 0xffffffff,
564	0x0000923c, 0x00090008, 0xffffffff,
565	0x00009240, 0x00070000, 0xffffffff,
566	0x00009244, 0x00030002, 0xffffffff,
567	0x00009248, 0x00050004, 0xffffffff,
568	0x00009254, 0x00010006, 0xffffffff,
569	0x00009258, 0x00090008, 0xffffffff,
570	0x0000925c, 0x00070000, 0xffffffff,
571	0x00009260, 0x00030002, 0xffffffff,
572	0x00009264, 0x00050004, 0xffffffff,
573	0x00009270, 0x00010006, 0xffffffff,
574	0x00009274, 0x00090008, 0xffffffff,
575	0x00009278, 0x00070000, 0xffffffff,
576	0x0000927c, 0x00030002, 0xffffffff,
577	0x00009280, 0x00050004, 0xffffffff,
578	0x0000928c, 0x00010006, 0xffffffff,
579	0x00009290, 0x00090008, 0xffffffff,
580	0x000092a8, 0x00070000, 0xffffffff,
581	0x000092ac, 0x00030002, 0xffffffff,
582	0x000092b0, 0x00050004, 0xffffffff,
583	0x000092bc, 0x00010006, 0xffffffff,
584	0x000092c0, 0x00090008, 0xffffffff,
585	0x000092c4, 0x00070000, 0xffffffff,
586	0x000092c8, 0x00030002, 0xffffffff,
587	0x000092cc, 0x00050004, 0xffffffff,
588	0x000092d8, 0x00010006, 0xffffffff,
589	0x000092dc, 0x00090008, 0xffffffff,
590	0x00009294, 0x00000000, 0xffffffff,
591	0x0000802c, 0xc0000000, 0xffffffff,
592	0x00003fc4, 0xc0000000, 0xffffffff,
593	0x000008f8, 0x00000010, 0xffffffff,
594	0x000008fc, 0x00000000, 0xffffffff,
595	0x000008f8, 0x00000011, 0xffffffff,
596	0x000008fc, 0x00000000, 0xffffffff,
597	0x000008f8, 0x00000012, 0xffffffff,
598	0x000008fc, 0x00000000, 0xffffffff,
599	0x000008f8, 0x00000013, 0xffffffff,
600	0x000008fc, 0x00000000, 0xffffffff,
601	0x000008f8, 0x00000014, 0xffffffff,
602	0x000008fc, 0x00000000, 0xffffffff,
603	0x000008f8, 0x00000015, 0xffffffff,
604	0x000008fc, 0x00000000, 0xffffffff,
605	0x000008f8, 0x00000016, 0xffffffff,
606	0x000008fc, 0x00000000, 0xffffffff,
607	0x000008f8, 0x00000017, 0xffffffff,
608	0x000008fc, 0x00000000, 0xffffffff,
609	0x000008f8, 0x00000018, 0xffffffff,
610	0x000008fc, 0x00000000, 0xffffffff,
611	0x000008f8, 0x00000019, 0xffffffff,
612	0x000008fc, 0x00000000, 0xffffffff,
613	0x000008f8, 0x0000001a, 0xffffffff,
614	0x000008fc, 0x00000000, 0xffffffff,
615	0x000008f8, 0x0000001b, 0xffffffff,
616	0x000008fc, 0x00000000, 0xffffffff
617};
618#define CAYMAN_MGCG_DEFAULT_LENGTH sizeof(cayman_mgcg_default) / (3 * sizeof(u32))
619
620static const u32 cayman_mgcg_disable[] =
621{
622	0x0000802c, 0xc0000000, 0xffffffff,
623	0x000008f8, 0x00000000, 0xffffffff,
624	0x000008fc, 0xffffffff, 0xffffffff,
625	0x000008f8, 0x00000001, 0xffffffff,
626	0x000008fc, 0xffffffff, 0xffffffff,
627	0x000008f8, 0x00000002, 0xffffffff,
628	0x000008fc, 0xffffffff, 0xffffffff,
629	0x000008f8, 0x00000003, 0xffffffff,
630	0x000008fc, 0xffffffff, 0xffffffff,
631	0x00009150, 0x00600000, 0xffffffff
632};
633#define CAYMAN_MGCG_DISABLE_LENGTH   sizeof(cayman_mgcg_disable) / (3 * sizeof(u32))
634
635static const u32 cayman_mgcg_enable[] =
636{
637	0x0000802c, 0xc0000000, 0xffffffff,
638	0x000008f8, 0x00000000, 0xffffffff,
639	0x000008fc, 0x00000000, 0xffffffff,
640	0x000008f8, 0x00000001, 0xffffffff,
641	0x000008fc, 0x00000000, 0xffffffff,
642	0x000008f8, 0x00000002, 0xffffffff,
643	0x000008fc, 0x00600000, 0xffffffff,
644	0x000008f8, 0x00000003, 0xffffffff,
645	0x000008fc, 0x00000000, 0xffffffff,
646	0x00009150, 0x96944200, 0xffffffff
647};
648
649#define CAYMAN_MGCG_ENABLE_LENGTH   sizeof(cayman_mgcg_enable) / (3 * sizeof(u32))
650
651#define NISLANDS_SYSLS_SEQUENCE  100
652
653static const u32 cayman_sysls_default[] =
654{
655	/* Register,   Value,     Mask bits */
656	0x000055e8, 0x00000000, 0xffffffff,
657	0x0000d0bc, 0x00000000, 0xffffffff,
658	0x0000d8bc, 0x00000000, 0xffffffff,
659	0x000015c0, 0x000c1401, 0xffffffff,
660	0x0000264c, 0x000c0400, 0xffffffff,
661	0x00002648, 0x000c0400, 0xffffffff,
662	0x00002650, 0x000c0400, 0xffffffff,
663	0x000020b8, 0x000c0400, 0xffffffff,
664	0x000020bc, 0x000c0400, 0xffffffff,
665	0x000020c0, 0x000c0c80, 0xffffffff,
666	0x0000f4a0, 0x000000c0, 0xffffffff,
667	0x0000f4a4, 0x00680fff, 0xffffffff,
668	0x00002f50, 0x00000404, 0xffffffff,
669	0x000004c8, 0x00000001, 0xffffffff,
670	0x000064ec, 0x00000000, 0xffffffff,
671	0x00000c7c, 0x00000000, 0xffffffff,
672	0x00008dfc, 0x00000000, 0xffffffff
673};
674#define CAYMAN_SYSLS_DEFAULT_LENGTH sizeof(cayman_sysls_default) / (3 * sizeof(u32))
675
676static const u32 cayman_sysls_disable[] =
677{
678	/* Register,   Value,     Mask bits */
679	0x0000d0c0, 0x00000000, 0xffffffff,
680	0x0000d8c0, 0x00000000, 0xffffffff,
681	0x000055e8, 0x00000000, 0xffffffff,
682	0x0000d0bc, 0x00000000, 0xffffffff,
683	0x0000d8bc, 0x00000000, 0xffffffff,
684	0x000015c0, 0x00041401, 0xffffffff,
685	0x0000264c, 0x00040400, 0xffffffff,
686	0x00002648, 0x00040400, 0xffffffff,
687	0x00002650, 0x00040400, 0xffffffff,
688	0x000020b8, 0x00040400, 0xffffffff,
689	0x000020bc, 0x00040400, 0xffffffff,
690	0x000020c0, 0x00040c80, 0xffffffff,
691	0x0000f4a0, 0x000000c0, 0xffffffff,
692	0x0000f4a4, 0x00680000, 0xffffffff,
693	0x00002f50, 0x00000404, 0xffffffff,
694	0x000004c8, 0x00000001, 0xffffffff,
695	0x000064ec, 0x00007ffd, 0xffffffff,
696	0x00000c7c, 0x0000ff00, 0xffffffff,
697	0x00008dfc, 0x0000007f, 0xffffffff
698};
699#define CAYMAN_SYSLS_DISABLE_LENGTH sizeof(cayman_sysls_disable) / (3 * sizeof(u32))
700
701static const u32 cayman_sysls_enable[] =
702{
703	/* Register,   Value,     Mask bits */
704	0x000055e8, 0x00000001, 0xffffffff,
705	0x0000d0bc, 0x00000100, 0xffffffff,
706	0x0000d8bc, 0x00000100, 0xffffffff,
707	0x000015c0, 0x000c1401, 0xffffffff,
708	0x0000264c, 0x000c0400, 0xffffffff,
709	0x00002648, 0x000c0400, 0xffffffff,
710	0x00002650, 0x000c0400, 0xffffffff,
711	0x000020b8, 0x000c0400, 0xffffffff,
712	0x000020bc, 0x000c0400, 0xffffffff,
713	0x000020c0, 0x000c0c80, 0xffffffff,
714	0x0000f4a0, 0x000000c0, 0xffffffff,
715	0x0000f4a4, 0x00680fff, 0xffffffff,
716	0x00002f50, 0x00000903, 0xffffffff,
717	0x000004c8, 0x00000000, 0xffffffff,
718	0x000064ec, 0x00000000, 0xffffffff,
719	0x00000c7c, 0x00000000, 0xffffffff,
720	0x00008dfc, 0x00000000, 0xffffffff
721};
722#define CAYMAN_SYSLS_ENABLE_LENGTH sizeof(cayman_sysls_enable) / (3 * sizeof(u32))
723
724extern int ni_mc_load_microcode(struct radeon_device *rdev);
725
726struct ni_power_info *ni_get_pi(struct radeon_device *rdev)
727{
728	struct ni_power_info *pi = rdev->pm.dpm.priv;
729
730	return pi;
731}
732
733struct ni_ps *ni_get_ps(struct radeon_ps *rps)
734{
735	struct ni_ps *ps = rps->ps_priv;
736
737	return ps;
738}
739
740static void ni_calculate_leakage_for_v_and_t_formula(const struct ni_leakage_coeffients *coeff,
741						     u16 v, s32 t,
742						     u32 ileakage,
743						     u32 *leakage)
744{
745	s64 kt, kv, leakage_w, i_leakage, vddc, temperature;
746
747	i_leakage = div64_s64(drm_int2fixp(ileakage), 1000);
748	vddc = div64_s64(drm_int2fixp(v), 1000);
749	temperature = div64_s64(drm_int2fixp(t), 1000);
750
751	kt = drm_fixp_mul(div64_s64(drm_int2fixp(coeff->at), 1000),
752			  drm_fixp_exp(drm_fixp_mul(div64_s64(drm_int2fixp(coeff->bt), 1000), temperature)));
753	kv = drm_fixp_mul(div64_s64(drm_int2fixp(coeff->av), 1000),
754			  drm_fixp_exp(drm_fixp_mul(div64_s64(drm_int2fixp(coeff->bv), 1000), vddc)));
755
756	leakage_w = drm_fixp_mul(drm_fixp_mul(drm_fixp_mul(i_leakage, kt), kv), vddc);
757
758	*leakage = drm_fixp2int(leakage_w * 1000);
759}
760
761static void ni_calculate_leakage_for_v_and_t(struct radeon_device *rdev,
762					     const struct ni_leakage_coeffients *coeff,
763					     u16 v,
764					     s32 t,
765					     u32 i_leakage,
766					     u32 *leakage)
767{
768	ni_calculate_leakage_for_v_and_t_formula(coeff, v, t, i_leakage, leakage);
769}
770
771bool ni_dpm_vblank_too_short(struct radeon_device *rdev)
772{
773	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
774	u32 vblank_time = r600_dpm_get_vblank_time(rdev);
775	/* we never hit the non-gddr5 limit so disable it */
776	u32 switch_limit = pi->mem_gddr5 ? 450 : 0;
777
778	if (vblank_time < switch_limit)
779		return true;
780	else
781		return false;
782
783}
784
785static void ni_apply_state_adjust_rules(struct radeon_device *rdev,
786					struct radeon_ps *rps)
787{
788	struct ni_ps *ps = ni_get_ps(rps);
789	struct radeon_clock_and_voltage_limits *max_limits;
790	bool disable_mclk_switching;
791	u32 mclk;
792	u16 vddci;
793	int i;
794
795	if ((rdev->pm.dpm.new_active_crtc_count > 1) ||
796	    ni_dpm_vblank_too_short(rdev))
797		disable_mclk_switching = true;
798	else
799		disable_mclk_switching = false;
800
801	if (rdev->pm.dpm.ac_power)
802		max_limits = &rdev->pm.dpm.dyn_state.max_clock_voltage_on_ac;
803	else
804		max_limits = &rdev->pm.dpm.dyn_state.max_clock_voltage_on_dc;
805
806	if (rdev->pm.dpm.ac_power == false) {
807		for (i = 0; i < ps->performance_level_count; i++) {
808			if (ps->performance_levels[i].mclk > max_limits->mclk)
809				ps->performance_levels[i].mclk = max_limits->mclk;
810			if (ps->performance_levels[i].sclk > max_limits->sclk)
811				ps->performance_levels[i].sclk = max_limits->sclk;
812			if (ps->performance_levels[i].vddc > max_limits->vddc)
813				ps->performance_levels[i].vddc = max_limits->vddc;
814			if (ps->performance_levels[i].vddci > max_limits->vddci)
815				ps->performance_levels[i].vddci = max_limits->vddci;
816		}
817	}
818
819	/* XXX validate the min clocks required for display */
820
821	/* adjust low state */
822	if (disable_mclk_switching) {
823		ps->performance_levels[0].mclk =
824			ps->performance_levels[ps->performance_level_count - 1].mclk;
825		ps->performance_levels[0].vddci =
826			ps->performance_levels[ps->performance_level_count - 1].vddci;
827	}
828
829	btc_skip_blacklist_clocks(rdev, max_limits->sclk, max_limits->mclk,
830				  &ps->performance_levels[0].sclk,
831				  &ps->performance_levels[0].mclk);
832
833	for (i = 1; i < ps->performance_level_count; i++) {
834		if (ps->performance_levels[i].sclk < ps->performance_levels[i - 1].sclk)
835			ps->performance_levels[i].sclk = ps->performance_levels[i - 1].sclk;
836		if (ps->performance_levels[i].vddc < ps->performance_levels[i - 1].vddc)
837			ps->performance_levels[i].vddc = ps->performance_levels[i - 1].vddc;
838	}
839
840	/* adjust remaining states */
841	if (disable_mclk_switching) {
842		mclk = ps->performance_levels[0].mclk;
843		vddci = ps->performance_levels[0].vddci;
844		for (i = 1; i < ps->performance_level_count; i++) {
845			if (mclk < ps->performance_levels[i].mclk)
846				mclk = ps->performance_levels[i].mclk;
847			if (vddci < ps->performance_levels[i].vddci)
848				vddci = ps->performance_levels[i].vddci;
849		}
850		for (i = 0; i < ps->performance_level_count; i++) {
851			ps->performance_levels[i].mclk = mclk;
852			ps->performance_levels[i].vddci = vddci;
853		}
854	} else {
855		for (i = 1; i < ps->performance_level_count; i++) {
856			if (ps->performance_levels[i].mclk < ps->performance_levels[i - 1].mclk)
857				ps->performance_levels[i].mclk = ps->performance_levels[i - 1].mclk;
858			if (ps->performance_levels[i].vddci < ps->performance_levels[i - 1].vddci)
859				ps->performance_levels[i].vddci = ps->performance_levels[i - 1].vddci;
860		}
861	}
862
863	for (i = 1; i < ps->performance_level_count; i++)
864		btc_skip_blacklist_clocks(rdev, max_limits->sclk, max_limits->mclk,
865					  &ps->performance_levels[i].sclk,
866					  &ps->performance_levels[i].mclk);
867
868	for (i = 0; i < ps->performance_level_count; i++)
869		btc_adjust_clock_combinations(rdev, max_limits,
870					      &ps->performance_levels[i]);
871
872	for (i = 0; i < ps->performance_level_count; i++) {
873		btc_apply_voltage_dependency_rules(&rdev->pm.dpm.dyn_state.vddc_dependency_on_sclk,
874						   ps->performance_levels[i].sclk,
875						   max_limits->vddc,  &ps->performance_levels[i].vddc);
876		btc_apply_voltage_dependency_rules(&rdev->pm.dpm.dyn_state.vddci_dependency_on_mclk,
877						   ps->performance_levels[i].mclk,
878						   max_limits->vddci, &ps->performance_levels[i].vddci);
879		btc_apply_voltage_dependency_rules(&rdev->pm.dpm.dyn_state.vddc_dependency_on_mclk,
880						   ps->performance_levels[i].mclk,
881						   max_limits->vddc,  &ps->performance_levels[i].vddc);
882		btc_apply_voltage_dependency_rules(&rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk,
883						   rdev->clock.current_dispclk,
884						   max_limits->vddc,  &ps->performance_levels[i].vddc);
885	}
886
887	for (i = 0; i < ps->performance_level_count; i++) {
888		btc_apply_voltage_delta_rules(rdev,
889					      max_limits->vddc, max_limits->vddci,
890					      &ps->performance_levels[i].vddc,
891					      &ps->performance_levels[i].vddci);
892	}
893
894	ps->dc_compatible = true;
895	for (i = 0; i < ps->performance_level_count; i++) {
896		if (ps->performance_levels[i].vddc > rdev->pm.dpm.dyn_state.max_clock_voltage_on_dc.vddc)
897			ps->dc_compatible = false;
898
899		if (ps->performance_levels[i].vddc < rdev->pm.dpm.dyn_state.min_vddc_for_pcie_gen2)
900			ps->performance_levels[i].flags &= ~ATOM_PPLIB_R600_FLAGS_PCIEGEN2;
901	}
902}
903
904static void ni_cg_clockgating_default(struct radeon_device *rdev)
905{
906	u32 count;
907	const u32 *ps = NULL;
908
909	ps = (const u32 *)&cayman_cgcg_cgls_default;
910	count = CAYMAN_CGCG_CGLS_DEFAULT_LENGTH;
911
912	btc_program_mgcg_hw_sequence(rdev, ps, count);
913}
914
915static void ni_gfx_clockgating_enable(struct radeon_device *rdev,
916				      bool enable)
917{
918	u32 count;
919	const u32 *ps = NULL;
920
921	if (enable) {
922		ps = (const u32 *)&cayman_cgcg_cgls_enable;
923		count = CAYMAN_CGCG_CGLS_ENABLE_LENGTH;
924	} else {
925		ps = (const u32 *)&cayman_cgcg_cgls_disable;
926		count = CAYMAN_CGCG_CGLS_DISABLE_LENGTH;
927	}
928
929	btc_program_mgcg_hw_sequence(rdev, ps, count);
930}
931
932static void ni_mg_clockgating_default(struct radeon_device *rdev)
933{
934	u32 count;
935	const u32 *ps = NULL;
936
937	ps = (const u32 *)&cayman_mgcg_default;
938	count = CAYMAN_MGCG_DEFAULT_LENGTH;
939
940	btc_program_mgcg_hw_sequence(rdev, ps, count);
941}
942
943static void ni_mg_clockgating_enable(struct radeon_device *rdev,
944				     bool enable)
945{
946	u32 count;
947	const u32 *ps = NULL;
948
949	if (enable) {
950		ps = (const u32 *)&cayman_mgcg_enable;
951		count = CAYMAN_MGCG_ENABLE_LENGTH;
952	} else {
953		ps = (const u32 *)&cayman_mgcg_disable;
954		count = CAYMAN_MGCG_DISABLE_LENGTH;
955	}
956
957	btc_program_mgcg_hw_sequence(rdev, ps, count);
958}
959
960static void ni_ls_clockgating_default(struct radeon_device *rdev)
961{
962	u32 count;
963	const u32 *ps = NULL;
964
965	ps = (const u32 *)&cayman_sysls_default;
966	count = CAYMAN_SYSLS_DEFAULT_LENGTH;
967
968	btc_program_mgcg_hw_sequence(rdev, ps, count);
969}
970
971static void ni_ls_clockgating_enable(struct radeon_device *rdev,
972				     bool enable)
973{
974	u32 count;
975	const u32 *ps = NULL;
976
977	if (enable) {
978		ps = (const u32 *)&cayman_sysls_enable;
979		count = CAYMAN_SYSLS_ENABLE_LENGTH;
980	} else {
981		ps = (const u32 *)&cayman_sysls_disable;
982		count = CAYMAN_SYSLS_DISABLE_LENGTH;
983	}
984
985	btc_program_mgcg_hw_sequence(rdev, ps, count);
986
987}
988
989static int ni_patch_single_dependency_table_based_on_leakage(struct radeon_device *rdev,
990							     struct radeon_clock_voltage_dependency_table *table)
991{
992	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
993	u32 i;
994
995	if (table) {
996		for (i = 0; i < table->count; i++) {
997			if (0xff01 == table->entries[i].v) {
998				if (pi->max_vddc == 0)
999					return -EINVAL;
1000				table->entries[i].v = pi->max_vddc;
1001			}
1002		}
1003	}
1004	return 0;
1005}
1006
1007static int ni_patch_dependency_tables_based_on_leakage(struct radeon_device *rdev)
1008{
1009	int ret = 0;
1010
1011	ret = ni_patch_single_dependency_table_based_on_leakage(rdev,
1012								&rdev->pm.dpm.dyn_state.vddc_dependency_on_sclk);
1013
1014	ret = ni_patch_single_dependency_table_based_on_leakage(rdev,
1015								&rdev->pm.dpm.dyn_state.vddc_dependency_on_mclk);
1016	return ret;
1017}
1018
1019static void ni_stop_dpm(struct radeon_device *rdev)
1020{
1021	WREG32_P(GENERAL_PWRMGT, 0, ~GLOBAL_PWRMGT_EN);
1022}
1023
1024#if 0
1025static int ni_notify_hw_of_power_source(struct radeon_device *rdev,
1026					bool ac_power)
1027{
1028	if (ac_power)
1029		return (rv770_send_msg_to_smc(rdev, PPSMC_MSG_RunningOnAC) == PPSMC_Result_OK) ?
1030			0 : -EINVAL;
1031
1032	return 0;
1033}
1034#endif
1035
1036static PPSMC_Result ni_send_msg_to_smc_with_parameter(struct radeon_device *rdev,
1037						      PPSMC_Msg msg, u32 parameter)
1038{
1039	WREG32(SMC_SCRATCH0, parameter);
1040	return rv770_send_msg_to_smc(rdev, msg);
1041}
1042
1043static int ni_restrict_performance_levels_before_switch(struct radeon_device *rdev)
1044{
1045	if (rv770_send_msg_to_smc(rdev, PPSMC_MSG_NoForcedLevel) != PPSMC_Result_OK)
1046		return -EINVAL;
1047
1048	return (ni_send_msg_to_smc_with_parameter(rdev, PPSMC_MSG_SetEnabledLevels, 1) == PPSMC_Result_OK) ?
1049		0 : -EINVAL;
1050}
1051
1052int ni_dpm_force_performance_level(struct radeon_device *rdev,
1053				   enum radeon_dpm_forced_level level)
1054{
1055	if (level == RADEON_DPM_FORCED_LEVEL_HIGH) {
1056		if (ni_send_msg_to_smc_with_parameter(rdev, PPSMC_MSG_SetEnabledLevels, 0) != PPSMC_Result_OK)
1057			return -EINVAL;
1058
1059		if (ni_send_msg_to_smc_with_parameter(rdev, PPSMC_MSG_SetForcedLevels, 1) != PPSMC_Result_OK)
1060			return -EINVAL;
1061	} else if (level == RADEON_DPM_FORCED_LEVEL_LOW) {
1062		if (ni_send_msg_to_smc_with_parameter(rdev, PPSMC_MSG_SetForcedLevels, 0) != PPSMC_Result_OK)
1063			return -EINVAL;
1064
1065		if (ni_send_msg_to_smc_with_parameter(rdev, PPSMC_MSG_SetEnabledLevels, 1) != PPSMC_Result_OK)
1066			return -EINVAL;
1067	} else if (level == RADEON_DPM_FORCED_LEVEL_AUTO) {
1068		if (ni_send_msg_to_smc_with_parameter(rdev, PPSMC_MSG_SetForcedLevels, 0) != PPSMC_Result_OK)
1069			return -EINVAL;
1070
1071		if (ni_send_msg_to_smc_with_parameter(rdev, PPSMC_MSG_SetEnabledLevels, 0) != PPSMC_Result_OK)
1072			return -EINVAL;
1073	}
1074
1075	rdev->pm.dpm.forced_level = level;
1076
1077	return 0;
1078}
1079
1080static void ni_stop_smc(struct radeon_device *rdev)
1081{
1082	u32 tmp;
1083	int i;
1084
1085	for (i = 0; i < rdev->usec_timeout; i++) {
1086		tmp = RREG32(LB_SYNC_RESET_SEL) & LB_SYNC_RESET_SEL_MASK;
1087		if (tmp != 1)
1088			break;
1089		udelay(1);
1090	}
1091
1092	udelay(100);
1093
1094	r7xx_stop_smc(rdev);
1095}
1096
1097static int ni_process_firmware_header(struct radeon_device *rdev)
1098{
1099	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
1100	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
1101	struct ni_power_info *ni_pi = ni_get_pi(rdev);
1102	u32 tmp;
1103	int ret;
1104
1105	ret = rv770_read_smc_sram_dword(rdev,
1106					NISLANDS_SMC_FIRMWARE_HEADER_LOCATION +
1107					NISLANDS_SMC_FIRMWARE_HEADER_stateTable,
1108					&tmp, pi->sram_end);
1109
1110	if (ret)
1111		return ret;
1112
1113	pi->state_table_start = (u16)tmp;
1114
1115	ret = rv770_read_smc_sram_dword(rdev,
1116					NISLANDS_SMC_FIRMWARE_HEADER_LOCATION +
1117					NISLANDS_SMC_FIRMWARE_HEADER_softRegisters,
1118					&tmp, pi->sram_end);
1119
1120	if (ret)
1121		return ret;
1122
1123	pi->soft_regs_start = (u16)tmp;
1124
1125	ret = rv770_read_smc_sram_dword(rdev,
1126					NISLANDS_SMC_FIRMWARE_HEADER_LOCATION +
1127					NISLANDS_SMC_FIRMWARE_HEADER_mcRegisterTable,
1128					&tmp, pi->sram_end);
1129
1130	if (ret)
1131		return ret;
1132
1133	eg_pi->mc_reg_table_start = (u16)tmp;
1134
1135	ret = rv770_read_smc_sram_dword(rdev,
1136					NISLANDS_SMC_FIRMWARE_HEADER_LOCATION +
1137					NISLANDS_SMC_FIRMWARE_HEADER_fanTable,
1138					&tmp, pi->sram_end);
1139
1140	if (ret)
1141		return ret;
1142
1143	ni_pi->fan_table_start = (u16)tmp;
1144
1145	ret = rv770_read_smc_sram_dword(rdev,
1146					NISLANDS_SMC_FIRMWARE_HEADER_LOCATION +
1147					NISLANDS_SMC_FIRMWARE_HEADER_mcArbDramAutoRefreshTable,
1148					&tmp, pi->sram_end);
1149
1150	if (ret)
1151		return ret;
1152
1153	ni_pi->arb_table_start = (u16)tmp;
1154
1155	ret = rv770_read_smc_sram_dword(rdev,
1156					NISLANDS_SMC_FIRMWARE_HEADER_LOCATION +
1157					NISLANDS_SMC_FIRMWARE_HEADER_cacTable,
1158					&tmp, pi->sram_end);
1159
1160	if (ret)
1161		return ret;
1162
1163	ni_pi->cac_table_start = (u16)tmp;
1164
1165	ret = rv770_read_smc_sram_dword(rdev,
1166					NISLANDS_SMC_FIRMWARE_HEADER_LOCATION +
1167					NISLANDS_SMC_FIRMWARE_HEADER_spllTable,
1168					&tmp, pi->sram_end);
1169
1170	if (ret)
1171		return ret;
1172
1173	ni_pi->spll_table_start = (u16)tmp;
1174
1175
1176	return ret;
1177}
1178
1179static void ni_read_clock_registers(struct radeon_device *rdev)
1180{
1181	struct ni_power_info *ni_pi = ni_get_pi(rdev);
1182
1183	ni_pi->clock_registers.cg_spll_func_cntl = RREG32(CG_SPLL_FUNC_CNTL);
1184	ni_pi->clock_registers.cg_spll_func_cntl_2 = RREG32(CG_SPLL_FUNC_CNTL_2);
1185	ni_pi->clock_registers.cg_spll_func_cntl_3 = RREG32(CG_SPLL_FUNC_CNTL_3);
1186	ni_pi->clock_registers.cg_spll_func_cntl_4 = RREG32(CG_SPLL_FUNC_CNTL_4);
1187	ni_pi->clock_registers.cg_spll_spread_spectrum = RREG32(CG_SPLL_SPREAD_SPECTRUM);
1188	ni_pi->clock_registers.cg_spll_spread_spectrum_2 = RREG32(CG_SPLL_SPREAD_SPECTRUM_2);
1189	ni_pi->clock_registers.mpll_ad_func_cntl = RREG32(MPLL_AD_FUNC_CNTL);
1190	ni_pi->clock_registers.mpll_ad_func_cntl_2 = RREG32(MPLL_AD_FUNC_CNTL_2);
1191	ni_pi->clock_registers.mpll_dq_func_cntl = RREG32(MPLL_DQ_FUNC_CNTL);
1192	ni_pi->clock_registers.mpll_dq_func_cntl_2 = RREG32(MPLL_DQ_FUNC_CNTL_2);
1193	ni_pi->clock_registers.mclk_pwrmgt_cntl = RREG32(MCLK_PWRMGT_CNTL);
1194	ni_pi->clock_registers.dll_cntl = RREG32(DLL_CNTL);
1195	ni_pi->clock_registers.mpll_ss1 = RREG32(MPLL_SS1);
1196	ni_pi->clock_registers.mpll_ss2 = RREG32(MPLL_SS2);
1197}
1198
1199#if 0
1200static int ni_enter_ulp_state(struct radeon_device *rdev)
1201{
1202	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
1203
1204	if (pi->gfx_clock_gating) {
1205		WREG32_P(SCLK_PWRMGT_CNTL, 0, ~DYN_GFX_CLK_OFF_EN);
1206		WREG32_P(SCLK_PWRMGT_CNTL, GFX_CLK_FORCE_ON, ~GFX_CLK_FORCE_ON);
1207		WREG32_P(SCLK_PWRMGT_CNTL, 0, ~GFX_CLK_FORCE_ON);
1208		RREG32(GB_ADDR_CONFIG);
1209	}
1210
1211	WREG32_P(SMC_MSG, HOST_SMC_MSG(PPSMC_MSG_SwitchToMinimumPower),
1212		 ~HOST_SMC_MSG_MASK);
1213
1214	udelay(25000);
1215
1216	return 0;
1217}
1218#endif
1219
1220static void ni_program_response_times(struct radeon_device *rdev)
1221{
1222	u32 voltage_response_time, backbias_response_time, acpi_delay_time, vbi_time_out;
1223	u32 vddc_dly, bb_dly, acpi_dly, vbi_dly, mclk_switch_limit;
1224	u32 reference_clock;
1225
1226	rv770_write_smc_soft_register(rdev, NI_SMC_SOFT_REGISTER_mvdd_chg_time, 1);
1227
1228	voltage_response_time = (u32)rdev->pm.dpm.voltage_response_time;
1229	backbias_response_time = (u32)rdev->pm.dpm.backbias_response_time;
1230
1231	if (voltage_response_time == 0)
1232		voltage_response_time = 1000;
1233
1234	if (backbias_response_time == 0)
1235		backbias_response_time = 1000;
1236
1237	acpi_delay_time = 15000;
1238	vbi_time_out = 100000;
1239
1240	reference_clock = radeon_get_xclk(rdev);
1241
1242	vddc_dly = (voltage_response_time  * reference_clock) / 1600;
1243	bb_dly   = (backbias_response_time * reference_clock) / 1600;
1244	acpi_dly = (acpi_delay_time * reference_clock) / 1600;
1245	vbi_dly  = (vbi_time_out * reference_clock) / 1600;
1246
1247	mclk_switch_limit = (460 * reference_clock) / 100;
1248
1249	rv770_write_smc_soft_register(rdev, NI_SMC_SOFT_REGISTER_delay_vreg,  vddc_dly);
1250	rv770_write_smc_soft_register(rdev, NI_SMC_SOFT_REGISTER_delay_bbias, bb_dly);
1251	rv770_write_smc_soft_register(rdev, NI_SMC_SOFT_REGISTER_delay_acpi,  acpi_dly);
1252	rv770_write_smc_soft_register(rdev, NI_SMC_SOFT_REGISTER_mclk_chg_timeout, vbi_dly);
1253	rv770_write_smc_soft_register(rdev, NI_SMC_SOFT_REGISTER_mc_block_delay, 0xAA);
1254	rv770_write_smc_soft_register(rdev, NI_SMC_SOFT_REGISTER_mclk_switch_lim, mclk_switch_limit);
1255}
1256
1257static void ni_populate_smc_voltage_table(struct radeon_device *rdev,
1258					  struct atom_voltage_table *voltage_table,
1259					  NISLANDS_SMC_STATETABLE *table)
1260{
1261	unsigned int i;
1262
1263	for (i = 0; i < voltage_table->count; i++) {
1264		table->highSMIO[i] = 0;
1265		table->lowSMIO[i] |= cpu_to_be32(voltage_table->entries[i].smio_low);
1266	}
1267}
1268
1269static void ni_populate_smc_voltage_tables(struct radeon_device *rdev,
1270					   NISLANDS_SMC_STATETABLE *table)
1271{
1272	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
1273	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
1274	unsigned char i;
1275
1276	if (eg_pi->vddc_voltage_table.count) {
1277		ni_populate_smc_voltage_table(rdev, &eg_pi->vddc_voltage_table, table);
1278		table->voltageMaskTable.highMask[NISLANDS_SMC_VOLTAGEMASK_VDDC] = 0;
1279		table->voltageMaskTable.lowMask[NISLANDS_SMC_VOLTAGEMASK_VDDC] =
1280			cpu_to_be32(eg_pi->vddc_voltage_table.mask_low);
1281
1282		for (i = 0; i < eg_pi->vddc_voltage_table.count; i++) {
1283			if (pi->max_vddc_in_table <= eg_pi->vddc_voltage_table.entries[i].value) {
1284				table->maxVDDCIndexInPPTable = i;
1285				break;
1286			}
1287		}
1288	}
1289
1290	if (eg_pi->vddci_voltage_table.count) {
1291		ni_populate_smc_voltage_table(rdev, &eg_pi->vddci_voltage_table, table);
1292
1293		table->voltageMaskTable.highMask[NISLANDS_SMC_VOLTAGEMASK_VDDCI] = 0;
1294		table->voltageMaskTable.lowMask[NISLANDS_SMC_VOLTAGEMASK_VDDCI] =
1295			cpu_to_be32(eg_pi->vddci_voltage_table.mask_low);
1296	}
1297}
1298
1299static int ni_populate_voltage_value(struct radeon_device *rdev,
1300				     struct atom_voltage_table *table,
1301				     u16 value,
1302				     NISLANDS_SMC_VOLTAGE_VALUE *voltage)
1303{
1304	unsigned int i;
1305
1306	for (i = 0; i < table->count; i++) {
1307		if (value <= table->entries[i].value) {
1308			voltage->index = (u8)i;
1309			voltage->value = cpu_to_be16(table->entries[i].value);
1310			break;
1311		}
1312	}
1313
1314	if (i >= table->count)
1315		return -EINVAL;
1316
1317	return 0;
1318}
1319
1320static void ni_populate_mvdd_value(struct radeon_device *rdev,
1321				   u32 mclk,
1322				   NISLANDS_SMC_VOLTAGE_VALUE *voltage)
1323{
1324	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
1325	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
1326
1327	if (!pi->mvdd_control) {
1328		voltage->index = eg_pi->mvdd_high_index;
1329		voltage->value = cpu_to_be16(MVDD_HIGH_VALUE);
1330		return;
1331	}
1332
1333	if (mclk <= pi->mvdd_split_frequency) {
1334		voltage->index = eg_pi->mvdd_low_index;
1335		voltage->value = cpu_to_be16(MVDD_LOW_VALUE);
1336	} else {
1337		voltage->index = eg_pi->mvdd_high_index;
1338		voltage->value = cpu_to_be16(MVDD_HIGH_VALUE);
1339	}
1340}
1341
1342static int ni_get_std_voltage_value(struct radeon_device *rdev,
1343				    NISLANDS_SMC_VOLTAGE_VALUE *voltage,
1344				    u16 *std_voltage)
1345{
1346	if (rdev->pm.dpm.dyn_state.cac_leakage_table.entries &&
1347	    ((u32)voltage->index < rdev->pm.dpm.dyn_state.cac_leakage_table.count))
1348		*std_voltage = rdev->pm.dpm.dyn_state.cac_leakage_table.entries[voltage->index].vddc;
1349	else
1350		*std_voltage = be16_to_cpu(voltage->value);
1351
1352	return 0;
1353}
1354
1355static void ni_populate_std_voltage_value(struct radeon_device *rdev,
1356					  u16 value, u8 index,
1357					  NISLANDS_SMC_VOLTAGE_VALUE *voltage)
1358{
1359	voltage->index = index;
1360	voltage->value = cpu_to_be16(value);
1361}
1362
1363static u32 ni_get_smc_power_scaling_factor(struct radeon_device *rdev)
1364{
1365	u32 xclk_period;
1366	u32 xclk = radeon_get_xclk(rdev);
1367	u32 tmp = RREG32(CG_CAC_CTRL) & TID_CNT_MASK;
1368
1369	xclk_period = (1000000000UL / xclk);
1370	xclk_period /= 10000UL;
1371
1372	return tmp * xclk_period;
1373}
1374
1375static u32 ni_scale_power_for_smc(u32 power_in_watts, u32 scaling_factor)
1376{
1377	return (power_in_watts * scaling_factor) << 2;
1378}
1379
1380static u32 ni_calculate_power_boost_limit(struct radeon_device *rdev,
1381					  struct radeon_ps *radeon_state,
1382					  u32 near_tdp_limit)
1383{
1384	struct ni_ps *state = ni_get_ps(radeon_state);
1385	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
1386	struct ni_power_info *ni_pi = ni_get_pi(rdev);
1387	u32 power_boost_limit = 0;
1388	int ret;
1389
1390	if (ni_pi->enable_power_containment &&
1391	    ni_pi->use_power_boost_limit) {
1392		NISLANDS_SMC_VOLTAGE_VALUE vddc;
1393		u16 std_vddc_med;
1394		u16 std_vddc_high;
1395		u64 tmp, n, d;
1396
1397		if (state->performance_level_count < 3)
1398			return 0;
1399
1400		ret = ni_populate_voltage_value(rdev, &eg_pi->vddc_voltage_table,
1401						state->performance_levels[state->performance_level_count - 2].vddc,
1402						&vddc);
1403		if (ret)
1404			return 0;
1405
1406		ret = ni_get_std_voltage_value(rdev, &vddc, &std_vddc_med);
1407		if (ret)
1408			return 0;
1409
1410		ret = ni_populate_voltage_value(rdev, &eg_pi->vddc_voltage_table,
1411						state->performance_levels[state->performance_level_count - 1].vddc,
1412						&vddc);
1413		if (ret)
1414			return 0;
1415
1416		ret = ni_get_std_voltage_value(rdev, &vddc, &std_vddc_high);
1417		if (ret)
1418			return 0;
1419
1420		n = ((u64)near_tdp_limit * ((u64)std_vddc_med * (u64)std_vddc_med) * 90);
1421		d = ((u64)std_vddc_high * (u64)std_vddc_high * 100);
1422		tmp = div64_u64(n, d);
1423
1424		if (tmp >> 32)
1425			return 0;
1426		power_boost_limit = (u32)tmp;
1427	}
1428
1429	return power_boost_limit;
1430}
1431
1432static int ni_calculate_adjusted_tdp_limits(struct radeon_device *rdev,
1433					    bool adjust_polarity,
1434					    u32 tdp_adjustment,
1435					    u32 *tdp_limit,
1436					    u32 *near_tdp_limit)
1437{
1438	if (tdp_adjustment > (u32)rdev->pm.dpm.tdp_od_limit)
1439		return -EINVAL;
1440
1441	if (adjust_polarity) {
1442		*tdp_limit = ((100 + tdp_adjustment) * rdev->pm.dpm.tdp_limit) / 100;
1443		*near_tdp_limit = rdev->pm.dpm.near_tdp_limit + (*tdp_limit - rdev->pm.dpm.tdp_limit);
1444	} else {
1445		*tdp_limit = ((100 - tdp_adjustment) * rdev->pm.dpm.tdp_limit) / 100;
1446		*near_tdp_limit = rdev->pm.dpm.near_tdp_limit - (rdev->pm.dpm.tdp_limit - *tdp_limit);
1447	}
1448
1449	return 0;
1450}
1451
1452static int ni_populate_smc_tdp_limits(struct radeon_device *rdev,
1453				      struct radeon_ps *radeon_state)
1454{
1455	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
1456	struct ni_power_info *ni_pi = ni_get_pi(rdev);
1457
1458	if (ni_pi->enable_power_containment) {
1459		NISLANDS_SMC_STATETABLE *smc_table = &ni_pi->smc_statetable;
1460		u32 scaling_factor = ni_get_smc_power_scaling_factor(rdev);
1461		u32 tdp_limit;
1462		u32 near_tdp_limit;
1463		u32 power_boost_limit;
1464		int ret;
1465
1466		if (scaling_factor == 0)
1467			return -EINVAL;
1468
1469		memset(smc_table, 0, sizeof(NISLANDS_SMC_STATETABLE));
1470
1471		ret = ni_calculate_adjusted_tdp_limits(rdev,
1472						       false, /* ??? */
1473						       rdev->pm.dpm.tdp_adjustment,
1474						       &tdp_limit,
1475						       &near_tdp_limit);
1476		if (ret)
1477			return ret;
1478
1479		power_boost_limit = ni_calculate_power_boost_limit(rdev, radeon_state,
1480								   near_tdp_limit);
1481
1482		smc_table->dpm2Params.TDPLimit =
1483			cpu_to_be32(ni_scale_power_for_smc(tdp_limit, scaling_factor));
1484		smc_table->dpm2Params.NearTDPLimit =
1485			cpu_to_be32(ni_scale_power_for_smc(near_tdp_limit, scaling_factor));
1486		smc_table->dpm2Params.SafePowerLimit =
1487			cpu_to_be32(ni_scale_power_for_smc((near_tdp_limit * NISLANDS_DPM2_TDP_SAFE_LIMIT_PERCENT) / 100,
1488							   scaling_factor));
1489		smc_table->dpm2Params.PowerBoostLimit =
1490			cpu_to_be32(ni_scale_power_for_smc(power_boost_limit, scaling_factor));
1491
1492		ret = rv770_copy_bytes_to_smc(rdev,
1493					      (u16)(pi->state_table_start + offsetof(NISLANDS_SMC_STATETABLE, dpm2Params) +
1494						    offsetof(PP_NIslands_DPM2Parameters, TDPLimit)),
1495					      (u8 *)(&smc_table->dpm2Params.TDPLimit),
1496					      sizeof(u32) * 4, pi->sram_end);
1497		if (ret)
1498			return ret;
1499	}
1500
1501	return 0;
1502}
1503
1504int ni_copy_and_switch_arb_sets(struct radeon_device *rdev,
1505				u32 arb_freq_src, u32 arb_freq_dest)
1506{
1507	u32 mc_arb_dram_timing;
1508	u32 mc_arb_dram_timing2;
1509	u32 burst_time;
1510	u32 mc_cg_config;
1511
1512	switch (arb_freq_src) {
1513	case MC_CG_ARB_FREQ_F0:
1514		mc_arb_dram_timing  = RREG32(MC_ARB_DRAM_TIMING);
1515		mc_arb_dram_timing2 = RREG32(MC_ARB_DRAM_TIMING2);
1516		burst_time = (RREG32(MC_ARB_BURST_TIME) & STATE0_MASK) >> STATE0_SHIFT;
1517		break;
1518	case MC_CG_ARB_FREQ_F1:
1519		mc_arb_dram_timing  = RREG32(MC_ARB_DRAM_TIMING_1);
1520		mc_arb_dram_timing2 = RREG32(MC_ARB_DRAM_TIMING2_1);
1521		burst_time = (RREG32(MC_ARB_BURST_TIME) & STATE1_MASK) >> STATE1_SHIFT;
1522		break;
1523	case MC_CG_ARB_FREQ_F2:
1524		mc_arb_dram_timing  = RREG32(MC_ARB_DRAM_TIMING_2);
1525		mc_arb_dram_timing2 = RREG32(MC_ARB_DRAM_TIMING2_2);
1526		burst_time = (RREG32(MC_ARB_BURST_TIME) & STATE2_MASK) >> STATE2_SHIFT;
1527		break;
1528	case MC_CG_ARB_FREQ_F3:
1529		mc_arb_dram_timing  = RREG32(MC_ARB_DRAM_TIMING_3);
1530		mc_arb_dram_timing2 = RREG32(MC_ARB_DRAM_TIMING2_3);
1531		burst_time = (RREG32(MC_ARB_BURST_TIME) & STATE3_MASK) >> STATE3_SHIFT;
1532		break;
1533	default:
1534		return -EINVAL;
1535	}
1536
1537	switch (arb_freq_dest) {
1538	case MC_CG_ARB_FREQ_F0:
1539		WREG32(MC_ARB_DRAM_TIMING, mc_arb_dram_timing);
1540		WREG32(MC_ARB_DRAM_TIMING2, mc_arb_dram_timing2);
1541		WREG32_P(MC_ARB_BURST_TIME, STATE0(burst_time), ~STATE0_MASK);
1542		break;
1543	case MC_CG_ARB_FREQ_F1:
1544		WREG32(MC_ARB_DRAM_TIMING_1, mc_arb_dram_timing);
1545		WREG32(MC_ARB_DRAM_TIMING2_1, mc_arb_dram_timing2);
1546		WREG32_P(MC_ARB_BURST_TIME, STATE1(burst_time), ~STATE1_MASK);
1547		break;
1548	case MC_CG_ARB_FREQ_F2:
1549		WREG32(MC_ARB_DRAM_TIMING_2, mc_arb_dram_timing);
1550		WREG32(MC_ARB_DRAM_TIMING2_2, mc_arb_dram_timing2);
1551		WREG32_P(MC_ARB_BURST_TIME, STATE2(burst_time), ~STATE2_MASK);
1552		break;
1553	case MC_CG_ARB_FREQ_F3:
1554		WREG32(MC_ARB_DRAM_TIMING_3, mc_arb_dram_timing);
1555		WREG32(MC_ARB_DRAM_TIMING2_3, mc_arb_dram_timing2);
1556		WREG32_P(MC_ARB_BURST_TIME, STATE3(burst_time), ~STATE3_MASK);
1557		break;
1558	default:
1559		return -EINVAL;
1560	}
1561
1562	mc_cg_config = RREG32(MC_CG_CONFIG) | 0x0000000F;
1563	WREG32(MC_CG_CONFIG, mc_cg_config);
1564	WREG32_P(MC_ARB_CG, CG_ARB_REQ(arb_freq_dest), ~CG_ARB_REQ_MASK);
1565
1566	return 0;
1567}
1568
1569static int ni_init_arb_table_index(struct radeon_device *rdev)
1570{
1571	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
1572	struct ni_power_info *ni_pi = ni_get_pi(rdev);
1573	u32 tmp;
1574	int ret;
1575
1576	ret = rv770_read_smc_sram_dword(rdev, ni_pi->arb_table_start,
1577					&tmp, pi->sram_end);
1578	if (ret)
1579		return ret;
1580
1581	tmp &= 0x00FFFFFF;
1582	tmp |= ((u32)MC_CG_ARB_FREQ_F1) << 24;
1583
1584	return rv770_write_smc_sram_dword(rdev, ni_pi->arb_table_start,
1585					  tmp, pi->sram_end);
1586}
1587
1588static int ni_initial_switch_from_arb_f0_to_f1(struct radeon_device *rdev)
1589{
1590	return ni_copy_and_switch_arb_sets(rdev, MC_CG_ARB_FREQ_F0, MC_CG_ARB_FREQ_F1);
1591}
1592
1593static int ni_force_switch_to_arb_f0(struct radeon_device *rdev)
1594{
1595	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
1596	struct ni_power_info *ni_pi = ni_get_pi(rdev);
1597	u32 tmp;
1598	int ret;
1599
1600	ret = rv770_read_smc_sram_dword(rdev, ni_pi->arb_table_start,
1601					&tmp, pi->sram_end);
1602	if (ret)
1603		return ret;
1604
1605	tmp = (tmp >> 24) & 0xff;
1606
1607	if (tmp == MC_CG_ARB_FREQ_F0)
1608		return 0;
1609
1610	return ni_copy_and_switch_arb_sets(rdev, tmp, MC_CG_ARB_FREQ_F0);
1611}
1612
1613static int ni_populate_memory_timing_parameters(struct radeon_device *rdev,
1614						struct rv7xx_pl *pl,
1615						SMC_NIslands_MCArbDramTimingRegisterSet *arb_regs)
1616{
1617	u32 dram_timing;
1618	u32 dram_timing2;
1619
1620	arb_regs->mc_arb_rfsh_rate =
1621		(u8)rv770_calculate_memory_refresh_rate(rdev, pl->sclk);
1622
1623
1624	radeon_atom_set_engine_dram_timings(rdev, pl->sclk, pl->mclk);
1625
1626	dram_timing = RREG32(MC_ARB_DRAM_TIMING);
1627	dram_timing2 = RREG32(MC_ARB_DRAM_TIMING2);
1628
1629	arb_regs->mc_arb_dram_timing  = cpu_to_be32(dram_timing);
1630	arb_regs->mc_arb_dram_timing2 = cpu_to_be32(dram_timing2);
1631
1632	return 0;
1633}
1634
1635static int ni_do_program_memory_timing_parameters(struct radeon_device *rdev,
1636						  struct radeon_ps *radeon_state,
1637						  unsigned int first_arb_set)
1638{
1639	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
1640	struct ni_power_info *ni_pi = ni_get_pi(rdev);
1641	struct ni_ps *state = ni_get_ps(radeon_state);
1642	SMC_NIslands_MCArbDramTimingRegisterSet arb_regs = { 0 };
1643	int i, ret = 0;
1644
1645	for (i = 0; i < state->performance_level_count; i++) {
1646		ret = ni_populate_memory_timing_parameters(rdev, &state->performance_levels[i], &arb_regs);
1647		if (ret)
1648			break;
1649
1650		ret = rv770_copy_bytes_to_smc(rdev,
1651					      (u16)(ni_pi->arb_table_start +
1652						    offsetof(SMC_NIslands_MCArbDramTimingRegisters, data) +
1653						    sizeof(SMC_NIslands_MCArbDramTimingRegisterSet) * (first_arb_set + i)),
1654					      (u8 *)&arb_regs,
1655					      (u16)sizeof(SMC_NIslands_MCArbDramTimingRegisterSet),
1656					      pi->sram_end);
1657		if (ret)
1658			break;
1659	}
1660	return ret;
1661}
1662
1663static int ni_program_memory_timing_parameters(struct radeon_device *rdev,
1664					       struct radeon_ps *radeon_new_state)
1665{
1666	return ni_do_program_memory_timing_parameters(rdev, radeon_new_state,
1667						      NISLANDS_DRIVER_STATE_ARB_INDEX);
1668}
1669
1670static void ni_populate_initial_mvdd_value(struct radeon_device *rdev,
1671					   struct NISLANDS_SMC_VOLTAGE_VALUE *voltage)
1672{
1673	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
1674
1675	voltage->index = eg_pi->mvdd_high_index;
1676	voltage->value = cpu_to_be16(MVDD_HIGH_VALUE);
1677}
1678
1679static int ni_populate_smc_initial_state(struct radeon_device *rdev,
1680					 struct radeon_ps *radeon_initial_state,
1681					 NISLANDS_SMC_STATETABLE *table)
1682{
1683	struct ni_ps *initial_state = ni_get_ps(radeon_initial_state);
1684	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
1685	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
1686	struct ni_power_info *ni_pi = ni_get_pi(rdev);
1687	u32 reg;
1688	int ret;
1689
1690	table->initialState.level.mclk.vMPLL_AD_FUNC_CNTL =
1691		cpu_to_be32(ni_pi->clock_registers.mpll_ad_func_cntl);
1692	table->initialState.level.mclk.vMPLL_AD_FUNC_CNTL_2 =
1693		cpu_to_be32(ni_pi->clock_registers.mpll_ad_func_cntl_2);
1694	table->initialState.level.mclk.vMPLL_DQ_FUNC_CNTL =
1695		cpu_to_be32(ni_pi->clock_registers.mpll_dq_func_cntl);
1696	table->initialState.level.mclk.vMPLL_DQ_FUNC_CNTL_2 =
1697		cpu_to_be32(ni_pi->clock_registers.mpll_dq_func_cntl_2);
1698	table->initialState.level.mclk.vMCLK_PWRMGT_CNTL =
1699		cpu_to_be32(ni_pi->clock_registers.mclk_pwrmgt_cntl);
1700	table->initialState.level.mclk.vDLL_CNTL =
1701		cpu_to_be32(ni_pi->clock_registers.dll_cntl);
1702	table->initialState.level.mclk.vMPLL_SS =
1703		cpu_to_be32(ni_pi->clock_registers.mpll_ss1);
1704	table->initialState.level.mclk.vMPLL_SS2 =
1705		cpu_to_be32(ni_pi->clock_registers.mpll_ss2);
1706	table->initialState.level.mclk.mclk_value =
1707		cpu_to_be32(initial_state->performance_levels[0].mclk);
1708
1709	table->initialState.level.sclk.vCG_SPLL_FUNC_CNTL =
1710		cpu_to_be32(ni_pi->clock_registers.cg_spll_func_cntl);
1711	table->initialState.level.sclk.vCG_SPLL_FUNC_CNTL_2 =
1712		cpu_to_be32(ni_pi->clock_registers.cg_spll_func_cntl_2);
1713	table->initialState.level.sclk.vCG_SPLL_FUNC_CNTL_3 =
1714		cpu_to_be32(ni_pi->clock_registers.cg_spll_func_cntl_3);
1715	table->initialState.level.sclk.vCG_SPLL_FUNC_CNTL_4 =
1716		cpu_to_be32(ni_pi->clock_registers.cg_spll_func_cntl_4);
1717	table->initialState.level.sclk.vCG_SPLL_SPREAD_SPECTRUM =
1718		cpu_to_be32(ni_pi->clock_registers.cg_spll_spread_spectrum);
1719	table->initialState.level.sclk.vCG_SPLL_SPREAD_SPECTRUM_2 =
1720		cpu_to_be32(ni_pi->clock_registers.cg_spll_spread_spectrum_2);
1721	table->initialState.level.sclk.sclk_value =
1722		cpu_to_be32(initial_state->performance_levels[0].sclk);
1723	table->initialState.level.arbRefreshState =
1724		NISLANDS_INITIAL_STATE_ARB_INDEX;
1725
1726	table->initialState.level.ACIndex = 0;
1727
1728	ret = ni_populate_voltage_value(rdev, &eg_pi->vddc_voltage_table,
1729					initial_state->performance_levels[0].vddc,
1730					&table->initialState.level.vddc);
1731	if (!ret) {
1732		u16 std_vddc;
1733
1734		ret = ni_get_std_voltage_value(rdev,
1735					       &table->initialState.level.vddc,
1736					       &std_vddc);
1737		if (!ret)
1738			ni_populate_std_voltage_value(rdev, std_vddc,
1739						      table->initialState.level.vddc.index,
1740						      &table->initialState.level.std_vddc);
1741	}
1742
1743	if (eg_pi->vddci_control)
1744		ni_populate_voltage_value(rdev,
1745					  &eg_pi->vddci_voltage_table,
1746					  initial_state->performance_levels[0].vddci,
1747					  &table->initialState.level.vddci);
1748
1749	ni_populate_initial_mvdd_value(rdev, &table->initialState.level.mvdd);
1750
1751	reg = CG_R(0xffff) | CG_L(0);
1752	table->initialState.level.aT = cpu_to_be32(reg);
1753
1754	table->initialState.level.bSP = cpu_to_be32(pi->dsp);
1755
1756	if (pi->boot_in_gen2)
1757		table->initialState.level.gen2PCIE = 1;
1758	else
1759		table->initialState.level.gen2PCIE = 0;
1760
1761	if (pi->mem_gddr5) {
1762		table->initialState.level.strobeMode =
1763			cypress_get_strobe_mode_settings(rdev,
1764							 initial_state->performance_levels[0].mclk);
1765
1766		if (initial_state->performance_levels[0].mclk > pi->mclk_edc_enable_threshold)
1767			table->initialState.level.mcFlags = NISLANDS_SMC_MC_EDC_RD_FLAG | NISLANDS_SMC_MC_EDC_WR_FLAG;
1768		else
1769			table->initialState.level.mcFlags =  0;
1770	}
1771
1772	table->initialState.levelCount = 1;
1773
1774	table->initialState.flags |= PPSMC_SWSTATE_FLAG_DC;
1775
1776	table->initialState.level.dpm2.MaxPS = 0;
1777	table->initialState.level.dpm2.NearTDPDec = 0;
1778	table->initialState.level.dpm2.AboveSafeInc = 0;
1779	table->initialState.level.dpm2.BelowSafeInc = 0;
1780
1781	reg = MIN_POWER_MASK | MAX_POWER_MASK;
1782	table->initialState.level.SQPowerThrottle = cpu_to_be32(reg);
1783
1784	reg = MAX_POWER_DELTA_MASK | STI_SIZE_MASK | LTI_RATIO_MASK;
1785	table->initialState.level.SQPowerThrottle_2 = cpu_to_be32(reg);
1786
1787	return 0;
1788}
1789
1790static int ni_populate_smc_acpi_state(struct radeon_device *rdev,
1791				      NISLANDS_SMC_STATETABLE *table)
1792{
1793	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
1794	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
1795	struct ni_power_info *ni_pi = ni_get_pi(rdev);
1796	u32 mpll_ad_func_cntl   = ni_pi->clock_registers.mpll_ad_func_cntl;
1797	u32 mpll_ad_func_cntl_2 = ni_pi->clock_registers.mpll_ad_func_cntl_2;
1798	u32 mpll_dq_func_cntl   = ni_pi->clock_registers.mpll_dq_func_cntl;
1799	u32 mpll_dq_func_cntl_2 = ni_pi->clock_registers.mpll_dq_func_cntl_2;
1800	u32 spll_func_cntl      = ni_pi->clock_registers.cg_spll_func_cntl;
1801	u32 spll_func_cntl_2    = ni_pi->clock_registers.cg_spll_func_cntl_2;
1802	u32 spll_func_cntl_3    = ni_pi->clock_registers.cg_spll_func_cntl_3;
1803	u32 spll_func_cntl_4    = ni_pi->clock_registers.cg_spll_func_cntl_4;
1804	u32 mclk_pwrmgt_cntl    = ni_pi->clock_registers.mclk_pwrmgt_cntl;
1805	u32 dll_cntl            = ni_pi->clock_registers.dll_cntl;
1806	u32 reg;
1807	int ret;
1808
1809	table->ACPIState = table->initialState;
1810
1811	table->ACPIState.flags &= ~PPSMC_SWSTATE_FLAG_DC;
1812
1813	if (pi->acpi_vddc) {
1814		ret = ni_populate_voltage_value(rdev,
1815						&eg_pi->vddc_voltage_table,
1816						pi->acpi_vddc, &table->ACPIState.level.vddc);
1817		if (!ret) {
1818			u16 std_vddc;
1819
1820			ret = ni_get_std_voltage_value(rdev,
1821						       &table->ACPIState.level.vddc, &std_vddc);
1822			if (!ret)
1823				ni_populate_std_voltage_value(rdev, std_vddc,
1824							      table->ACPIState.level.vddc.index,
1825							      &table->ACPIState.level.std_vddc);
1826		}
1827
1828		if (pi->pcie_gen2) {
1829			if (pi->acpi_pcie_gen2)
1830				table->ACPIState.level.gen2PCIE = 1;
1831			else
1832				table->ACPIState.level.gen2PCIE = 0;
1833		} else {
1834			table->ACPIState.level.gen2PCIE = 0;
1835		}
1836	} else {
1837		ret = ni_populate_voltage_value(rdev,
1838						&eg_pi->vddc_voltage_table,
1839						pi->min_vddc_in_table,
1840						&table->ACPIState.level.vddc);
1841		if (!ret) {
1842			u16 std_vddc;
1843
1844			ret = ni_get_std_voltage_value(rdev,
1845						       &table->ACPIState.level.vddc,
1846						       &std_vddc);
1847			if (!ret)
1848				ni_populate_std_voltage_value(rdev, std_vddc,
1849							      table->ACPIState.level.vddc.index,
1850							      &table->ACPIState.level.std_vddc);
1851		}
1852		table->ACPIState.level.gen2PCIE = 0;
1853	}
1854
1855	if (eg_pi->acpi_vddci) {
1856		if (eg_pi->vddci_control)
1857			ni_populate_voltage_value(rdev,
1858						  &eg_pi->vddci_voltage_table,
1859						  eg_pi->acpi_vddci,
1860						  &table->ACPIState.level.vddci);
1861	}
1862
1863
1864	mpll_ad_func_cntl &= ~PDNB;
1865
1866	mpll_ad_func_cntl_2 |= BIAS_GEN_PDNB | RESET_EN;
1867
1868	if (pi->mem_gddr5)
1869		mpll_dq_func_cntl &= ~PDNB;
1870	mpll_dq_func_cntl_2 |= BIAS_GEN_PDNB | RESET_EN | BYPASS;
1871
1872
1873	mclk_pwrmgt_cntl |= (MRDCKA0_RESET |
1874			     MRDCKA1_RESET |
1875			     MRDCKB0_RESET |
1876			     MRDCKB1_RESET |
1877			     MRDCKC0_RESET |
1878			     MRDCKC1_RESET |
1879			     MRDCKD0_RESET |
1880			     MRDCKD1_RESET);
1881
1882	mclk_pwrmgt_cntl &= ~(MRDCKA0_PDNB |
1883			      MRDCKA1_PDNB |
1884			      MRDCKB0_PDNB |
1885			      MRDCKB1_PDNB |
1886			      MRDCKC0_PDNB |
1887			      MRDCKC1_PDNB |
1888			      MRDCKD0_PDNB |
1889			      MRDCKD1_PDNB);
1890
1891	dll_cntl |= (MRDCKA0_BYPASS |
1892		     MRDCKA1_BYPASS |
1893		     MRDCKB0_BYPASS |
1894		     MRDCKB1_BYPASS |
1895		     MRDCKC0_BYPASS |
1896		     MRDCKC1_BYPASS |
1897		     MRDCKD0_BYPASS |
1898		     MRDCKD1_BYPASS);
1899
1900	spll_func_cntl_2 &= ~SCLK_MUX_SEL_MASK;
1901	spll_func_cntl_2 |= SCLK_MUX_SEL(4);
1902
1903	table->ACPIState.level.mclk.vMPLL_AD_FUNC_CNTL = cpu_to_be32(mpll_ad_func_cntl);
1904	table->ACPIState.level.mclk.vMPLL_AD_FUNC_CNTL_2 = cpu_to_be32(mpll_ad_func_cntl_2);
1905	table->ACPIState.level.mclk.vMPLL_DQ_FUNC_CNTL = cpu_to_be32(mpll_dq_func_cntl);
1906	table->ACPIState.level.mclk.vMPLL_DQ_FUNC_CNTL_2 = cpu_to_be32(mpll_dq_func_cntl_2);
1907	table->ACPIState.level.mclk.vMCLK_PWRMGT_CNTL = cpu_to_be32(mclk_pwrmgt_cntl);
1908	table->ACPIState.level.mclk.vDLL_CNTL = cpu_to_be32(dll_cntl);
1909
1910	table->ACPIState.level.mclk.mclk_value = 0;
1911
1912	table->ACPIState.level.sclk.vCG_SPLL_FUNC_CNTL = cpu_to_be32(spll_func_cntl);
1913	table->ACPIState.level.sclk.vCG_SPLL_FUNC_CNTL_2 = cpu_to_be32(spll_func_cntl_2);
1914	table->ACPIState.level.sclk.vCG_SPLL_FUNC_CNTL_3 = cpu_to_be32(spll_func_cntl_3);
1915	table->ACPIState.level.sclk.vCG_SPLL_FUNC_CNTL_4 = cpu_to_be32(spll_func_cntl_4);
1916
1917	table->ACPIState.level.sclk.sclk_value = 0;
1918
1919	ni_populate_mvdd_value(rdev, 0, &table->ACPIState.level.mvdd);
1920
1921	if (eg_pi->dynamic_ac_timing)
1922		table->ACPIState.level.ACIndex = 1;
1923
1924	table->ACPIState.level.dpm2.MaxPS = 0;
1925	table->ACPIState.level.dpm2.NearTDPDec = 0;
1926	table->ACPIState.level.dpm2.AboveSafeInc = 0;
1927	table->ACPIState.level.dpm2.BelowSafeInc = 0;
1928
1929	reg = MIN_POWER_MASK | MAX_POWER_MASK;
1930	table->ACPIState.level.SQPowerThrottle = cpu_to_be32(reg);
1931
1932	reg = MAX_POWER_DELTA_MASK | STI_SIZE_MASK | LTI_RATIO_MASK;
1933	table->ACPIState.level.SQPowerThrottle_2 = cpu_to_be32(reg);
1934
1935	return 0;
1936}
1937
1938static int ni_init_smc_table(struct radeon_device *rdev)
1939{
1940	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
1941	struct ni_power_info *ni_pi = ni_get_pi(rdev);
1942	int ret;
1943	struct radeon_ps *radeon_boot_state = rdev->pm.dpm.boot_ps;
1944	NISLANDS_SMC_STATETABLE *table = &ni_pi->smc_statetable;
1945
1946	memset(table, 0, sizeof(NISLANDS_SMC_STATETABLE));
1947
1948	ni_populate_smc_voltage_tables(rdev, table);
1949
1950	switch (rdev->pm.int_thermal_type) {
1951	case THERMAL_TYPE_NI:
1952	case THERMAL_TYPE_EMC2103_WITH_INTERNAL:
1953		table->thermalProtectType = PPSMC_THERMAL_PROTECT_TYPE_INTERNAL;
1954		break;
1955	case THERMAL_TYPE_NONE:
1956		table->thermalProtectType = PPSMC_THERMAL_PROTECT_TYPE_NONE;
1957		break;
1958	default:
1959		table->thermalProtectType = PPSMC_THERMAL_PROTECT_TYPE_EXTERNAL;
1960		break;
1961	}
1962
1963	if (rdev->pm.dpm.platform_caps & ATOM_PP_PLATFORM_CAP_HARDWAREDC)
1964		table->systemFlags |= PPSMC_SYSTEMFLAG_GPIO_DC;
1965
1966	if (rdev->pm.dpm.platform_caps & ATOM_PP_PLATFORM_CAP_REGULATOR_HOT)
1967		table->systemFlags |= PPSMC_SYSTEMFLAG_REGULATOR_HOT;
1968
1969	if (rdev->pm.dpm.platform_caps & ATOM_PP_PLATFORM_CAP_STEPVDDC)
1970		table->systemFlags |= PPSMC_SYSTEMFLAG_STEPVDDC;
1971
1972	if (pi->mem_gddr5)
1973		table->systemFlags |= PPSMC_SYSTEMFLAG_GDDR5;
1974
1975	ret = ni_populate_smc_initial_state(rdev, radeon_boot_state, table);
1976	if (ret)
1977		return ret;
1978
1979	ret = ni_populate_smc_acpi_state(rdev, table);
1980	if (ret)
1981		return ret;
1982
1983	table->driverState.flags = table->initialState.flags;
1984	table->driverState.levelCount = table->initialState.levelCount;
1985	table->driverState.levels[0] = table->initialState.level;
1986
1987	table->ULVState = table->initialState;
1988
1989	ret = ni_do_program_memory_timing_parameters(rdev, radeon_boot_state,
1990						     NISLANDS_INITIAL_STATE_ARB_INDEX);
1991	if (ret)
1992		return ret;
1993
1994	return rv770_copy_bytes_to_smc(rdev, pi->state_table_start, (u8 *)table,
1995				       sizeof(NISLANDS_SMC_STATETABLE), pi->sram_end);
1996}
1997
1998static int ni_calculate_sclk_params(struct radeon_device *rdev,
1999				    u32 engine_clock,
2000				    NISLANDS_SMC_SCLK_VALUE *sclk)
2001{
2002	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
2003	struct ni_power_info *ni_pi = ni_get_pi(rdev);
2004	struct atom_clock_dividers dividers;
2005	u32 spll_func_cntl = ni_pi->clock_registers.cg_spll_func_cntl;
2006	u32 spll_func_cntl_2 = ni_pi->clock_registers.cg_spll_func_cntl_2;
2007	u32 spll_func_cntl_3 = ni_pi->clock_registers.cg_spll_func_cntl_3;
2008	u32 spll_func_cntl_4 = ni_pi->clock_registers.cg_spll_func_cntl_4;
2009	u32 cg_spll_spread_spectrum = ni_pi->clock_registers.cg_spll_spread_spectrum;
2010	u32 cg_spll_spread_spectrum_2 = ni_pi->clock_registers.cg_spll_spread_spectrum_2;
2011	u64 tmp;
2012	u32 reference_clock = rdev->clock.spll.reference_freq;
2013	u32 reference_divider;
2014	u32 fbdiv;
2015	int ret;
2016
2017	ret = radeon_atom_get_clock_dividers(rdev, COMPUTE_ENGINE_PLL_PARAM,
2018					     engine_clock, false, &dividers);
2019	if (ret)
2020		return ret;
2021
2022	reference_divider = 1 + dividers.ref_div;
2023
2024
2025	tmp = (u64) engine_clock * reference_divider * dividers.post_div * 16834;
2026	do_div(tmp, reference_clock);
2027	fbdiv = (u32) tmp;
2028
2029	spll_func_cntl &= ~(SPLL_PDIV_A_MASK | SPLL_REF_DIV_MASK);
2030	spll_func_cntl |= SPLL_REF_DIV(dividers.ref_div);
2031	spll_func_cntl |= SPLL_PDIV_A(dividers.post_div);
2032
2033	spll_func_cntl_2 &= ~SCLK_MUX_SEL_MASK;
2034	spll_func_cntl_2 |= SCLK_MUX_SEL(2);
2035
2036	spll_func_cntl_3 &= ~SPLL_FB_DIV_MASK;
2037	spll_func_cntl_3 |= SPLL_FB_DIV(fbdiv);
2038	spll_func_cntl_3 |= SPLL_DITHEN;
2039
2040	if (pi->sclk_ss) {
2041		struct radeon_atom_ss ss;
2042		u32 vco_freq = engine_clock * dividers.post_div;
2043
2044		if (radeon_atombios_get_asic_ss_info(rdev, &ss,
2045						     ASIC_INTERNAL_ENGINE_SS, vco_freq)) {
2046			u32 clk_s = reference_clock * 5 / (reference_divider * ss.rate);
2047			u32 clk_v = 4 * ss.percentage * fbdiv / (clk_s * 10000);
2048
2049			cg_spll_spread_spectrum &= ~CLK_S_MASK;
2050			cg_spll_spread_spectrum |= CLK_S(clk_s);
2051			cg_spll_spread_spectrum |= SSEN;
2052
2053			cg_spll_spread_spectrum_2 &= ~CLK_V_MASK;
2054			cg_spll_spread_spectrum_2 |= CLK_V(clk_v);
2055		}
2056	}
2057
2058	sclk->sclk_value = engine_clock;
2059	sclk->vCG_SPLL_FUNC_CNTL = spll_func_cntl;
2060	sclk->vCG_SPLL_FUNC_CNTL_2 = spll_func_cntl_2;
2061	sclk->vCG_SPLL_FUNC_CNTL_3 = spll_func_cntl_3;
2062	sclk->vCG_SPLL_FUNC_CNTL_4 = spll_func_cntl_4;
2063	sclk->vCG_SPLL_SPREAD_SPECTRUM = cg_spll_spread_spectrum;
2064	sclk->vCG_SPLL_SPREAD_SPECTRUM_2 = cg_spll_spread_spectrum_2;
2065
2066	return 0;
2067}
2068
2069static int ni_populate_sclk_value(struct radeon_device *rdev,
2070				  u32 engine_clock,
2071				  NISLANDS_SMC_SCLK_VALUE *sclk)
2072{
2073	NISLANDS_SMC_SCLK_VALUE sclk_tmp;
2074	int ret;
2075
2076	ret = ni_calculate_sclk_params(rdev, engine_clock, &sclk_tmp);
2077	if (!ret) {
2078		sclk->sclk_value = cpu_to_be32(sclk_tmp.sclk_value);
2079		sclk->vCG_SPLL_FUNC_CNTL = cpu_to_be32(sclk_tmp.vCG_SPLL_FUNC_CNTL);
2080		sclk->vCG_SPLL_FUNC_CNTL_2 = cpu_to_be32(sclk_tmp.vCG_SPLL_FUNC_CNTL_2);
2081		sclk->vCG_SPLL_FUNC_CNTL_3 = cpu_to_be32(sclk_tmp.vCG_SPLL_FUNC_CNTL_3);
2082		sclk->vCG_SPLL_FUNC_CNTL_4 = cpu_to_be32(sclk_tmp.vCG_SPLL_FUNC_CNTL_4);
2083		sclk->vCG_SPLL_SPREAD_SPECTRUM = cpu_to_be32(sclk_tmp.vCG_SPLL_SPREAD_SPECTRUM);
2084		sclk->vCG_SPLL_SPREAD_SPECTRUM_2 = cpu_to_be32(sclk_tmp.vCG_SPLL_SPREAD_SPECTRUM_2);
2085	}
2086
2087	return ret;
2088}
2089
2090static int ni_init_smc_spll_table(struct radeon_device *rdev)
2091{
2092	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
2093	struct ni_power_info *ni_pi = ni_get_pi(rdev);
2094	SMC_NISLANDS_SPLL_DIV_TABLE *spll_table;
2095	NISLANDS_SMC_SCLK_VALUE sclk_params;
2096	u32 fb_div;
2097	u32 p_div;
2098	u32 clk_s;
2099	u32 clk_v;
2100	u32 sclk = 0;
2101	int i, ret;
2102	u32 tmp;
2103
2104	if (ni_pi->spll_table_start == 0)
2105		return -EINVAL;
2106
2107	spll_table = kzalloc(sizeof(SMC_NISLANDS_SPLL_DIV_TABLE), GFP_KERNEL);
2108	if (spll_table == NULL)
2109		return -ENOMEM;
2110
2111	for (i = 0; i < 256; i++) {
2112		ret = ni_calculate_sclk_params(rdev, sclk, &sclk_params);
2113		if (ret)
2114			break;
2115
2116		p_div = (sclk_params.vCG_SPLL_FUNC_CNTL & SPLL_PDIV_A_MASK) >> SPLL_PDIV_A_SHIFT;
2117		fb_div = (sclk_params.vCG_SPLL_FUNC_CNTL_3 & SPLL_FB_DIV_MASK) >> SPLL_FB_DIV_SHIFT;
2118		clk_s = (sclk_params.vCG_SPLL_SPREAD_SPECTRUM & CLK_S_MASK) >> CLK_S_SHIFT;
2119		clk_v = (sclk_params.vCG_SPLL_SPREAD_SPECTRUM_2 & CLK_V_MASK) >> CLK_V_SHIFT;
2120
2121		fb_div &= ~0x00001FFF;
2122		fb_div >>= 1;
2123		clk_v >>= 6;
2124
2125		if (p_div & ~(SMC_NISLANDS_SPLL_DIV_TABLE_PDIV_MASK >> SMC_NISLANDS_SPLL_DIV_TABLE_PDIV_SHIFT))
2126			ret = -EINVAL;
2127
2128		if (clk_s & ~(SMC_NISLANDS_SPLL_DIV_TABLE_CLKS_MASK >> SMC_NISLANDS_SPLL_DIV_TABLE_CLKS_SHIFT))
2129			ret = -EINVAL;
2130
2131		if (fb_div & ~(SMC_NISLANDS_SPLL_DIV_TABLE_FBDIV_MASK >> SMC_NISLANDS_SPLL_DIV_TABLE_FBDIV_SHIFT))
2132			ret = -EINVAL;
2133
2134		if (clk_v & ~(SMC_NISLANDS_SPLL_DIV_TABLE_CLKV_MASK >> SMC_NISLANDS_SPLL_DIV_TABLE_CLKV_SHIFT))
2135			ret = -EINVAL;
2136
2137		if (ret)
2138			break;
2139
2140		tmp = ((fb_div << SMC_NISLANDS_SPLL_DIV_TABLE_FBDIV_SHIFT) & SMC_NISLANDS_SPLL_DIV_TABLE_FBDIV_MASK) |
2141			((p_div << SMC_NISLANDS_SPLL_DIV_TABLE_PDIV_SHIFT) & SMC_NISLANDS_SPLL_DIV_TABLE_PDIV_MASK);
2142		spll_table->freq[i] = cpu_to_be32(tmp);
2143
2144		tmp = ((clk_v << SMC_NISLANDS_SPLL_DIV_TABLE_CLKV_SHIFT) & SMC_NISLANDS_SPLL_DIV_TABLE_CLKV_MASK) |
2145			((clk_s << SMC_NISLANDS_SPLL_DIV_TABLE_CLKS_SHIFT) & SMC_NISLANDS_SPLL_DIV_TABLE_CLKS_MASK);
2146		spll_table->ss[i] = cpu_to_be32(tmp);
2147
2148		sclk += 512;
2149	}
2150
2151	if (!ret)
2152		ret = rv770_copy_bytes_to_smc(rdev, ni_pi->spll_table_start, (u8 *)spll_table,
2153					      sizeof(SMC_NISLANDS_SPLL_DIV_TABLE), pi->sram_end);
2154
2155	kfree(spll_table);
2156
2157	return ret;
2158}
2159
2160static int ni_populate_mclk_value(struct radeon_device *rdev,
2161				  u32 engine_clock,
2162				  u32 memory_clock,
2163				  NISLANDS_SMC_MCLK_VALUE *mclk,
2164				  bool strobe_mode,
2165				  bool dll_state_on)
2166{
2167	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
2168	struct ni_power_info *ni_pi = ni_get_pi(rdev);
2169	u32 mpll_ad_func_cntl = ni_pi->clock_registers.mpll_ad_func_cntl;
2170	u32 mpll_ad_func_cntl_2 = ni_pi->clock_registers.mpll_ad_func_cntl_2;
2171	u32 mpll_dq_func_cntl = ni_pi->clock_registers.mpll_dq_func_cntl;
2172	u32 mpll_dq_func_cntl_2 = ni_pi->clock_registers.mpll_dq_func_cntl_2;
2173	u32 mclk_pwrmgt_cntl = ni_pi->clock_registers.mclk_pwrmgt_cntl;
2174	u32 dll_cntl = ni_pi->clock_registers.dll_cntl;
2175	u32 mpll_ss1 = ni_pi->clock_registers.mpll_ss1;
2176	u32 mpll_ss2 = ni_pi->clock_registers.mpll_ss2;
2177	struct atom_clock_dividers dividers;
2178	u32 ibias;
2179	u32 dll_speed;
2180	int ret;
2181	u32 mc_seq_misc7;
2182
2183	ret = radeon_atom_get_clock_dividers(rdev, COMPUTE_MEMORY_PLL_PARAM,
2184					     memory_clock, strobe_mode, &dividers);
2185	if (ret)
2186		return ret;
2187
2188	if (!strobe_mode) {
2189		mc_seq_misc7 = RREG32(MC_SEQ_MISC7);
2190
2191		if (mc_seq_misc7 & 0x8000000)
2192			dividers.post_div = 1;
2193	}
2194
2195	ibias = cypress_map_clkf_to_ibias(rdev, dividers.whole_fb_div);
2196
2197	mpll_ad_func_cntl &= ~(CLKR_MASK |
2198			       YCLK_POST_DIV_MASK |
2199			       CLKF_MASK |
2200			       CLKFRAC_MASK |
2201			       IBIAS_MASK);
2202	mpll_ad_func_cntl |= CLKR(dividers.ref_div);
2203	mpll_ad_func_cntl |= YCLK_POST_DIV(dividers.post_div);
2204	mpll_ad_func_cntl |= CLKF(dividers.whole_fb_div);
2205	mpll_ad_func_cntl |= CLKFRAC(dividers.frac_fb_div);
2206	mpll_ad_func_cntl |= IBIAS(ibias);
2207
2208	if (dividers.vco_mode)
2209		mpll_ad_func_cntl_2 |= VCO_MODE;
2210	else
2211		mpll_ad_func_cntl_2 &= ~VCO_MODE;
2212
2213	if (pi->mem_gddr5) {
2214		mpll_dq_func_cntl &= ~(CLKR_MASK |
2215				       YCLK_POST_DIV_MASK |
2216				       CLKF_MASK |
2217				       CLKFRAC_MASK |
2218				       IBIAS_MASK);
2219		mpll_dq_func_cntl |= CLKR(dividers.ref_div);
2220		mpll_dq_func_cntl |= YCLK_POST_DIV(dividers.post_div);
2221		mpll_dq_func_cntl |= CLKF(dividers.whole_fb_div);
2222		mpll_dq_func_cntl |= CLKFRAC(dividers.frac_fb_div);
2223		mpll_dq_func_cntl |= IBIAS(ibias);
2224
2225		if (strobe_mode)
2226			mpll_dq_func_cntl &= ~PDNB;
2227		else
2228			mpll_dq_func_cntl |= PDNB;
2229
2230		if (dividers.vco_mode)
2231			mpll_dq_func_cntl_2 |= VCO_MODE;
2232		else
2233			mpll_dq_func_cntl_2 &= ~VCO_MODE;
2234	}
2235
2236	if (pi->mclk_ss) {
2237		struct radeon_atom_ss ss;
2238		u32 vco_freq = memory_clock * dividers.post_div;
2239
2240		if (radeon_atombios_get_asic_ss_info(rdev, &ss,
2241						     ASIC_INTERNAL_MEMORY_SS, vco_freq)) {
2242			u32 reference_clock = rdev->clock.mpll.reference_freq;
2243			u32 decoded_ref = rv740_get_decoded_reference_divider(dividers.ref_div);
2244			u32 clk_s, clk_v;
2245
2246			if (!decoded_ref)
2247				return -EINVAL;
2248			clk_s = reference_clock * 5 / (decoded_ref * ss.rate);
2249			clk_v = ss.percentage *
2250				(0x4000 * dividers.whole_fb_div + 0x800 * dividers.frac_fb_div) / (clk_s * 625);
2251
2252			mpll_ss1 &= ~CLKV_MASK;
2253			mpll_ss1 |= CLKV(clk_v);
2254
2255			mpll_ss2 &= ~CLKS_MASK;
2256			mpll_ss2 |= CLKS(clk_s);
2257		}
2258	}
2259
2260	dll_speed = rv740_get_dll_speed(pi->mem_gddr5,
2261					memory_clock);
2262
2263	mclk_pwrmgt_cntl &= ~DLL_SPEED_MASK;
2264	mclk_pwrmgt_cntl |= DLL_SPEED(dll_speed);
2265	if (dll_state_on)
2266		mclk_pwrmgt_cntl |= (MRDCKA0_PDNB |
2267				     MRDCKA1_PDNB |
2268				     MRDCKB0_PDNB |
2269				     MRDCKB1_PDNB |
2270				     MRDCKC0_PDNB |
2271				     MRDCKC1_PDNB |
2272				     MRDCKD0_PDNB |
2273				     MRDCKD1_PDNB);
2274	else
2275		mclk_pwrmgt_cntl &= ~(MRDCKA0_PDNB |
2276				      MRDCKA1_PDNB |
2277				      MRDCKB0_PDNB |
2278				      MRDCKB1_PDNB |
2279				      MRDCKC0_PDNB |
2280				      MRDCKC1_PDNB |
2281				      MRDCKD0_PDNB |
2282				      MRDCKD1_PDNB);
2283
2284
2285	mclk->mclk_value = cpu_to_be32(memory_clock);
2286	mclk->vMPLL_AD_FUNC_CNTL = cpu_to_be32(mpll_ad_func_cntl);
2287	mclk->vMPLL_AD_FUNC_CNTL_2 = cpu_to_be32(mpll_ad_func_cntl_2);
2288	mclk->vMPLL_DQ_FUNC_CNTL = cpu_to_be32(mpll_dq_func_cntl);
2289	mclk->vMPLL_DQ_FUNC_CNTL_2 = cpu_to_be32(mpll_dq_func_cntl_2);
2290	mclk->vMCLK_PWRMGT_CNTL = cpu_to_be32(mclk_pwrmgt_cntl);
2291	mclk->vDLL_CNTL = cpu_to_be32(dll_cntl);
2292	mclk->vMPLL_SS = cpu_to_be32(mpll_ss1);
2293	mclk->vMPLL_SS2 = cpu_to_be32(mpll_ss2);
2294
2295	return 0;
2296}
2297
2298static void ni_populate_smc_sp(struct radeon_device *rdev,
2299			       struct radeon_ps *radeon_state,
2300			       NISLANDS_SMC_SWSTATE *smc_state)
2301{
2302	struct ni_ps *ps = ni_get_ps(radeon_state);
2303	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
2304	int i;
2305
2306	for (i = 0; i < ps->performance_level_count - 1; i++)
2307		smc_state->levels[i].bSP = cpu_to_be32(pi->dsp);
2308
2309	smc_state->levels[ps->performance_level_count - 1].bSP =
2310		cpu_to_be32(pi->psp);
2311}
2312
2313static int ni_convert_power_level_to_smc(struct radeon_device *rdev,
2314					 struct rv7xx_pl *pl,
2315					 NISLANDS_SMC_HW_PERFORMANCE_LEVEL *level)
2316{
2317	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
2318	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
2319	struct ni_power_info *ni_pi = ni_get_pi(rdev);
2320	int ret;
2321	bool dll_state_on;
2322	u16 std_vddc;
2323	u32 tmp = RREG32(DC_STUTTER_CNTL);
2324
2325	level->gen2PCIE = pi->pcie_gen2 ?
2326		((pl->flags & ATOM_PPLIB_R600_FLAGS_PCIEGEN2) ? 1 : 0) : 0;
2327
2328	ret = ni_populate_sclk_value(rdev, pl->sclk, &level->sclk);
2329	if (ret)
2330		return ret;
2331
2332	level->mcFlags =  0;
2333	if (pi->mclk_stutter_mode_threshold &&
2334	    (pl->mclk <= pi->mclk_stutter_mode_threshold) &&
2335	    !eg_pi->uvd_enabled &&
2336	    (tmp & DC_STUTTER_ENABLE_A) &&
2337	    (tmp & DC_STUTTER_ENABLE_B))
2338		level->mcFlags |= NISLANDS_SMC_MC_STUTTER_EN;
2339
2340	if (pi->mem_gddr5) {
2341		if (pl->mclk > pi->mclk_edc_enable_threshold)
2342			level->mcFlags |= NISLANDS_SMC_MC_EDC_RD_FLAG;
2343		if (pl->mclk > eg_pi->mclk_edc_wr_enable_threshold)
2344			level->mcFlags |= NISLANDS_SMC_MC_EDC_WR_FLAG;
2345
2346		level->strobeMode = cypress_get_strobe_mode_settings(rdev, pl->mclk);
2347
2348		if (level->strobeMode & NISLANDS_SMC_STROBE_ENABLE) {
2349			if (cypress_get_mclk_frequency_ratio(rdev, pl->mclk, true) >=
2350			    ((RREG32(MC_SEQ_MISC7) >> 16) & 0xf))
2351				dll_state_on = ((RREG32(MC_SEQ_MISC5) >> 1) & 0x1) ? true : false;
2352			else
2353				dll_state_on = ((RREG32(MC_SEQ_MISC6) >> 1) & 0x1) ? true : false;
2354		} else {
2355			dll_state_on = false;
2356			if (pl->mclk > ni_pi->mclk_rtt_mode_threshold)
2357				level->mcFlags |= NISLANDS_SMC_MC_RTT_ENABLE;
2358		}
2359
2360		ret = ni_populate_mclk_value(rdev, pl->sclk, pl->mclk,
2361					     &level->mclk,
2362					     (level->strobeMode & NISLANDS_SMC_STROBE_ENABLE) != 0,
2363					     dll_state_on);
2364	} else
2365		ret = ni_populate_mclk_value(rdev, pl->sclk, pl->mclk, &level->mclk, 1, 1);
2366
2367	if (ret)
2368		return ret;
2369
2370	ret = ni_populate_voltage_value(rdev, &eg_pi->vddc_voltage_table,
2371					pl->vddc, &level->vddc);
2372	if (ret)
2373		return ret;
2374
2375	ret = ni_get_std_voltage_value(rdev, &level->vddc, &std_vddc);
2376	if (ret)
2377		return ret;
2378
2379	ni_populate_std_voltage_value(rdev, std_vddc,
2380				      level->vddc.index, &level->std_vddc);
2381
2382	if (eg_pi->vddci_control) {
2383		ret = ni_populate_voltage_value(rdev, &eg_pi->vddci_voltage_table,
2384						pl->vddci, &level->vddci);
2385		if (ret)
2386			return ret;
2387	}
2388
2389	ni_populate_mvdd_value(rdev, pl->mclk, &level->mvdd);
2390
2391	return ret;
2392}
2393
2394static int ni_populate_smc_t(struct radeon_device *rdev,
2395			     struct radeon_ps *radeon_state,
2396			     NISLANDS_SMC_SWSTATE *smc_state)
2397{
2398	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
2399	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
2400	struct ni_ps *state = ni_get_ps(radeon_state);
2401	u32 a_t;
2402	u32 t_l, t_h;
2403	u32 high_bsp;
2404	int i, ret;
2405
2406	if (state->performance_level_count >= 9)
2407		return -EINVAL;
2408
2409	if (state->performance_level_count < 2) {
2410		a_t = CG_R(0xffff) | CG_L(0);
2411		smc_state->levels[0].aT = cpu_to_be32(a_t);
2412		return 0;
2413	}
2414
2415	smc_state->levels[0].aT = cpu_to_be32(0);
2416
2417	for (i = 0; i <= state->performance_level_count - 2; i++) {
2418		if (eg_pi->uvd_enabled)
2419			ret = r600_calculate_at(
2420				1000 * (i * (eg_pi->smu_uvd_hs ? 2 : 8) + 2),
2421				100 * R600_AH_DFLT,
2422				state->performance_levels[i + 1].sclk,
2423				state->performance_levels[i].sclk,
2424				&t_l,
2425				&t_h);
2426		else
2427			ret = r600_calculate_at(
2428				1000 * (i + 1),
2429				100 * R600_AH_DFLT,
2430				state->performance_levels[i + 1].sclk,
2431				state->performance_levels[i].sclk,
2432				&t_l,
2433				&t_h);
2434
2435		if (ret) {
2436			t_h = (i + 1) * 1000 - 50 * R600_AH_DFLT;
2437			t_l = (i + 1) * 1000 + 50 * R600_AH_DFLT;
2438		}
2439
2440		a_t = be32_to_cpu(smc_state->levels[i].aT) & ~CG_R_MASK;
2441		a_t |= CG_R(t_l * pi->bsp / 20000);
2442		smc_state->levels[i].aT = cpu_to_be32(a_t);
2443
2444		high_bsp = (i == state->performance_level_count - 2) ?
2445			pi->pbsp : pi->bsp;
2446
2447		a_t = CG_R(0xffff) | CG_L(t_h * high_bsp / 20000);
2448		smc_state->levels[i + 1].aT = cpu_to_be32(a_t);
2449	}
2450
2451	return 0;
2452}
2453
2454static int ni_populate_power_containment_values(struct radeon_device *rdev,
2455						struct radeon_ps *radeon_state,
2456						NISLANDS_SMC_SWSTATE *smc_state)
2457{
2458	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
2459	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
2460	struct ni_power_info *ni_pi = ni_get_pi(rdev);
2461	struct ni_ps *state = ni_get_ps(radeon_state);
2462	u32 prev_sclk;
2463	u32 max_sclk;
2464	u32 min_sclk;
2465	int i, ret;
2466	u32 tdp_limit;
2467	u32 near_tdp_limit;
2468	u32 power_boost_limit;
2469	u8 max_ps_percent;
2470
2471	if (ni_pi->enable_power_containment == false)
2472		return 0;
2473
2474	if (state->performance_level_count == 0)
2475		return -EINVAL;
2476
2477	if (smc_state->levelCount != state->performance_level_count)
2478		return -EINVAL;
2479
2480	ret = ni_calculate_adjusted_tdp_limits(rdev,
2481					       false, /* ??? */
2482					       rdev->pm.dpm.tdp_adjustment,
2483					       &tdp_limit,
2484					       &near_tdp_limit);
2485	if (ret)
2486		return ret;
2487
2488	power_boost_limit = ni_calculate_power_boost_limit(rdev, radeon_state, near_tdp_limit);
2489
2490	ret = rv770_write_smc_sram_dword(rdev,
2491					 pi->state_table_start +
2492					 offsetof(NISLANDS_SMC_STATETABLE, dpm2Params) +
2493					 offsetof(PP_NIslands_DPM2Parameters, PowerBoostLimit),
2494					 ni_scale_power_for_smc(power_boost_limit, ni_get_smc_power_scaling_factor(rdev)),
2495					 pi->sram_end);
2496	if (ret)
2497		power_boost_limit = 0;
2498
2499	smc_state->levels[0].dpm2.MaxPS = 0;
2500	smc_state->levels[0].dpm2.NearTDPDec = 0;
2501	smc_state->levels[0].dpm2.AboveSafeInc = 0;
2502	smc_state->levels[0].dpm2.BelowSafeInc = 0;
2503	smc_state->levels[0].stateFlags |= power_boost_limit ? PPSMC_STATEFLAG_POWERBOOST : 0;
2504
2505	for (i = 1; i < state->performance_level_count; i++) {
2506		prev_sclk = state->performance_levels[i-1].sclk;
2507		max_sclk  = state->performance_levels[i].sclk;
2508		max_ps_percent = (i != (state->performance_level_count - 1)) ?
2509			NISLANDS_DPM2_MAXPS_PERCENT_M : NISLANDS_DPM2_MAXPS_PERCENT_H;
2510
2511		if (max_sclk < prev_sclk)
2512			return -EINVAL;
2513
2514		if ((max_ps_percent == 0) || (prev_sclk == max_sclk) || eg_pi->uvd_enabled)
2515			min_sclk = max_sclk;
2516		else if (1 == i)
2517			min_sclk = prev_sclk;
2518		else
2519			min_sclk = (prev_sclk * (u32)max_ps_percent) / 100;
2520
2521		if (min_sclk < state->performance_levels[0].sclk)
2522			min_sclk = state->performance_levels[0].sclk;
2523
2524		if (min_sclk == 0)
2525			return -EINVAL;
2526
2527		smc_state->levels[i].dpm2.MaxPS =
2528			(u8)((NISLANDS_DPM2_MAX_PULSE_SKIP * (max_sclk - min_sclk)) / max_sclk);
2529		smc_state->levels[i].dpm2.NearTDPDec = NISLANDS_DPM2_NEAR_TDP_DEC;
2530		smc_state->levels[i].dpm2.AboveSafeInc = NISLANDS_DPM2_ABOVE_SAFE_INC;
2531		smc_state->levels[i].dpm2.BelowSafeInc = NISLANDS_DPM2_BELOW_SAFE_INC;
2532		smc_state->levels[i].stateFlags |=
2533			((i != (state->performance_level_count - 1)) && power_boost_limit) ?
2534			PPSMC_STATEFLAG_POWERBOOST : 0;
2535	}
2536
2537	return 0;
2538}
2539
2540static int ni_populate_sq_ramping_values(struct radeon_device *rdev,
2541					 struct radeon_ps *radeon_state,
2542					 NISLANDS_SMC_SWSTATE *smc_state)
2543{
2544	struct ni_power_info *ni_pi = ni_get_pi(rdev);
2545	struct ni_ps *state = ni_get_ps(radeon_state);
2546	u32 sq_power_throttle;
2547	u32 sq_power_throttle2;
2548	bool enable_sq_ramping = ni_pi->enable_sq_ramping;
2549	int i;
2550
2551	if (state->performance_level_count == 0)
2552		return -EINVAL;
2553
2554	if (smc_state->levelCount != state->performance_level_count)
2555		return -EINVAL;
2556
2557	if (rdev->pm.dpm.sq_ramping_threshold == 0)
2558		return -EINVAL;
2559
2560	if (NISLANDS_DPM2_SQ_RAMP_MAX_POWER > (MAX_POWER_MASK >> MAX_POWER_SHIFT))
2561		enable_sq_ramping = false;
2562
2563	if (NISLANDS_DPM2_SQ_RAMP_MIN_POWER > (MIN_POWER_MASK >> MIN_POWER_SHIFT))
2564		enable_sq_ramping = false;
2565
2566	if (NISLANDS_DPM2_SQ_RAMP_MAX_POWER_DELTA > (MAX_POWER_DELTA_MASK >> MAX_POWER_DELTA_SHIFT))
2567		enable_sq_ramping = false;
2568
2569	if (NISLANDS_DPM2_SQ_RAMP_STI_SIZE > (STI_SIZE_MASK >> STI_SIZE_SHIFT))
2570		enable_sq_ramping = false;
2571
2572	if (NISLANDS_DPM2_SQ_RAMP_LTI_RATIO > (LTI_RATIO_MASK >> LTI_RATIO_SHIFT))
2573		enable_sq_ramping = false;
2574
2575	for (i = 0; i < state->performance_level_count; i++) {
2576		sq_power_throttle  = 0;
2577		sq_power_throttle2 = 0;
2578
2579		if ((state->performance_levels[i].sclk >= rdev->pm.dpm.sq_ramping_threshold) &&
2580		    enable_sq_ramping) {
2581			sq_power_throttle |= MAX_POWER(NISLANDS_DPM2_SQ_RAMP_MAX_POWER);
2582			sq_power_throttle |= MIN_POWER(NISLANDS_DPM2_SQ_RAMP_MIN_POWER);
2583			sq_power_throttle2 |= MAX_POWER_DELTA(NISLANDS_DPM2_SQ_RAMP_MAX_POWER_DELTA);
2584			sq_power_throttle2 |= STI_SIZE(NISLANDS_DPM2_SQ_RAMP_STI_SIZE);
2585			sq_power_throttle2 |= LTI_RATIO(NISLANDS_DPM2_SQ_RAMP_LTI_RATIO);
2586		} else {
2587			sq_power_throttle |= MAX_POWER_MASK | MIN_POWER_MASK;
2588			sq_power_throttle2 |= MAX_POWER_DELTA_MASK | STI_SIZE_MASK | LTI_RATIO_MASK;
2589		}
2590
2591		smc_state->levels[i].SQPowerThrottle   = cpu_to_be32(sq_power_throttle);
2592		smc_state->levels[i].SQPowerThrottle_2 = cpu_to_be32(sq_power_throttle2);
2593	}
2594
2595	return 0;
2596}
2597
2598static int ni_enable_power_containment(struct radeon_device *rdev,
2599				       struct radeon_ps *radeon_new_state,
2600				       bool enable)
2601{
2602	struct ni_power_info *ni_pi = ni_get_pi(rdev);
2603	PPSMC_Result smc_result;
2604	int ret = 0;
2605
2606	if (ni_pi->enable_power_containment) {
2607		if (enable) {
2608			if (!r600_is_uvd_state(radeon_new_state->class, radeon_new_state->class2)) {
2609				smc_result = rv770_send_msg_to_smc(rdev, PPSMC_TDPClampingActive);
2610				if (smc_result != PPSMC_Result_OK) {
2611					ret = -EINVAL;
2612					ni_pi->pc_enabled = false;
2613				} else {
2614					ni_pi->pc_enabled = true;
2615				}
2616			}
2617		} else {
2618			smc_result = rv770_send_msg_to_smc(rdev, PPSMC_TDPClampingInactive);
2619			if (smc_result != PPSMC_Result_OK)
2620				ret = -EINVAL;
2621			ni_pi->pc_enabled = false;
2622		}
2623	}
2624
2625	return ret;
2626}
2627
2628static int ni_convert_power_state_to_smc(struct radeon_device *rdev,
2629					 struct radeon_ps *radeon_state,
2630					 NISLANDS_SMC_SWSTATE *smc_state)
2631{
2632	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
2633	struct ni_power_info *ni_pi = ni_get_pi(rdev);
2634	struct ni_ps *state = ni_get_ps(radeon_state);
2635	int i, ret;
2636	u32 threshold = state->performance_levels[state->performance_level_count - 1].sclk * 100 / 100;
2637
2638	if (!(radeon_state->caps & ATOM_PPLIB_DISALLOW_ON_DC))
2639		smc_state->flags |= PPSMC_SWSTATE_FLAG_DC;
2640
2641	smc_state->levelCount = 0;
2642
2643	if (state->performance_level_count > NISLANDS_MAX_SMC_PERFORMANCE_LEVELS_PER_SWSTATE)
2644		return -EINVAL;
2645
2646	for (i = 0; i < state->performance_level_count; i++) {
2647		ret = ni_convert_power_level_to_smc(rdev, &state->performance_levels[i],
2648						    &smc_state->levels[i]);
2649		smc_state->levels[i].arbRefreshState =
2650			(u8)(NISLANDS_DRIVER_STATE_ARB_INDEX + i);
2651
2652		if (ret)
2653			return ret;
2654
2655		if (ni_pi->enable_power_containment)
2656			smc_state->levels[i].displayWatermark =
2657				(state->performance_levels[i].sclk < threshold) ?
2658				PPSMC_DISPLAY_WATERMARK_LOW : PPSMC_DISPLAY_WATERMARK_HIGH;
2659		else
2660			smc_state->levels[i].displayWatermark = (i < 2) ?
2661				PPSMC_DISPLAY_WATERMARK_LOW : PPSMC_DISPLAY_WATERMARK_HIGH;
2662
2663		if (eg_pi->dynamic_ac_timing)
2664			smc_state->levels[i].ACIndex = NISLANDS_MCREGISTERTABLE_FIRST_DRIVERSTATE_SLOT + i;
2665		else
2666			smc_state->levels[i].ACIndex = 0;
2667
2668		smc_state->levelCount++;
2669	}
2670
2671	rv770_write_smc_soft_register(rdev, NI_SMC_SOFT_REGISTER_watermark_threshold,
2672				      cpu_to_be32(threshold / 512));
2673
2674	ni_populate_smc_sp(rdev, radeon_state, smc_state);
2675
2676	ret = ni_populate_power_containment_values(rdev, radeon_state, smc_state);
2677	if (ret)
2678		ni_pi->enable_power_containment = false;
2679
2680	ret = ni_populate_sq_ramping_values(rdev, radeon_state, smc_state);
2681	if (ret)
2682		ni_pi->enable_sq_ramping = false;
2683
2684	return ni_populate_smc_t(rdev, radeon_state, smc_state);
2685}
2686
2687static int ni_upload_sw_state(struct radeon_device *rdev,
2688			      struct radeon_ps *radeon_new_state)
2689{
2690	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
2691	u16 address = pi->state_table_start +
2692		offsetof(NISLANDS_SMC_STATETABLE, driverState);
2693	NISLANDS_SMC_SWSTATE *smc_state;
2694	size_t state_size = struct_size(smc_state, levels,
2695			NISLANDS_MAX_SMC_PERFORMANCE_LEVELS_PER_SWSTATE);
2696	int ret;
2697
2698	smc_state = kzalloc(state_size, GFP_KERNEL);
2699	if (smc_state == NULL)
2700		return -ENOMEM;
2701
2702	ret = ni_convert_power_state_to_smc(rdev, radeon_new_state, smc_state);
2703	if (ret)
2704		goto done;
2705
2706	ret = rv770_copy_bytes_to_smc(rdev, address, (u8 *)smc_state, state_size, pi->sram_end);
2707
2708done:
2709	kfree(smc_state);
2710
2711	return ret;
2712}
2713
2714static int ni_set_mc_special_registers(struct radeon_device *rdev,
2715				       struct ni_mc_reg_table *table)
2716{
2717	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
2718	u8 i, j, k;
2719	u32 temp_reg;
2720
2721	for (i = 0, j = table->last; i < table->last; i++) {
2722		switch (table->mc_reg_address[i].s1) {
2723		case MC_SEQ_MISC1 >> 2:
2724			if (j >= SMC_NISLANDS_MC_REGISTER_ARRAY_SIZE)
2725				return -EINVAL;
2726			temp_reg = RREG32(MC_PMG_CMD_EMRS);
2727			table->mc_reg_address[j].s1 = MC_PMG_CMD_EMRS >> 2;
2728			table->mc_reg_address[j].s0 = MC_SEQ_PMG_CMD_EMRS_LP >> 2;
2729			for (k = 0; k < table->num_entries; k++)
2730				table->mc_reg_table_entry[k].mc_data[j] =
2731					((temp_reg & 0xffff0000)) |
2732					((table->mc_reg_table_entry[k].mc_data[i] & 0xffff0000) >> 16);
2733			j++;
2734			if (j >= SMC_NISLANDS_MC_REGISTER_ARRAY_SIZE)
2735				return -EINVAL;
2736
2737			temp_reg = RREG32(MC_PMG_CMD_MRS);
2738			table->mc_reg_address[j].s1 = MC_PMG_CMD_MRS >> 2;
2739			table->mc_reg_address[j].s0 = MC_SEQ_PMG_CMD_MRS_LP >> 2;
2740			for(k = 0; k < table->num_entries; k++) {
2741				table->mc_reg_table_entry[k].mc_data[j] =
2742					(temp_reg & 0xffff0000) |
2743					(table->mc_reg_table_entry[k].mc_data[i] & 0x0000ffff);
2744				if (!pi->mem_gddr5)
2745					table->mc_reg_table_entry[k].mc_data[j] |= 0x100;
2746			}
2747			j++;
2748			break;
2749		case MC_SEQ_RESERVE_M >> 2:
2750			if (j >= SMC_NISLANDS_MC_REGISTER_ARRAY_SIZE)
2751				return -EINVAL;
2752			temp_reg = RREG32(MC_PMG_CMD_MRS1);
2753			table->mc_reg_address[j].s1 = MC_PMG_CMD_MRS1 >> 2;
2754			table->mc_reg_address[j].s0 = MC_SEQ_PMG_CMD_MRS1_LP >> 2;
2755			for (k = 0; k < table->num_entries; k++)
2756				table->mc_reg_table_entry[k].mc_data[j] =
2757					(temp_reg & 0xffff0000) |
2758					(table->mc_reg_table_entry[k].mc_data[i] & 0x0000ffff);
2759			j++;
2760			break;
2761		default:
2762			break;
2763		}
2764	}
2765
2766	table->last = j;
2767
2768	return 0;
2769}
2770
2771static bool ni_check_s0_mc_reg_index(u16 in_reg, u16 *out_reg)
2772{
2773	bool result = true;
2774
2775	switch (in_reg) {
2776	case  MC_SEQ_RAS_TIMING >> 2:
2777		*out_reg = MC_SEQ_RAS_TIMING_LP >> 2;
2778		break;
2779	case MC_SEQ_CAS_TIMING >> 2:
2780		*out_reg = MC_SEQ_CAS_TIMING_LP >> 2;
2781		break;
2782	case MC_SEQ_MISC_TIMING >> 2:
2783		*out_reg = MC_SEQ_MISC_TIMING_LP >> 2;
2784		break;
2785	case MC_SEQ_MISC_TIMING2 >> 2:
2786		*out_reg = MC_SEQ_MISC_TIMING2_LP >> 2;
2787		break;
2788	case MC_SEQ_RD_CTL_D0 >> 2:
2789		*out_reg = MC_SEQ_RD_CTL_D0_LP >> 2;
2790		break;
2791	case MC_SEQ_RD_CTL_D1 >> 2:
2792		*out_reg = MC_SEQ_RD_CTL_D1_LP >> 2;
2793		break;
2794	case MC_SEQ_WR_CTL_D0 >> 2:
2795		*out_reg = MC_SEQ_WR_CTL_D0_LP >> 2;
2796		break;
2797	case MC_SEQ_WR_CTL_D1 >> 2:
2798		*out_reg = MC_SEQ_WR_CTL_D1_LP >> 2;
2799		break;
2800	case MC_PMG_CMD_EMRS >> 2:
2801		*out_reg = MC_SEQ_PMG_CMD_EMRS_LP >> 2;
2802		break;
2803	case MC_PMG_CMD_MRS >> 2:
2804		*out_reg = MC_SEQ_PMG_CMD_MRS_LP >> 2;
2805		break;
2806	case MC_PMG_CMD_MRS1 >> 2:
2807		*out_reg = MC_SEQ_PMG_CMD_MRS1_LP >> 2;
2808		break;
2809	case MC_SEQ_PMG_TIMING >> 2:
2810		*out_reg = MC_SEQ_PMG_TIMING_LP >> 2;
2811		break;
2812	case MC_PMG_CMD_MRS2 >> 2:
2813		*out_reg = MC_SEQ_PMG_CMD_MRS2_LP >> 2;
2814		break;
2815	default:
2816		result = false;
2817		break;
2818	}
2819
2820	return result;
2821}
2822
2823static void ni_set_valid_flag(struct ni_mc_reg_table *table)
2824{
2825	u8 i, j;
2826
2827	for (i = 0; i < table->last; i++) {
2828		for (j = 1; j < table->num_entries; j++) {
2829			if (table->mc_reg_table_entry[j-1].mc_data[i] != table->mc_reg_table_entry[j].mc_data[i]) {
2830				table->valid_flag |= 1 << i;
2831				break;
2832			}
2833		}
2834	}
2835}
2836
2837static void ni_set_s0_mc_reg_index(struct ni_mc_reg_table *table)
2838{
2839	u32 i;
2840	u16 address;
2841
2842	for (i = 0; i < table->last; i++)
2843		table->mc_reg_address[i].s0 =
2844			ni_check_s0_mc_reg_index(table->mc_reg_address[i].s1, &address) ?
2845			address : table->mc_reg_address[i].s1;
2846}
2847
2848static int ni_copy_vbios_mc_reg_table(struct atom_mc_reg_table *table,
2849				      struct ni_mc_reg_table *ni_table)
2850{
2851	u8 i, j;
2852
2853	if (table->last > SMC_NISLANDS_MC_REGISTER_ARRAY_SIZE)
2854		return -EINVAL;
2855	if (table->num_entries > MAX_AC_TIMING_ENTRIES)
2856		return -EINVAL;
2857
2858	for (i = 0; i < table->last; i++)
2859		ni_table->mc_reg_address[i].s1 = table->mc_reg_address[i].s1;
2860	ni_table->last = table->last;
2861
2862	for (i = 0; i < table->num_entries; i++) {
2863		ni_table->mc_reg_table_entry[i].mclk_max =
2864			table->mc_reg_table_entry[i].mclk_max;
2865		for (j = 0; j < table->last; j++)
2866			ni_table->mc_reg_table_entry[i].mc_data[j] =
2867				table->mc_reg_table_entry[i].mc_data[j];
2868	}
2869	ni_table->num_entries = table->num_entries;
2870
2871	return 0;
2872}
2873
2874static int ni_initialize_mc_reg_table(struct radeon_device *rdev)
2875{
2876	struct ni_power_info *ni_pi = ni_get_pi(rdev);
2877	int ret;
2878	struct atom_mc_reg_table *table;
2879	struct ni_mc_reg_table *ni_table = &ni_pi->mc_reg_table;
2880	u8 module_index = rv770_get_memory_module_index(rdev);
2881
2882	table = kzalloc(sizeof(struct atom_mc_reg_table), GFP_KERNEL);
2883	if (!table)
2884		return -ENOMEM;
2885
2886	WREG32(MC_SEQ_RAS_TIMING_LP, RREG32(MC_SEQ_RAS_TIMING));
2887	WREG32(MC_SEQ_CAS_TIMING_LP, RREG32(MC_SEQ_CAS_TIMING));
2888	WREG32(MC_SEQ_MISC_TIMING_LP, RREG32(MC_SEQ_MISC_TIMING));
2889	WREG32(MC_SEQ_MISC_TIMING2_LP, RREG32(MC_SEQ_MISC_TIMING2));
2890	WREG32(MC_SEQ_PMG_CMD_EMRS_LP, RREG32(MC_PMG_CMD_EMRS));
2891	WREG32(MC_SEQ_PMG_CMD_MRS_LP, RREG32(MC_PMG_CMD_MRS));
2892	WREG32(MC_SEQ_PMG_CMD_MRS1_LP, RREG32(MC_PMG_CMD_MRS1));
2893	WREG32(MC_SEQ_WR_CTL_D0_LP, RREG32(MC_SEQ_WR_CTL_D0));
2894	WREG32(MC_SEQ_WR_CTL_D1_LP, RREG32(MC_SEQ_WR_CTL_D1));
2895	WREG32(MC_SEQ_RD_CTL_D0_LP, RREG32(MC_SEQ_RD_CTL_D0));
2896	WREG32(MC_SEQ_RD_CTL_D1_LP, RREG32(MC_SEQ_RD_CTL_D1));
2897	WREG32(MC_SEQ_PMG_TIMING_LP, RREG32(MC_SEQ_PMG_TIMING));
2898	WREG32(MC_SEQ_PMG_CMD_MRS2_LP, RREG32(MC_PMG_CMD_MRS2));
2899
2900	ret = radeon_atom_init_mc_reg_table(rdev, module_index, table);
2901
2902	if (ret)
2903		goto init_mc_done;
2904
2905	ret = ni_copy_vbios_mc_reg_table(table, ni_table);
2906
2907	if (ret)
2908		goto init_mc_done;
2909
2910	ni_set_s0_mc_reg_index(ni_table);
2911
2912	ret = ni_set_mc_special_registers(rdev, ni_table);
2913
2914	if (ret)
2915		goto init_mc_done;
2916
2917	ni_set_valid_flag(ni_table);
2918
2919init_mc_done:
2920	kfree(table);
2921
2922	return ret;
2923}
2924
2925static void ni_populate_mc_reg_addresses(struct radeon_device *rdev,
2926					 SMC_NIslands_MCRegisters *mc_reg_table)
2927{
2928	struct ni_power_info *ni_pi = ni_get_pi(rdev);
2929	u32 i, j;
2930
2931	for (i = 0, j = 0; j < ni_pi->mc_reg_table.last; j++) {
2932		if (ni_pi->mc_reg_table.valid_flag & (1 << j)) {
2933			if (i >= SMC_NISLANDS_MC_REGISTER_ARRAY_SIZE)
2934				break;
2935			mc_reg_table->address[i].s0 =
2936				cpu_to_be16(ni_pi->mc_reg_table.mc_reg_address[j].s0);
2937			mc_reg_table->address[i].s1 =
2938				cpu_to_be16(ni_pi->mc_reg_table.mc_reg_address[j].s1);
2939			i++;
2940		}
2941	}
2942	mc_reg_table->last = (u8)i;
2943}
2944
2945
2946static void ni_convert_mc_registers(struct ni_mc_reg_entry *entry,
2947				    SMC_NIslands_MCRegisterSet *data,
2948				    u32 num_entries, u32 valid_flag)
2949{
2950	u32 i, j;
2951
2952	for (i = 0, j = 0; j < num_entries; j++) {
2953		if (valid_flag & (1 << j)) {
2954			data->value[i] = cpu_to_be32(entry->mc_data[j]);
2955			i++;
2956		}
2957	}
2958}
2959
2960static void ni_convert_mc_reg_table_entry_to_smc(struct radeon_device *rdev,
2961						 struct rv7xx_pl *pl,
2962						 SMC_NIslands_MCRegisterSet *mc_reg_table_data)
2963{
2964	struct ni_power_info *ni_pi = ni_get_pi(rdev);
2965	u32 i = 0;
2966
2967	for (i = 0; i < ni_pi->mc_reg_table.num_entries; i++) {
2968		if (pl->mclk <= ni_pi->mc_reg_table.mc_reg_table_entry[i].mclk_max)
2969			break;
2970	}
2971
2972	if ((i == ni_pi->mc_reg_table.num_entries) && (i > 0))
2973		--i;
2974
2975	ni_convert_mc_registers(&ni_pi->mc_reg_table.mc_reg_table_entry[i],
2976				mc_reg_table_data,
2977				ni_pi->mc_reg_table.last,
2978				ni_pi->mc_reg_table.valid_flag);
2979}
2980
2981static void ni_convert_mc_reg_table_to_smc(struct radeon_device *rdev,
2982					   struct radeon_ps *radeon_state,
2983					   SMC_NIslands_MCRegisters *mc_reg_table)
2984{
2985	struct ni_ps *state = ni_get_ps(radeon_state);
2986	int i;
2987
2988	for (i = 0; i < state->performance_level_count; i++) {
2989		ni_convert_mc_reg_table_entry_to_smc(rdev,
2990						     &state->performance_levels[i],
2991						     &mc_reg_table->data[NISLANDS_MCREGISTERTABLE_FIRST_DRIVERSTATE_SLOT + i]);
2992	}
2993}
2994
2995static int ni_populate_mc_reg_table(struct radeon_device *rdev,
2996				    struct radeon_ps *radeon_boot_state)
2997{
2998	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
2999	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3000	struct ni_power_info *ni_pi = ni_get_pi(rdev);
3001	struct ni_ps *boot_state = ni_get_ps(radeon_boot_state);
3002	SMC_NIslands_MCRegisters *mc_reg_table = &ni_pi->smc_mc_reg_table;
3003
3004	memset(mc_reg_table, 0, sizeof(SMC_NIslands_MCRegisters));
3005
3006	rv770_write_smc_soft_register(rdev, NI_SMC_SOFT_REGISTER_seq_index, 1);
3007
3008	ni_populate_mc_reg_addresses(rdev, mc_reg_table);
3009
3010	ni_convert_mc_reg_table_entry_to_smc(rdev, &boot_state->performance_levels[0],
3011					     &mc_reg_table->data[0]);
3012
3013	ni_convert_mc_registers(&ni_pi->mc_reg_table.mc_reg_table_entry[0],
3014				&mc_reg_table->data[1],
3015				ni_pi->mc_reg_table.last,
3016				ni_pi->mc_reg_table.valid_flag);
3017
3018	ni_convert_mc_reg_table_to_smc(rdev, radeon_boot_state, mc_reg_table);
3019
3020	return rv770_copy_bytes_to_smc(rdev, eg_pi->mc_reg_table_start,
3021				       (u8 *)mc_reg_table,
3022				       sizeof(SMC_NIslands_MCRegisters),
3023				       pi->sram_end);
3024}
3025
3026static int ni_upload_mc_reg_table(struct radeon_device *rdev,
3027				  struct radeon_ps *radeon_new_state)
3028{
3029	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
3030	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3031	struct ni_power_info *ni_pi = ni_get_pi(rdev);
3032	struct ni_ps *ni_new_state = ni_get_ps(radeon_new_state);
3033	SMC_NIslands_MCRegisters *mc_reg_table = &ni_pi->smc_mc_reg_table;
3034	u16 address;
3035
3036	memset(mc_reg_table, 0, sizeof(SMC_NIslands_MCRegisters));
3037
3038	ni_convert_mc_reg_table_to_smc(rdev, radeon_new_state, mc_reg_table);
3039
3040	address = eg_pi->mc_reg_table_start +
3041		(u16)offsetof(SMC_NIslands_MCRegisters, data[NISLANDS_MCREGISTERTABLE_FIRST_DRIVERSTATE_SLOT]);
3042
3043	return rv770_copy_bytes_to_smc(rdev, address,
3044				       (u8 *)&mc_reg_table->data[NISLANDS_MCREGISTERTABLE_FIRST_DRIVERSTATE_SLOT],
3045				       sizeof(SMC_NIslands_MCRegisterSet) * ni_new_state->performance_level_count,
3046				       pi->sram_end);
3047}
3048
3049static int ni_init_driver_calculated_leakage_table(struct radeon_device *rdev,
3050						   PP_NIslands_CACTABLES *cac_tables)
3051{
3052	struct ni_power_info *ni_pi = ni_get_pi(rdev);
3053	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3054	u32 leakage = 0;
3055	unsigned int i, j, table_size;
3056	s32 t;
3057	u32 smc_leakage, max_leakage = 0;
3058	u32 scaling_factor;
3059
3060	table_size = eg_pi->vddc_voltage_table.count;
3061
3062	if (SMC_NISLANDS_LKGE_LUT_NUM_OF_VOLT_ENTRIES < table_size)
3063		table_size = SMC_NISLANDS_LKGE_LUT_NUM_OF_VOLT_ENTRIES;
3064
3065	scaling_factor = ni_get_smc_power_scaling_factor(rdev);
3066
3067	for (i = 0; i < SMC_NISLANDS_LKGE_LUT_NUM_OF_TEMP_ENTRIES; i++) {
3068		for (j = 0; j < table_size; j++) {
3069			t = (1000 * ((i + 1) * 8));
3070
3071			if (t < ni_pi->cac_data.leakage_minimum_temperature)
3072				t = ni_pi->cac_data.leakage_minimum_temperature;
3073
3074			ni_calculate_leakage_for_v_and_t(rdev,
3075							 &ni_pi->cac_data.leakage_coefficients,
3076							 eg_pi->vddc_voltage_table.entries[j].value,
3077							 t,
3078							 ni_pi->cac_data.i_leakage,
3079							 &leakage);
3080
3081			smc_leakage = ni_scale_power_for_smc(leakage, scaling_factor) / 1000;
3082			if (smc_leakage > max_leakage)
3083				max_leakage = smc_leakage;
3084
3085			cac_tables->cac_lkge_lut[i][j] = cpu_to_be32(smc_leakage);
3086		}
3087	}
3088
3089	for (j = table_size; j < SMC_NISLANDS_LKGE_LUT_NUM_OF_VOLT_ENTRIES; j++) {
3090		for (i = 0; i < SMC_NISLANDS_LKGE_LUT_NUM_OF_TEMP_ENTRIES; i++)
3091			cac_tables->cac_lkge_lut[i][j] = cpu_to_be32(max_leakage);
3092	}
3093	return 0;
3094}
3095
3096static int ni_init_simplified_leakage_table(struct radeon_device *rdev,
3097					    PP_NIslands_CACTABLES *cac_tables)
3098{
3099	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3100	struct radeon_cac_leakage_table *leakage_table =
3101		&rdev->pm.dpm.dyn_state.cac_leakage_table;
3102	u32 i, j, table_size;
3103	u32 smc_leakage, max_leakage = 0;
3104	u32 scaling_factor;
3105
3106	table_size = leakage_table->count;
3107
3108	if (eg_pi->vddc_voltage_table.count != table_size)
3109		table_size = (eg_pi->vddc_voltage_table.count < leakage_table->count) ?
3110			eg_pi->vddc_voltage_table.count : leakage_table->count;
3111
3112	if (SMC_NISLANDS_LKGE_LUT_NUM_OF_VOLT_ENTRIES < table_size)
3113		table_size = SMC_NISLANDS_LKGE_LUT_NUM_OF_VOLT_ENTRIES;
3114
3115	if (table_size == 0)
3116		return -EINVAL;
3117
3118	scaling_factor = ni_get_smc_power_scaling_factor(rdev);
3119
3120	for (j = 0; j < table_size; j++) {
3121		smc_leakage = leakage_table->entries[j].leakage;
3122
3123		if (smc_leakage > max_leakage)
3124			max_leakage = smc_leakage;
3125
3126		for (i = 0; i < SMC_NISLANDS_LKGE_LUT_NUM_OF_TEMP_ENTRIES; i++)
3127			cac_tables->cac_lkge_lut[i][j] =
3128				cpu_to_be32(ni_scale_power_for_smc(smc_leakage, scaling_factor));
3129	}
3130
3131	for (j = table_size; j < SMC_NISLANDS_LKGE_LUT_NUM_OF_VOLT_ENTRIES; j++) {
3132		for (i = 0; i < SMC_NISLANDS_LKGE_LUT_NUM_OF_TEMP_ENTRIES; i++)
3133			cac_tables->cac_lkge_lut[i][j] =
3134				cpu_to_be32(ni_scale_power_for_smc(max_leakage, scaling_factor));
3135	}
3136	return 0;
3137}
3138
3139static int ni_initialize_smc_cac_tables(struct radeon_device *rdev)
3140{
3141	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
3142	struct ni_power_info *ni_pi = ni_get_pi(rdev);
3143	PP_NIslands_CACTABLES *cac_tables = NULL;
3144	int i, ret;
3145	u32 reg;
3146
3147	if (ni_pi->enable_cac == false)
3148		return 0;
3149
3150	cac_tables = kzalloc(sizeof(PP_NIslands_CACTABLES), GFP_KERNEL);
3151	if (!cac_tables)
3152		return -ENOMEM;
3153
3154	reg = RREG32(CG_CAC_CTRL) & ~(TID_CNT_MASK | TID_UNIT_MASK);
3155	reg |= (TID_CNT(ni_pi->cac_weights->tid_cnt) |
3156		TID_UNIT(ni_pi->cac_weights->tid_unit));
3157	WREG32(CG_CAC_CTRL, reg);
3158
3159	for (i = 0; i < NISLANDS_DCCAC_MAX_LEVELS; i++)
3160		ni_pi->dc_cac_table[i] = ni_pi->cac_weights->dc_cac[i];
3161
3162	for (i = 0; i < SMC_NISLANDS_BIF_LUT_NUM_OF_ENTRIES; i++)
3163		cac_tables->cac_bif_lut[i] = ni_pi->cac_weights->pcie_cac[i];
3164
3165	ni_pi->cac_data.i_leakage = rdev->pm.dpm.cac_leakage;
3166	ni_pi->cac_data.pwr_const = 0;
3167	ni_pi->cac_data.dc_cac_value = ni_pi->dc_cac_table[NISLANDS_DCCAC_LEVEL_0];
3168	ni_pi->cac_data.bif_cac_value = 0;
3169	ni_pi->cac_data.mc_wr_weight = ni_pi->cac_weights->mc_write_weight;
3170	ni_pi->cac_data.mc_rd_weight = ni_pi->cac_weights->mc_read_weight;
3171	ni_pi->cac_data.allow_ovrflw = 0;
3172	ni_pi->cac_data.l2num_win_tdp = ni_pi->lta_window_size;
3173	ni_pi->cac_data.num_win_tdp = 0;
3174	ni_pi->cac_data.lts_truncate_n = ni_pi->lts_truncate;
3175
3176	if (ni_pi->driver_calculate_cac_leakage)
3177		ret = ni_init_driver_calculated_leakage_table(rdev, cac_tables);
3178	else
3179		ret = ni_init_simplified_leakage_table(rdev, cac_tables);
3180
3181	if (ret)
3182		goto done_free;
3183
3184	cac_tables->pwr_const      = cpu_to_be32(ni_pi->cac_data.pwr_const);
3185	cac_tables->dc_cacValue    = cpu_to_be32(ni_pi->cac_data.dc_cac_value);
3186	cac_tables->bif_cacValue   = cpu_to_be32(ni_pi->cac_data.bif_cac_value);
3187	cac_tables->AllowOvrflw    = ni_pi->cac_data.allow_ovrflw;
3188	cac_tables->MCWrWeight     = ni_pi->cac_data.mc_wr_weight;
3189	cac_tables->MCRdWeight     = ni_pi->cac_data.mc_rd_weight;
3190	cac_tables->numWin_TDP     = ni_pi->cac_data.num_win_tdp;
3191	cac_tables->l2numWin_TDP   = ni_pi->cac_data.l2num_win_tdp;
3192	cac_tables->lts_truncate_n = ni_pi->cac_data.lts_truncate_n;
3193
3194	ret = rv770_copy_bytes_to_smc(rdev, ni_pi->cac_table_start, (u8 *)cac_tables,
3195				      sizeof(PP_NIslands_CACTABLES), pi->sram_end);
3196
3197done_free:
3198	if (ret) {
3199		ni_pi->enable_cac = false;
3200		ni_pi->enable_power_containment = false;
3201	}
3202
3203	kfree(cac_tables);
3204
3205	return 0;
3206}
3207
3208static int ni_initialize_hardware_cac_manager(struct radeon_device *rdev)
3209{
3210	struct ni_power_info *ni_pi = ni_get_pi(rdev);
3211	u32 reg;
3212
3213	if (!ni_pi->enable_cac ||
3214	    !ni_pi->cac_configuration_required)
3215		return 0;
3216
3217	if (ni_pi->cac_weights == NULL)
3218		return -EINVAL;
3219
3220	reg = RREG32_CG(CG_CAC_REGION_1_WEIGHT_0) & ~(WEIGHT_TCP_SIG0_MASK |
3221						      WEIGHT_TCP_SIG1_MASK |
3222						      WEIGHT_TA_SIG_MASK);
3223	reg |= (WEIGHT_TCP_SIG0(ni_pi->cac_weights->weight_tcp_sig0) |
3224		WEIGHT_TCP_SIG1(ni_pi->cac_weights->weight_tcp_sig1) |
3225		WEIGHT_TA_SIG(ni_pi->cac_weights->weight_ta_sig));
3226	WREG32_CG(CG_CAC_REGION_1_WEIGHT_0, reg);
3227
3228	reg = RREG32_CG(CG_CAC_REGION_1_WEIGHT_1) & ~(WEIGHT_TCC_EN0_MASK |
3229						      WEIGHT_TCC_EN1_MASK |
3230						      WEIGHT_TCC_EN2_MASK);
3231	reg |= (WEIGHT_TCC_EN0(ni_pi->cac_weights->weight_tcc_en0) |
3232		WEIGHT_TCC_EN1(ni_pi->cac_weights->weight_tcc_en1) |
3233		WEIGHT_TCC_EN2(ni_pi->cac_weights->weight_tcc_en2));
3234	WREG32_CG(CG_CAC_REGION_1_WEIGHT_1, reg);
3235
3236	reg = RREG32_CG(CG_CAC_REGION_2_WEIGHT_0) & ~(WEIGHT_CB_EN0_MASK |
3237						      WEIGHT_CB_EN1_MASK |
3238						      WEIGHT_CB_EN2_MASK |
3239						      WEIGHT_CB_EN3_MASK);
3240	reg |= (WEIGHT_CB_EN0(ni_pi->cac_weights->weight_cb_en0) |
3241		WEIGHT_CB_EN1(ni_pi->cac_weights->weight_cb_en1) |
3242		WEIGHT_CB_EN2(ni_pi->cac_weights->weight_cb_en2) |
3243		WEIGHT_CB_EN3(ni_pi->cac_weights->weight_cb_en3));
3244	WREG32_CG(CG_CAC_REGION_2_WEIGHT_0, reg);
3245
3246	reg = RREG32_CG(CG_CAC_REGION_2_WEIGHT_1) & ~(WEIGHT_DB_SIG0_MASK |
3247						      WEIGHT_DB_SIG1_MASK |
3248						      WEIGHT_DB_SIG2_MASK |
3249						      WEIGHT_DB_SIG3_MASK);
3250	reg |= (WEIGHT_DB_SIG0(ni_pi->cac_weights->weight_db_sig0) |
3251		WEIGHT_DB_SIG1(ni_pi->cac_weights->weight_db_sig1) |
3252		WEIGHT_DB_SIG2(ni_pi->cac_weights->weight_db_sig2) |
3253		WEIGHT_DB_SIG3(ni_pi->cac_weights->weight_db_sig3));
3254	WREG32_CG(CG_CAC_REGION_2_WEIGHT_1, reg);
3255
3256	reg = RREG32_CG(CG_CAC_REGION_2_WEIGHT_2) & ~(WEIGHT_SXM_SIG0_MASK |
3257						      WEIGHT_SXM_SIG1_MASK |
3258						      WEIGHT_SXM_SIG2_MASK |
3259						      WEIGHT_SXS_SIG0_MASK |
3260						      WEIGHT_SXS_SIG1_MASK);
3261	reg |= (WEIGHT_SXM_SIG0(ni_pi->cac_weights->weight_sxm_sig0) |
3262		WEIGHT_SXM_SIG1(ni_pi->cac_weights->weight_sxm_sig1) |
3263		WEIGHT_SXM_SIG2(ni_pi->cac_weights->weight_sxm_sig2) |
3264		WEIGHT_SXS_SIG0(ni_pi->cac_weights->weight_sxs_sig0) |
3265		WEIGHT_SXS_SIG1(ni_pi->cac_weights->weight_sxs_sig1));
3266	WREG32_CG(CG_CAC_REGION_2_WEIGHT_2, reg);
3267
3268	reg = RREG32_CG(CG_CAC_REGION_3_WEIGHT_0) & ~(WEIGHT_XBR_0_MASK |
3269						      WEIGHT_XBR_1_MASK |
3270						      WEIGHT_XBR_2_MASK |
3271						      WEIGHT_SPI_SIG0_MASK);
3272	reg |= (WEIGHT_XBR_0(ni_pi->cac_weights->weight_xbr_0) |
3273		WEIGHT_XBR_1(ni_pi->cac_weights->weight_xbr_1) |
3274		WEIGHT_XBR_2(ni_pi->cac_weights->weight_xbr_2) |
3275		WEIGHT_SPI_SIG0(ni_pi->cac_weights->weight_spi_sig0));
3276	WREG32_CG(CG_CAC_REGION_3_WEIGHT_0, reg);
3277
3278	reg = RREG32_CG(CG_CAC_REGION_3_WEIGHT_1) & ~(WEIGHT_SPI_SIG1_MASK |
3279						      WEIGHT_SPI_SIG2_MASK |
3280						      WEIGHT_SPI_SIG3_MASK |
3281						      WEIGHT_SPI_SIG4_MASK |
3282						      WEIGHT_SPI_SIG5_MASK);
3283	reg |= (WEIGHT_SPI_SIG1(ni_pi->cac_weights->weight_spi_sig1) |
3284		WEIGHT_SPI_SIG2(ni_pi->cac_weights->weight_spi_sig2) |
3285		WEIGHT_SPI_SIG3(ni_pi->cac_weights->weight_spi_sig3) |
3286		WEIGHT_SPI_SIG4(ni_pi->cac_weights->weight_spi_sig4) |
3287		WEIGHT_SPI_SIG5(ni_pi->cac_weights->weight_spi_sig5));
3288	WREG32_CG(CG_CAC_REGION_3_WEIGHT_1, reg);
3289
3290	reg = RREG32_CG(CG_CAC_REGION_4_WEIGHT_0) & ~(WEIGHT_LDS_SIG0_MASK |
3291						      WEIGHT_LDS_SIG1_MASK |
3292						      WEIGHT_SC_MASK);
3293	reg |= (WEIGHT_LDS_SIG0(ni_pi->cac_weights->weight_lds_sig0) |
3294		WEIGHT_LDS_SIG1(ni_pi->cac_weights->weight_lds_sig1) |
3295		WEIGHT_SC(ni_pi->cac_weights->weight_sc));
3296	WREG32_CG(CG_CAC_REGION_4_WEIGHT_0, reg);
3297
3298	reg = RREG32_CG(CG_CAC_REGION_4_WEIGHT_1) & ~(WEIGHT_BIF_MASK |
3299						      WEIGHT_CP_MASK |
3300						      WEIGHT_PA_SIG0_MASK |
3301						      WEIGHT_PA_SIG1_MASK |
3302						      WEIGHT_VGT_SIG0_MASK);
3303	reg |= (WEIGHT_BIF(ni_pi->cac_weights->weight_bif) |
3304		WEIGHT_CP(ni_pi->cac_weights->weight_cp) |
3305		WEIGHT_PA_SIG0(ni_pi->cac_weights->weight_pa_sig0) |
3306		WEIGHT_PA_SIG1(ni_pi->cac_weights->weight_pa_sig1) |
3307		WEIGHT_VGT_SIG0(ni_pi->cac_weights->weight_vgt_sig0));
3308	WREG32_CG(CG_CAC_REGION_4_WEIGHT_1, reg);
3309
3310	reg = RREG32_CG(CG_CAC_REGION_4_WEIGHT_2) & ~(WEIGHT_VGT_SIG1_MASK |
3311						      WEIGHT_VGT_SIG2_MASK |
3312						      WEIGHT_DC_SIG0_MASK |
3313						      WEIGHT_DC_SIG1_MASK |
3314						      WEIGHT_DC_SIG2_MASK);
3315	reg |= (WEIGHT_VGT_SIG1(ni_pi->cac_weights->weight_vgt_sig1) |
3316		WEIGHT_VGT_SIG2(ni_pi->cac_weights->weight_vgt_sig2) |
3317		WEIGHT_DC_SIG0(ni_pi->cac_weights->weight_dc_sig0) |
3318		WEIGHT_DC_SIG1(ni_pi->cac_weights->weight_dc_sig1) |
3319		WEIGHT_DC_SIG2(ni_pi->cac_weights->weight_dc_sig2));
3320	WREG32_CG(CG_CAC_REGION_4_WEIGHT_2, reg);
3321
3322	reg = RREG32_CG(CG_CAC_REGION_4_WEIGHT_3) & ~(WEIGHT_DC_SIG3_MASK |
3323						      WEIGHT_UVD_SIG0_MASK |
3324						      WEIGHT_UVD_SIG1_MASK |
3325						      WEIGHT_SPARE0_MASK |
3326						      WEIGHT_SPARE1_MASK);
3327	reg |= (WEIGHT_DC_SIG3(ni_pi->cac_weights->weight_dc_sig3) |
3328		WEIGHT_UVD_SIG0(ni_pi->cac_weights->weight_uvd_sig0) |
3329		WEIGHT_UVD_SIG1(ni_pi->cac_weights->weight_uvd_sig1) |
3330		WEIGHT_SPARE0(ni_pi->cac_weights->weight_spare0) |
3331		WEIGHT_SPARE1(ni_pi->cac_weights->weight_spare1));
3332	WREG32_CG(CG_CAC_REGION_4_WEIGHT_3, reg);
3333
3334	reg = RREG32_CG(CG_CAC_REGION_5_WEIGHT_0) & ~(WEIGHT_SQ_VSP_MASK |
3335						      WEIGHT_SQ_VSP0_MASK);
3336	reg |= (WEIGHT_SQ_VSP(ni_pi->cac_weights->weight_sq_vsp) |
3337		WEIGHT_SQ_VSP0(ni_pi->cac_weights->weight_sq_vsp0));
3338	WREG32_CG(CG_CAC_REGION_5_WEIGHT_0, reg);
3339
3340	reg = RREG32_CG(CG_CAC_REGION_5_WEIGHT_1) & ~(WEIGHT_SQ_GPR_MASK);
3341	reg |= WEIGHT_SQ_GPR(ni_pi->cac_weights->weight_sq_gpr);
3342	WREG32_CG(CG_CAC_REGION_5_WEIGHT_1, reg);
3343
3344	reg = RREG32_CG(CG_CAC_REGION_4_OVERRIDE_4) & ~(OVR_MODE_SPARE_0_MASK |
3345							OVR_VAL_SPARE_0_MASK |
3346							OVR_MODE_SPARE_1_MASK |
3347							OVR_VAL_SPARE_1_MASK);
3348	reg |= (OVR_MODE_SPARE_0(ni_pi->cac_weights->ovr_mode_spare_0) |
3349		OVR_VAL_SPARE_0(ni_pi->cac_weights->ovr_val_spare_0) |
3350		OVR_MODE_SPARE_1(ni_pi->cac_weights->ovr_mode_spare_1) |
3351		OVR_VAL_SPARE_1(ni_pi->cac_weights->ovr_val_spare_1));
3352	WREG32_CG(CG_CAC_REGION_4_OVERRIDE_4, reg);
3353
3354	reg = RREG32(SQ_CAC_THRESHOLD) & ~(VSP_MASK |
3355					   VSP0_MASK |
3356					   GPR_MASK);
3357	reg |= (VSP(ni_pi->cac_weights->vsp) |
3358		VSP0(ni_pi->cac_weights->vsp0) |
3359		GPR(ni_pi->cac_weights->gpr));
3360	WREG32(SQ_CAC_THRESHOLD, reg);
3361
3362	reg = (MCDW_WR_ENABLE |
3363	       MCDX_WR_ENABLE |
3364	       MCDY_WR_ENABLE |
3365	       MCDZ_WR_ENABLE |
3366	       INDEX(0x09D4));
3367	WREG32(MC_CG_CONFIG, reg);
3368
3369	reg = (READ_WEIGHT(ni_pi->cac_weights->mc_read_weight) |
3370	       WRITE_WEIGHT(ni_pi->cac_weights->mc_write_weight) |
3371	       ALLOW_OVERFLOW);
3372	WREG32(MC_CG_DATAPORT, reg);
3373
3374	return 0;
3375}
3376
3377static int ni_enable_smc_cac(struct radeon_device *rdev,
3378			     struct radeon_ps *radeon_new_state,
3379			     bool enable)
3380{
3381	struct ni_power_info *ni_pi = ni_get_pi(rdev);
3382	int ret = 0;
3383	PPSMC_Result smc_result;
3384
3385	if (ni_pi->enable_cac) {
3386		if (enable) {
3387			if (!r600_is_uvd_state(radeon_new_state->class, radeon_new_state->class2)) {
3388				smc_result = rv770_send_msg_to_smc(rdev, PPSMC_MSG_CollectCAC_PowerCorreln);
3389
3390				if (ni_pi->support_cac_long_term_average) {
3391					smc_result = rv770_send_msg_to_smc(rdev, PPSMC_CACLongTermAvgEnable);
3392					if (PPSMC_Result_OK != smc_result)
3393						ni_pi->support_cac_long_term_average = false;
3394				}
3395
3396				smc_result = rv770_send_msg_to_smc(rdev, PPSMC_MSG_EnableCac);
3397				if (PPSMC_Result_OK != smc_result)
3398					ret = -EINVAL;
3399
3400				ni_pi->cac_enabled = (PPSMC_Result_OK == smc_result) ? true : false;
3401			}
3402		} else if (ni_pi->cac_enabled) {
3403			smc_result = rv770_send_msg_to_smc(rdev, PPSMC_MSG_DisableCac);
3404
3405			ni_pi->cac_enabled = false;
3406
3407			if (ni_pi->support_cac_long_term_average) {
3408				smc_result = rv770_send_msg_to_smc(rdev, PPSMC_CACLongTermAvgDisable);
3409				if (PPSMC_Result_OK != smc_result)
3410					ni_pi->support_cac_long_term_average = false;
3411			}
3412		}
3413	}
3414
3415	return ret;
3416}
3417
3418static int ni_pcie_performance_request(struct radeon_device *rdev,
3419				       u8 perf_req, bool advertise)
3420{
3421#if defined(CONFIG_ACPI)
3422	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3423
3424	if ((perf_req == PCIE_PERF_REQ_PECI_GEN1) ||
3425	    (perf_req == PCIE_PERF_REQ_PECI_GEN2)) {
3426		if (eg_pi->pcie_performance_request_registered == false)
3427			radeon_acpi_pcie_notify_device_ready(rdev);
3428		eg_pi->pcie_performance_request_registered = true;
3429		return radeon_acpi_pcie_performance_request(rdev, perf_req, advertise);
3430	} else if ((perf_req == PCIE_PERF_REQ_REMOVE_REGISTRY) &&
3431		    eg_pi->pcie_performance_request_registered) {
3432		eg_pi->pcie_performance_request_registered = false;
3433		return radeon_acpi_pcie_performance_request(rdev, perf_req, advertise);
3434	}
3435#endif
3436	return 0;
3437}
3438
3439static int ni_advertise_gen2_capability(struct radeon_device *rdev)
3440{
3441	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
3442	u32 tmp;
3443
3444	tmp = RREG32_PCIE_PORT(PCIE_LC_SPEED_CNTL);
3445
3446	if ((tmp & LC_OTHER_SIDE_EVER_SENT_GEN2) &&
3447	    (tmp & LC_OTHER_SIDE_SUPPORTS_GEN2))
3448		pi->pcie_gen2 = true;
3449	else
3450		pi->pcie_gen2 = false;
3451
3452	if (!pi->pcie_gen2)
3453		ni_pcie_performance_request(rdev, PCIE_PERF_REQ_PECI_GEN2, true);
3454
3455	return 0;
3456}
3457
3458static void ni_enable_bif_dynamic_pcie_gen2(struct radeon_device *rdev,
3459					    bool enable)
3460{
3461	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
3462	u32 tmp, bif;
3463
3464	tmp = RREG32_PCIE_PORT(PCIE_LC_SPEED_CNTL);
3465
3466	if ((tmp & LC_OTHER_SIDE_EVER_SENT_GEN2) &&
3467	    (tmp & LC_OTHER_SIDE_SUPPORTS_GEN2)) {
3468		if (enable) {
3469			if (!pi->boot_in_gen2) {
3470				bif = RREG32(CG_BIF_REQ_AND_RSP) & ~CG_CLIENT_REQ_MASK;
3471				bif |= CG_CLIENT_REQ(0xd);
3472				WREG32(CG_BIF_REQ_AND_RSP, bif);
3473			}
3474			tmp &= ~LC_HW_VOLTAGE_IF_CONTROL_MASK;
3475			tmp |= LC_HW_VOLTAGE_IF_CONTROL(1);
3476			tmp |= LC_GEN2_EN_STRAP;
3477
3478			tmp |= LC_CLR_FAILED_SPD_CHANGE_CNT;
3479			WREG32_PCIE_PORT(PCIE_LC_SPEED_CNTL, tmp);
3480			udelay(10);
3481			tmp &= ~LC_CLR_FAILED_SPD_CHANGE_CNT;
3482			WREG32_PCIE_PORT(PCIE_LC_SPEED_CNTL, tmp);
3483		} else {
3484			if (!pi->boot_in_gen2) {
3485				bif = RREG32(CG_BIF_REQ_AND_RSP) & ~CG_CLIENT_REQ_MASK;
3486				bif |= CG_CLIENT_REQ(0xd);
3487				WREG32(CG_BIF_REQ_AND_RSP, bif);
3488
3489				tmp &= ~LC_HW_VOLTAGE_IF_CONTROL_MASK;
3490				tmp &= ~LC_GEN2_EN_STRAP;
3491			}
3492			WREG32_PCIE_PORT(PCIE_LC_SPEED_CNTL, tmp);
3493		}
3494	}
3495}
3496
3497static void ni_enable_dynamic_pcie_gen2(struct radeon_device *rdev,
3498					bool enable)
3499{
3500	ni_enable_bif_dynamic_pcie_gen2(rdev, enable);
3501
3502	if (enable)
3503		WREG32_P(GENERAL_PWRMGT, ENABLE_GEN2PCIE, ~ENABLE_GEN2PCIE);
3504	else
3505		WREG32_P(GENERAL_PWRMGT, 0, ~ENABLE_GEN2PCIE);
3506}
3507
3508void ni_set_uvd_clock_before_set_eng_clock(struct radeon_device *rdev,
3509					   struct radeon_ps *new_ps,
3510					   struct radeon_ps *old_ps)
3511{
3512	struct ni_ps *new_state = ni_get_ps(new_ps);
3513	struct ni_ps *current_state = ni_get_ps(old_ps);
3514
3515	if ((new_ps->vclk == old_ps->vclk) &&
3516	    (new_ps->dclk == old_ps->dclk))
3517		return;
3518
3519	if (new_state->performance_levels[new_state->performance_level_count - 1].sclk >=
3520	    current_state->performance_levels[current_state->performance_level_count - 1].sclk)
3521		return;
3522
3523	radeon_set_uvd_clocks(rdev, new_ps->vclk, new_ps->dclk);
3524}
3525
3526void ni_set_uvd_clock_after_set_eng_clock(struct radeon_device *rdev,
3527					  struct radeon_ps *new_ps,
3528					  struct radeon_ps *old_ps)
3529{
3530	struct ni_ps *new_state = ni_get_ps(new_ps);
3531	struct ni_ps *current_state = ni_get_ps(old_ps);
3532
3533	if ((new_ps->vclk == old_ps->vclk) &&
3534	    (new_ps->dclk == old_ps->dclk))
3535		return;
3536
3537	if (new_state->performance_levels[new_state->performance_level_count - 1].sclk <
3538	    current_state->performance_levels[current_state->performance_level_count - 1].sclk)
3539		return;
3540
3541	radeon_set_uvd_clocks(rdev, new_ps->vclk, new_ps->dclk);
3542}
3543
3544void ni_dpm_setup_asic(struct radeon_device *rdev)
3545{
3546	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3547	int r;
3548
3549	r = ni_mc_load_microcode(rdev);
3550	if (r)
3551		DRM_ERROR("Failed to load MC firmware!\n");
3552	ni_read_clock_registers(rdev);
3553	btc_read_arb_registers(rdev);
3554	rv770_get_memory_type(rdev);
3555	if (eg_pi->pcie_performance_request)
3556		ni_advertise_gen2_capability(rdev);
3557	rv770_get_pcie_gen2_status(rdev);
3558	rv770_enable_acpi_pm(rdev);
3559}
3560
3561void ni_update_current_ps(struct radeon_device *rdev,
3562			  struct radeon_ps *rps)
3563{
3564	struct ni_ps *new_ps = ni_get_ps(rps);
3565	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3566	struct ni_power_info *ni_pi = ni_get_pi(rdev);
3567
3568	eg_pi->current_rps = *rps;
3569	ni_pi->current_ps = *new_ps;
3570	eg_pi->current_rps.ps_priv = &ni_pi->current_ps;
3571}
3572
3573void ni_update_requested_ps(struct radeon_device *rdev,
3574			    struct radeon_ps *rps)
3575{
3576	struct ni_ps *new_ps = ni_get_ps(rps);
3577	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3578	struct ni_power_info *ni_pi = ni_get_pi(rdev);
3579
3580	eg_pi->requested_rps = *rps;
3581	ni_pi->requested_ps = *new_ps;
3582	eg_pi->requested_rps.ps_priv = &ni_pi->requested_ps;
3583}
3584
3585int ni_dpm_enable(struct radeon_device *rdev)
3586{
3587	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
3588	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3589	struct radeon_ps *boot_ps = rdev->pm.dpm.boot_ps;
3590	int ret;
3591
3592	if (pi->gfx_clock_gating)
3593		ni_cg_clockgating_default(rdev);
3594	if (btc_dpm_enabled(rdev))
3595		return -EINVAL;
3596	if (pi->mg_clock_gating)
3597		ni_mg_clockgating_default(rdev);
3598	if (eg_pi->ls_clock_gating)
3599		ni_ls_clockgating_default(rdev);
3600	if (pi->voltage_control) {
3601		rv770_enable_voltage_control(rdev, true);
3602		ret = cypress_construct_voltage_tables(rdev);
3603		if (ret) {
3604			DRM_ERROR("cypress_construct_voltage_tables failed\n");
3605			return ret;
3606		}
3607	}
3608	if (eg_pi->dynamic_ac_timing) {
3609		ret = ni_initialize_mc_reg_table(rdev);
3610		if (ret)
3611			eg_pi->dynamic_ac_timing = false;
3612	}
3613	if (pi->dynamic_ss)
3614		cypress_enable_spread_spectrum(rdev, true);
3615	if (pi->thermal_protection)
3616		rv770_enable_thermal_protection(rdev, true);
3617	rv770_setup_bsp(rdev);
3618	rv770_program_git(rdev);
3619	rv770_program_tp(rdev);
3620	rv770_program_tpp(rdev);
3621	rv770_program_sstp(rdev);
3622	cypress_enable_display_gap(rdev);
3623	rv770_program_vc(rdev);
3624	if (pi->dynamic_pcie_gen2)
3625		ni_enable_dynamic_pcie_gen2(rdev, true);
3626	ret = rv770_upload_firmware(rdev);
3627	if (ret) {
3628		DRM_ERROR("rv770_upload_firmware failed\n");
3629		return ret;
3630	}
3631	ret = ni_process_firmware_header(rdev);
3632	if (ret) {
3633		DRM_ERROR("ni_process_firmware_header failed\n");
3634		return ret;
3635	}
3636	ret = ni_initial_switch_from_arb_f0_to_f1(rdev);
3637	if (ret) {
3638		DRM_ERROR("ni_initial_switch_from_arb_f0_to_f1 failed\n");
3639		return ret;
3640	}
3641	ret = ni_init_smc_table(rdev);
3642	if (ret) {
3643		DRM_ERROR("ni_init_smc_table failed\n");
3644		return ret;
3645	}
3646	ret = ni_init_smc_spll_table(rdev);
3647	if (ret) {
3648		DRM_ERROR("ni_init_smc_spll_table failed\n");
3649		return ret;
3650	}
3651	ret = ni_init_arb_table_index(rdev);
3652	if (ret) {
3653		DRM_ERROR("ni_init_arb_table_index failed\n");
3654		return ret;
3655	}
3656	if (eg_pi->dynamic_ac_timing) {
3657		ret = ni_populate_mc_reg_table(rdev, boot_ps);
3658		if (ret) {
3659			DRM_ERROR("ni_populate_mc_reg_table failed\n");
3660			return ret;
3661		}
3662	}
3663	ret = ni_initialize_smc_cac_tables(rdev);
3664	if (ret) {
3665		DRM_ERROR("ni_initialize_smc_cac_tables failed\n");
3666		return ret;
3667	}
3668	ret = ni_initialize_hardware_cac_manager(rdev);
3669	if (ret) {
3670		DRM_ERROR("ni_initialize_hardware_cac_manager failed\n");
3671		return ret;
3672	}
3673	ret = ni_populate_smc_tdp_limits(rdev, boot_ps);
3674	if (ret) {
3675		DRM_ERROR("ni_populate_smc_tdp_limits failed\n");
3676		return ret;
3677	}
3678	ni_program_response_times(rdev);
3679	r7xx_start_smc(rdev);
3680	ret = cypress_notify_smc_display_change(rdev, false);
3681	if (ret) {
3682		DRM_ERROR("cypress_notify_smc_display_change failed\n");
3683		return ret;
3684	}
3685	cypress_enable_sclk_control(rdev, true);
3686	if (eg_pi->memory_transition)
3687		cypress_enable_mclk_control(rdev, true);
3688	cypress_start_dpm(rdev);
3689	if (pi->gfx_clock_gating)
3690		ni_gfx_clockgating_enable(rdev, true);
3691	if (pi->mg_clock_gating)
3692		ni_mg_clockgating_enable(rdev, true);
3693	if (eg_pi->ls_clock_gating)
3694		ni_ls_clockgating_enable(rdev, true);
3695
3696	rv770_enable_auto_throttle_source(rdev, RADEON_DPM_AUTO_THROTTLE_SRC_THERMAL, true);
3697
3698	ni_update_current_ps(rdev, boot_ps);
3699
3700	return 0;
3701}
3702
3703void ni_dpm_disable(struct radeon_device *rdev)
3704{
3705	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
3706	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3707	struct radeon_ps *boot_ps = rdev->pm.dpm.boot_ps;
3708
3709	if (!btc_dpm_enabled(rdev))
3710		return;
3711	rv770_clear_vc(rdev);
3712	if (pi->thermal_protection)
3713		rv770_enable_thermal_protection(rdev, false);
3714	ni_enable_power_containment(rdev, boot_ps, false);
3715	ni_enable_smc_cac(rdev, boot_ps, false);
3716	cypress_enable_spread_spectrum(rdev, false);
3717	rv770_enable_auto_throttle_source(rdev, RADEON_DPM_AUTO_THROTTLE_SRC_THERMAL, false);
3718	if (pi->dynamic_pcie_gen2)
3719		ni_enable_dynamic_pcie_gen2(rdev, false);
3720
3721	if (rdev->irq.installed &&
3722	    r600_is_internal_thermal_sensor(rdev->pm.int_thermal_type)) {
3723		rdev->irq.dpm_thermal = false;
3724		radeon_irq_set(rdev);
3725	}
3726
3727	if (pi->gfx_clock_gating)
3728		ni_gfx_clockgating_enable(rdev, false);
3729	if (pi->mg_clock_gating)
3730		ni_mg_clockgating_enable(rdev, false);
3731	if (eg_pi->ls_clock_gating)
3732		ni_ls_clockgating_enable(rdev, false);
3733	ni_stop_dpm(rdev);
3734	btc_reset_to_default(rdev);
3735	ni_stop_smc(rdev);
3736	ni_force_switch_to_arb_f0(rdev);
3737
3738	ni_update_current_ps(rdev, boot_ps);
3739}
3740
3741static int ni_power_control_set_level(struct radeon_device *rdev)
3742{
3743	struct radeon_ps *new_ps = rdev->pm.dpm.requested_ps;
3744	int ret;
3745
3746	ret = ni_restrict_performance_levels_before_switch(rdev);
3747	if (ret)
3748		return ret;
3749	ret = rv770_halt_smc(rdev);
3750	if (ret)
3751		return ret;
3752	ret = ni_populate_smc_tdp_limits(rdev, new_ps);
3753	if (ret)
3754		return ret;
3755	ret = rv770_resume_smc(rdev);
3756	if (ret)
3757		return ret;
3758	ret = rv770_set_sw_state(rdev);
3759	if (ret)
3760		return ret;
3761
3762	return 0;
3763}
3764
3765int ni_dpm_pre_set_power_state(struct radeon_device *rdev)
3766{
3767	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3768	struct radeon_ps requested_ps = *rdev->pm.dpm.requested_ps;
3769	struct radeon_ps *new_ps = &requested_ps;
3770
3771	ni_update_requested_ps(rdev, new_ps);
3772
3773	ni_apply_state_adjust_rules(rdev, &eg_pi->requested_rps);
3774
3775	return 0;
3776}
3777
3778int ni_dpm_set_power_state(struct radeon_device *rdev)
3779{
3780	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3781	struct radeon_ps *new_ps = &eg_pi->requested_rps;
3782	struct radeon_ps *old_ps = &eg_pi->current_rps;
3783	int ret;
3784
3785	ret = ni_restrict_performance_levels_before_switch(rdev);
3786	if (ret) {
3787		DRM_ERROR("ni_restrict_performance_levels_before_switch failed\n");
3788		return ret;
3789	}
3790	ni_set_uvd_clock_before_set_eng_clock(rdev, new_ps, old_ps);
3791	ret = ni_enable_power_containment(rdev, new_ps, false);
3792	if (ret) {
3793		DRM_ERROR("ni_enable_power_containment failed\n");
3794		return ret;
3795	}
3796	ret = ni_enable_smc_cac(rdev, new_ps, false);
3797	if (ret) {
3798		DRM_ERROR("ni_enable_smc_cac failed\n");
3799		return ret;
3800	}
3801	ret = rv770_halt_smc(rdev);
3802	if (ret) {
3803		DRM_ERROR("rv770_halt_smc failed\n");
3804		return ret;
3805	}
3806	if (eg_pi->smu_uvd_hs)
3807		btc_notify_uvd_to_smc(rdev, new_ps);
3808	ret = ni_upload_sw_state(rdev, new_ps);
3809	if (ret) {
3810		DRM_ERROR("ni_upload_sw_state failed\n");
3811		return ret;
3812	}
3813	if (eg_pi->dynamic_ac_timing) {
3814		ret = ni_upload_mc_reg_table(rdev, new_ps);
3815		if (ret) {
3816			DRM_ERROR("ni_upload_mc_reg_table failed\n");
3817			return ret;
3818		}
3819	}
3820	ret = ni_program_memory_timing_parameters(rdev, new_ps);
3821	if (ret) {
3822		DRM_ERROR("ni_program_memory_timing_parameters failed\n");
3823		return ret;
3824	}
3825	ret = rv770_resume_smc(rdev);
3826	if (ret) {
3827		DRM_ERROR("rv770_resume_smc failed\n");
3828		return ret;
3829	}
3830	ret = rv770_set_sw_state(rdev);
3831	if (ret) {
3832		DRM_ERROR("rv770_set_sw_state failed\n");
3833		return ret;
3834	}
3835	ni_set_uvd_clock_after_set_eng_clock(rdev, new_ps, old_ps);
3836	ret = ni_enable_smc_cac(rdev, new_ps, true);
3837	if (ret) {
3838		DRM_ERROR("ni_enable_smc_cac failed\n");
3839		return ret;
3840	}
3841	ret = ni_enable_power_containment(rdev, new_ps, true);
3842	if (ret) {
3843		DRM_ERROR("ni_enable_power_containment failed\n");
3844		return ret;
3845	}
3846
3847	/* update tdp */
3848	ret = ni_power_control_set_level(rdev);
3849	if (ret) {
3850		DRM_ERROR("ni_power_control_set_level failed\n");
3851		return ret;
3852	}
3853
3854	return 0;
3855}
3856
3857void ni_dpm_post_set_power_state(struct radeon_device *rdev)
3858{
3859	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3860	struct radeon_ps *new_ps = &eg_pi->requested_rps;
3861
3862	ni_update_current_ps(rdev, new_ps);
3863}
3864
3865#if 0
3866void ni_dpm_reset_asic(struct radeon_device *rdev)
3867{
3868	ni_restrict_performance_levels_before_switch(rdev);
3869	rv770_set_boot_state(rdev);
3870}
3871#endif
3872
3873union power_info {
3874	struct _ATOM_POWERPLAY_INFO info;
3875	struct _ATOM_POWERPLAY_INFO_V2 info_2;
3876	struct _ATOM_POWERPLAY_INFO_V3 info_3;
3877	struct _ATOM_PPLIB_POWERPLAYTABLE pplib;
3878	struct _ATOM_PPLIB_POWERPLAYTABLE2 pplib2;
3879	struct _ATOM_PPLIB_POWERPLAYTABLE3 pplib3;
3880};
3881
3882union pplib_clock_info {
3883	struct _ATOM_PPLIB_R600_CLOCK_INFO r600;
3884	struct _ATOM_PPLIB_RS780_CLOCK_INFO rs780;
3885	struct _ATOM_PPLIB_EVERGREEN_CLOCK_INFO evergreen;
3886	struct _ATOM_PPLIB_SUMO_CLOCK_INFO sumo;
3887};
3888
3889union pplib_power_state {
3890	struct _ATOM_PPLIB_STATE v1;
3891	struct _ATOM_PPLIB_STATE_V2 v2;
3892};
3893
3894static void ni_parse_pplib_non_clock_info(struct radeon_device *rdev,
3895					  struct radeon_ps *rps,
3896					  struct _ATOM_PPLIB_NONCLOCK_INFO *non_clock_info,
3897					  u8 table_rev)
3898{
3899	rps->caps = le32_to_cpu(non_clock_info->ulCapsAndSettings);
3900	rps->class = le16_to_cpu(non_clock_info->usClassification);
3901	rps->class2 = le16_to_cpu(non_clock_info->usClassification2);
3902
3903	if (ATOM_PPLIB_NONCLOCKINFO_VER1 < table_rev) {
3904		rps->vclk = le32_to_cpu(non_clock_info->ulVCLK);
3905		rps->dclk = le32_to_cpu(non_clock_info->ulDCLK);
3906	} else if (r600_is_uvd_state(rps->class, rps->class2)) {
3907		rps->vclk = RV770_DEFAULT_VCLK_FREQ;
3908		rps->dclk = RV770_DEFAULT_DCLK_FREQ;
3909	} else {
3910		rps->vclk = 0;
3911		rps->dclk = 0;
3912	}
3913
3914	if (rps->class & ATOM_PPLIB_CLASSIFICATION_BOOT)
3915		rdev->pm.dpm.boot_ps = rps;
3916	if (rps->class & ATOM_PPLIB_CLASSIFICATION_UVDSTATE)
3917		rdev->pm.dpm.uvd_ps = rps;
3918}
3919
3920static void ni_parse_pplib_clock_info(struct radeon_device *rdev,
3921				      struct radeon_ps *rps, int index,
3922				      union pplib_clock_info *clock_info)
3923{
3924	struct rv7xx_power_info *pi = rv770_get_pi(rdev);
3925	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
3926	struct ni_ps *ps = ni_get_ps(rps);
3927	struct rv7xx_pl *pl = &ps->performance_levels[index];
3928
3929	ps->performance_level_count = index + 1;
3930
3931	pl->sclk = le16_to_cpu(clock_info->evergreen.usEngineClockLow);
3932	pl->sclk |= clock_info->evergreen.ucEngineClockHigh << 16;
3933	pl->mclk = le16_to_cpu(clock_info->evergreen.usMemoryClockLow);
3934	pl->mclk |= clock_info->evergreen.ucMemoryClockHigh << 16;
3935
3936	pl->vddc = le16_to_cpu(clock_info->evergreen.usVDDC);
3937	pl->vddci = le16_to_cpu(clock_info->evergreen.usVDDCI);
3938	pl->flags = le32_to_cpu(clock_info->evergreen.ulFlags);
3939
3940	/* patch up vddc if necessary */
3941	if (pl->vddc == 0xff01) {
3942		if (pi->max_vddc)
3943			pl->vddc = pi->max_vddc;
3944	}
3945
3946	if (rps->class & ATOM_PPLIB_CLASSIFICATION_ACPI) {
3947		pi->acpi_vddc = pl->vddc;
3948		eg_pi->acpi_vddci = pl->vddci;
3949		if (ps->performance_levels[0].flags & ATOM_PPLIB_R600_FLAGS_PCIEGEN2)
3950			pi->acpi_pcie_gen2 = true;
3951		else
3952			pi->acpi_pcie_gen2 = false;
3953	}
3954
3955	if (rps->class2 & ATOM_PPLIB_CLASSIFICATION2_ULV) {
3956		eg_pi->ulv.supported = true;
3957		eg_pi->ulv.pl = pl;
3958	}
3959
3960	if (pi->min_vddc_in_table > pl->vddc)
3961		pi->min_vddc_in_table = pl->vddc;
3962
3963	if (pi->max_vddc_in_table < pl->vddc)
3964		pi->max_vddc_in_table = pl->vddc;
3965
3966	/* patch up boot state */
3967	if (rps->class & ATOM_PPLIB_CLASSIFICATION_BOOT) {
3968		u16 vddc, vddci, mvdd;
3969		radeon_atombios_get_default_voltages(rdev, &vddc, &vddci, &mvdd);
3970		pl->mclk = rdev->clock.default_mclk;
3971		pl->sclk = rdev->clock.default_sclk;
3972		pl->vddc = vddc;
3973		pl->vddci = vddci;
3974	}
3975
3976	if ((rps->class & ATOM_PPLIB_CLASSIFICATION_UI_MASK) ==
3977	    ATOM_PPLIB_CLASSIFICATION_UI_PERFORMANCE) {
3978		rdev->pm.dpm.dyn_state.max_clock_voltage_on_ac.sclk = pl->sclk;
3979		rdev->pm.dpm.dyn_state.max_clock_voltage_on_ac.mclk = pl->mclk;
3980		rdev->pm.dpm.dyn_state.max_clock_voltage_on_ac.vddc = pl->vddc;
3981		rdev->pm.dpm.dyn_state.max_clock_voltage_on_ac.vddci = pl->vddci;
3982	}
3983}
3984
3985static int ni_parse_power_table(struct radeon_device *rdev)
3986{
3987	struct radeon_mode_info *mode_info = &rdev->mode_info;
3988	struct _ATOM_PPLIB_NONCLOCK_INFO *non_clock_info;
3989	union pplib_power_state *power_state;
3990	int i, j;
3991	union pplib_clock_info *clock_info;
3992	union power_info *power_info;
3993	int index = GetIndexIntoMasterTable(DATA, PowerPlayInfo);
3994	u16 data_offset;
3995	u8 frev, crev;
3996	struct ni_ps *ps;
3997
3998	if (!atom_parse_data_header(mode_info->atom_context, index, NULL,
3999				   &frev, &crev, &data_offset))
4000		return -EINVAL;
4001	power_info = (union power_info *)(mode_info->atom_context->bios + data_offset);
4002
4003	rdev->pm.dpm.ps = kcalloc(power_info->pplib.ucNumStates,
4004				  sizeof(struct radeon_ps),
4005				  GFP_KERNEL);
4006	if (!rdev->pm.dpm.ps)
4007		return -ENOMEM;
4008
4009	for (i = 0; i < power_info->pplib.ucNumStates; i++) {
4010		power_state = (union pplib_power_state *)
4011			(mode_info->atom_context->bios + data_offset +
4012			 le16_to_cpu(power_info->pplib.usStateArrayOffset) +
4013			 i * power_info->pplib.ucStateEntrySize);
4014		non_clock_info = (struct _ATOM_PPLIB_NONCLOCK_INFO *)
4015			(mode_info->atom_context->bios + data_offset +
4016			 le16_to_cpu(power_info->pplib.usNonClockInfoArrayOffset) +
4017			 (power_state->v1.ucNonClockStateIndex *
4018			  power_info->pplib.ucNonClockSize));
4019		if (power_info->pplib.ucStateEntrySize - 1) {
4020			u8 *idx;
4021			ps = kzalloc(sizeof(struct ni_ps), GFP_KERNEL);
4022			if (ps == NULL) {
4023				kfree(rdev->pm.dpm.ps);
4024				return -ENOMEM;
4025			}
4026			rdev->pm.dpm.ps[i].ps_priv = ps;
4027			ni_parse_pplib_non_clock_info(rdev, &rdev->pm.dpm.ps[i],
4028							 non_clock_info,
4029							 power_info->pplib.ucNonClockSize);
4030			idx = (u8 *)&power_state->v1.ucClockStateIndices[0];
4031			for (j = 0; j < (power_info->pplib.ucStateEntrySize - 1); j++) {
4032				clock_info = (union pplib_clock_info *)
4033					(mode_info->atom_context->bios + data_offset +
4034					 le16_to_cpu(power_info->pplib.usClockInfoArrayOffset) +
4035					 (idx[j] * power_info->pplib.ucClockInfoSize));
4036				ni_parse_pplib_clock_info(rdev,
4037							  &rdev->pm.dpm.ps[i], j,
4038							  clock_info);
4039			}
4040		}
4041	}
4042	rdev->pm.dpm.num_ps = power_info->pplib.ucNumStates;
4043	return 0;
4044}
4045
4046int ni_dpm_init(struct radeon_device *rdev)
4047{
4048	struct rv7xx_power_info *pi;
4049	struct evergreen_power_info *eg_pi;
4050	struct ni_power_info *ni_pi;
4051	struct atom_clock_dividers dividers;
4052	int ret;
4053
4054	ni_pi = kzalloc(sizeof(struct ni_power_info), GFP_KERNEL);
4055	if (ni_pi == NULL)
4056		return -ENOMEM;
4057	rdev->pm.dpm.priv = ni_pi;
4058	eg_pi = &ni_pi->eg;
4059	pi = &eg_pi->rv7xx;
4060
4061	rv770_get_max_vddc(rdev);
4062
4063	eg_pi->ulv.supported = false;
4064	pi->acpi_vddc = 0;
4065	eg_pi->acpi_vddci = 0;
4066	pi->min_vddc_in_table = 0;
4067	pi->max_vddc_in_table = 0;
4068
4069	ret = r600_get_platform_caps(rdev);
4070	if (ret)
4071		return ret;
4072
4073	ret = ni_parse_power_table(rdev);
4074	if (ret)
4075		return ret;
4076	ret = r600_parse_extended_power_table(rdev);
4077	if (ret)
4078		return ret;
4079
4080	rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries =
4081		kcalloc(4,
4082			sizeof(struct radeon_clock_voltage_dependency_entry),
4083			GFP_KERNEL);
4084	if (!rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries) {
4085		r600_free_extended_power_table(rdev);
4086		return -ENOMEM;
4087	}
4088	rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.count = 4;
4089	rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries[0].clk = 0;
4090	rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries[0].v = 0;
4091	rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries[1].clk = 36000;
4092	rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries[1].v = 720;
4093	rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries[2].clk = 54000;
4094	rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries[2].v = 810;
4095	rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries[3].clk = 72000;
4096	rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries[3].v = 900;
4097
4098	ni_patch_dependency_tables_based_on_leakage(rdev);
4099
4100	if (rdev->pm.dpm.voltage_response_time == 0)
4101		rdev->pm.dpm.voltage_response_time = R600_VOLTAGERESPONSETIME_DFLT;
4102	if (rdev->pm.dpm.backbias_response_time == 0)
4103		rdev->pm.dpm.backbias_response_time = R600_BACKBIASRESPONSETIME_DFLT;
4104
4105	ret = radeon_atom_get_clock_dividers(rdev, COMPUTE_ENGINE_PLL_PARAM,
4106					     0, false, &dividers);
4107	if (ret)
4108		pi->ref_div = dividers.ref_div + 1;
4109	else
4110		pi->ref_div = R600_REFERENCEDIVIDER_DFLT;
4111
4112	pi->rlp = RV770_RLP_DFLT;
4113	pi->rmp = RV770_RMP_DFLT;
4114	pi->lhp = RV770_LHP_DFLT;
4115	pi->lmp = RV770_LMP_DFLT;
4116
4117	eg_pi->ats[0].rlp = RV770_RLP_DFLT;
4118	eg_pi->ats[0].rmp = RV770_RMP_DFLT;
4119	eg_pi->ats[0].lhp = RV770_LHP_DFLT;
4120	eg_pi->ats[0].lmp = RV770_LMP_DFLT;
4121
4122	eg_pi->ats[1].rlp = BTC_RLP_UVD_DFLT;
4123	eg_pi->ats[1].rmp = BTC_RMP_UVD_DFLT;
4124	eg_pi->ats[1].lhp = BTC_LHP_UVD_DFLT;
4125	eg_pi->ats[1].lmp = BTC_LMP_UVD_DFLT;
4126
4127	eg_pi->smu_uvd_hs = true;
4128
4129	if (rdev->pdev->device == 0x6707) {
4130		pi->mclk_strobe_mode_threshold = 55000;
4131		pi->mclk_edc_enable_threshold = 55000;
4132		eg_pi->mclk_edc_wr_enable_threshold = 55000;
4133	} else {
4134		pi->mclk_strobe_mode_threshold = 40000;
4135		pi->mclk_edc_enable_threshold = 40000;
4136		eg_pi->mclk_edc_wr_enable_threshold = 40000;
4137	}
4138	ni_pi->mclk_rtt_mode_threshold = eg_pi->mclk_edc_wr_enable_threshold;
4139
4140	pi->voltage_control =
4141		radeon_atom_is_voltage_gpio(rdev, SET_VOLTAGE_TYPE_ASIC_VDDC, 0);
4142
4143	pi->mvdd_control =
4144		radeon_atom_is_voltage_gpio(rdev, SET_VOLTAGE_TYPE_ASIC_MVDDC, 0);
4145
4146	eg_pi->vddci_control =
4147		radeon_atom_is_voltage_gpio(rdev, SET_VOLTAGE_TYPE_ASIC_VDDCI, 0);
4148
4149	rv770_get_engine_memory_ss(rdev);
4150
4151	pi->asi = RV770_ASI_DFLT;
4152	pi->pasi = CYPRESS_HASI_DFLT;
4153	pi->vrc = CYPRESS_VRC_DFLT;
4154
4155	pi->power_gating = false;
4156
4157	pi->gfx_clock_gating = true;
4158
4159	pi->mg_clock_gating = true;
4160	pi->mgcgtssm = true;
4161	eg_pi->ls_clock_gating = false;
4162	eg_pi->sclk_deep_sleep = false;
4163
4164	pi->dynamic_pcie_gen2 = true;
4165
4166	if (rdev->pm.int_thermal_type != THERMAL_TYPE_NONE)
4167		pi->thermal_protection = true;
4168	else
4169		pi->thermal_protection = false;
4170
4171	pi->display_gap = true;
4172
4173	pi->dcodt = true;
4174
4175	pi->ulps = true;
4176
4177	eg_pi->dynamic_ac_timing = true;
4178	eg_pi->abm = true;
4179	eg_pi->mcls = true;
4180	eg_pi->light_sleep = true;
4181	eg_pi->memory_transition = true;
4182#if defined(CONFIG_ACPI)
4183	eg_pi->pcie_performance_request =
4184		radeon_acpi_is_pcie_performance_request_supported(rdev);
4185#else
4186	eg_pi->pcie_performance_request = false;
4187#endif
4188
4189	eg_pi->dll_default_on = false;
4190
4191	eg_pi->sclk_deep_sleep = false;
4192
4193	pi->mclk_stutter_mode_threshold = 0;
4194
4195	pi->sram_end = SMC_RAM_END;
4196
4197	rdev->pm.dpm.dyn_state.mclk_sclk_ratio = 3;
4198	rdev->pm.dpm.dyn_state.vddc_vddci_delta = 200;
4199	rdev->pm.dpm.dyn_state.min_vddc_for_pcie_gen2 = 900;
4200	rdev->pm.dpm.dyn_state.valid_sclk_values.count = ARRAY_SIZE(btc_valid_sclk);
4201	rdev->pm.dpm.dyn_state.valid_sclk_values.values = btc_valid_sclk;
4202	rdev->pm.dpm.dyn_state.valid_mclk_values.count = 0;
4203	rdev->pm.dpm.dyn_state.valid_mclk_values.values = NULL;
4204	rdev->pm.dpm.dyn_state.sclk_mclk_delta = 12500;
4205
4206	ni_pi->cac_data.leakage_coefficients.at = 516;
4207	ni_pi->cac_data.leakage_coefficients.bt = 18;
4208	ni_pi->cac_data.leakage_coefficients.av = 51;
4209	ni_pi->cac_data.leakage_coefficients.bv = 2957;
4210
4211	switch (rdev->pdev->device) {
4212	case 0x6700:
4213	case 0x6701:
4214	case 0x6702:
4215	case 0x6703:
4216	case 0x6718:
4217		ni_pi->cac_weights = &cac_weights_cayman_xt;
4218		break;
4219	case 0x6705:
4220	case 0x6719:
4221	case 0x671D:
4222	case 0x671C:
4223	default:
4224		ni_pi->cac_weights = &cac_weights_cayman_pro;
4225		break;
4226	case 0x6704:
4227	case 0x6706:
4228	case 0x6707:
4229	case 0x6708:
4230	case 0x6709:
4231		ni_pi->cac_weights = &cac_weights_cayman_le;
4232		break;
4233	}
4234
4235	if (ni_pi->cac_weights->enable_power_containment_by_default) {
4236		ni_pi->enable_power_containment = true;
4237		ni_pi->enable_cac = true;
4238		ni_pi->enable_sq_ramping = true;
4239	} else {
4240		ni_pi->enable_power_containment = false;
4241		ni_pi->enable_cac = false;
4242		ni_pi->enable_sq_ramping = false;
4243	}
4244
4245	ni_pi->driver_calculate_cac_leakage = false;
4246	ni_pi->cac_configuration_required = true;
4247
4248	if (ni_pi->cac_configuration_required) {
4249		ni_pi->support_cac_long_term_average = true;
4250		ni_pi->lta_window_size = ni_pi->cac_weights->l2_lta_window_size;
4251		ni_pi->lts_truncate = ni_pi->cac_weights->lts_truncate;
4252	} else {
4253		ni_pi->support_cac_long_term_average = false;
4254		ni_pi->lta_window_size = 0;
4255		ni_pi->lts_truncate = 0;
4256	}
4257
4258	ni_pi->use_power_boost_limit = true;
4259
4260	/* make sure dc limits are valid */
4261	if ((rdev->pm.dpm.dyn_state.max_clock_voltage_on_dc.sclk == 0) ||
4262	    (rdev->pm.dpm.dyn_state.max_clock_voltage_on_dc.mclk == 0))
4263		rdev->pm.dpm.dyn_state.max_clock_voltage_on_dc =
4264			rdev->pm.dpm.dyn_state.max_clock_voltage_on_ac;
4265
4266	return 0;
4267}
4268
4269void ni_dpm_fini(struct radeon_device *rdev)
4270{
4271	int i;
4272
4273	for (i = 0; i < rdev->pm.dpm.num_ps; i++) {
4274		kfree(rdev->pm.dpm.ps[i].ps_priv);
4275	}
4276	kfree(rdev->pm.dpm.ps);
4277	kfree(rdev->pm.dpm.priv);
4278	kfree(rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries);
4279	r600_free_extended_power_table(rdev);
4280}
4281
4282void ni_dpm_print_power_state(struct radeon_device *rdev,
4283			      struct radeon_ps *rps)
4284{
4285	struct ni_ps *ps = ni_get_ps(rps);
4286	struct rv7xx_pl *pl;
4287	int i;
4288
4289	r600_dpm_print_class_info(rps->class, rps->class2);
4290	r600_dpm_print_cap_info(rps->caps);
4291	printk("\tuvd    vclk: %d dclk: %d\n", rps->vclk, rps->dclk);
4292	for (i = 0; i < ps->performance_level_count; i++) {
4293		pl = &ps->performance_levels[i];
4294		if (rdev->family >= CHIP_TAHITI)
4295			printk("\t\tpower level %d    sclk: %u mclk: %u vddc: %u vddci: %u pcie gen: %u\n",
4296			       i, pl->sclk, pl->mclk, pl->vddc, pl->vddci, pl->pcie_gen + 1);
4297		else
4298			printk("\t\tpower level %d    sclk: %u mclk: %u vddc: %u vddci: %u\n",
4299			       i, pl->sclk, pl->mclk, pl->vddc, pl->vddci);
4300	}
4301	r600_dpm_print_ps_status(rdev, rps);
4302}
4303
4304void ni_dpm_debugfs_print_current_performance_level(struct radeon_device *rdev,
4305						    struct seq_file *m)
4306{
4307	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
4308	struct radeon_ps *rps = &eg_pi->current_rps;
4309	struct ni_ps *ps = ni_get_ps(rps);
4310	struct rv7xx_pl *pl;
4311	u32 current_index =
4312		(RREG32(TARGET_AND_CURRENT_PROFILE_INDEX) & CURRENT_STATE_INDEX_MASK) >>
4313		CURRENT_STATE_INDEX_SHIFT;
4314
4315	if (current_index >= ps->performance_level_count) {
4316		seq_printf(m, "invalid dpm profile %d\n", current_index);
4317	} else {
4318		pl = &ps->performance_levels[current_index];
4319		seq_printf(m, "uvd    vclk: %d dclk: %d\n", rps->vclk, rps->dclk);
4320		seq_printf(m, "power level %d    sclk: %u mclk: %u vddc: %u vddci: %u\n",
4321			   current_index, pl->sclk, pl->mclk, pl->vddc, pl->vddci);
4322	}
4323}
4324
4325u32 ni_dpm_get_current_sclk(struct radeon_device *rdev)
4326{
4327	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
4328	struct radeon_ps *rps = &eg_pi->current_rps;
4329	struct ni_ps *ps = ni_get_ps(rps);
4330	struct rv7xx_pl *pl;
4331	u32 current_index =
4332		(RREG32(TARGET_AND_CURRENT_PROFILE_INDEX) & CURRENT_STATE_INDEX_MASK) >>
4333		CURRENT_STATE_INDEX_SHIFT;
4334
4335	if (current_index >= ps->performance_level_count) {
4336		return 0;
4337	} else {
4338		pl = &ps->performance_levels[current_index];
4339		return pl->sclk;
4340	}
4341}
4342
4343u32 ni_dpm_get_current_mclk(struct radeon_device *rdev)
4344{
4345	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
4346	struct radeon_ps *rps = &eg_pi->current_rps;
4347	struct ni_ps *ps = ni_get_ps(rps);
4348	struct rv7xx_pl *pl;
4349	u32 current_index =
4350		(RREG32(TARGET_AND_CURRENT_PROFILE_INDEX) & CURRENT_STATE_INDEX_MASK) >>
4351		CURRENT_STATE_INDEX_SHIFT;
4352
4353	if (current_index >= ps->performance_level_count) {
4354		return 0;
4355	} else {
4356		pl = &ps->performance_levels[current_index];
4357		return pl->mclk;
4358	}
4359}
4360
4361u32 ni_dpm_get_sclk(struct radeon_device *rdev, bool low)
4362{
4363	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
4364	struct ni_ps *requested_state = ni_get_ps(&eg_pi->requested_rps);
4365
4366	if (low)
4367		return requested_state->performance_levels[0].sclk;
4368	else
4369		return requested_state->performance_levels[requested_state->performance_level_count - 1].sclk;
4370}
4371
4372u32 ni_dpm_get_mclk(struct radeon_device *rdev, bool low)
4373{
4374	struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev);
4375	struct ni_ps *requested_state = ni_get_ps(&eg_pi->requested_rps);
4376
4377	if (low)
4378		return requested_state->performance_levels[0].mclk;
4379	else
4380		return requested_state->performance_levels[requested_state->performance_level_count - 1].mclk;
4381}
4382
4383