1 /* 2 * Copyright 2012 Advanced Micro Devices, Inc. 3 * 4 * Permission is hereby granted, free of charge, to any person obtaining a 5 * copy of this software and associated documentation files (the "Software"), 6 * to deal in the Software without restriction, including without limitation 7 * the rights to use, copy, modify, merge, publish, distribute, sublicense, 8 * and/or sell copies of the Software, and to permit persons to whom the 9 * Software is furnished to do so, subject to the following conditions: 10 * 11 * The above copyright notice and this permission notice shall be included in 12 * all copies or substantial portions of the Software. 13 * 14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR 18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, 19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR 20 * OTHER DEALINGS IN THE SOFTWARE. 21 * 22 */ 23 24 #include <linux/math64.h> 25 #include <linux/seq_file.h> 26 27 #include <drm/drm_pci.h> 28 29 #include "atom.h" 30 #include "ni_dpm.h" 31 #include "nid.h" 32 #include "r600_dpm.h" 33 #include "radeon.h" 34 #include "radeon_asic.h" 35 36 #define MC_CG_ARB_FREQ_F0 0x0a 37 #define MC_CG_ARB_FREQ_F1 0x0b 38 #define MC_CG_ARB_FREQ_F2 0x0c 39 #define MC_CG_ARB_FREQ_F3 0x0d 40 41 #define SMC_RAM_END 0xC000 42 43 static const struct ni_cac_weights cac_weights_cayman_xt = 44 { 45 0x15, 46 0x2, 47 0x19, 48 0x2, 49 0x8, 50 0x14, 51 0x2, 52 0x16, 53 0xE, 54 0x17, 55 0x13, 56 0x2B, 57 0x10, 58 0x7, 59 0x5, 60 0x5, 61 0x5, 62 0x2, 63 0x3, 64 0x9, 65 0x10, 66 0x10, 67 0x2B, 68 0xA, 69 0x9, 70 0x4, 71 0xD, 72 0xD, 73 0x3E, 74 0x18, 75 0x14, 76 0, 77 0x3, 78 0x3, 79 0x5, 80 0, 81 0x2, 82 0, 83 0, 84 0, 85 0, 86 0, 87 0, 88 0, 89 0, 90 0, 91 0x1CC, 92 0, 93 0x164, 94 1, 95 1, 96 1, 97 1, 98 12, 99 12, 100 12, 101 0x12, 102 0x1F, 103 132, 104 5, 105 7, 106 0, 107 { 0, 0, 0, 0, 0, 0, 0, 0 }, 108 { 0, 0, 0, 0 }, 109 true 110 }; 111 112 static const struct ni_cac_weights cac_weights_cayman_pro = 113 { 114 0x16, 115 0x4, 116 0x10, 117 0x2, 118 0xA, 119 0x16, 120 0x2, 121 0x18, 122 0x10, 123 0x1A, 124 0x16, 125 0x2D, 126 0x12, 127 0xA, 128 0x6, 129 0x6, 130 0x6, 131 0x2, 132 0x4, 133 0xB, 134 0x11, 135 0x11, 136 0x2D, 137 0xC, 138 0xC, 139 0x7, 140 0x10, 141 0x10, 142 0x3F, 143 0x1A, 144 0x16, 145 0, 146 0x7, 147 0x4, 148 0x6, 149 1, 150 0x2, 151 0x1, 152 0, 153 0, 154 0, 155 0, 156 0, 157 0, 158 0x30, 159 0, 160 0x1CF, 161 0, 162 0x166, 163 1, 164 1, 165 1, 166 1, 167 12, 168 12, 169 12, 170 0x15, 171 0x1F, 172 132, 173 6, 174 6, 175 0, 176 { 0, 0, 0, 0, 0, 0, 0, 0 }, 177 { 0, 0, 0, 0 }, 178 true 179 }; 180 181 static const struct ni_cac_weights cac_weights_cayman_le = 182 { 183 0x7, 184 0xE, 185 0x1, 186 0xA, 187 0x1, 188 0x3F, 189 0x2, 190 0x18, 191 0x10, 192 0x1A, 193 0x1, 194 0x3F, 195 0x1, 196 0xE, 197 0x6, 198 0x6, 199 0x6, 200 0x2, 201 0x4, 202 0x9, 203 0x1A, 204 0x1A, 205 0x2C, 206 0xA, 207 0x11, 208 0x8, 209 0x19, 210 0x19, 211 0x1, 212 0x1, 213 0x1A, 214 0, 215 0x8, 216 0x5, 217 0x8, 218 0x1, 219 0x3, 220 0x1, 221 0, 222 0, 223 0, 224 0, 225 0, 226 0, 227 0x38, 228 0x38, 229 0x239, 230 0x3, 231 0x18A, 232 1, 233 1, 234 1, 235 1, 236 12, 237 12, 238 12, 239 0x15, 240 0x22, 241 132, 242 6, 243 6, 244 0, 245 { 0, 0, 0, 0, 0, 0, 0, 0 }, 246 { 0, 0, 0, 0 }, 247 true 248 }; 249 250 #define NISLANDS_MGCG_SEQUENCE 300 251 252 static const u32 cayman_cgcg_cgls_default[] = 253 { 254 0x000008f8, 0x00000010, 0xffffffff, 255 0x000008fc, 0x00000000, 0xffffffff, 256 0x000008f8, 0x00000011, 0xffffffff, 257 0x000008fc, 0x00000000, 0xffffffff, 258 0x000008f8, 0x00000012, 0xffffffff, 259 0x000008fc, 0x00000000, 0xffffffff, 260 0x000008f8, 0x00000013, 0xffffffff, 261 0x000008fc, 0x00000000, 0xffffffff, 262 0x000008f8, 0x00000014, 0xffffffff, 263 0x000008fc, 0x00000000, 0xffffffff, 264 0x000008f8, 0x00000015, 0xffffffff, 265 0x000008fc, 0x00000000, 0xffffffff, 266 0x000008f8, 0x00000016, 0xffffffff, 267 0x000008fc, 0x00000000, 0xffffffff, 268 0x000008f8, 0x00000017, 0xffffffff, 269 0x000008fc, 0x00000000, 0xffffffff, 270 0x000008f8, 0x00000018, 0xffffffff, 271 0x000008fc, 0x00000000, 0xffffffff, 272 0x000008f8, 0x00000019, 0xffffffff, 273 0x000008fc, 0x00000000, 0xffffffff, 274 0x000008f8, 0x0000001a, 0xffffffff, 275 0x000008fc, 0x00000000, 0xffffffff, 276 0x000008f8, 0x0000001b, 0xffffffff, 277 0x000008fc, 0x00000000, 0xffffffff, 278 0x000008f8, 0x00000020, 0xffffffff, 279 0x000008fc, 0x00000000, 0xffffffff, 280 0x000008f8, 0x00000021, 0xffffffff, 281 0x000008fc, 0x00000000, 0xffffffff, 282 0x000008f8, 0x00000022, 0xffffffff, 283 0x000008fc, 0x00000000, 0xffffffff, 284 0x000008f8, 0x00000023, 0xffffffff, 285 0x000008fc, 0x00000000, 0xffffffff, 286 0x000008f8, 0x00000024, 0xffffffff, 287 0x000008fc, 0x00000000, 0xffffffff, 288 0x000008f8, 0x00000025, 0xffffffff, 289 0x000008fc, 0x00000000, 0xffffffff, 290 0x000008f8, 0x00000026, 0xffffffff, 291 0x000008fc, 0x00000000, 0xffffffff, 292 0x000008f8, 0x00000027, 0xffffffff, 293 0x000008fc, 0x00000000, 0xffffffff, 294 0x000008f8, 0x00000028, 0xffffffff, 295 0x000008fc, 0x00000000, 0xffffffff, 296 0x000008f8, 0x00000029, 0xffffffff, 297 0x000008fc, 0x00000000, 0xffffffff, 298 0x000008f8, 0x0000002a, 0xffffffff, 299 0x000008fc, 0x00000000, 0xffffffff, 300 0x000008f8, 0x0000002b, 0xffffffff, 301 0x000008fc, 0x00000000, 0xffffffff 302 }; 303 #define CAYMAN_CGCG_CGLS_DEFAULT_LENGTH sizeof(cayman_cgcg_cgls_default) / (3 * sizeof(u32)) 304 305 static const u32 cayman_cgcg_cgls_disable[] = 306 { 307 0x000008f8, 0x00000010, 0xffffffff, 308 0x000008fc, 0xffffffff, 0xffffffff, 309 0x000008f8, 0x00000011, 0xffffffff, 310 0x000008fc, 0xffffffff, 0xffffffff, 311 0x000008f8, 0x00000012, 0xffffffff, 312 0x000008fc, 0xffffffff, 0xffffffff, 313 0x000008f8, 0x00000013, 0xffffffff, 314 0x000008fc, 0xffffffff, 0xffffffff, 315 0x000008f8, 0x00000014, 0xffffffff, 316 0x000008fc, 0xffffffff, 0xffffffff, 317 0x000008f8, 0x00000015, 0xffffffff, 318 0x000008fc, 0xffffffff, 0xffffffff, 319 0x000008f8, 0x00000016, 0xffffffff, 320 0x000008fc, 0xffffffff, 0xffffffff, 321 0x000008f8, 0x00000017, 0xffffffff, 322 0x000008fc, 0xffffffff, 0xffffffff, 323 0x000008f8, 0x00000018, 0xffffffff, 324 0x000008fc, 0xffffffff, 0xffffffff, 325 0x000008f8, 0x00000019, 0xffffffff, 326 0x000008fc, 0xffffffff, 0xffffffff, 327 0x000008f8, 0x0000001a, 0xffffffff, 328 0x000008fc, 0xffffffff, 0xffffffff, 329 0x000008f8, 0x0000001b, 0xffffffff, 330 0x000008fc, 0xffffffff, 0xffffffff, 331 0x000008f8, 0x00000020, 0xffffffff, 332 0x000008fc, 0x00000000, 0xffffffff, 333 0x000008f8, 0x00000021, 0xffffffff, 334 0x000008fc, 0x00000000, 0xffffffff, 335 0x000008f8, 0x00000022, 0xffffffff, 336 0x000008fc, 0x00000000, 0xffffffff, 337 0x000008f8, 0x00000023, 0xffffffff, 338 0x000008fc, 0x00000000, 0xffffffff, 339 0x000008f8, 0x00000024, 0xffffffff, 340 0x000008fc, 0x00000000, 0xffffffff, 341 0x000008f8, 0x00000025, 0xffffffff, 342 0x000008fc, 0x00000000, 0xffffffff, 343 0x000008f8, 0x00000026, 0xffffffff, 344 0x000008fc, 0x00000000, 0xffffffff, 345 0x000008f8, 0x00000027, 0xffffffff, 346 0x000008fc, 0x00000000, 0xffffffff, 347 0x000008f8, 0x00000028, 0xffffffff, 348 0x000008fc, 0x00000000, 0xffffffff, 349 0x000008f8, 0x00000029, 0xffffffff, 350 0x000008fc, 0x00000000, 0xffffffff, 351 0x000008f8, 0x0000002a, 0xffffffff, 352 0x000008fc, 0x00000000, 0xffffffff, 353 0x000008f8, 0x0000002b, 0xffffffff, 354 0x000008fc, 0x00000000, 0xffffffff, 355 0x00000644, 0x000f7902, 0x001f4180, 356 0x00000644, 0x000f3802, 0x001f4180 357 }; 358 #define CAYMAN_CGCG_CGLS_DISABLE_LENGTH sizeof(cayman_cgcg_cgls_disable) / (3 * sizeof(u32)) 359 360 static const u32 cayman_cgcg_cgls_enable[] = 361 { 362 0x00000644, 0x000f7882, 0x001f4080, 363 0x000008f8, 0x00000010, 0xffffffff, 364 0x000008fc, 0x00000000, 0xffffffff, 365 0x000008f8, 0x00000011, 0xffffffff, 366 0x000008fc, 0x00000000, 0xffffffff, 367 0x000008f8, 0x00000012, 0xffffffff, 368 0x000008fc, 0x00000000, 0xffffffff, 369 0x000008f8, 0x00000013, 0xffffffff, 370 0x000008fc, 0x00000000, 0xffffffff, 371 0x000008f8, 0x00000014, 0xffffffff, 372 0x000008fc, 0x00000000, 0xffffffff, 373 0x000008f8, 0x00000015, 0xffffffff, 374 0x000008fc, 0x00000000, 0xffffffff, 375 0x000008f8, 0x00000016, 0xffffffff, 376 0x000008fc, 0x00000000, 0xffffffff, 377 0x000008f8, 0x00000017, 0xffffffff, 378 0x000008fc, 0x00000000, 0xffffffff, 379 0x000008f8, 0x00000018, 0xffffffff, 380 0x000008fc, 0x00000000, 0xffffffff, 381 0x000008f8, 0x00000019, 0xffffffff, 382 0x000008fc, 0x00000000, 0xffffffff, 383 0x000008f8, 0x0000001a, 0xffffffff, 384 0x000008fc, 0x00000000, 0xffffffff, 385 0x000008f8, 0x0000001b, 0xffffffff, 386 0x000008fc, 0x00000000, 0xffffffff, 387 0x000008f8, 0x00000020, 0xffffffff, 388 0x000008fc, 0xffffffff, 0xffffffff, 389 0x000008f8, 0x00000021, 0xffffffff, 390 0x000008fc, 0xffffffff, 0xffffffff, 391 0x000008f8, 0x00000022, 0xffffffff, 392 0x000008fc, 0xffffffff, 0xffffffff, 393 0x000008f8, 0x00000023, 0xffffffff, 394 0x000008fc, 0xffffffff, 0xffffffff, 395 0x000008f8, 0x00000024, 0xffffffff, 396 0x000008fc, 0xffffffff, 0xffffffff, 397 0x000008f8, 0x00000025, 0xffffffff, 398 0x000008fc, 0xffffffff, 0xffffffff, 399 0x000008f8, 0x00000026, 0xffffffff, 400 0x000008fc, 0xffffffff, 0xffffffff, 401 0x000008f8, 0x00000027, 0xffffffff, 402 0x000008fc, 0xffffffff, 0xffffffff, 403 0x000008f8, 0x00000028, 0xffffffff, 404 0x000008fc, 0xffffffff, 0xffffffff, 405 0x000008f8, 0x00000029, 0xffffffff, 406 0x000008fc, 0xffffffff, 0xffffffff, 407 0x000008f8, 0x0000002a, 0xffffffff, 408 0x000008fc, 0xffffffff, 0xffffffff, 409 0x000008f8, 0x0000002b, 0xffffffff, 410 0x000008fc, 0xffffffff, 0xffffffff 411 }; 412 #define CAYMAN_CGCG_CGLS_ENABLE_LENGTH sizeof(cayman_cgcg_cgls_enable) / (3 * sizeof(u32)) 413 414 static const u32 cayman_mgcg_default[] = 415 { 416 0x0000802c, 0xc0000000, 0xffffffff, 417 0x00003fc4, 0xc0000000, 0xffffffff, 418 0x00005448, 0x00000100, 0xffffffff, 419 0x000055e4, 0x00000100, 0xffffffff, 420 0x0000160c, 0x00000100, 0xffffffff, 421 0x00008984, 0x06000100, 0xffffffff, 422 0x0000c164, 0x00000100, 0xffffffff, 423 0x00008a18, 0x00000100, 0xffffffff, 424 0x0000897c, 0x06000100, 0xffffffff, 425 0x00008b28, 0x00000100, 0xffffffff, 426 0x00009144, 0x00800200, 0xffffffff, 427 0x00009a60, 0x00000100, 0xffffffff, 428 0x00009868, 0x00000100, 0xffffffff, 429 0x00008d58, 0x00000100, 0xffffffff, 430 0x00009510, 0x00000100, 0xffffffff, 431 0x0000949c, 0x00000100, 0xffffffff, 432 0x00009654, 0x00000100, 0xffffffff, 433 0x00009030, 0x00000100, 0xffffffff, 434 0x00009034, 0x00000100, 0xffffffff, 435 0x00009038, 0x00000100, 0xffffffff, 436 0x0000903c, 0x00000100, 0xffffffff, 437 0x00009040, 0x00000100, 0xffffffff, 438 0x0000a200, 0x00000100, 0xffffffff, 439 0x0000a204, 0x00000100, 0xffffffff, 440 0x0000a208, 0x00000100, 0xffffffff, 441 0x0000a20c, 0x00000100, 0xffffffff, 442 0x00009744, 0x00000100, 0xffffffff, 443 0x00003f80, 0x00000100, 0xffffffff, 444 0x0000a210, 0x00000100, 0xffffffff, 445 0x0000a214, 0x00000100, 0xffffffff, 446 0x000004d8, 0x00000100, 0xffffffff, 447 0x00009664, 0x00000100, 0xffffffff, 448 0x00009698, 0x00000100, 0xffffffff, 449 0x000004d4, 0x00000200, 0xffffffff, 450 0x000004d0, 0x00000000, 0xffffffff, 451 0x000030cc, 0x00000104, 0xffffffff, 452 0x0000d0c0, 0x00000100, 0xffffffff, 453 0x0000d8c0, 0x00000100, 0xffffffff, 454 0x0000802c, 0x40000000, 0xffffffff, 455 0x00003fc4, 0x40000000, 0xffffffff, 456 0x0000915c, 0x00010000, 0xffffffff, 457 0x00009160, 0x00030002, 0xffffffff, 458 0x00009164, 0x00050004, 0xffffffff, 459 0x00009168, 0x00070006, 0xffffffff, 460 0x00009178, 0x00070000, 0xffffffff, 461 0x0000917c, 0x00030002, 0xffffffff, 462 0x00009180, 0x00050004, 0xffffffff, 463 0x0000918c, 0x00010006, 0xffffffff, 464 0x00009190, 0x00090008, 0xffffffff, 465 0x00009194, 0x00070000, 0xffffffff, 466 0x00009198, 0x00030002, 0xffffffff, 467 0x0000919c, 0x00050004, 0xffffffff, 468 0x000091a8, 0x00010006, 0xffffffff, 469 0x000091ac, 0x00090008, 0xffffffff, 470 0x000091b0, 0x00070000, 0xffffffff, 471 0x000091b4, 0x00030002, 0xffffffff, 472 0x000091b8, 0x00050004, 0xffffffff, 473 0x000091c4, 0x00010006, 0xffffffff, 474 0x000091c8, 0x00090008, 0xffffffff, 475 0x000091cc, 0x00070000, 0xffffffff, 476 0x000091d0, 0x00030002, 0xffffffff, 477 0x000091d4, 0x00050004, 0xffffffff, 478 0x000091e0, 0x00010006, 0xffffffff, 479 0x000091e4, 0x00090008, 0xffffffff, 480 0x000091e8, 0x00000000, 0xffffffff, 481 0x000091ec, 0x00070000, 0xffffffff, 482 0x000091f0, 0x00030002, 0xffffffff, 483 0x000091f4, 0x00050004, 0xffffffff, 484 0x00009200, 0x00010006, 0xffffffff, 485 0x00009204, 0x00090008, 0xffffffff, 486 0x00009208, 0x00070000, 0xffffffff, 487 0x0000920c, 0x00030002, 0xffffffff, 488 0x00009210, 0x00050004, 0xffffffff, 489 0x0000921c, 0x00010006, 0xffffffff, 490 0x00009220, 0x00090008, 0xffffffff, 491 0x00009224, 0x00070000, 0xffffffff, 492 0x00009228, 0x00030002, 0xffffffff, 493 0x0000922c, 0x00050004, 0xffffffff, 494 0x00009238, 0x00010006, 0xffffffff, 495 0x0000923c, 0x00090008, 0xffffffff, 496 0x00009240, 0x00070000, 0xffffffff, 497 0x00009244, 0x00030002, 0xffffffff, 498 0x00009248, 0x00050004, 0xffffffff, 499 0x00009254, 0x00010006, 0xffffffff, 500 0x00009258, 0x00090008, 0xffffffff, 501 0x0000925c, 0x00070000, 0xffffffff, 502 0x00009260, 0x00030002, 0xffffffff, 503 0x00009264, 0x00050004, 0xffffffff, 504 0x00009270, 0x00010006, 0xffffffff, 505 0x00009274, 0x00090008, 0xffffffff, 506 0x00009278, 0x00070000, 0xffffffff, 507 0x0000927c, 0x00030002, 0xffffffff, 508 0x00009280, 0x00050004, 0xffffffff, 509 0x0000928c, 0x00010006, 0xffffffff, 510 0x00009290, 0x00090008, 0xffffffff, 511 0x000092a8, 0x00070000, 0xffffffff, 512 0x000092ac, 0x00030002, 0xffffffff, 513 0x000092b0, 0x00050004, 0xffffffff, 514 0x000092bc, 0x00010006, 0xffffffff, 515 0x000092c0, 0x00090008, 0xffffffff, 516 0x000092c4, 0x00070000, 0xffffffff, 517 0x000092c8, 0x00030002, 0xffffffff, 518 0x000092cc, 0x00050004, 0xffffffff, 519 0x000092d8, 0x00010006, 0xffffffff, 520 0x000092dc, 0x00090008, 0xffffffff, 521 0x00009294, 0x00000000, 0xffffffff, 522 0x0000802c, 0x40010000, 0xffffffff, 523 0x00003fc4, 0x40010000, 0xffffffff, 524 0x0000915c, 0x00010000, 0xffffffff, 525 0x00009160, 0x00030002, 0xffffffff, 526 0x00009164, 0x00050004, 0xffffffff, 527 0x00009168, 0x00070006, 0xffffffff, 528 0x00009178, 0x00070000, 0xffffffff, 529 0x0000917c, 0x00030002, 0xffffffff, 530 0x00009180, 0x00050004, 0xffffffff, 531 0x0000918c, 0x00010006, 0xffffffff, 532 0x00009190, 0x00090008, 0xffffffff, 533 0x00009194, 0x00070000, 0xffffffff, 534 0x00009198, 0x00030002, 0xffffffff, 535 0x0000919c, 0x00050004, 0xffffffff, 536 0x000091a8, 0x00010006, 0xffffffff, 537 0x000091ac, 0x00090008, 0xffffffff, 538 0x000091b0, 0x00070000, 0xffffffff, 539 0x000091b4, 0x00030002, 0xffffffff, 540 0x000091b8, 0x00050004, 0xffffffff, 541 0x000091c4, 0x00010006, 0xffffffff, 542 0x000091c8, 0x00090008, 0xffffffff, 543 0x000091cc, 0x00070000, 0xffffffff, 544 0x000091d0, 0x00030002, 0xffffffff, 545 0x000091d4, 0x00050004, 0xffffffff, 546 0x000091e0, 0x00010006, 0xffffffff, 547 0x000091e4, 0x00090008, 0xffffffff, 548 0x000091e8, 0x00000000, 0xffffffff, 549 0x000091ec, 0x00070000, 0xffffffff, 550 0x000091f0, 0x00030002, 0xffffffff, 551 0x000091f4, 0x00050004, 0xffffffff, 552 0x00009200, 0x00010006, 0xffffffff, 553 0x00009204, 0x00090008, 0xffffffff, 554 0x00009208, 0x00070000, 0xffffffff, 555 0x0000920c, 0x00030002, 0xffffffff, 556 0x00009210, 0x00050004, 0xffffffff, 557 0x0000921c, 0x00010006, 0xffffffff, 558 0x00009220, 0x00090008, 0xffffffff, 559 0x00009224, 0x00070000, 0xffffffff, 560 0x00009228, 0x00030002, 0xffffffff, 561 0x0000922c, 0x00050004, 0xffffffff, 562 0x00009238, 0x00010006, 0xffffffff, 563 0x0000923c, 0x00090008, 0xffffffff, 564 0x00009240, 0x00070000, 0xffffffff, 565 0x00009244, 0x00030002, 0xffffffff, 566 0x00009248, 0x00050004, 0xffffffff, 567 0x00009254, 0x00010006, 0xffffffff, 568 0x00009258, 0x00090008, 0xffffffff, 569 0x0000925c, 0x00070000, 0xffffffff, 570 0x00009260, 0x00030002, 0xffffffff, 571 0x00009264, 0x00050004, 0xffffffff, 572 0x00009270, 0x00010006, 0xffffffff, 573 0x00009274, 0x00090008, 0xffffffff, 574 0x00009278, 0x00070000, 0xffffffff, 575 0x0000927c, 0x00030002, 0xffffffff, 576 0x00009280, 0x00050004, 0xffffffff, 577 0x0000928c, 0x00010006, 0xffffffff, 578 0x00009290, 0x00090008, 0xffffffff, 579 0x000092a8, 0x00070000, 0xffffffff, 580 0x000092ac, 0x00030002, 0xffffffff, 581 0x000092b0, 0x00050004, 0xffffffff, 582 0x000092bc, 0x00010006, 0xffffffff, 583 0x000092c0, 0x00090008, 0xffffffff, 584 0x000092c4, 0x00070000, 0xffffffff, 585 0x000092c8, 0x00030002, 0xffffffff, 586 0x000092cc, 0x00050004, 0xffffffff, 587 0x000092d8, 0x00010006, 0xffffffff, 588 0x000092dc, 0x00090008, 0xffffffff, 589 0x00009294, 0x00000000, 0xffffffff, 590 0x0000802c, 0xc0000000, 0xffffffff, 591 0x00003fc4, 0xc0000000, 0xffffffff, 592 0x000008f8, 0x00000010, 0xffffffff, 593 0x000008fc, 0x00000000, 0xffffffff, 594 0x000008f8, 0x00000011, 0xffffffff, 595 0x000008fc, 0x00000000, 0xffffffff, 596 0x000008f8, 0x00000012, 0xffffffff, 597 0x000008fc, 0x00000000, 0xffffffff, 598 0x000008f8, 0x00000013, 0xffffffff, 599 0x000008fc, 0x00000000, 0xffffffff, 600 0x000008f8, 0x00000014, 0xffffffff, 601 0x000008fc, 0x00000000, 0xffffffff, 602 0x000008f8, 0x00000015, 0xffffffff, 603 0x000008fc, 0x00000000, 0xffffffff, 604 0x000008f8, 0x00000016, 0xffffffff, 605 0x000008fc, 0x00000000, 0xffffffff, 606 0x000008f8, 0x00000017, 0xffffffff, 607 0x000008fc, 0x00000000, 0xffffffff, 608 0x000008f8, 0x00000018, 0xffffffff, 609 0x000008fc, 0x00000000, 0xffffffff, 610 0x000008f8, 0x00000019, 0xffffffff, 611 0x000008fc, 0x00000000, 0xffffffff, 612 0x000008f8, 0x0000001a, 0xffffffff, 613 0x000008fc, 0x00000000, 0xffffffff, 614 0x000008f8, 0x0000001b, 0xffffffff, 615 0x000008fc, 0x00000000, 0xffffffff 616 }; 617 #define CAYMAN_MGCG_DEFAULT_LENGTH sizeof(cayman_mgcg_default) / (3 * sizeof(u32)) 618 619 static const u32 cayman_mgcg_disable[] = 620 { 621 0x0000802c, 0xc0000000, 0xffffffff, 622 0x000008f8, 0x00000000, 0xffffffff, 623 0x000008fc, 0xffffffff, 0xffffffff, 624 0x000008f8, 0x00000001, 0xffffffff, 625 0x000008fc, 0xffffffff, 0xffffffff, 626 0x000008f8, 0x00000002, 0xffffffff, 627 0x000008fc, 0xffffffff, 0xffffffff, 628 0x000008f8, 0x00000003, 0xffffffff, 629 0x000008fc, 0xffffffff, 0xffffffff, 630 0x00009150, 0x00600000, 0xffffffff 631 }; 632 #define CAYMAN_MGCG_DISABLE_LENGTH sizeof(cayman_mgcg_disable) / (3 * sizeof(u32)) 633 634 static const u32 cayman_mgcg_enable[] = 635 { 636 0x0000802c, 0xc0000000, 0xffffffff, 637 0x000008f8, 0x00000000, 0xffffffff, 638 0x000008fc, 0x00000000, 0xffffffff, 639 0x000008f8, 0x00000001, 0xffffffff, 640 0x000008fc, 0x00000000, 0xffffffff, 641 0x000008f8, 0x00000002, 0xffffffff, 642 0x000008fc, 0x00600000, 0xffffffff, 643 0x000008f8, 0x00000003, 0xffffffff, 644 0x000008fc, 0x00000000, 0xffffffff, 645 0x00009150, 0x96944200, 0xffffffff 646 }; 647 648 #define CAYMAN_MGCG_ENABLE_LENGTH sizeof(cayman_mgcg_enable) / (3 * sizeof(u32)) 649 650 #define NISLANDS_SYSLS_SEQUENCE 100 651 652 static const u32 cayman_sysls_default[] = 653 { 654 /* Register, Value, Mask bits */ 655 0x000055e8, 0x00000000, 0xffffffff, 656 0x0000d0bc, 0x00000000, 0xffffffff, 657 0x0000d8bc, 0x00000000, 0xffffffff, 658 0x000015c0, 0x000c1401, 0xffffffff, 659 0x0000264c, 0x000c0400, 0xffffffff, 660 0x00002648, 0x000c0400, 0xffffffff, 661 0x00002650, 0x000c0400, 0xffffffff, 662 0x000020b8, 0x000c0400, 0xffffffff, 663 0x000020bc, 0x000c0400, 0xffffffff, 664 0x000020c0, 0x000c0c80, 0xffffffff, 665 0x0000f4a0, 0x000000c0, 0xffffffff, 666 0x0000f4a4, 0x00680fff, 0xffffffff, 667 0x00002f50, 0x00000404, 0xffffffff, 668 0x000004c8, 0x00000001, 0xffffffff, 669 0x000064ec, 0x00000000, 0xffffffff, 670 0x00000c7c, 0x00000000, 0xffffffff, 671 0x00008dfc, 0x00000000, 0xffffffff 672 }; 673 #define CAYMAN_SYSLS_DEFAULT_LENGTH sizeof(cayman_sysls_default) / (3 * sizeof(u32)) 674 675 static const u32 cayman_sysls_disable[] = 676 { 677 /* Register, Value, Mask bits */ 678 0x0000d0c0, 0x00000000, 0xffffffff, 679 0x0000d8c0, 0x00000000, 0xffffffff, 680 0x000055e8, 0x00000000, 0xffffffff, 681 0x0000d0bc, 0x00000000, 0xffffffff, 682 0x0000d8bc, 0x00000000, 0xffffffff, 683 0x000015c0, 0x00041401, 0xffffffff, 684 0x0000264c, 0x00040400, 0xffffffff, 685 0x00002648, 0x00040400, 0xffffffff, 686 0x00002650, 0x00040400, 0xffffffff, 687 0x000020b8, 0x00040400, 0xffffffff, 688 0x000020bc, 0x00040400, 0xffffffff, 689 0x000020c0, 0x00040c80, 0xffffffff, 690 0x0000f4a0, 0x000000c0, 0xffffffff, 691 0x0000f4a4, 0x00680000, 0xffffffff, 692 0x00002f50, 0x00000404, 0xffffffff, 693 0x000004c8, 0x00000001, 0xffffffff, 694 0x000064ec, 0x00007ffd, 0xffffffff, 695 0x00000c7c, 0x0000ff00, 0xffffffff, 696 0x00008dfc, 0x0000007f, 0xffffffff 697 }; 698 #define CAYMAN_SYSLS_DISABLE_LENGTH sizeof(cayman_sysls_disable) / (3 * sizeof(u32)) 699 700 static const u32 cayman_sysls_enable[] = 701 { 702 /* Register, Value, Mask bits */ 703 0x000055e8, 0x00000001, 0xffffffff, 704 0x0000d0bc, 0x00000100, 0xffffffff, 705 0x0000d8bc, 0x00000100, 0xffffffff, 706 0x000015c0, 0x000c1401, 0xffffffff, 707 0x0000264c, 0x000c0400, 0xffffffff, 708 0x00002648, 0x000c0400, 0xffffffff, 709 0x00002650, 0x000c0400, 0xffffffff, 710 0x000020b8, 0x000c0400, 0xffffffff, 711 0x000020bc, 0x000c0400, 0xffffffff, 712 0x000020c0, 0x000c0c80, 0xffffffff, 713 0x0000f4a0, 0x000000c0, 0xffffffff, 714 0x0000f4a4, 0x00680fff, 0xffffffff, 715 0x00002f50, 0x00000903, 0xffffffff, 716 0x000004c8, 0x00000000, 0xffffffff, 717 0x000064ec, 0x00000000, 0xffffffff, 718 0x00000c7c, 0x00000000, 0xffffffff, 719 0x00008dfc, 0x00000000, 0xffffffff 720 }; 721 #define CAYMAN_SYSLS_ENABLE_LENGTH sizeof(cayman_sysls_enable) / (3 * sizeof(u32)) 722 723 struct rv7xx_power_info *rv770_get_pi(struct radeon_device *rdev); 724 struct evergreen_power_info *evergreen_get_pi(struct radeon_device *rdev); 725 726 extern int ni_mc_load_microcode(struct radeon_device *rdev); 727 728 struct ni_power_info *ni_get_pi(struct radeon_device *rdev) 729 { 730 struct ni_power_info *pi = rdev->pm.dpm.priv; 731 732 return pi; 733 } 734 735 struct ni_ps *ni_get_ps(struct radeon_ps *rps) 736 { 737 struct ni_ps *ps = rps->ps_priv; 738 739 return ps; 740 } 741 742 static void ni_calculate_leakage_for_v_and_t_formula(const struct ni_leakage_coeffients *coeff, 743 u16 v, s32 t, 744 u32 ileakage, 745 u32 *leakage) 746 { 747 s64 kt, kv, leakage_w, i_leakage, vddc, temperature; 748 749 i_leakage = div64_s64(drm_int2fixp(ileakage), 1000); 750 vddc = div64_s64(drm_int2fixp(v), 1000); 751 temperature = div64_s64(drm_int2fixp(t), 1000); 752 753 kt = drm_fixp_mul(div64_s64(drm_int2fixp(coeff->at), 1000), 754 drm_fixp_exp(drm_fixp_mul(div64_s64(drm_int2fixp(coeff->bt), 1000), temperature))); 755 kv = drm_fixp_mul(div64_s64(drm_int2fixp(coeff->av), 1000), 756 drm_fixp_exp(drm_fixp_mul(div64_s64(drm_int2fixp(coeff->bv), 1000), vddc))); 757 758 leakage_w = drm_fixp_mul(drm_fixp_mul(drm_fixp_mul(i_leakage, kt), kv), vddc); 759 760 *leakage = drm_fixp2int(leakage_w * 1000); 761 } 762 763 static void ni_calculate_leakage_for_v_and_t(struct radeon_device *rdev, 764 const struct ni_leakage_coeffients *coeff, 765 u16 v, 766 s32 t, 767 u32 i_leakage, 768 u32 *leakage) 769 { 770 ni_calculate_leakage_for_v_and_t_formula(coeff, v, t, i_leakage, leakage); 771 } 772 773 bool ni_dpm_vblank_too_short(struct radeon_device *rdev) 774 { 775 struct rv7xx_power_info *pi = rv770_get_pi(rdev); 776 u32 vblank_time = r600_dpm_get_vblank_time(rdev); 777 /* we never hit the non-gddr5 limit so disable it */ 778 u32 switch_limit = pi->mem_gddr5 ? 450 : 0; 779 780 if (vblank_time < switch_limit) 781 return true; 782 else 783 return false; 784 785 } 786 787 static void ni_apply_state_adjust_rules(struct radeon_device *rdev, 788 struct radeon_ps *rps) 789 { 790 struct ni_ps *ps = ni_get_ps(rps); 791 struct radeon_clock_and_voltage_limits *max_limits; 792 bool disable_mclk_switching; 793 u32 mclk; 794 u16 vddci; 795 int i; 796 797 if ((rdev->pm.dpm.new_active_crtc_count > 1) || 798 ni_dpm_vblank_too_short(rdev)) 799 disable_mclk_switching = true; 800 else 801 disable_mclk_switching = false; 802 803 if (rdev->pm.dpm.ac_power) 804 max_limits = &rdev->pm.dpm.dyn_state.max_clock_voltage_on_ac; 805 else 806 max_limits = &rdev->pm.dpm.dyn_state.max_clock_voltage_on_dc; 807 808 if (rdev->pm.dpm.ac_power == false) { 809 for (i = 0; i < ps->performance_level_count; i++) { 810 if (ps->performance_levels[i].mclk > max_limits->mclk) 811 ps->performance_levels[i].mclk = max_limits->mclk; 812 if (ps->performance_levels[i].sclk > max_limits->sclk) 813 ps->performance_levels[i].sclk = max_limits->sclk; 814 if (ps->performance_levels[i].vddc > max_limits->vddc) 815 ps->performance_levels[i].vddc = max_limits->vddc; 816 if (ps->performance_levels[i].vddci > max_limits->vddci) 817 ps->performance_levels[i].vddci = max_limits->vddci; 818 } 819 } 820 821 /* XXX validate the min clocks required for display */ 822 823 /* adjust low state */ 824 if (disable_mclk_switching) { 825 ps->performance_levels[0].mclk = 826 ps->performance_levels[ps->performance_level_count - 1].mclk; 827 ps->performance_levels[0].vddci = 828 ps->performance_levels[ps->performance_level_count - 1].vddci; 829 } 830 831 btc_skip_blacklist_clocks(rdev, max_limits->sclk, max_limits->mclk, 832 &ps->performance_levels[0].sclk, 833 &ps->performance_levels[0].mclk); 834 835 for (i = 1; i < ps->performance_level_count; i++) { 836 if (ps->performance_levels[i].sclk < ps->performance_levels[i - 1].sclk) 837 ps->performance_levels[i].sclk = ps->performance_levels[i - 1].sclk; 838 if (ps->performance_levels[i].vddc < ps->performance_levels[i - 1].vddc) 839 ps->performance_levels[i].vddc = ps->performance_levels[i - 1].vddc; 840 } 841 842 /* adjust remaining states */ 843 if (disable_mclk_switching) { 844 mclk = ps->performance_levels[0].mclk; 845 vddci = ps->performance_levels[0].vddci; 846 for (i = 1; i < ps->performance_level_count; i++) { 847 if (mclk < ps->performance_levels[i].mclk) 848 mclk = ps->performance_levels[i].mclk; 849 if (vddci < ps->performance_levels[i].vddci) 850 vddci = ps->performance_levels[i].vddci; 851 } 852 for (i = 0; i < ps->performance_level_count; i++) { 853 ps->performance_levels[i].mclk = mclk; 854 ps->performance_levels[i].vddci = vddci; 855 } 856 } else { 857 for (i = 1; i < ps->performance_level_count; i++) { 858 if (ps->performance_levels[i].mclk < ps->performance_levels[i - 1].mclk) 859 ps->performance_levels[i].mclk = ps->performance_levels[i - 1].mclk; 860 if (ps->performance_levels[i].vddci < ps->performance_levels[i - 1].vddci) 861 ps->performance_levels[i].vddci = ps->performance_levels[i - 1].vddci; 862 } 863 } 864 865 for (i = 1; i < ps->performance_level_count; i++) 866 btc_skip_blacklist_clocks(rdev, max_limits->sclk, max_limits->mclk, 867 &ps->performance_levels[i].sclk, 868 &ps->performance_levels[i].mclk); 869 870 for (i = 0; i < ps->performance_level_count; i++) 871 btc_adjust_clock_combinations(rdev, max_limits, 872 &ps->performance_levels[i]); 873 874 for (i = 0; i < ps->performance_level_count; i++) { 875 btc_apply_voltage_dependency_rules(&rdev->pm.dpm.dyn_state.vddc_dependency_on_sclk, 876 ps->performance_levels[i].sclk, 877 max_limits->vddc, &ps->performance_levels[i].vddc); 878 btc_apply_voltage_dependency_rules(&rdev->pm.dpm.dyn_state.vddci_dependency_on_mclk, 879 ps->performance_levels[i].mclk, 880 max_limits->vddci, &ps->performance_levels[i].vddci); 881 btc_apply_voltage_dependency_rules(&rdev->pm.dpm.dyn_state.vddc_dependency_on_mclk, 882 ps->performance_levels[i].mclk, 883 max_limits->vddc, &ps->performance_levels[i].vddc); 884 btc_apply_voltage_dependency_rules(&rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk, 885 rdev->clock.current_dispclk, 886 max_limits->vddc, &ps->performance_levels[i].vddc); 887 } 888 889 for (i = 0; i < ps->performance_level_count; i++) { 890 btc_apply_voltage_delta_rules(rdev, 891 max_limits->vddc, max_limits->vddci, 892 &ps->performance_levels[i].vddc, 893 &ps->performance_levels[i].vddci); 894 } 895 896 ps->dc_compatible = true; 897 for (i = 0; i < ps->performance_level_count; i++) { 898 if (ps->performance_levels[i].vddc > rdev->pm.dpm.dyn_state.max_clock_voltage_on_dc.vddc) 899 ps->dc_compatible = false; 900 901 if (ps->performance_levels[i].vddc < rdev->pm.dpm.dyn_state.min_vddc_for_pcie_gen2) 902 ps->performance_levels[i].flags &= ~ATOM_PPLIB_R600_FLAGS_PCIEGEN2; 903 } 904 } 905 906 static void ni_cg_clockgating_default(struct radeon_device *rdev) 907 { 908 u32 count; 909 const u32 *ps = NULL; 910 911 ps = (const u32 *)&cayman_cgcg_cgls_default; 912 count = CAYMAN_CGCG_CGLS_DEFAULT_LENGTH; 913 914 btc_program_mgcg_hw_sequence(rdev, ps, count); 915 } 916 917 static void ni_gfx_clockgating_enable(struct radeon_device *rdev, 918 bool enable) 919 { 920 u32 count; 921 const u32 *ps = NULL; 922 923 if (enable) { 924 ps = (const u32 *)&cayman_cgcg_cgls_enable; 925 count = CAYMAN_CGCG_CGLS_ENABLE_LENGTH; 926 } else { 927 ps = (const u32 *)&cayman_cgcg_cgls_disable; 928 count = CAYMAN_CGCG_CGLS_DISABLE_LENGTH; 929 } 930 931 btc_program_mgcg_hw_sequence(rdev, ps, count); 932 } 933 934 static void ni_mg_clockgating_default(struct radeon_device *rdev) 935 { 936 u32 count; 937 const u32 *ps = NULL; 938 939 ps = (const u32 *)&cayman_mgcg_default; 940 count = CAYMAN_MGCG_DEFAULT_LENGTH; 941 942 btc_program_mgcg_hw_sequence(rdev, ps, count); 943 } 944 945 static void ni_mg_clockgating_enable(struct radeon_device *rdev, 946 bool enable) 947 { 948 u32 count; 949 const u32 *ps = NULL; 950 951 if (enable) { 952 ps = (const u32 *)&cayman_mgcg_enable; 953 count = CAYMAN_MGCG_ENABLE_LENGTH; 954 } else { 955 ps = (const u32 *)&cayman_mgcg_disable; 956 count = CAYMAN_MGCG_DISABLE_LENGTH; 957 } 958 959 btc_program_mgcg_hw_sequence(rdev, ps, count); 960 } 961 962 static void ni_ls_clockgating_default(struct radeon_device *rdev) 963 { 964 u32 count; 965 const u32 *ps = NULL; 966 967 ps = (const u32 *)&cayman_sysls_default; 968 count = CAYMAN_SYSLS_DEFAULT_LENGTH; 969 970 btc_program_mgcg_hw_sequence(rdev, ps, count); 971 } 972 973 static void ni_ls_clockgating_enable(struct radeon_device *rdev, 974 bool enable) 975 { 976 u32 count; 977 const u32 *ps = NULL; 978 979 if (enable) { 980 ps = (const u32 *)&cayman_sysls_enable; 981 count = CAYMAN_SYSLS_ENABLE_LENGTH; 982 } else { 983 ps = (const u32 *)&cayman_sysls_disable; 984 count = CAYMAN_SYSLS_DISABLE_LENGTH; 985 } 986 987 btc_program_mgcg_hw_sequence(rdev, ps, count); 988 989 } 990 991 static int ni_patch_single_dependency_table_based_on_leakage(struct radeon_device *rdev, 992 struct radeon_clock_voltage_dependency_table *table) 993 { 994 struct rv7xx_power_info *pi = rv770_get_pi(rdev); 995 u32 i; 996 997 if (table) { 998 for (i = 0; i < table->count; i++) { 999 if (0xff01 == table->entries[i].v) { 1000 if (pi->max_vddc == 0) 1001 return -EINVAL; 1002 table->entries[i].v = pi->max_vddc; 1003 } 1004 } 1005 } 1006 return 0; 1007 } 1008 1009 static int ni_patch_dependency_tables_based_on_leakage(struct radeon_device *rdev) 1010 { 1011 int ret = 0; 1012 1013 ret = ni_patch_single_dependency_table_based_on_leakage(rdev, 1014 &rdev->pm.dpm.dyn_state.vddc_dependency_on_sclk); 1015 1016 ret = ni_patch_single_dependency_table_based_on_leakage(rdev, 1017 &rdev->pm.dpm.dyn_state.vddc_dependency_on_mclk); 1018 return ret; 1019 } 1020 1021 static void ni_stop_dpm(struct radeon_device *rdev) 1022 { 1023 WREG32_P(GENERAL_PWRMGT, 0, ~GLOBAL_PWRMGT_EN); 1024 } 1025 1026 #if 0 1027 static int ni_notify_hw_of_power_source(struct radeon_device *rdev, 1028 bool ac_power) 1029 { 1030 if (ac_power) 1031 return (rv770_send_msg_to_smc(rdev, PPSMC_MSG_RunningOnAC) == PPSMC_Result_OK) ? 1032 0 : -EINVAL; 1033 1034 return 0; 1035 } 1036 #endif 1037 1038 static PPSMC_Result ni_send_msg_to_smc_with_parameter(struct radeon_device *rdev, 1039 PPSMC_Msg msg, u32 parameter) 1040 { 1041 WREG32(SMC_SCRATCH0, parameter); 1042 return rv770_send_msg_to_smc(rdev, msg); 1043 } 1044 1045 static int ni_restrict_performance_levels_before_switch(struct radeon_device *rdev) 1046 { 1047 if (rv770_send_msg_to_smc(rdev, PPSMC_MSG_NoForcedLevel) != PPSMC_Result_OK) 1048 return -EINVAL; 1049 1050 return (ni_send_msg_to_smc_with_parameter(rdev, PPSMC_MSG_SetEnabledLevels, 1) == PPSMC_Result_OK) ? 1051 0 : -EINVAL; 1052 } 1053 1054 int ni_dpm_force_performance_level(struct radeon_device *rdev, 1055 enum radeon_dpm_forced_level level) 1056 { 1057 if (level == RADEON_DPM_FORCED_LEVEL_HIGH) { 1058 if (ni_send_msg_to_smc_with_parameter(rdev, PPSMC_MSG_SetEnabledLevels, 0) != PPSMC_Result_OK) 1059 return -EINVAL; 1060 1061 if (ni_send_msg_to_smc_with_parameter(rdev, PPSMC_MSG_SetForcedLevels, 1) != PPSMC_Result_OK) 1062 return -EINVAL; 1063 } else if (level == RADEON_DPM_FORCED_LEVEL_LOW) { 1064 if (ni_send_msg_to_smc_with_parameter(rdev, PPSMC_MSG_SetForcedLevels, 0) != PPSMC_Result_OK) 1065 return -EINVAL; 1066 1067 if (ni_send_msg_to_smc_with_parameter(rdev, PPSMC_MSG_SetEnabledLevels, 1) != PPSMC_Result_OK) 1068 return -EINVAL; 1069 } else if (level == RADEON_DPM_FORCED_LEVEL_AUTO) { 1070 if (ni_send_msg_to_smc_with_parameter(rdev, PPSMC_MSG_SetForcedLevels, 0) != PPSMC_Result_OK) 1071 return -EINVAL; 1072 1073 if (ni_send_msg_to_smc_with_parameter(rdev, PPSMC_MSG_SetEnabledLevels, 0) != PPSMC_Result_OK) 1074 return -EINVAL; 1075 } 1076 1077 rdev->pm.dpm.forced_level = level; 1078 1079 return 0; 1080 } 1081 1082 static void ni_stop_smc(struct radeon_device *rdev) 1083 { 1084 u32 tmp; 1085 int i; 1086 1087 for (i = 0; i < rdev->usec_timeout; i++) { 1088 tmp = RREG32(LB_SYNC_RESET_SEL) & LB_SYNC_RESET_SEL_MASK; 1089 if (tmp != 1) 1090 break; 1091 udelay(1); 1092 } 1093 1094 udelay(100); 1095 1096 r7xx_stop_smc(rdev); 1097 } 1098 1099 static int ni_process_firmware_header(struct radeon_device *rdev) 1100 { 1101 struct rv7xx_power_info *pi = rv770_get_pi(rdev); 1102 struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev); 1103 struct ni_power_info *ni_pi = ni_get_pi(rdev); 1104 u32 tmp; 1105 int ret; 1106 1107 ret = rv770_read_smc_sram_dword(rdev, 1108 NISLANDS_SMC_FIRMWARE_HEADER_LOCATION + 1109 NISLANDS_SMC_FIRMWARE_HEADER_stateTable, 1110 &tmp, pi->sram_end); 1111 1112 if (ret) 1113 return ret; 1114 1115 pi->state_table_start = (u16)tmp; 1116 1117 ret = rv770_read_smc_sram_dword(rdev, 1118 NISLANDS_SMC_FIRMWARE_HEADER_LOCATION + 1119 NISLANDS_SMC_FIRMWARE_HEADER_softRegisters, 1120 &tmp, pi->sram_end); 1121 1122 if (ret) 1123 return ret; 1124 1125 pi->soft_regs_start = (u16)tmp; 1126 1127 ret = rv770_read_smc_sram_dword(rdev, 1128 NISLANDS_SMC_FIRMWARE_HEADER_LOCATION + 1129 NISLANDS_SMC_FIRMWARE_HEADER_mcRegisterTable, 1130 &tmp, pi->sram_end); 1131 1132 if (ret) 1133 return ret; 1134 1135 eg_pi->mc_reg_table_start = (u16)tmp; 1136 1137 ret = rv770_read_smc_sram_dword(rdev, 1138 NISLANDS_SMC_FIRMWARE_HEADER_LOCATION + 1139 NISLANDS_SMC_FIRMWARE_HEADER_fanTable, 1140 &tmp, pi->sram_end); 1141 1142 if (ret) 1143 return ret; 1144 1145 ni_pi->fan_table_start = (u16)tmp; 1146 1147 ret = rv770_read_smc_sram_dword(rdev, 1148 NISLANDS_SMC_FIRMWARE_HEADER_LOCATION + 1149 NISLANDS_SMC_FIRMWARE_HEADER_mcArbDramAutoRefreshTable, 1150 &tmp, pi->sram_end); 1151 1152 if (ret) 1153 return ret; 1154 1155 ni_pi->arb_table_start = (u16)tmp; 1156 1157 ret = rv770_read_smc_sram_dword(rdev, 1158 NISLANDS_SMC_FIRMWARE_HEADER_LOCATION + 1159 NISLANDS_SMC_FIRMWARE_HEADER_cacTable, 1160 &tmp, pi->sram_end); 1161 1162 if (ret) 1163 return ret; 1164 1165 ni_pi->cac_table_start = (u16)tmp; 1166 1167 ret = rv770_read_smc_sram_dword(rdev, 1168 NISLANDS_SMC_FIRMWARE_HEADER_LOCATION + 1169 NISLANDS_SMC_FIRMWARE_HEADER_spllTable, 1170 &tmp, pi->sram_end); 1171 1172 if (ret) 1173 return ret; 1174 1175 ni_pi->spll_table_start = (u16)tmp; 1176 1177 1178 return ret; 1179 } 1180 1181 static void ni_read_clock_registers(struct radeon_device *rdev) 1182 { 1183 struct ni_power_info *ni_pi = ni_get_pi(rdev); 1184 1185 ni_pi->clock_registers.cg_spll_func_cntl = RREG32(CG_SPLL_FUNC_CNTL); 1186 ni_pi->clock_registers.cg_spll_func_cntl_2 = RREG32(CG_SPLL_FUNC_CNTL_2); 1187 ni_pi->clock_registers.cg_spll_func_cntl_3 = RREG32(CG_SPLL_FUNC_CNTL_3); 1188 ni_pi->clock_registers.cg_spll_func_cntl_4 = RREG32(CG_SPLL_FUNC_CNTL_4); 1189 ni_pi->clock_registers.cg_spll_spread_spectrum = RREG32(CG_SPLL_SPREAD_SPECTRUM); 1190 ni_pi->clock_registers.cg_spll_spread_spectrum_2 = RREG32(CG_SPLL_SPREAD_SPECTRUM_2); 1191 ni_pi->clock_registers.mpll_ad_func_cntl = RREG32(MPLL_AD_FUNC_CNTL); 1192 ni_pi->clock_registers.mpll_ad_func_cntl_2 = RREG32(MPLL_AD_FUNC_CNTL_2); 1193 ni_pi->clock_registers.mpll_dq_func_cntl = RREG32(MPLL_DQ_FUNC_CNTL); 1194 ni_pi->clock_registers.mpll_dq_func_cntl_2 = RREG32(MPLL_DQ_FUNC_CNTL_2); 1195 ni_pi->clock_registers.mclk_pwrmgt_cntl = RREG32(MCLK_PWRMGT_CNTL); 1196 ni_pi->clock_registers.dll_cntl = RREG32(DLL_CNTL); 1197 ni_pi->clock_registers.mpll_ss1 = RREG32(MPLL_SS1); 1198 ni_pi->clock_registers.mpll_ss2 = RREG32(MPLL_SS2); 1199 } 1200 1201 #if 0 1202 static int ni_enter_ulp_state(struct radeon_device *rdev) 1203 { 1204 struct rv7xx_power_info *pi = rv770_get_pi(rdev); 1205 1206 if (pi->gfx_clock_gating) { 1207 WREG32_P(SCLK_PWRMGT_CNTL, 0, ~DYN_GFX_CLK_OFF_EN); 1208 WREG32_P(SCLK_PWRMGT_CNTL, GFX_CLK_FORCE_ON, ~GFX_CLK_FORCE_ON); 1209 WREG32_P(SCLK_PWRMGT_CNTL, 0, ~GFX_CLK_FORCE_ON); 1210 RREG32(GB_ADDR_CONFIG); 1211 } 1212 1213 WREG32_P(SMC_MSG, HOST_SMC_MSG(PPSMC_MSG_SwitchToMinimumPower), 1214 ~HOST_SMC_MSG_MASK); 1215 1216 udelay(25000); 1217 1218 return 0; 1219 } 1220 #endif 1221 1222 static void ni_program_response_times(struct radeon_device *rdev) 1223 { 1224 u32 voltage_response_time, backbias_response_time, acpi_delay_time, vbi_time_out; 1225 u32 vddc_dly, bb_dly, acpi_dly, vbi_dly, mclk_switch_limit; 1226 u32 reference_clock; 1227 1228 rv770_write_smc_soft_register(rdev, NI_SMC_SOFT_REGISTER_mvdd_chg_time, 1); 1229 1230 voltage_response_time = (u32)rdev->pm.dpm.voltage_response_time; 1231 backbias_response_time = (u32)rdev->pm.dpm.backbias_response_time; 1232 1233 if (voltage_response_time == 0) 1234 voltage_response_time = 1000; 1235 1236 if (backbias_response_time == 0) 1237 backbias_response_time = 1000; 1238 1239 acpi_delay_time = 15000; 1240 vbi_time_out = 100000; 1241 1242 reference_clock = radeon_get_xclk(rdev); 1243 1244 vddc_dly = (voltage_response_time * reference_clock) / 1600; 1245 bb_dly = (backbias_response_time * reference_clock) / 1600; 1246 acpi_dly = (acpi_delay_time * reference_clock) / 1600; 1247 vbi_dly = (vbi_time_out * reference_clock) / 1600; 1248 1249 mclk_switch_limit = (460 * reference_clock) / 100; 1250 1251 rv770_write_smc_soft_register(rdev, NI_SMC_SOFT_REGISTER_delay_vreg, vddc_dly); 1252 rv770_write_smc_soft_register(rdev, NI_SMC_SOFT_REGISTER_delay_bbias, bb_dly); 1253 rv770_write_smc_soft_register(rdev, NI_SMC_SOFT_REGISTER_delay_acpi, acpi_dly); 1254 rv770_write_smc_soft_register(rdev, NI_SMC_SOFT_REGISTER_mclk_chg_timeout, vbi_dly); 1255 rv770_write_smc_soft_register(rdev, NI_SMC_SOFT_REGISTER_mc_block_delay, 0xAA); 1256 rv770_write_smc_soft_register(rdev, NI_SMC_SOFT_REGISTER_mclk_switch_lim, mclk_switch_limit); 1257 } 1258 1259 static void ni_populate_smc_voltage_table(struct radeon_device *rdev, 1260 struct atom_voltage_table *voltage_table, 1261 NISLANDS_SMC_STATETABLE *table) 1262 { 1263 unsigned int i; 1264 1265 for (i = 0; i < voltage_table->count; i++) { 1266 table->highSMIO[i] = 0; 1267 table->lowSMIO[i] |= cpu_to_be32(voltage_table->entries[i].smio_low); 1268 } 1269 } 1270 1271 static void ni_populate_smc_voltage_tables(struct radeon_device *rdev, 1272 NISLANDS_SMC_STATETABLE *table) 1273 { 1274 struct rv7xx_power_info *pi = rv770_get_pi(rdev); 1275 struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev); 1276 unsigned char i; 1277 1278 if (eg_pi->vddc_voltage_table.count) { 1279 ni_populate_smc_voltage_table(rdev, &eg_pi->vddc_voltage_table, table); 1280 table->voltageMaskTable.highMask[NISLANDS_SMC_VOLTAGEMASK_VDDC] = 0; 1281 table->voltageMaskTable.lowMask[NISLANDS_SMC_VOLTAGEMASK_VDDC] = 1282 cpu_to_be32(eg_pi->vddc_voltage_table.mask_low); 1283 1284 for (i = 0; i < eg_pi->vddc_voltage_table.count; i++) { 1285 if (pi->max_vddc_in_table <= eg_pi->vddc_voltage_table.entries[i].value) { 1286 table->maxVDDCIndexInPPTable = i; 1287 break; 1288 } 1289 } 1290 } 1291 1292 if (eg_pi->vddci_voltage_table.count) { 1293 ni_populate_smc_voltage_table(rdev, &eg_pi->vddci_voltage_table, table); 1294 1295 table->voltageMaskTable.highMask[NISLANDS_SMC_VOLTAGEMASK_VDDCI] = 0; 1296 table->voltageMaskTable.lowMask[NISLANDS_SMC_VOLTAGEMASK_VDDCI] = 1297 cpu_to_be32(eg_pi->vddci_voltage_table.mask_low); 1298 } 1299 } 1300 1301 static int ni_populate_voltage_value(struct radeon_device *rdev, 1302 struct atom_voltage_table *table, 1303 u16 value, 1304 NISLANDS_SMC_VOLTAGE_VALUE *voltage) 1305 { 1306 unsigned int i; 1307 1308 for (i = 0; i < table->count; i++) { 1309 if (value <= table->entries[i].value) { 1310 voltage->index = (u8)i; 1311 voltage->value = cpu_to_be16(table->entries[i].value); 1312 break; 1313 } 1314 } 1315 1316 if (i >= table->count) 1317 return -EINVAL; 1318 1319 return 0; 1320 } 1321 1322 static void ni_populate_mvdd_value(struct radeon_device *rdev, 1323 u32 mclk, 1324 NISLANDS_SMC_VOLTAGE_VALUE *voltage) 1325 { 1326 struct rv7xx_power_info *pi = rv770_get_pi(rdev); 1327 struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev); 1328 1329 if (!pi->mvdd_control) { 1330 voltage->index = eg_pi->mvdd_high_index; 1331 voltage->value = cpu_to_be16(MVDD_HIGH_VALUE); 1332 return; 1333 } 1334 1335 if (mclk <= pi->mvdd_split_frequency) { 1336 voltage->index = eg_pi->mvdd_low_index; 1337 voltage->value = cpu_to_be16(MVDD_LOW_VALUE); 1338 } else { 1339 voltage->index = eg_pi->mvdd_high_index; 1340 voltage->value = cpu_to_be16(MVDD_HIGH_VALUE); 1341 } 1342 } 1343 1344 static int ni_get_std_voltage_value(struct radeon_device *rdev, 1345 NISLANDS_SMC_VOLTAGE_VALUE *voltage, 1346 u16 *std_voltage) 1347 { 1348 if (rdev->pm.dpm.dyn_state.cac_leakage_table.entries && 1349 ((u32)voltage->index < rdev->pm.dpm.dyn_state.cac_leakage_table.count)) 1350 *std_voltage = rdev->pm.dpm.dyn_state.cac_leakage_table.entries[voltage->index].vddc; 1351 else 1352 *std_voltage = be16_to_cpu(voltage->value); 1353 1354 return 0; 1355 } 1356 1357 static void ni_populate_std_voltage_value(struct radeon_device *rdev, 1358 u16 value, u8 index, 1359 NISLANDS_SMC_VOLTAGE_VALUE *voltage) 1360 { 1361 voltage->index = index; 1362 voltage->value = cpu_to_be16(value); 1363 } 1364 1365 static u32 ni_get_smc_power_scaling_factor(struct radeon_device *rdev) 1366 { 1367 u32 xclk_period; 1368 u32 xclk = radeon_get_xclk(rdev); 1369 u32 tmp = RREG32(CG_CAC_CTRL) & TID_CNT_MASK; 1370 1371 xclk_period = (1000000000UL / xclk); 1372 xclk_period /= 10000UL; 1373 1374 return tmp * xclk_period; 1375 } 1376 1377 static u32 ni_scale_power_for_smc(u32 power_in_watts, u32 scaling_factor) 1378 { 1379 return (power_in_watts * scaling_factor) << 2; 1380 } 1381 1382 static u32 ni_calculate_power_boost_limit(struct radeon_device *rdev, 1383 struct radeon_ps *radeon_state, 1384 u32 near_tdp_limit) 1385 { 1386 struct ni_ps *state = ni_get_ps(radeon_state); 1387 struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev); 1388 struct ni_power_info *ni_pi = ni_get_pi(rdev); 1389 u32 power_boost_limit = 0; 1390 int ret; 1391 1392 if (ni_pi->enable_power_containment && 1393 ni_pi->use_power_boost_limit) { 1394 NISLANDS_SMC_VOLTAGE_VALUE vddc; 1395 u16 std_vddc_med; 1396 u16 std_vddc_high; 1397 u64 tmp, n, d; 1398 1399 if (state->performance_level_count < 3) 1400 return 0; 1401 1402 ret = ni_populate_voltage_value(rdev, &eg_pi->vddc_voltage_table, 1403 state->performance_levels[state->performance_level_count - 2].vddc, 1404 &vddc); 1405 if (ret) 1406 return 0; 1407 1408 ret = ni_get_std_voltage_value(rdev, &vddc, &std_vddc_med); 1409 if (ret) 1410 return 0; 1411 1412 ret = ni_populate_voltage_value(rdev, &eg_pi->vddc_voltage_table, 1413 state->performance_levels[state->performance_level_count - 1].vddc, 1414 &vddc); 1415 if (ret) 1416 return 0; 1417 1418 ret = ni_get_std_voltage_value(rdev, &vddc, &std_vddc_high); 1419 if (ret) 1420 return 0; 1421 1422 n = ((u64)near_tdp_limit * ((u64)std_vddc_med * (u64)std_vddc_med) * 90); 1423 d = ((u64)std_vddc_high * (u64)std_vddc_high * 100); 1424 tmp = div64_u64(n, d); 1425 1426 if (tmp >> 32) 1427 return 0; 1428 power_boost_limit = (u32)tmp; 1429 } 1430 1431 return power_boost_limit; 1432 } 1433 1434 static int ni_calculate_adjusted_tdp_limits(struct radeon_device *rdev, 1435 bool adjust_polarity, 1436 u32 tdp_adjustment, 1437 u32 *tdp_limit, 1438 u32 *near_tdp_limit) 1439 { 1440 if (tdp_adjustment > (u32)rdev->pm.dpm.tdp_od_limit) 1441 return -EINVAL; 1442 1443 if (adjust_polarity) { 1444 *tdp_limit = ((100 + tdp_adjustment) * rdev->pm.dpm.tdp_limit) / 100; 1445 *near_tdp_limit = rdev->pm.dpm.near_tdp_limit + (*tdp_limit - rdev->pm.dpm.tdp_limit); 1446 } else { 1447 *tdp_limit = ((100 - tdp_adjustment) * rdev->pm.dpm.tdp_limit) / 100; 1448 *near_tdp_limit = rdev->pm.dpm.near_tdp_limit - (rdev->pm.dpm.tdp_limit - *tdp_limit); 1449 } 1450 1451 return 0; 1452 } 1453 1454 static int ni_populate_smc_tdp_limits(struct radeon_device *rdev, 1455 struct radeon_ps *radeon_state) 1456 { 1457 struct rv7xx_power_info *pi = rv770_get_pi(rdev); 1458 struct ni_power_info *ni_pi = ni_get_pi(rdev); 1459 1460 if (ni_pi->enable_power_containment) { 1461 NISLANDS_SMC_STATETABLE *smc_table = &ni_pi->smc_statetable; 1462 u32 scaling_factor = ni_get_smc_power_scaling_factor(rdev); 1463 u32 tdp_limit; 1464 u32 near_tdp_limit; 1465 u32 power_boost_limit; 1466 int ret; 1467 1468 if (scaling_factor == 0) 1469 return -EINVAL; 1470 1471 memset(smc_table, 0, sizeof(NISLANDS_SMC_STATETABLE)); 1472 1473 ret = ni_calculate_adjusted_tdp_limits(rdev, 1474 false, /* ??? */ 1475 rdev->pm.dpm.tdp_adjustment, 1476 &tdp_limit, 1477 &near_tdp_limit); 1478 if (ret) 1479 return ret; 1480 1481 power_boost_limit = ni_calculate_power_boost_limit(rdev, radeon_state, 1482 near_tdp_limit); 1483 1484 smc_table->dpm2Params.TDPLimit = 1485 cpu_to_be32(ni_scale_power_for_smc(tdp_limit, scaling_factor)); 1486 smc_table->dpm2Params.NearTDPLimit = 1487 cpu_to_be32(ni_scale_power_for_smc(near_tdp_limit, scaling_factor)); 1488 smc_table->dpm2Params.SafePowerLimit = 1489 cpu_to_be32(ni_scale_power_for_smc((near_tdp_limit * NISLANDS_DPM2_TDP_SAFE_LIMIT_PERCENT) / 100, 1490 scaling_factor)); 1491 smc_table->dpm2Params.PowerBoostLimit = 1492 cpu_to_be32(ni_scale_power_for_smc(power_boost_limit, scaling_factor)); 1493 1494 ret = rv770_copy_bytes_to_smc(rdev, 1495 (u16)(pi->state_table_start + offsetof(NISLANDS_SMC_STATETABLE, dpm2Params) + 1496 offsetof(PP_NIslands_DPM2Parameters, TDPLimit)), 1497 (u8 *)(&smc_table->dpm2Params.TDPLimit), 1498 sizeof(u32) * 4, pi->sram_end); 1499 if (ret) 1500 return ret; 1501 } 1502 1503 return 0; 1504 } 1505 1506 int ni_copy_and_switch_arb_sets(struct radeon_device *rdev, 1507 u32 arb_freq_src, u32 arb_freq_dest) 1508 { 1509 u32 mc_arb_dram_timing; 1510 u32 mc_arb_dram_timing2; 1511 u32 burst_time; 1512 u32 mc_cg_config; 1513 1514 switch (arb_freq_src) { 1515 case MC_CG_ARB_FREQ_F0: 1516 mc_arb_dram_timing = RREG32(MC_ARB_DRAM_TIMING); 1517 mc_arb_dram_timing2 = RREG32(MC_ARB_DRAM_TIMING2); 1518 burst_time = (RREG32(MC_ARB_BURST_TIME) & STATE0_MASK) >> STATE0_SHIFT; 1519 break; 1520 case MC_CG_ARB_FREQ_F1: 1521 mc_arb_dram_timing = RREG32(MC_ARB_DRAM_TIMING_1); 1522 mc_arb_dram_timing2 = RREG32(MC_ARB_DRAM_TIMING2_1); 1523 burst_time = (RREG32(MC_ARB_BURST_TIME) & STATE1_MASK) >> STATE1_SHIFT; 1524 break; 1525 case MC_CG_ARB_FREQ_F2: 1526 mc_arb_dram_timing = RREG32(MC_ARB_DRAM_TIMING_2); 1527 mc_arb_dram_timing2 = RREG32(MC_ARB_DRAM_TIMING2_2); 1528 burst_time = (RREG32(MC_ARB_BURST_TIME) & STATE2_MASK) >> STATE2_SHIFT; 1529 break; 1530 case MC_CG_ARB_FREQ_F3: 1531 mc_arb_dram_timing = RREG32(MC_ARB_DRAM_TIMING_3); 1532 mc_arb_dram_timing2 = RREG32(MC_ARB_DRAM_TIMING2_3); 1533 burst_time = (RREG32(MC_ARB_BURST_TIME) & STATE3_MASK) >> STATE3_SHIFT; 1534 break; 1535 default: 1536 return -EINVAL; 1537 } 1538 1539 switch (arb_freq_dest) { 1540 case MC_CG_ARB_FREQ_F0: 1541 WREG32(MC_ARB_DRAM_TIMING, mc_arb_dram_timing); 1542 WREG32(MC_ARB_DRAM_TIMING2, mc_arb_dram_timing2); 1543 WREG32_P(MC_ARB_BURST_TIME, STATE0(burst_time), ~STATE0_MASK); 1544 break; 1545 case MC_CG_ARB_FREQ_F1: 1546 WREG32(MC_ARB_DRAM_TIMING_1, mc_arb_dram_timing); 1547 WREG32(MC_ARB_DRAM_TIMING2_1, mc_arb_dram_timing2); 1548 WREG32_P(MC_ARB_BURST_TIME, STATE1(burst_time), ~STATE1_MASK); 1549 break; 1550 case MC_CG_ARB_FREQ_F2: 1551 WREG32(MC_ARB_DRAM_TIMING_2, mc_arb_dram_timing); 1552 WREG32(MC_ARB_DRAM_TIMING2_2, mc_arb_dram_timing2); 1553 WREG32_P(MC_ARB_BURST_TIME, STATE2(burst_time), ~STATE2_MASK); 1554 break; 1555 case MC_CG_ARB_FREQ_F3: 1556 WREG32(MC_ARB_DRAM_TIMING_3, mc_arb_dram_timing); 1557 WREG32(MC_ARB_DRAM_TIMING2_3, mc_arb_dram_timing2); 1558 WREG32_P(MC_ARB_BURST_TIME, STATE3(burst_time), ~STATE3_MASK); 1559 break; 1560 default: 1561 return -EINVAL; 1562 } 1563 1564 mc_cg_config = RREG32(MC_CG_CONFIG) | 0x0000000F; 1565 WREG32(MC_CG_CONFIG, mc_cg_config); 1566 WREG32_P(MC_ARB_CG, CG_ARB_REQ(arb_freq_dest), ~CG_ARB_REQ_MASK); 1567 1568 return 0; 1569 } 1570 1571 static int ni_init_arb_table_index(struct radeon_device *rdev) 1572 { 1573 struct rv7xx_power_info *pi = rv770_get_pi(rdev); 1574 struct ni_power_info *ni_pi = ni_get_pi(rdev); 1575 u32 tmp; 1576 int ret; 1577 1578 ret = rv770_read_smc_sram_dword(rdev, ni_pi->arb_table_start, 1579 &tmp, pi->sram_end); 1580 if (ret) 1581 return ret; 1582 1583 tmp &= 0x00FFFFFF; 1584 tmp |= ((u32)MC_CG_ARB_FREQ_F1) << 24; 1585 1586 return rv770_write_smc_sram_dword(rdev, ni_pi->arb_table_start, 1587 tmp, pi->sram_end); 1588 } 1589 1590 static int ni_initial_switch_from_arb_f0_to_f1(struct radeon_device *rdev) 1591 { 1592 return ni_copy_and_switch_arb_sets(rdev, MC_CG_ARB_FREQ_F0, MC_CG_ARB_FREQ_F1); 1593 } 1594 1595 static int ni_force_switch_to_arb_f0(struct radeon_device *rdev) 1596 { 1597 struct rv7xx_power_info *pi = rv770_get_pi(rdev); 1598 struct ni_power_info *ni_pi = ni_get_pi(rdev); 1599 u32 tmp; 1600 int ret; 1601 1602 ret = rv770_read_smc_sram_dword(rdev, ni_pi->arb_table_start, 1603 &tmp, pi->sram_end); 1604 if (ret) 1605 return ret; 1606 1607 tmp = (tmp >> 24) & 0xff; 1608 1609 if (tmp == MC_CG_ARB_FREQ_F0) 1610 return 0; 1611 1612 return ni_copy_and_switch_arb_sets(rdev, tmp, MC_CG_ARB_FREQ_F0); 1613 } 1614 1615 static int ni_populate_memory_timing_parameters(struct radeon_device *rdev, 1616 struct rv7xx_pl *pl, 1617 SMC_NIslands_MCArbDramTimingRegisterSet *arb_regs) 1618 { 1619 u32 dram_timing; 1620 u32 dram_timing2; 1621 1622 arb_regs->mc_arb_rfsh_rate = 1623 (u8)rv770_calculate_memory_refresh_rate(rdev, pl->sclk); 1624 1625 1626 radeon_atom_set_engine_dram_timings(rdev, pl->sclk, pl->mclk); 1627 1628 dram_timing = RREG32(MC_ARB_DRAM_TIMING); 1629 dram_timing2 = RREG32(MC_ARB_DRAM_TIMING2); 1630 1631 arb_regs->mc_arb_dram_timing = cpu_to_be32(dram_timing); 1632 arb_regs->mc_arb_dram_timing2 = cpu_to_be32(dram_timing2); 1633 1634 return 0; 1635 } 1636 1637 static int ni_do_program_memory_timing_parameters(struct radeon_device *rdev, 1638 struct radeon_ps *radeon_state, 1639 unsigned int first_arb_set) 1640 { 1641 struct rv7xx_power_info *pi = rv770_get_pi(rdev); 1642 struct ni_power_info *ni_pi = ni_get_pi(rdev); 1643 struct ni_ps *state = ni_get_ps(radeon_state); 1644 SMC_NIslands_MCArbDramTimingRegisterSet arb_regs = { 0 }; 1645 int i, ret = 0; 1646 1647 for (i = 0; i < state->performance_level_count; i++) { 1648 ret = ni_populate_memory_timing_parameters(rdev, &state->performance_levels[i], &arb_regs); 1649 if (ret) 1650 break; 1651 1652 ret = rv770_copy_bytes_to_smc(rdev, 1653 (u16)(ni_pi->arb_table_start + 1654 offsetof(SMC_NIslands_MCArbDramTimingRegisters, data) + 1655 sizeof(SMC_NIslands_MCArbDramTimingRegisterSet) * (first_arb_set + i)), 1656 (u8 *)&arb_regs, 1657 (u16)sizeof(SMC_NIslands_MCArbDramTimingRegisterSet), 1658 pi->sram_end); 1659 if (ret) 1660 break; 1661 } 1662 return ret; 1663 } 1664 1665 static int ni_program_memory_timing_parameters(struct radeon_device *rdev, 1666 struct radeon_ps *radeon_new_state) 1667 { 1668 return ni_do_program_memory_timing_parameters(rdev, radeon_new_state, 1669 NISLANDS_DRIVER_STATE_ARB_INDEX); 1670 } 1671 1672 static void ni_populate_initial_mvdd_value(struct radeon_device *rdev, 1673 struct NISLANDS_SMC_VOLTAGE_VALUE *voltage) 1674 { 1675 struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev); 1676 1677 voltage->index = eg_pi->mvdd_high_index; 1678 voltage->value = cpu_to_be16(MVDD_HIGH_VALUE); 1679 } 1680 1681 static int ni_populate_smc_initial_state(struct radeon_device *rdev, 1682 struct radeon_ps *radeon_initial_state, 1683 NISLANDS_SMC_STATETABLE *table) 1684 { 1685 struct ni_ps *initial_state = ni_get_ps(radeon_initial_state); 1686 struct rv7xx_power_info *pi = rv770_get_pi(rdev); 1687 struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev); 1688 struct ni_power_info *ni_pi = ni_get_pi(rdev); 1689 u32 reg; 1690 int ret; 1691 1692 table->initialState.levels[0].mclk.vMPLL_AD_FUNC_CNTL = 1693 cpu_to_be32(ni_pi->clock_registers.mpll_ad_func_cntl); 1694 table->initialState.levels[0].mclk.vMPLL_AD_FUNC_CNTL_2 = 1695 cpu_to_be32(ni_pi->clock_registers.mpll_ad_func_cntl_2); 1696 table->initialState.levels[0].mclk.vMPLL_DQ_FUNC_CNTL = 1697 cpu_to_be32(ni_pi->clock_registers.mpll_dq_func_cntl); 1698 table->initialState.levels[0].mclk.vMPLL_DQ_FUNC_CNTL_2 = 1699 cpu_to_be32(ni_pi->clock_registers.mpll_dq_func_cntl_2); 1700 table->initialState.levels[0].mclk.vMCLK_PWRMGT_CNTL = 1701 cpu_to_be32(ni_pi->clock_registers.mclk_pwrmgt_cntl); 1702 table->initialState.levels[0].mclk.vDLL_CNTL = 1703 cpu_to_be32(ni_pi->clock_registers.dll_cntl); 1704 table->initialState.levels[0].mclk.vMPLL_SS = 1705 cpu_to_be32(ni_pi->clock_registers.mpll_ss1); 1706 table->initialState.levels[0].mclk.vMPLL_SS2 = 1707 cpu_to_be32(ni_pi->clock_registers.mpll_ss2); 1708 table->initialState.levels[0].mclk.mclk_value = 1709 cpu_to_be32(initial_state->performance_levels[0].mclk); 1710 1711 table->initialState.levels[0].sclk.vCG_SPLL_FUNC_CNTL = 1712 cpu_to_be32(ni_pi->clock_registers.cg_spll_func_cntl); 1713 table->initialState.levels[0].sclk.vCG_SPLL_FUNC_CNTL_2 = 1714 cpu_to_be32(ni_pi->clock_registers.cg_spll_func_cntl_2); 1715 table->initialState.levels[0].sclk.vCG_SPLL_FUNC_CNTL_3 = 1716 cpu_to_be32(ni_pi->clock_registers.cg_spll_func_cntl_3); 1717 table->initialState.levels[0].sclk.vCG_SPLL_FUNC_CNTL_4 = 1718 cpu_to_be32(ni_pi->clock_registers.cg_spll_func_cntl_4); 1719 table->initialState.levels[0].sclk.vCG_SPLL_SPREAD_SPECTRUM = 1720 cpu_to_be32(ni_pi->clock_registers.cg_spll_spread_spectrum); 1721 table->initialState.levels[0].sclk.vCG_SPLL_SPREAD_SPECTRUM_2 = 1722 cpu_to_be32(ni_pi->clock_registers.cg_spll_spread_spectrum_2); 1723 table->initialState.levels[0].sclk.sclk_value = 1724 cpu_to_be32(initial_state->performance_levels[0].sclk); 1725 table->initialState.levels[0].arbRefreshState = 1726 NISLANDS_INITIAL_STATE_ARB_INDEX; 1727 1728 table->initialState.levels[0].ACIndex = 0; 1729 1730 ret = ni_populate_voltage_value(rdev, &eg_pi->vddc_voltage_table, 1731 initial_state->performance_levels[0].vddc, 1732 &table->initialState.levels[0].vddc); 1733 if (!ret) { 1734 u16 std_vddc; 1735 1736 ret = ni_get_std_voltage_value(rdev, 1737 &table->initialState.levels[0].vddc, 1738 &std_vddc); 1739 if (!ret) 1740 ni_populate_std_voltage_value(rdev, std_vddc, 1741 table->initialState.levels[0].vddc.index, 1742 &table->initialState.levels[0].std_vddc); 1743 } 1744 1745 if (eg_pi->vddci_control) 1746 ni_populate_voltage_value(rdev, 1747 &eg_pi->vddci_voltage_table, 1748 initial_state->performance_levels[0].vddci, 1749 &table->initialState.levels[0].vddci); 1750 1751 ni_populate_initial_mvdd_value(rdev, &table->initialState.levels[0].mvdd); 1752 1753 reg = CG_R(0xffff) | CG_L(0); 1754 table->initialState.levels[0].aT = cpu_to_be32(reg); 1755 1756 table->initialState.levels[0].bSP = cpu_to_be32(pi->dsp); 1757 1758 if (pi->boot_in_gen2) 1759 table->initialState.levels[0].gen2PCIE = 1; 1760 else 1761 table->initialState.levels[0].gen2PCIE = 0; 1762 1763 if (pi->mem_gddr5) { 1764 table->initialState.levels[0].strobeMode = 1765 cypress_get_strobe_mode_settings(rdev, 1766 initial_state->performance_levels[0].mclk); 1767 1768 if (initial_state->performance_levels[0].mclk > pi->mclk_edc_enable_threshold) 1769 table->initialState.levels[0].mcFlags = NISLANDS_SMC_MC_EDC_RD_FLAG | NISLANDS_SMC_MC_EDC_WR_FLAG; 1770 else 1771 table->initialState.levels[0].mcFlags = 0; 1772 } 1773 1774 table->initialState.levelCount = 1; 1775 1776 table->initialState.flags |= PPSMC_SWSTATE_FLAG_DC; 1777 1778 table->initialState.levels[0].dpm2.MaxPS = 0; 1779 table->initialState.levels[0].dpm2.NearTDPDec = 0; 1780 table->initialState.levels[0].dpm2.AboveSafeInc = 0; 1781 table->initialState.levels[0].dpm2.BelowSafeInc = 0; 1782 1783 reg = MIN_POWER_MASK | MAX_POWER_MASK; 1784 table->initialState.levels[0].SQPowerThrottle = cpu_to_be32(reg); 1785 1786 reg = MAX_POWER_DELTA_MASK | STI_SIZE_MASK | LTI_RATIO_MASK; 1787 table->initialState.levels[0].SQPowerThrottle_2 = cpu_to_be32(reg); 1788 1789 return 0; 1790 } 1791 1792 static int ni_populate_smc_acpi_state(struct radeon_device *rdev, 1793 NISLANDS_SMC_STATETABLE *table) 1794 { 1795 struct rv7xx_power_info *pi = rv770_get_pi(rdev); 1796 struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev); 1797 struct ni_power_info *ni_pi = ni_get_pi(rdev); 1798 u32 mpll_ad_func_cntl = ni_pi->clock_registers.mpll_ad_func_cntl; 1799 u32 mpll_ad_func_cntl_2 = ni_pi->clock_registers.mpll_ad_func_cntl_2; 1800 u32 mpll_dq_func_cntl = ni_pi->clock_registers.mpll_dq_func_cntl; 1801 u32 mpll_dq_func_cntl_2 = ni_pi->clock_registers.mpll_dq_func_cntl_2; 1802 u32 spll_func_cntl = ni_pi->clock_registers.cg_spll_func_cntl; 1803 u32 spll_func_cntl_2 = ni_pi->clock_registers.cg_spll_func_cntl_2; 1804 u32 spll_func_cntl_3 = ni_pi->clock_registers.cg_spll_func_cntl_3; 1805 u32 spll_func_cntl_4 = ni_pi->clock_registers.cg_spll_func_cntl_4; 1806 u32 mclk_pwrmgt_cntl = ni_pi->clock_registers.mclk_pwrmgt_cntl; 1807 u32 dll_cntl = ni_pi->clock_registers.dll_cntl; 1808 u32 reg; 1809 int ret; 1810 1811 table->ACPIState = table->initialState; 1812 1813 table->ACPIState.flags &= ~PPSMC_SWSTATE_FLAG_DC; 1814 1815 if (pi->acpi_vddc) { 1816 ret = ni_populate_voltage_value(rdev, 1817 &eg_pi->vddc_voltage_table, 1818 pi->acpi_vddc, &table->ACPIState.levels[0].vddc); 1819 if (!ret) { 1820 u16 std_vddc; 1821 1822 ret = ni_get_std_voltage_value(rdev, 1823 &table->ACPIState.levels[0].vddc, &std_vddc); 1824 if (!ret) 1825 ni_populate_std_voltage_value(rdev, std_vddc, 1826 table->ACPIState.levels[0].vddc.index, 1827 &table->ACPIState.levels[0].std_vddc); 1828 } 1829 1830 if (pi->pcie_gen2) { 1831 if (pi->acpi_pcie_gen2) 1832 table->ACPIState.levels[0].gen2PCIE = 1; 1833 else 1834 table->ACPIState.levels[0].gen2PCIE = 0; 1835 } else { 1836 table->ACPIState.levels[0].gen2PCIE = 0; 1837 } 1838 } else { 1839 ret = ni_populate_voltage_value(rdev, 1840 &eg_pi->vddc_voltage_table, 1841 pi->min_vddc_in_table, 1842 &table->ACPIState.levels[0].vddc); 1843 if (!ret) { 1844 u16 std_vddc; 1845 1846 ret = ni_get_std_voltage_value(rdev, 1847 &table->ACPIState.levels[0].vddc, 1848 &std_vddc); 1849 if (!ret) 1850 ni_populate_std_voltage_value(rdev, std_vddc, 1851 table->ACPIState.levels[0].vddc.index, 1852 &table->ACPIState.levels[0].std_vddc); 1853 } 1854 table->ACPIState.levels[0].gen2PCIE = 0; 1855 } 1856 1857 if (eg_pi->acpi_vddci) { 1858 if (eg_pi->vddci_control) 1859 ni_populate_voltage_value(rdev, 1860 &eg_pi->vddci_voltage_table, 1861 eg_pi->acpi_vddci, 1862 &table->ACPIState.levels[0].vddci); 1863 } 1864 1865 1866 mpll_ad_func_cntl &= ~PDNB; 1867 1868 mpll_ad_func_cntl_2 |= BIAS_GEN_PDNB | RESET_EN; 1869 1870 if (pi->mem_gddr5) 1871 mpll_dq_func_cntl &= ~PDNB; 1872 mpll_dq_func_cntl_2 |= BIAS_GEN_PDNB | RESET_EN | BYPASS; 1873 1874 1875 mclk_pwrmgt_cntl |= (MRDCKA0_RESET | 1876 MRDCKA1_RESET | 1877 MRDCKB0_RESET | 1878 MRDCKB1_RESET | 1879 MRDCKC0_RESET | 1880 MRDCKC1_RESET | 1881 MRDCKD0_RESET | 1882 MRDCKD1_RESET); 1883 1884 mclk_pwrmgt_cntl &= ~(MRDCKA0_PDNB | 1885 MRDCKA1_PDNB | 1886 MRDCKB0_PDNB | 1887 MRDCKB1_PDNB | 1888 MRDCKC0_PDNB | 1889 MRDCKC1_PDNB | 1890 MRDCKD0_PDNB | 1891 MRDCKD1_PDNB); 1892 1893 dll_cntl |= (MRDCKA0_BYPASS | 1894 MRDCKA1_BYPASS | 1895 MRDCKB0_BYPASS | 1896 MRDCKB1_BYPASS | 1897 MRDCKC0_BYPASS | 1898 MRDCKC1_BYPASS | 1899 MRDCKD0_BYPASS | 1900 MRDCKD1_BYPASS); 1901 1902 spll_func_cntl_2 &= ~SCLK_MUX_SEL_MASK; 1903 spll_func_cntl_2 |= SCLK_MUX_SEL(4); 1904 1905 table->ACPIState.levels[0].mclk.vMPLL_AD_FUNC_CNTL = cpu_to_be32(mpll_ad_func_cntl); 1906 table->ACPIState.levels[0].mclk.vMPLL_AD_FUNC_CNTL_2 = cpu_to_be32(mpll_ad_func_cntl_2); 1907 table->ACPIState.levels[0].mclk.vMPLL_DQ_FUNC_CNTL = cpu_to_be32(mpll_dq_func_cntl); 1908 table->ACPIState.levels[0].mclk.vMPLL_DQ_FUNC_CNTL_2 = cpu_to_be32(mpll_dq_func_cntl_2); 1909 table->ACPIState.levels[0].mclk.vMCLK_PWRMGT_CNTL = cpu_to_be32(mclk_pwrmgt_cntl); 1910 table->ACPIState.levels[0].mclk.vDLL_CNTL = cpu_to_be32(dll_cntl); 1911 1912 table->ACPIState.levels[0].mclk.mclk_value = 0; 1913 1914 table->ACPIState.levels[0].sclk.vCG_SPLL_FUNC_CNTL = cpu_to_be32(spll_func_cntl); 1915 table->ACPIState.levels[0].sclk.vCG_SPLL_FUNC_CNTL_2 = cpu_to_be32(spll_func_cntl_2); 1916 table->ACPIState.levels[0].sclk.vCG_SPLL_FUNC_CNTL_3 = cpu_to_be32(spll_func_cntl_3); 1917 table->ACPIState.levels[0].sclk.vCG_SPLL_FUNC_CNTL_4 = cpu_to_be32(spll_func_cntl_4); 1918 1919 table->ACPIState.levels[0].sclk.sclk_value = 0; 1920 1921 ni_populate_mvdd_value(rdev, 0, &table->ACPIState.levels[0].mvdd); 1922 1923 if (eg_pi->dynamic_ac_timing) 1924 table->ACPIState.levels[0].ACIndex = 1; 1925 1926 table->ACPIState.levels[0].dpm2.MaxPS = 0; 1927 table->ACPIState.levels[0].dpm2.NearTDPDec = 0; 1928 table->ACPIState.levels[0].dpm2.AboveSafeInc = 0; 1929 table->ACPIState.levels[0].dpm2.BelowSafeInc = 0; 1930 1931 reg = MIN_POWER_MASK | MAX_POWER_MASK; 1932 table->ACPIState.levels[0].SQPowerThrottle = cpu_to_be32(reg); 1933 1934 reg = MAX_POWER_DELTA_MASK | STI_SIZE_MASK | LTI_RATIO_MASK; 1935 table->ACPIState.levels[0].SQPowerThrottle_2 = cpu_to_be32(reg); 1936 1937 return 0; 1938 } 1939 1940 static int ni_init_smc_table(struct radeon_device *rdev) 1941 { 1942 struct rv7xx_power_info *pi = rv770_get_pi(rdev); 1943 struct ni_power_info *ni_pi = ni_get_pi(rdev); 1944 int ret; 1945 struct radeon_ps *radeon_boot_state = rdev->pm.dpm.boot_ps; 1946 NISLANDS_SMC_STATETABLE *table = &ni_pi->smc_statetable; 1947 1948 memset(table, 0, sizeof(NISLANDS_SMC_STATETABLE)); 1949 1950 ni_populate_smc_voltage_tables(rdev, table); 1951 1952 switch (rdev->pm.int_thermal_type) { 1953 case THERMAL_TYPE_NI: 1954 case THERMAL_TYPE_EMC2103_WITH_INTERNAL: 1955 table->thermalProtectType = PPSMC_THERMAL_PROTECT_TYPE_INTERNAL; 1956 break; 1957 case THERMAL_TYPE_NONE: 1958 table->thermalProtectType = PPSMC_THERMAL_PROTECT_TYPE_NONE; 1959 break; 1960 default: 1961 table->thermalProtectType = PPSMC_THERMAL_PROTECT_TYPE_EXTERNAL; 1962 break; 1963 } 1964 1965 if (rdev->pm.dpm.platform_caps & ATOM_PP_PLATFORM_CAP_HARDWAREDC) 1966 table->systemFlags |= PPSMC_SYSTEMFLAG_GPIO_DC; 1967 1968 if (rdev->pm.dpm.platform_caps & ATOM_PP_PLATFORM_CAP_REGULATOR_HOT) 1969 table->systemFlags |= PPSMC_SYSTEMFLAG_REGULATOR_HOT; 1970 1971 if (rdev->pm.dpm.platform_caps & ATOM_PP_PLATFORM_CAP_STEPVDDC) 1972 table->systemFlags |= PPSMC_SYSTEMFLAG_STEPVDDC; 1973 1974 if (pi->mem_gddr5) 1975 table->systemFlags |= PPSMC_SYSTEMFLAG_GDDR5; 1976 1977 ret = ni_populate_smc_initial_state(rdev, radeon_boot_state, table); 1978 if (ret) 1979 return ret; 1980 1981 ret = ni_populate_smc_acpi_state(rdev, table); 1982 if (ret) 1983 return ret; 1984 1985 table->driverState = table->initialState; 1986 1987 table->ULVState = table->initialState; 1988 1989 ret = ni_do_program_memory_timing_parameters(rdev, radeon_boot_state, 1990 NISLANDS_INITIAL_STATE_ARB_INDEX); 1991 if (ret) 1992 return ret; 1993 1994 return rv770_copy_bytes_to_smc(rdev, pi->state_table_start, (u8 *)table, 1995 sizeof(NISLANDS_SMC_STATETABLE), pi->sram_end); 1996 } 1997 1998 static int ni_calculate_sclk_params(struct radeon_device *rdev, 1999 u32 engine_clock, 2000 NISLANDS_SMC_SCLK_VALUE *sclk) 2001 { 2002 struct rv7xx_power_info *pi = rv770_get_pi(rdev); 2003 struct ni_power_info *ni_pi = ni_get_pi(rdev); 2004 struct atom_clock_dividers dividers; 2005 u32 spll_func_cntl = ni_pi->clock_registers.cg_spll_func_cntl; 2006 u32 spll_func_cntl_2 = ni_pi->clock_registers.cg_spll_func_cntl_2; 2007 u32 spll_func_cntl_3 = ni_pi->clock_registers.cg_spll_func_cntl_3; 2008 u32 spll_func_cntl_4 = ni_pi->clock_registers.cg_spll_func_cntl_4; 2009 u32 cg_spll_spread_spectrum = ni_pi->clock_registers.cg_spll_spread_spectrum; 2010 u32 cg_spll_spread_spectrum_2 = ni_pi->clock_registers.cg_spll_spread_spectrum_2; 2011 u64 tmp; 2012 u32 reference_clock = rdev->clock.spll.reference_freq; 2013 u32 reference_divider; 2014 u32 fbdiv; 2015 int ret; 2016 2017 ret = radeon_atom_get_clock_dividers(rdev, COMPUTE_ENGINE_PLL_PARAM, 2018 engine_clock, false, ÷rs); 2019 if (ret) 2020 return ret; 2021 2022 reference_divider = 1 + dividers.ref_div; 2023 2024 2025 tmp = (u64) engine_clock * reference_divider * dividers.post_div * 16834; 2026 do_div(tmp, reference_clock); 2027 fbdiv = (u32) tmp; 2028 2029 spll_func_cntl &= ~(SPLL_PDIV_A_MASK | SPLL_REF_DIV_MASK); 2030 spll_func_cntl |= SPLL_REF_DIV(dividers.ref_div); 2031 spll_func_cntl |= SPLL_PDIV_A(dividers.post_div); 2032 2033 spll_func_cntl_2 &= ~SCLK_MUX_SEL_MASK; 2034 spll_func_cntl_2 |= SCLK_MUX_SEL(2); 2035 2036 spll_func_cntl_3 &= ~SPLL_FB_DIV_MASK; 2037 spll_func_cntl_3 |= SPLL_FB_DIV(fbdiv); 2038 spll_func_cntl_3 |= SPLL_DITHEN; 2039 2040 if (pi->sclk_ss) { 2041 struct radeon_atom_ss ss; 2042 u32 vco_freq = engine_clock * dividers.post_div; 2043 2044 if (radeon_atombios_get_asic_ss_info(rdev, &ss, 2045 ASIC_INTERNAL_ENGINE_SS, vco_freq)) { 2046 u32 clk_s = reference_clock * 5 / (reference_divider * ss.rate); 2047 u32 clk_v = 4 * ss.percentage * fbdiv / (clk_s * 10000); 2048 2049 cg_spll_spread_spectrum &= ~CLK_S_MASK; 2050 cg_spll_spread_spectrum |= CLK_S(clk_s); 2051 cg_spll_spread_spectrum |= SSEN; 2052 2053 cg_spll_spread_spectrum_2 &= ~CLK_V_MASK; 2054 cg_spll_spread_spectrum_2 |= CLK_V(clk_v); 2055 } 2056 } 2057 2058 sclk->sclk_value = engine_clock; 2059 sclk->vCG_SPLL_FUNC_CNTL = spll_func_cntl; 2060 sclk->vCG_SPLL_FUNC_CNTL_2 = spll_func_cntl_2; 2061 sclk->vCG_SPLL_FUNC_CNTL_3 = spll_func_cntl_3; 2062 sclk->vCG_SPLL_FUNC_CNTL_4 = spll_func_cntl_4; 2063 sclk->vCG_SPLL_SPREAD_SPECTRUM = cg_spll_spread_spectrum; 2064 sclk->vCG_SPLL_SPREAD_SPECTRUM_2 = cg_spll_spread_spectrum_2; 2065 2066 return 0; 2067 } 2068 2069 static int ni_populate_sclk_value(struct radeon_device *rdev, 2070 u32 engine_clock, 2071 NISLANDS_SMC_SCLK_VALUE *sclk) 2072 { 2073 NISLANDS_SMC_SCLK_VALUE sclk_tmp; 2074 int ret; 2075 2076 ret = ni_calculate_sclk_params(rdev, engine_clock, &sclk_tmp); 2077 if (!ret) { 2078 sclk->sclk_value = cpu_to_be32(sclk_tmp.sclk_value); 2079 sclk->vCG_SPLL_FUNC_CNTL = cpu_to_be32(sclk_tmp.vCG_SPLL_FUNC_CNTL); 2080 sclk->vCG_SPLL_FUNC_CNTL_2 = cpu_to_be32(sclk_tmp.vCG_SPLL_FUNC_CNTL_2); 2081 sclk->vCG_SPLL_FUNC_CNTL_3 = cpu_to_be32(sclk_tmp.vCG_SPLL_FUNC_CNTL_3); 2082 sclk->vCG_SPLL_FUNC_CNTL_4 = cpu_to_be32(sclk_tmp.vCG_SPLL_FUNC_CNTL_4); 2083 sclk->vCG_SPLL_SPREAD_SPECTRUM = cpu_to_be32(sclk_tmp.vCG_SPLL_SPREAD_SPECTRUM); 2084 sclk->vCG_SPLL_SPREAD_SPECTRUM_2 = cpu_to_be32(sclk_tmp.vCG_SPLL_SPREAD_SPECTRUM_2); 2085 } 2086 2087 return ret; 2088 } 2089 2090 static int ni_init_smc_spll_table(struct radeon_device *rdev) 2091 { 2092 struct rv7xx_power_info *pi = rv770_get_pi(rdev); 2093 struct ni_power_info *ni_pi = ni_get_pi(rdev); 2094 SMC_NISLANDS_SPLL_DIV_TABLE *spll_table; 2095 NISLANDS_SMC_SCLK_VALUE sclk_params; 2096 u32 fb_div; 2097 u32 p_div; 2098 u32 clk_s; 2099 u32 clk_v; 2100 u32 sclk = 0; 2101 int i, ret; 2102 u32 tmp; 2103 2104 if (ni_pi->spll_table_start == 0) 2105 return -EINVAL; 2106 2107 spll_table = kzalloc(sizeof(SMC_NISLANDS_SPLL_DIV_TABLE), GFP_KERNEL); 2108 if (spll_table == NULL) 2109 return -ENOMEM; 2110 2111 for (i = 0; i < 256; i++) { 2112 ret = ni_calculate_sclk_params(rdev, sclk, &sclk_params); 2113 if (ret) 2114 break; 2115 2116 p_div = (sclk_params.vCG_SPLL_FUNC_CNTL & SPLL_PDIV_A_MASK) >> SPLL_PDIV_A_SHIFT; 2117 fb_div = (sclk_params.vCG_SPLL_FUNC_CNTL_3 & SPLL_FB_DIV_MASK) >> SPLL_FB_DIV_SHIFT; 2118 clk_s = (sclk_params.vCG_SPLL_SPREAD_SPECTRUM & CLK_S_MASK) >> CLK_S_SHIFT; 2119 clk_v = (sclk_params.vCG_SPLL_SPREAD_SPECTRUM_2 & CLK_V_MASK) >> CLK_V_SHIFT; 2120 2121 fb_div &= ~0x00001FFF; 2122 fb_div >>= 1; 2123 clk_v >>= 6; 2124 2125 if (p_div & ~(SMC_NISLANDS_SPLL_DIV_TABLE_PDIV_MASK >> SMC_NISLANDS_SPLL_DIV_TABLE_PDIV_SHIFT)) 2126 ret = -EINVAL; 2127 2128 if (clk_s & ~(SMC_NISLANDS_SPLL_DIV_TABLE_CLKS_MASK >> SMC_NISLANDS_SPLL_DIV_TABLE_CLKS_SHIFT)) 2129 ret = -EINVAL; 2130 2131 if (clk_s & ~(SMC_NISLANDS_SPLL_DIV_TABLE_CLKS_MASK >> SMC_NISLANDS_SPLL_DIV_TABLE_CLKS_SHIFT)) 2132 ret = -EINVAL; 2133 2134 if (clk_v & ~(SMC_NISLANDS_SPLL_DIV_TABLE_CLKV_MASK >> SMC_NISLANDS_SPLL_DIV_TABLE_CLKV_SHIFT)) 2135 ret = -EINVAL; 2136 2137 if (ret) 2138 break; 2139 2140 tmp = ((fb_div << SMC_NISLANDS_SPLL_DIV_TABLE_FBDIV_SHIFT) & SMC_NISLANDS_SPLL_DIV_TABLE_FBDIV_MASK) | 2141 ((p_div << SMC_NISLANDS_SPLL_DIV_TABLE_PDIV_SHIFT) & SMC_NISLANDS_SPLL_DIV_TABLE_PDIV_MASK); 2142 spll_table->freq[i] = cpu_to_be32(tmp); 2143 2144 tmp = ((clk_v << SMC_NISLANDS_SPLL_DIV_TABLE_CLKV_SHIFT) & SMC_NISLANDS_SPLL_DIV_TABLE_CLKV_MASK) | 2145 ((clk_s << SMC_NISLANDS_SPLL_DIV_TABLE_CLKS_SHIFT) & SMC_NISLANDS_SPLL_DIV_TABLE_CLKS_MASK); 2146 spll_table->ss[i] = cpu_to_be32(tmp); 2147 2148 sclk += 512; 2149 } 2150 2151 if (!ret) 2152 ret = rv770_copy_bytes_to_smc(rdev, ni_pi->spll_table_start, (u8 *)spll_table, 2153 sizeof(SMC_NISLANDS_SPLL_DIV_TABLE), pi->sram_end); 2154 2155 kfree(spll_table); 2156 2157 return ret; 2158 } 2159 2160 static int ni_populate_mclk_value(struct radeon_device *rdev, 2161 u32 engine_clock, 2162 u32 memory_clock, 2163 NISLANDS_SMC_MCLK_VALUE *mclk, 2164 bool strobe_mode, 2165 bool dll_state_on) 2166 { 2167 struct rv7xx_power_info *pi = rv770_get_pi(rdev); 2168 struct ni_power_info *ni_pi = ni_get_pi(rdev); 2169 u32 mpll_ad_func_cntl = ni_pi->clock_registers.mpll_ad_func_cntl; 2170 u32 mpll_ad_func_cntl_2 = ni_pi->clock_registers.mpll_ad_func_cntl_2; 2171 u32 mpll_dq_func_cntl = ni_pi->clock_registers.mpll_dq_func_cntl; 2172 u32 mpll_dq_func_cntl_2 = ni_pi->clock_registers.mpll_dq_func_cntl_2; 2173 u32 mclk_pwrmgt_cntl = ni_pi->clock_registers.mclk_pwrmgt_cntl; 2174 u32 dll_cntl = ni_pi->clock_registers.dll_cntl; 2175 u32 mpll_ss1 = ni_pi->clock_registers.mpll_ss1; 2176 u32 mpll_ss2 = ni_pi->clock_registers.mpll_ss2; 2177 struct atom_clock_dividers dividers; 2178 u32 ibias; 2179 u32 dll_speed; 2180 int ret; 2181 u32 mc_seq_misc7; 2182 2183 ret = radeon_atom_get_clock_dividers(rdev, COMPUTE_MEMORY_PLL_PARAM, 2184 memory_clock, strobe_mode, ÷rs); 2185 if (ret) 2186 return ret; 2187 2188 if (!strobe_mode) { 2189 mc_seq_misc7 = RREG32(MC_SEQ_MISC7); 2190 2191 if (mc_seq_misc7 & 0x8000000) 2192 dividers.post_div = 1; 2193 } 2194 2195 ibias = cypress_map_clkf_to_ibias(rdev, dividers.whole_fb_div); 2196 2197 mpll_ad_func_cntl &= ~(CLKR_MASK | 2198 YCLK_POST_DIV_MASK | 2199 CLKF_MASK | 2200 CLKFRAC_MASK | 2201 IBIAS_MASK); 2202 mpll_ad_func_cntl |= CLKR(dividers.ref_div); 2203 mpll_ad_func_cntl |= YCLK_POST_DIV(dividers.post_div); 2204 mpll_ad_func_cntl |= CLKF(dividers.whole_fb_div); 2205 mpll_ad_func_cntl |= CLKFRAC(dividers.frac_fb_div); 2206 mpll_ad_func_cntl |= IBIAS(ibias); 2207 2208 if (dividers.vco_mode) 2209 mpll_ad_func_cntl_2 |= VCO_MODE; 2210 else 2211 mpll_ad_func_cntl_2 &= ~VCO_MODE; 2212 2213 if (pi->mem_gddr5) { 2214 mpll_dq_func_cntl &= ~(CLKR_MASK | 2215 YCLK_POST_DIV_MASK | 2216 CLKF_MASK | 2217 CLKFRAC_MASK | 2218 IBIAS_MASK); 2219 mpll_dq_func_cntl |= CLKR(dividers.ref_div); 2220 mpll_dq_func_cntl |= YCLK_POST_DIV(dividers.post_div); 2221 mpll_dq_func_cntl |= CLKF(dividers.whole_fb_div); 2222 mpll_dq_func_cntl |= CLKFRAC(dividers.frac_fb_div); 2223 mpll_dq_func_cntl |= IBIAS(ibias); 2224 2225 if (strobe_mode) 2226 mpll_dq_func_cntl &= ~PDNB; 2227 else 2228 mpll_dq_func_cntl |= PDNB; 2229 2230 if (dividers.vco_mode) 2231 mpll_dq_func_cntl_2 |= VCO_MODE; 2232 else 2233 mpll_dq_func_cntl_2 &= ~VCO_MODE; 2234 } 2235 2236 if (pi->mclk_ss) { 2237 struct radeon_atom_ss ss; 2238 u32 vco_freq = memory_clock * dividers.post_div; 2239 2240 if (radeon_atombios_get_asic_ss_info(rdev, &ss, 2241 ASIC_INTERNAL_MEMORY_SS, vco_freq)) { 2242 u32 reference_clock = rdev->clock.mpll.reference_freq; 2243 u32 decoded_ref = rv740_get_decoded_reference_divider(dividers.ref_div); 2244 u32 clk_s = reference_clock * 5 / (decoded_ref * ss.rate); 2245 u32 clk_v = ss.percentage * 2246 (0x4000 * dividers.whole_fb_div + 0x800 * dividers.frac_fb_div) / (clk_s * 625); 2247 2248 mpll_ss1 &= ~CLKV_MASK; 2249 mpll_ss1 |= CLKV(clk_v); 2250 2251 mpll_ss2 &= ~CLKS_MASK; 2252 mpll_ss2 |= CLKS(clk_s); 2253 } 2254 } 2255 2256 dll_speed = rv740_get_dll_speed(pi->mem_gddr5, 2257 memory_clock); 2258 2259 mclk_pwrmgt_cntl &= ~DLL_SPEED_MASK; 2260 mclk_pwrmgt_cntl |= DLL_SPEED(dll_speed); 2261 if (dll_state_on) 2262 mclk_pwrmgt_cntl |= (MRDCKA0_PDNB | 2263 MRDCKA1_PDNB | 2264 MRDCKB0_PDNB | 2265 MRDCKB1_PDNB | 2266 MRDCKC0_PDNB | 2267 MRDCKC1_PDNB | 2268 MRDCKD0_PDNB | 2269 MRDCKD1_PDNB); 2270 else 2271 mclk_pwrmgt_cntl &= ~(MRDCKA0_PDNB | 2272 MRDCKA1_PDNB | 2273 MRDCKB0_PDNB | 2274 MRDCKB1_PDNB | 2275 MRDCKC0_PDNB | 2276 MRDCKC1_PDNB | 2277 MRDCKD0_PDNB | 2278 MRDCKD1_PDNB); 2279 2280 2281 mclk->mclk_value = cpu_to_be32(memory_clock); 2282 mclk->vMPLL_AD_FUNC_CNTL = cpu_to_be32(mpll_ad_func_cntl); 2283 mclk->vMPLL_AD_FUNC_CNTL_2 = cpu_to_be32(mpll_ad_func_cntl_2); 2284 mclk->vMPLL_DQ_FUNC_CNTL = cpu_to_be32(mpll_dq_func_cntl); 2285 mclk->vMPLL_DQ_FUNC_CNTL_2 = cpu_to_be32(mpll_dq_func_cntl_2); 2286 mclk->vMCLK_PWRMGT_CNTL = cpu_to_be32(mclk_pwrmgt_cntl); 2287 mclk->vDLL_CNTL = cpu_to_be32(dll_cntl); 2288 mclk->vMPLL_SS = cpu_to_be32(mpll_ss1); 2289 mclk->vMPLL_SS2 = cpu_to_be32(mpll_ss2); 2290 2291 return 0; 2292 } 2293 2294 static void ni_populate_smc_sp(struct radeon_device *rdev, 2295 struct radeon_ps *radeon_state, 2296 NISLANDS_SMC_SWSTATE *smc_state) 2297 { 2298 struct ni_ps *ps = ni_get_ps(radeon_state); 2299 struct rv7xx_power_info *pi = rv770_get_pi(rdev); 2300 int i; 2301 2302 for (i = 0; i < ps->performance_level_count - 1; i++) 2303 smc_state->levels[i].bSP = cpu_to_be32(pi->dsp); 2304 2305 smc_state->levels[ps->performance_level_count - 1].bSP = 2306 cpu_to_be32(pi->psp); 2307 } 2308 2309 static int ni_convert_power_level_to_smc(struct radeon_device *rdev, 2310 struct rv7xx_pl *pl, 2311 NISLANDS_SMC_HW_PERFORMANCE_LEVEL *level) 2312 { 2313 struct rv7xx_power_info *pi = rv770_get_pi(rdev); 2314 struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev); 2315 struct ni_power_info *ni_pi = ni_get_pi(rdev); 2316 int ret; 2317 bool dll_state_on; 2318 u16 std_vddc; 2319 u32 tmp = RREG32(DC_STUTTER_CNTL); 2320 2321 level->gen2PCIE = pi->pcie_gen2 ? 2322 ((pl->flags & ATOM_PPLIB_R600_FLAGS_PCIEGEN2) ? 1 : 0) : 0; 2323 2324 ret = ni_populate_sclk_value(rdev, pl->sclk, &level->sclk); 2325 if (ret) 2326 return ret; 2327 2328 level->mcFlags = 0; 2329 if (pi->mclk_stutter_mode_threshold && 2330 (pl->mclk <= pi->mclk_stutter_mode_threshold) && 2331 !eg_pi->uvd_enabled && 2332 (tmp & DC_STUTTER_ENABLE_A) && 2333 (tmp & DC_STUTTER_ENABLE_B)) 2334 level->mcFlags |= NISLANDS_SMC_MC_STUTTER_EN; 2335 2336 if (pi->mem_gddr5) { 2337 if (pl->mclk > pi->mclk_edc_enable_threshold) 2338 level->mcFlags |= NISLANDS_SMC_MC_EDC_RD_FLAG; 2339 if (pl->mclk > eg_pi->mclk_edc_wr_enable_threshold) 2340 level->mcFlags |= NISLANDS_SMC_MC_EDC_WR_FLAG; 2341 2342 level->strobeMode = cypress_get_strobe_mode_settings(rdev, pl->mclk); 2343 2344 if (level->strobeMode & NISLANDS_SMC_STROBE_ENABLE) { 2345 if (cypress_get_mclk_frequency_ratio(rdev, pl->mclk, true) >= 2346 ((RREG32(MC_SEQ_MISC7) >> 16) & 0xf)) 2347 dll_state_on = ((RREG32(MC_SEQ_MISC5) >> 1) & 0x1) ? true : false; 2348 else 2349 dll_state_on = ((RREG32(MC_SEQ_MISC6) >> 1) & 0x1) ? true : false; 2350 } else { 2351 dll_state_on = false; 2352 if (pl->mclk > ni_pi->mclk_rtt_mode_threshold) 2353 level->mcFlags |= NISLANDS_SMC_MC_RTT_ENABLE; 2354 } 2355 2356 ret = ni_populate_mclk_value(rdev, pl->sclk, pl->mclk, 2357 &level->mclk, 2358 (level->strobeMode & NISLANDS_SMC_STROBE_ENABLE) != 0, 2359 dll_state_on); 2360 } else 2361 ret = ni_populate_mclk_value(rdev, pl->sclk, pl->mclk, &level->mclk, 1, 1); 2362 2363 if (ret) 2364 return ret; 2365 2366 ret = ni_populate_voltage_value(rdev, &eg_pi->vddc_voltage_table, 2367 pl->vddc, &level->vddc); 2368 if (ret) 2369 return ret; 2370 2371 ret = ni_get_std_voltage_value(rdev, &level->vddc, &std_vddc); 2372 if (ret) 2373 return ret; 2374 2375 ni_populate_std_voltage_value(rdev, std_vddc, 2376 level->vddc.index, &level->std_vddc); 2377 2378 if (eg_pi->vddci_control) { 2379 ret = ni_populate_voltage_value(rdev, &eg_pi->vddci_voltage_table, 2380 pl->vddci, &level->vddci); 2381 if (ret) 2382 return ret; 2383 } 2384 2385 ni_populate_mvdd_value(rdev, pl->mclk, &level->mvdd); 2386 2387 return ret; 2388 } 2389 2390 static int ni_populate_smc_t(struct radeon_device *rdev, 2391 struct radeon_ps *radeon_state, 2392 NISLANDS_SMC_SWSTATE *smc_state) 2393 { 2394 struct rv7xx_power_info *pi = rv770_get_pi(rdev); 2395 struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev); 2396 struct ni_ps *state = ni_get_ps(radeon_state); 2397 u32 a_t; 2398 u32 t_l, t_h; 2399 u32 high_bsp; 2400 int i, ret; 2401 2402 if (state->performance_level_count >= 9) 2403 return -EINVAL; 2404 2405 if (state->performance_level_count < 2) { 2406 a_t = CG_R(0xffff) | CG_L(0); 2407 smc_state->levels[0].aT = cpu_to_be32(a_t); 2408 return 0; 2409 } 2410 2411 smc_state->levels[0].aT = cpu_to_be32(0); 2412 2413 for (i = 0; i <= state->performance_level_count - 2; i++) { 2414 if (eg_pi->uvd_enabled) 2415 ret = r600_calculate_at( 2416 1000 * (i * (eg_pi->smu_uvd_hs ? 2 : 8) + 2), 2417 100 * R600_AH_DFLT, 2418 state->performance_levels[i + 1].sclk, 2419 state->performance_levels[i].sclk, 2420 &t_l, 2421 &t_h); 2422 else 2423 ret = r600_calculate_at( 2424 1000 * (i + 1), 2425 100 * R600_AH_DFLT, 2426 state->performance_levels[i + 1].sclk, 2427 state->performance_levels[i].sclk, 2428 &t_l, 2429 &t_h); 2430 2431 if (ret) { 2432 t_h = (i + 1) * 1000 - 50 * R600_AH_DFLT; 2433 t_l = (i + 1) * 1000 + 50 * R600_AH_DFLT; 2434 } 2435 2436 a_t = be32_to_cpu(smc_state->levels[i].aT) & ~CG_R_MASK; 2437 a_t |= CG_R(t_l * pi->bsp / 20000); 2438 smc_state->levels[i].aT = cpu_to_be32(a_t); 2439 2440 high_bsp = (i == state->performance_level_count - 2) ? 2441 pi->pbsp : pi->bsp; 2442 2443 a_t = CG_R(0xffff) | CG_L(t_h * high_bsp / 20000); 2444 smc_state->levels[i + 1].aT = cpu_to_be32(a_t); 2445 } 2446 2447 return 0; 2448 } 2449 2450 static int ni_populate_power_containment_values(struct radeon_device *rdev, 2451 struct radeon_ps *radeon_state, 2452 NISLANDS_SMC_SWSTATE *smc_state) 2453 { 2454 struct rv7xx_power_info *pi = rv770_get_pi(rdev); 2455 struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev); 2456 struct ni_power_info *ni_pi = ni_get_pi(rdev); 2457 struct ni_ps *state = ni_get_ps(radeon_state); 2458 u32 prev_sclk; 2459 u32 max_sclk; 2460 u32 min_sclk; 2461 int i, ret; 2462 u32 tdp_limit; 2463 u32 near_tdp_limit; 2464 u32 power_boost_limit; 2465 u8 max_ps_percent; 2466 2467 if (ni_pi->enable_power_containment == false) 2468 return 0; 2469 2470 if (state->performance_level_count == 0) 2471 return -EINVAL; 2472 2473 if (smc_state->levelCount != state->performance_level_count) 2474 return -EINVAL; 2475 2476 ret = ni_calculate_adjusted_tdp_limits(rdev, 2477 false, /* ??? */ 2478 rdev->pm.dpm.tdp_adjustment, 2479 &tdp_limit, 2480 &near_tdp_limit); 2481 if (ret) 2482 return ret; 2483 2484 power_boost_limit = ni_calculate_power_boost_limit(rdev, radeon_state, near_tdp_limit); 2485 2486 ret = rv770_write_smc_sram_dword(rdev, 2487 pi->state_table_start + 2488 offsetof(NISLANDS_SMC_STATETABLE, dpm2Params) + 2489 offsetof(PP_NIslands_DPM2Parameters, PowerBoostLimit), 2490 ni_scale_power_for_smc(power_boost_limit, ni_get_smc_power_scaling_factor(rdev)), 2491 pi->sram_end); 2492 if (ret) 2493 power_boost_limit = 0; 2494 2495 smc_state->levels[0].dpm2.MaxPS = 0; 2496 smc_state->levels[0].dpm2.NearTDPDec = 0; 2497 smc_state->levels[0].dpm2.AboveSafeInc = 0; 2498 smc_state->levels[0].dpm2.BelowSafeInc = 0; 2499 smc_state->levels[0].stateFlags |= power_boost_limit ? PPSMC_STATEFLAG_POWERBOOST : 0; 2500 2501 for (i = 1; i < state->performance_level_count; i++) { 2502 prev_sclk = state->performance_levels[i-1].sclk; 2503 max_sclk = state->performance_levels[i].sclk; 2504 max_ps_percent = (i != (state->performance_level_count - 1)) ? 2505 NISLANDS_DPM2_MAXPS_PERCENT_M : NISLANDS_DPM2_MAXPS_PERCENT_H; 2506 2507 if (max_sclk < prev_sclk) 2508 return -EINVAL; 2509 2510 if ((max_ps_percent == 0) || (prev_sclk == max_sclk) || eg_pi->uvd_enabled) 2511 min_sclk = max_sclk; 2512 else if (1 == i) 2513 min_sclk = prev_sclk; 2514 else 2515 min_sclk = (prev_sclk * (u32)max_ps_percent) / 100; 2516 2517 if (min_sclk < state->performance_levels[0].sclk) 2518 min_sclk = state->performance_levels[0].sclk; 2519 2520 if (min_sclk == 0) 2521 return -EINVAL; 2522 2523 smc_state->levels[i].dpm2.MaxPS = 2524 (u8)((NISLANDS_DPM2_MAX_PULSE_SKIP * (max_sclk - min_sclk)) / max_sclk); 2525 smc_state->levels[i].dpm2.NearTDPDec = NISLANDS_DPM2_NEAR_TDP_DEC; 2526 smc_state->levels[i].dpm2.AboveSafeInc = NISLANDS_DPM2_ABOVE_SAFE_INC; 2527 smc_state->levels[i].dpm2.BelowSafeInc = NISLANDS_DPM2_BELOW_SAFE_INC; 2528 smc_state->levels[i].stateFlags |= 2529 ((i != (state->performance_level_count - 1)) && power_boost_limit) ? 2530 PPSMC_STATEFLAG_POWERBOOST : 0; 2531 } 2532 2533 return 0; 2534 } 2535 2536 static int ni_populate_sq_ramping_values(struct radeon_device *rdev, 2537 struct radeon_ps *radeon_state, 2538 NISLANDS_SMC_SWSTATE *smc_state) 2539 { 2540 struct ni_power_info *ni_pi = ni_get_pi(rdev); 2541 struct ni_ps *state = ni_get_ps(radeon_state); 2542 u32 sq_power_throttle; 2543 u32 sq_power_throttle2; 2544 bool enable_sq_ramping = ni_pi->enable_sq_ramping; 2545 int i; 2546 2547 if (state->performance_level_count == 0) 2548 return -EINVAL; 2549 2550 if (smc_state->levelCount != state->performance_level_count) 2551 return -EINVAL; 2552 2553 if (rdev->pm.dpm.sq_ramping_threshold == 0) 2554 return -EINVAL; 2555 2556 if (NISLANDS_DPM2_SQ_RAMP_MAX_POWER > (MAX_POWER_MASK >> MAX_POWER_SHIFT)) 2557 enable_sq_ramping = false; 2558 2559 if (NISLANDS_DPM2_SQ_RAMP_MIN_POWER > (MIN_POWER_MASK >> MIN_POWER_SHIFT)) 2560 enable_sq_ramping = false; 2561 2562 if (NISLANDS_DPM2_SQ_RAMP_MAX_POWER_DELTA > (MAX_POWER_DELTA_MASK >> MAX_POWER_DELTA_SHIFT)) 2563 enable_sq_ramping = false; 2564 2565 if (NISLANDS_DPM2_SQ_RAMP_STI_SIZE > (STI_SIZE_MASK >> STI_SIZE_SHIFT)) 2566 enable_sq_ramping = false; 2567 2568 if (NISLANDS_DPM2_SQ_RAMP_LTI_RATIO > (LTI_RATIO_MASK >> LTI_RATIO_SHIFT)) 2569 enable_sq_ramping = false; 2570 2571 for (i = 0; i < state->performance_level_count; i++) { 2572 sq_power_throttle = 0; 2573 sq_power_throttle2 = 0; 2574 2575 if ((state->performance_levels[i].sclk >= rdev->pm.dpm.sq_ramping_threshold) && 2576 enable_sq_ramping) { 2577 sq_power_throttle |= MAX_POWER(NISLANDS_DPM2_SQ_RAMP_MAX_POWER); 2578 sq_power_throttle |= MIN_POWER(NISLANDS_DPM2_SQ_RAMP_MIN_POWER); 2579 sq_power_throttle2 |= MAX_POWER_DELTA(NISLANDS_DPM2_SQ_RAMP_MAX_POWER_DELTA); 2580 sq_power_throttle2 |= STI_SIZE(NISLANDS_DPM2_SQ_RAMP_STI_SIZE); 2581 sq_power_throttle2 |= LTI_RATIO(NISLANDS_DPM2_SQ_RAMP_LTI_RATIO); 2582 } else { 2583 sq_power_throttle |= MAX_POWER_MASK | MIN_POWER_MASK; 2584 sq_power_throttle2 |= MAX_POWER_DELTA_MASK | STI_SIZE_MASK | LTI_RATIO_MASK; 2585 } 2586 2587 smc_state->levels[i].SQPowerThrottle = cpu_to_be32(sq_power_throttle); 2588 smc_state->levels[i].SQPowerThrottle_2 = cpu_to_be32(sq_power_throttle2); 2589 } 2590 2591 return 0; 2592 } 2593 2594 static int ni_enable_power_containment(struct radeon_device *rdev, 2595 struct radeon_ps *radeon_new_state, 2596 bool enable) 2597 { 2598 struct ni_power_info *ni_pi = ni_get_pi(rdev); 2599 PPSMC_Result smc_result; 2600 int ret = 0; 2601 2602 if (ni_pi->enable_power_containment) { 2603 if (enable) { 2604 if (!r600_is_uvd_state(radeon_new_state->class, radeon_new_state->class2)) { 2605 smc_result = rv770_send_msg_to_smc(rdev, PPSMC_TDPClampingActive); 2606 if (smc_result != PPSMC_Result_OK) { 2607 ret = -EINVAL; 2608 ni_pi->pc_enabled = false; 2609 } else { 2610 ni_pi->pc_enabled = true; 2611 } 2612 } 2613 } else { 2614 smc_result = rv770_send_msg_to_smc(rdev, PPSMC_TDPClampingInactive); 2615 if (smc_result != PPSMC_Result_OK) 2616 ret = -EINVAL; 2617 ni_pi->pc_enabled = false; 2618 } 2619 } 2620 2621 return ret; 2622 } 2623 2624 static int ni_convert_power_state_to_smc(struct radeon_device *rdev, 2625 struct radeon_ps *radeon_state, 2626 NISLANDS_SMC_SWSTATE *smc_state) 2627 { 2628 struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev); 2629 struct ni_power_info *ni_pi = ni_get_pi(rdev); 2630 struct ni_ps *state = ni_get_ps(radeon_state); 2631 int i, ret; 2632 u32 threshold = state->performance_levels[state->performance_level_count - 1].sclk * 100 / 100; 2633 2634 if (!(radeon_state->caps & ATOM_PPLIB_DISALLOW_ON_DC)) 2635 smc_state->flags |= PPSMC_SWSTATE_FLAG_DC; 2636 2637 smc_state->levelCount = 0; 2638 2639 if (state->performance_level_count > NISLANDS_MAX_SMC_PERFORMANCE_LEVELS_PER_SWSTATE) 2640 return -EINVAL; 2641 2642 for (i = 0; i < state->performance_level_count; i++) { 2643 ret = ni_convert_power_level_to_smc(rdev, &state->performance_levels[i], 2644 &smc_state->levels[i]); 2645 smc_state->levels[i].arbRefreshState = 2646 (u8)(NISLANDS_DRIVER_STATE_ARB_INDEX + i); 2647 2648 if (ret) 2649 return ret; 2650 2651 if (ni_pi->enable_power_containment) 2652 smc_state->levels[i].displayWatermark = 2653 (state->performance_levels[i].sclk < threshold) ? 2654 PPSMC_DISPLAY_WATERMARK_LOW : PPSMC_DISPLAY_WATERMARK_HIGH; 2655 else 2656 smc_state->levels[i].displayWatermark = (i < 2) ? 2657 PPSMC_DISPLAY_WATERMARK_LOW : PPSMC_DISPLAY_WATERMARK_HIGH; 2658 2659 if (eg_pi->dynamic_ac_timing) 2660 smc_state->levels[i].ACIndex = NISLANDS_MCREGISTERTABLE_FIRST_DRIVERSTATE_SLOT + i; 2661 else 2662 smc_state->levels[i].ACIndex = 0; 2663 2664 smc_state->levelCount++; 2665 } 2666 2667 rv770_write_smc_soft_register(rdev, NI_SMC_SOFT_REGISTER_watermark_threshold, 2668 cpu_to_be32(threshold / 512)); 2669 2670 ni_populate_smc_sp(rdev, radeon_state, smc_state); 2671 2672 ret = ni_populate_power_containment_values(rdev, radeon_state, smc_state); 2673 if (ret) 2674 ni_pi->enable_power_containment = false; 2675 2676 ret = ni_populate_sq_ramping_values(rdev, radeon_state, smc_state); 2677 if (ret) 2678 ni_pi->enable_sq_ramping = false; 2679 2680 return ni_populate_smc_t(rdev, radeon_state, smc_state); 2681 } 2682 2683 static int ni_upload_sw_state(struct radeon_device *rdev, 2684 struct radeon_ps *radeon_new_state) 2685 { 2686 struct rv7xx_power_info *pi = rv770_get_pi(rdev); 2687 u16 address = pi->state_table_start + 2688 offsetof(NISLANDS_SMC_STATETABLE, driverState); 2689 u16 state_size = sizeof(NISLANDS_SMC_SWSTATE) + 2690 ((NISLANDS_MAX_SMC_PERFORMANCE_LEVELS_PER_SWSTATE - 1) * sizeof(NISLANDS_SMC_HW_PERFORMANCE_LEVEL)); 2691 int ret; 2692 NISLANDS_SMC_SWSTATE *smc_state = kzalloc(state_size, GFP_KERNEL); 2693 2694 if (smc_state == NULL) 2695 return -ENOMEM; 2696 2697 ret = ni_convert_power_state_to_smc(rdev, radeon_new_state, smc_state); 2698 if (ret) 2699 goto done; 2700 2701 ret = rv770_copy_bytes_to_smc(rdev, address, (u8 *)smc_state, state_size, pi->sram_end); 2702 2703 done: 2704 kfree(smc_state); 2705 2706 return ret; 2707 } 2708 2709 static int ni_set_mc_special_registers(struct radeon_device *rdev, 2710 struct ni_mc_reg_table *table) 2711 { 2712 struct rv7xx_power_info *pi = rv770_get_pi(rdev); 2713 u8 i, j, k; 2714 u32 temp_reg; 2715 2716 for (i = 0, j = table->last; i < table->last; i++) { 2717 switch (table->mc_reg_address[i].s1) { 2718 case MC_SEQ_MISC1 >> 2: 2719 if (j >= SMC_NISLANDS_MC_REGISTER_ARRAY_SIZE) 2720 return -EINVAL; 2721 temp_reg = RREG32(MC_PMG_CMD_EMRS); 2722 table->mc_reg_address[j].s1 = MC_PMG_CMD_EMRS >> 2; 2723 table->mc_reg_address[j].s0 = MC_SEQ_PMG_CMD_EMRS_LP >> 2; 2724 for (k = 0; k < table->num_entries; k++) 2725 table->mc_reg_table_entry[k].mc_data[j] = 2726 ((temp_reg & 0xffff0000)) | 2727 ((table->mc_reg_table_entry[k].mc_data[i] & 0xffff0000) >> 16); 2728 j++; 2729 if (j >= SMC_NISLANDS_MC_REGISTER_ARRAY_SIZE) 2730 return -EINVAL; 2731 2732 temp_reg = RREG32(MC_PMG_CMD_MRS); 2733 table->mc_reg_address[j].s1 = MC_PMG_CMD_MRS >> 2; 2734 table->mc_reg_address[j].s0 = MC_SEQ_PMG_CMD_MRS_LP >> 2; 2735 for(k = 0; k < table->num_entries; k++) { 2736 table->mc_reg_table_entry[k].mc_data[j] = 2737 (temp_reg & 0xffff0000) | 2738 (table->mc_reg_table_entry[k].mc_data[i] & 0x0000ffff); 2739 if (!pi->mem_gddr5) 2740 table->mc_reg_table_entry[k].mc_data[j] |= 0x100; 2741 } 2742 j++; 2743 if (j > SMC_NISLANDS_MC_REGISTER_ARRAY_SIZE) 2744 return -EINVAL; 2745 break; 2746 case MC_SEQ_RESERVE_M >> 2: 2747 temp_reg = RREG32(MC_PMG_CMD_MRS1); 2748 table->mc_reg_address[j].s1 = MC_PMG_CMD_MRS1 >> 2; 2749 table->mc_reg_address[j].s0 = MC_SEQ_PMG_CMD_MRS1_LP >> 2; 2750 for (k = 0; k < table->num_entries; k++) 2751 table->mc_reg_table_entry[k].mc_data[j] = 2752 (temp_reg & 0xffff0000) | 2753 (table->mc_reg_table_entry[k].mc_data[i] & 0x0000ffff); 2754 j++; 2755 if (j > SMC_NISLANDS_MC_REGISTER_ARRAY_SIZE) 2756 return -EINVAL; 2757 break; 2758 default: 2759 break; 2760 } 2761 } 2762 2763 table->last = j; 2764 2765 return 0; 2766 } 2767 2768 static bool ni_check_s0_mc_reg_index(u16 in_reg, u16 *out_reg) 2769 { 2770 bool result = true; 2771 2772 switch (in_reg) { 2773 case MC_SEQ_RAS_TIMING >> 2: 2774 *out_reg = MC_SEQ_RAS_TIMING_LP >> 2; 2775 break; 2776 case MC_SEQ_CAS_TIMING >> 2: 2777 *out_reg = MC_SEQ_CAS_TIMING_LP >> 2; 2778 break; 2779 case MC_SEQ_MISC_TIMING >> 2: 2780 *out_reg = MC_SEQ_MISC_TIMING_LP >> 2; 2781 break; 2782 case MC_SEQ_MISC_TIMING2 >> 2: 2783 *out_reg = MC_SEQ_MISC_TIMING2_LP >> 2; 2784 break; 2785 case MC_SEQ_RD_CTL_D0 >> 2: 2786 *out_reg = MC_SEQ_RD_CTL_D0_LP >> 2; 2787 break; 2788 case MC_SEQ_RD_CTL_D1 >> 2: 2789 *out_reg = MC_SEQ_RD_CTL_D1_LP >> 2; 2790 break; 2791 case MC_SEQ_WR_CTL_D0 >> 2: 2792 *out_reg = MC_SEQ_WR_CTL_D0_LP >> 2; 2793 break; 2794 case MC_SEQ_WR_CTL_D1 >> 2: 2795 *out_reg = MC_SEQ_WR_CTL_D1_LP >> 2; 2796 break; 2797 case MC_PMG_CMD_EMRS >> 2: 2798 *out_reg = MC_SEQ_PMG_CMD_EMRS_LP >> 2; 2799 break; 2800 case MC_PMG_CMD_MRS >> 2: 2801 *out_reg = MC_SEQ_PMG_CMD_MRS_LP >> 2; 2802 break; 2803 case MC_PMG_CMD_MRS1 >> 2: 2804 *out_reg = MC_SEQ_PMG_CMD_MRS1_LP >> 2; 2805 break; 2806 case MC_SEQ_PMG_TIMING >> 2: 2807 *out_reg = MC_SEQ_PMG_TIMING_LP >> 2; 2808 break; 2809 case MC_PMG_CMD_MRS2 >> 2: 2810 *out_reg = MC_SEQ_PMG_CMD_MRS2_LP >> 2; 2811 break; 2812 default: 2813 result = false; 2814 break; 2815 } 2816 2817 return result; 2818 } 2819 2820 static void ni_set_valid_flag(struct ni_mc_reg_table *table) 2821 { 2822 u8 i, j; 2823 2824 for (i = 0; i < table->last; i++) { 2825 for (j = 1; j < table->num_entries; j++) { 2826 if (table->mc_reg_table_entry[j-1].mc_data[i] != table->mc_reg_table_entry[j].mc_data[i]) { 2827 table->valid_flag |= 1 << i; 2828 break; 2829 } 2830 } 2831 } 2832 } 2833 2834 static void ni_set_s0_mc_reg_index(struct ni_mc_reg_table *table) 2835 { 2836 u32 i; 2837 u16 address; 2838 2839 for (i = 0; i < table->last; i++) 2840 table->mc_reg_address[i].s0 = 2841 ni_check_s0_mc_reg_index(table->mc_reg_address[i].s1, &address) ? 2842 address : table->mc_reg_address[i].s1; 2843 } 2844 2845 static int ni_copy_vbios_mc_reg_table(struct atom_mc_reg_table *table, 2846 struct ni_mc_reg_table *ni_table) 2847 { 2848 u8 i, j; 2849 2850 if (table->last > SMC_NISLANDS_MC_REGISTER_ARRAY_SIZE) 2851 return -EINVAL; 2852 if (table->num_entries > MAX_AC_TIMING_ENTRIES) 2853 return -EINVAL; 2854 2855 for (i = 0; i < table->last; i++) 2856 ni_table->mc_reg_address[i].s1 = table->mc_reg_address[i].s1; 2857 ni_table->last = table->last; 2858 2859 for (i = 0; i < table->num_entries; i++) { 2860 ni_table->mc_reg_table_entry[i].mclk_max = 2861 table->mc_reg_table_entry[i].mclk_max; 2862 for (j = 0; j < table->last; j++) 2863 ni_table->mc_reg_table_entry[i].mc_data[j] = 2864 table->mc_reg_table_entry[i].mc_data[j]; 2865 } 2866 ni_table->num_entries = table->num_entries; 2867 2868 return 0; 2869 } 2870 2871 static int ni_initialize_mc_reg_table(struct radeon_device *rdev) 2872 { 2873 struct ni_power_info *ni_pi = ni_get_pi(rdev); 2874 int ret; 2875 struct atom_mc_reg_table *table; 2876 struct ni_mc_reg_table *ni_table = &ni_pi->mc_reg_table; 2877 u8 module_index = rv770_get_memory_module_index(rdev); 2878 2879 table = kzalloc(sizeof(struct atom_mc_reg_table), GFP_KERNEL); 2880 if (!table) 2881 return -ENOMEM; 2882 2883 WREG32(MC_SEQ_RAS_TIMING_LP, RREG32(MC_SEQ_RAS_TIMING)); 2884 WREG32(MC_SEQ_CAS_TIMING_LP, RREG32(MC_SEQ_CAS_TIMING)); 2885 WREG32(MC_SEQ_MISC_TIMING_LP, RREG32(MC_SEQ_MISC_TIMING)); 2886 WREG32(MC_SEQ_MISC_TIMING2_LP, RREG32(MC_SEQ_MISC_TIMING2)); 2887 WREG32(MC_SEQ_PMG_CMD_EMRS_LP, RREG32(MC_PMG_CMD_EMRS)); 2888 WREG32(MC_SEQ_PMG_CMD_MRS_LP, RREG32(MC_PMG_CMD_MRS)); 2889 WREG32(MC_SEQ_PMG_CMD_MRS1_LP, RREG32(MC_PMG_CMD_MRS1)); 2890 WREG32(MC_SEQ_WR_CTL_D0_LP, RREG32(MC_SEQ_WR_CTL_D0)); 2891 WREG32(MC_SEQ_WR_CTL_D1_LP, RREG32(MC_SEQ_WR_CTL_D1)); 2892 WREG32(MC_SEQ_RD_CTL_D0_LP, RREG32(MC_SEQ_RD_CTL_D0)); 2893 WREG32(MC_SEQ_RD_CTL_D1_LP, RREG32(MC_SEQ_RD_CTL_D1)); 2894 WREG32(MC_SEQ_PMG_TIMING_LP, RREG32(MC_SEQ_PMG_TIMING)); 2895 WREG32(MC_SEQ_PMG_CMD_MRS2_LP, RREG32(MC_PMG_CMD_MRS2)); 2896 2897 ret = radeon_atom_init_mc_reg_table(rdev, module_index, table); 2898 2899 if (ret) 2900 goto init_mc_done; 2901 2902 ret = ni_copy_vbios_mc_reg_table(table, ni_table); 2903 2904 if (ret) 2905 goto init_mc_done; 2906 2907 ni_set_s0_mc_reg_index(ni_table); 2908 2909 ret = ni_set_mc_special_registers(rdev, ni_table); 2910 2911 if (ret) 2912 goto init_mc_done; 2913 2914 ni_set_valid_flag(ni_table); 2915 2916 init_mc_done: 2917 kfree(table); 2918 2919 return ret; 2920 } 2921 2922 static void ni_populate_mc_reg_addresses(struct radeon_device *rdev, 2923 SMC_NIslands_MCRegisters *mc_reg_table) 2924 { 2925 struct ni_power_info *ni_pi = ni_get_pi(rdev); 2926 u32 i, j; 2927 2928 for (i = 0, j = 0; j < ni_pi->mc_reg_table.last; j++) { 2929 if (ni_pi->mc_reg_table.valid_flag & (1 << j)) { 2930 if (i >= SMC_NISLANDS_MC_REGISTER_ARRAY_SIZE) 2931 break; 2932 mc_reg_table->address[i].s0 = 2933 cpu_to_be16(ni_pi->mc_reg_table.mc_reg_address[j].s0); 2934 mc_reg_table->address[i].s1 = 2935 cpu_to_be16(ni_pi->mc_reg_table.mc_reg_address[j].s1); 2936 i++; 2937 } 2938 } 2939 mc_reg_table->last = (u8)i; 2940 } 2941 2942 2943 static void ni_convert_mc_registers(struct ni_mc_reg_entry *entry, 2944 SMC_NIslands_MCRegisterSet *data, 2945 u32 num_entries, u32 valid_flag) 2946 { 2947 u32 i, j; 2948 2949 for (i = 0, j = 0; j < num_entries; j++) { 2950 if (valid_flag & (1 << j)) { 2951 data->value[i] = cpu_to_be32(entry->mc_data[j]); 2952 i++; 2953 } 2954 } 2955 } 2956 2957 static void ni_convert_mc_reg_table_entry_to_smc(struct radeon_device *rdev, 2958 struct rv7xx_pl *pl, 2959 SMC_NIslands_MCRegisterSet *mc_reg_table_data) 2960 { 2961 struct ni_power_info *ni_pi = ni_get_pi(rdev); 2962 u32 i = 0; 2963 2964 for (i = 0; i < ni_pi->mc_reg_table.num_entries; i++) { 2965 if (pl->mclk <= ni_pi->mc_reg_table.mc_reg_table_entry[i].mclk_max) 2966 break; 2967 } 2968 2969 if ((i == ni_pi->mc_reg_table.num_entries) && (i > 0)) 2970 --i; 2971 2972 ni_convert_mc_registers(&ni_pi->mc_reg_table.mc_reg_table_entry[i], 2973 mc_reg_table_data, 2974 ni_pi->mc_reg_table.last, 2975 ni_pi->mc_reg_table.valid_flag); 2976 } 2977 2978 static void ni_convert_mc_reg_table_to_smc(struct radeon_device *rdev, 2979 struct radeon_ps *radeon_state, 2980 SMC_NIslands_MCRegisters *mc_reg_table) 2981 { 2982 struct ni_ps *state = ni_get_ps(radeon_state); 2983 int i; 2984 2985 for (i = 0; i < state->performance_level_count; i++) { 2986 ni_convert_mc_reg_table_entry_to_smc(rdev, 2987 &state->performance_levels[i], 2988 &mc_reg_table->data[NISLANDS_MCREGISTERTABLE_FIRST_DRIVERSTATE_SLOT + i]); 2989 } 2990 } 2991 2992 static int ni_populate_mc_reg_table(struct radeon_device *rdev, 2993 struct radeon_ps *radeon_boot_state) 2994 { 2995 struct rv7xx_power_info *pi = rv770_get_pi(rdev); 2996 struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev); 2997 struct ni_power_info *ni_pi = ni_get_pi(rdev); 2998 struct ni_ps *boot_state = ni_get_ps(radeon_boot_state); 2999 SMC_NIslands_MCRegisters *mc_reg_table = &ni_pi->smc_mc_reg_table; 3000 3001 memset(mc_reg_table, 0, sizeof(SMC_NIslands_MCRegisters)); 3002 3003 rv770_write_smc_soft_register(rdev, NI_SMC_SOFT_REGISTER_seq_index, 1); 3004 3005 ni_populate_mc_reg_addresses(rdev, mc_reg_table); 3006 3007 ni_convert_mc_reg_table_entry_to_smc(rdev, &boot_state->performance_levels[0], 3008 &mc_reg_table->data[0]); 3009 3010 ni_convert_mc_registers(&ni_pi->mc_reg_table.mc_reg_table_entry[0], 3011 &mc_reg_table->data[1], 3012 ni_pi->mc_reg_table.last, 3013 ni_pi->mc_reg_table.valid_flag); 3014 3015 ni_convert_mc_reg_table_to_smc(rdev, radeon_boot_state, mc_reg_table); 3016 3017 return rv770_copy_bytes_to_smc(rdev, eg_pi->mc_reg_table_start, 3018 (u8 *)mc_reg_table, 3019 sizeof(SMC_NIslands_MCRegisters), 3020 pi->sram_end); 3021 } 3022 3023 static int ni_upload_mc_reg_table(struct radeon_device *rdev, 3024 struct radeon_ps *radeon_new_state) 3025 { 3026 struct rv7xx_power_info *pi = rv770_get_pi(rdev); 3027 struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev); 3028 struct ni_power_info *ni_pi = ni_get_pi(rdev); 3029 struct ni_ps *ni_new_state = ni_get_ps(radeon_new_state); 3030 SMC_NIslands_MCRegisters *mc_reg_table = &ni_pi->smc_mc_reg_table; 3031 u16 address; 3032 3033 memset(mc_reg_table, 0, sizeof(SMC_NIslands_MCRegisters)); 3034 3035 ni_convert_mc_reg_table_to_smc(rdev, radeon_new_state, mc_reg_table); 3036 3037 address = eg_pi->mc_reg_table_start + 3038 (u16)offsetof(SMC_NIslands_MCRegisters, data[NISLANDS_MCREGISTERTABLE_FIRST_DRIVERSTATE_SLOT]); 3039 3040 return rv770_copy_bytes_to_smc(rdev, address, 3041 (u8 *)&mc_reg_table->data[NISLANDS_MCREGISTERTABLE_FIRST_DRIVERSTATE_SLOT], 3042 sizeof(SMC_NIslands_MCRegisterSet) * ni_new_state->performance_level_count, 3043 pi->sram_end); 3044 } 3045 3046 static int ni_init_driver_calculated_leakage_table(struct radeon_device *rdev, 3047 PP_NIslands_CACTABLES *cac_tables) 3048 { 3049 struct ni_power_info *ni_pi = ni_get_pi(rdev); 3050 struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev); 3051 u32 leakage = 0; 3052 unsigned int i, j, table_size; 3053 s32 t; 3054 u32 smc_leakage, max_leakage = 0; 3055 u32 scaling_factor; 3056 3057 table_size = eg_pi->vddc_voltage_table.count; 3058 3059 if (SMC_NISLANDS_LKGE_LUT_NUM_OF_VOLT_ENTRIES < table_size) 3060 table_size = SMC_NISLANDS_LKGE_LUT_NUM_OF_VOLT_ENTRIES; 3061 3062 scaling_factor = ni_get_smc_power_scaling_factor(rdev); 3063 3064 for (i = 0; i < SMC_NISLANDS_LKGE_LUT_NUM_OF_TEMP_ENTRIES; i++) { 3065 for (j = 0; j < table_size; j++) { 3066 t = (1000 * ((i + 1) * 8)); 3067 3068 if (t < ni_pi->cac_data.leakage_minimum_temperature) 3069 t = ni_pi->cac_data.leakage_minimum_temperature; 3070 3071 ni_calculate_leakage_for_v_and_t(rdev, 3072 &ni_pi->cac_data.leakage_coefficients, 3073 eg_pi->vddc_voltage_table.entries[j].value, 3074 t, 3075 ni_pi->cac_data.i_leakage, 3076 &leakage); 3077 3078 smc_leakage = ni_scale_power_for_smc(leakage, scaling_factor) / 1000; 3079 if (smc_leakage > max_leakage) 3080 max_leakage = smc_leakage; 3081 3082 cac_tables->cac_lkge_lut[i][j] = cpu_to_be32(smc_leakage); 3083 } 3084 } 3085 3086 for (j = table_size; j < SMC_NISLANDS_LKGE_LUT_NUM_OF_VOLT_ENTRIES; j++) { 3087 for (i = 0; i < SMC_NISLANDS_LKGE_LUT_NUM_OF_TEMP_ENTRIES; i++) 3088 cac_tables->cac_lkge_lut[i][j] = cpu_to_be32(max_leakage); 3089 } 3090 return 0; 3091 } 3092 3093 static int ni_init_simplified_leakage_table(struct radeon_device *rdev, 3094 PP_NIslands_CACTABLES *cac_tables) 3095 { 3096 struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev); 3097 struct radeon_cac_leakage_table *leakage_table = 3098 &rdev->pm.dpm.dyn_state.cac_leakage_table; 3099 u32 i, j, table_size; 3100 u32 smc_leakage, max_leakage = 0; 3101 u32 scaling_factor; 3102 3103 if (!leakage_table) 3104 return -EINVAL; 3105 3106 table_size = leakage_table->count; 3107 3108 if (eg_pi->vddc_voltage_table.count != table_size) 3109 table_size = (eg_pi->vddc_voltage_table.count < leakage_table->count) ? 3110 eg_pi->vddc_voltage_table.count : leakage_table->count; 3111 3112 if (SMC_NISLANDS_LKGE_LUT_NUM_OF_VOLT_ENTRIES < table_size) 3113 table_size = SMC_NISLANDS_LKGE_LUT_NUM_OF_VOLT_ENTRIES; 3114 3115 if (table_size == 0) 3116 return -EINVAL; 3117 3118 scaling_factor = ni_get_smc_power_scaling_factor(rdev); 3119 3120 for (j = 0; j < table_size; j++) { 3121 smc_leakage = leakage_table->entries[j].leakage; 3122 3123 if (smc_leakage > max_leakage) 3124 max_leakage = smc_leakage; 3125 3126 for (i = 0; i < SMC_NISLANDS_LKGE_LUT_NUM_OF_TEMP_ENTRIES; i++) 3127 cac_tables->cac_lkge_lut[i][j] = 3128 cpu_to_be32(ni_scale_power_for_smc(smc_leakage, scaling_factor)); 3129 } 3130 3131 for (j = table_size; j < SMC_NISLANDS_LKGE_LUT_NUM_OF_VOLT_ENTRIES; j++) { 3132 for (i = 0; i < SMC_NISLANDS_LKGE_LUT_NUM_OF_TEMP_ENTRIES; i++) 3133 cac_tables->cac_lkge_lut[i][j] = 3134 cpu_to_be32(ni_scale_power_for_smc(max_leakage, scaling_factor)); 3135 } 3136 return 0; 3137 } 3138 3139 static int ni_initialize_smc_cac_tables(struct radeon_device *rdev) 3140 { 3141 struct rv7xx_power_info *pi = rv770_get_pi(rdev); 3142 struct ni_power_info *ni_pi = ni_get_pi(rdev); 3143 PP_NIslands_CACTABLES *cac_tables = NULL; 3144 int i, ret; 3145 u32 reg; 3146 3147 if (ni_pi->enable_cac == false) 3148 return 0; 3149 3150 cac_tables = kzalloc(sizeof(PP_NIslands_CACTABLES), GFP_KERNEL); 3151 if (!cac_tables) 3152 return -ENOMEM; 3153 3154 reg = RREG32(CG_CAC_CTRL) & ~(TID_CNT_MASK | TID_UNIT_MASK); 3155 reg |= (TID_CNT(ni_pi->cac_weights->tid_cnt) | 3156 TID_UNIT(ni_pi->cac_weights->tid_unit)); 3157 WREG32(CG_CAC_CTRL, reg); 3158 3159 for (i = 0; i < NISLANDS_DCCAC_MAX_LEVELS; i++) 3160 ni_pi->dc_cac_table[i] = ni_pi->cac_weights->dc_cac[i]; 3161 3162 for (i = 0; i < SMC_NISLANDS_BIF_LUT_NUM_OF_ENTRIES; i++) 3163 cac_tables->cac_bif_lut[i] = ni_pi->cac_weights->pcie_cac[i]; 3164 3165 ni_pi->cac_data.i_leakage = rdev->pm.dpm.cac_leakage; 3166 ni_pi->cac_data.pwr_const = 0; 3167 ni_pi->cac_data.dc_cac_value = ni_pi->dc_cac_table[NISLANDS_DCCAC_LEVEL_0]; 3168 ni_pi->cac_data.bif_cac_value = 0; 3169 ni_pi->cac_data.mc_wr_weight = ni_pi->cac_weights->mc_write_weight; 3170 ni_pi->cac_data.mc_rd_weight = ni_pi->cac_weights->mc_read_weight; 3171 ni_pi->cac_data.allow_ovrflw = 0; 3172 ni_pi->cac_data.l2num_win_tdp = ni_pi->lta_window_size; 3173 ni_pi->cac_data.num_win_tdp = 0; 3174 ni_pi->cac_data.lts_truncate_n = ni_pi->lts_truncate; 3175 3176 if (ni_pi->driver_calculate_cac_leakage) 3177 ret = ni_init_driver_calculated_leakage_table(rdev, cac_tables); 3178 else 3179 ret = ni_init_simplified_leakage_table(rdev, cac_tables); 3180 3181 if (ret) 3182 goto done_free; 3183 3184 cac_tables->pwr_const = cpu_to_be32(ni_pi->cac_data.pwr_const); 3185 cac_tables->dc_cacValue = cpu_to_be32(ni_pi->cac_data.dc_cac_value); 3186 cac_tables->bif_cacValue = cpu_to_be32(ni_pi->cac_data.bif_cac_value); 3187 cac_tables->AllowOvrflw = ni_pi->cac_data.allow_ovrflw; 3188 cac_tables->MCWrWeight = ni_pi->cac_data.mc_wr_weight; 3189 cac_tables->MCRdWeight = ni_pi->cac_data.mc_rd_weight; 3190 cac_tables->numWin_TDP = ni_pi->cac_data.num_win_tdp; 3191 cac_tables->l2numWin_TDP = ni_pi->cac_data.l2num_win_tdp; 3192 cac_tables->lts_truncate_n = ni_pi->cac_data.lts_truncate_n; 3193 3194 ret = rv770_copy_bytes_to_smc(rdev, ni_pi->cac_table_start, (u8 *)cac_tables, 3195 sizeof(PP_NIslands_CACTABLES), pi->sram_end); 3196 3197 done_free: 3198 if (ret) { 3199 ni_pi->enable_cac = false; 3200 ni_pi->enable_power_containment = false; 3201 } 3202 3203 kfree(cac_tables); 3204 3205 return 0; 3206 } 3207 3208 static int ni_initialize_hardware_cac_manager(struct radeon_device *rdev) 3209 { 3210 struct ni_power_info *ni_pi = ni_get_pi(rdev); 3211 u32 reg; 3212 3213 if (!ni_pi->enable_cac || 3214 !ni_pi->cac_configuration_required) 3215 return 0; 3216 3217 if (ni_pi->cac_weights == NULL) 3218 return -EINVAL; 3219 3220 reg = RREG32_CG(CG_CAC_REGION_1_WEIGHT_0) & ~(WEIGHT_TCP_SIG0_MASK | 3221 WEIGHT_TCP_SIG1_MASK | 3222 WEIGHT_TA_SIG_MASK); 3223 reg |= (WEIGHT_TCP_SIG0(ni_pi->cac_weights->weight_tcp_sig0) | 3224 WEIGHT_TCP_SIG1(ni_pi->cac_weights->weight_tcp_sig1) | 3225 WEIGHT_TA_SIG(ni_pi->cac_weights->weight_ta_sig)); 3226 WREG32_CG(CG_CAC_REGION_1_WEIGHT_0, reg); 3227 3228 reg = RREG32_CG(CG_CAC_REGION_1_WEIGHT_1) & ~(WEIGHT_TCC_EN0_MASK | 3229 WEIGHT_TCC_EN1_MASK | 3230 WEIGHT_TCC_EN2_MASK); 3231 reg |= (WEIGHT_TCC_EN0(ni_pi->cac_weights->weight_tcc_en0) | 3232 WEIGHT_TCC_EN1(ni_pi->cac_weights->weight_tcc_en1) | 3233 WEIGHT_TCC_EN2(ni_pi->cac_weights->weight_tcc_en2)); 3234 WREG32_CG(CG_CAC_REGION_1_WEIGHT_1, reg); 3235 3236 reg = RREG32_CG(CG_CAC_REGION_2_WEIGHT_0) & ~(WEIGHT_CB_EN0_MASK | 3237 WEIGHT_CB_EN1_MASK | 3238 WEIGHT_CB_EN2_MASK | 3239 WEIGHT_CB_EN3_MASK); 3240 reg |= (WEIGHT_CB_EN0(ni_pi->cac_weights->weight_cb_en0) | 3241 WEIGHT_CB_EN1(ni_pi->cac_weights->weight_cb_en1) | 3242 WEIGHT_CB_EN2(ni_pi->cac_weights->weight_cb_en2) | 3243 WEIGHT_CB_EN3(ni_pi->cac_weights->weight_cb_en3)); 3244 WREG32_CG(CG_CAC_REGION_2_WEIGHT_0, reg); 3245 3246 reg = RREG32_CG(CG_CAC_REGION_2_WEIGHT_1) & ~(WEIGHT_DB_SIG0_MASK | 3247 WEIGHT_DB_SIG1_MASK | 3248 WEIGHT_DB_SIG2_MASK | 3249 WEIGHT_DB_SIG3_MASK); 3250 reg |= (WEIGHT_DB_SIG0(ni_pi->cac_weights->weight_db_sig0) | 3251 WEIGHT_DB_SIG1(ni_pi->cac_weights->weight_db_sig1) | 3252 WEIGHT_DB_SIG2(ni_pi->cac_weights->weight_db_sig2) | 3253 WEIGHT_DB_SIG3(ni_pi->cac_weights->weight_db_sig3)); 3254 WREG32_CG(CG_CAC_REGION_2_WEIGHT_1, reg); 3255 3256 reg = RREG32_CG(CG_CAC_REGION_2_WEIGHT_2) & ~(WEIGHT_SXM_SIG0_MASK | 3257 WEIGHT_SXM_SIG1_MASK | 3258 WEIGHT_SXM_SIG2_MASK | 3259 WEIGHT_SXS_SIG0_MASK | 3260 WEIGHT_SXS_SIG1_MASK); 3261 reg |= (WEIGHT_SXM_SIG0(ni_pi->cac_weights->weight_sxm_sig0) | 3262 WEIGHT_SXM_SIG1(ni_pi->cac_weights->weight_sxm_sig1) | 3263 WEIGHT_SXM_SIG2(ni_pi->cac_weights->weight_sxm_sig2) | 3264 WEIGHT_SXS_SIG0(ni_pi->cac_weights->weight_sxs_sig0) | 3265 WEIGHT_SXS_SIG1(ni_pi->cac_weights->weight_sxs_sig1)); 3266 WREG32_CG(CG_CAC_REGION_2_WEIGHT_2, reg); 3267 3268 reg = RREG32_CG(CG_CAC_REGION_3_WEIGHT_0) & ~(WEIGHT_XBR_0_MASK | 3269 WEIGHT_XBR_1_MASK | 3270 WEIGHT_XBR_2_MASK | 3271 WEIGHT_SPI_SIG0_MASK); 3272 reg |= (WEIGHT_XBR_0(ni_pi->cac_weights->weight_xbr_0) | 3273 WEIGHT_XBR_1(ni_pi->cac_weights->weight_xbr_1) | 3274 WEIGHT_XBR_2(ni_pi->cac_weights->weight_xbr_2) | 3275 WEIGHT_SPI_SIG0(ni_pi->cac_weights->weight_spi_sig0)); 3276 WREG32_CG(CG_CAC_REGION_3_WEIGHT_0, reg); 3277 3278 reg = RREG32_CG(CG_CAC_REGION_3_WEIGHT_1) & ~(WEIGHT_SPI_SIG1_MASK | 3279 WEIGHT_SPI_SIG2_MASK | 3280 WEIGHT_SPI_SIG3_MASK | 3281 WEIGHT_SPI_SIG4_MASK | 3282 WEIGHT_SPI_SIG5_MASK); 3283 reg |= (WEIGHT_SPI_SIG1(ni_pi->cac_weights->weight_spi_sig1) | 3284 WEIGHT_SPI_SIG2(ni_pi->cac_weights->weight_spi_sig2) | 3285 WEIGHT_SPI_SIG3(ni_pi->cac_weights->weight_spi_sig3) | 3286 WEIGHT_SPI_SIG4(ni_pi->cac_weights->weight_spi_sig4) | 3287 WEIGHT_SPI_SIG5(ni_pi->cac_weights->weight_spi_sig5)); 3288 WREG32_CG(CG_CAC_REGION_3_WEIGHT_1, reg); 3289 3290 reg = RREG32_CG(CG_CAC_REGION_4_WEIGHT_0) & ~(WEIGHT_LDS_SIG0_MASK | 3291 WEIGHT_LDS_SIG1_MASK | 3292 WEIGHT_SC_MASK); 3293 reg |= (WEIGHT_LDS_SIG0(ni_pi->cac_weights->weight_lds_sig0) | 3294 WEIGHT_LDS_SIG1(ni_pi->cac_weights->weight_lds_sig1) | 3295 WEIGHT_SC(ni_pi->cac_weights->weight_sc)); 3296 WREG32_CG(CG_CAC_REGION_4_WEIGHT_0, reg); 3297 3298 reg = RREG32_CG(CG_CAC_REGION_4_WEIGHT_1) & ~(WEIGHT_BIF_MASK | 3299 WEIGHT_CP_MASK | 3300 WEIGHT_PA_SIG0_MASK | 3301 WEIGHT_PA_SIG1_MASK | 3302 WEIGHT_VGT_SIG0_MASK); 3303 reg |= (WEIGHT_BIF(ni_pi->cac_weights->weight_bif) | 3304 WEIGHT_CP(ni_pi->cac_weights->weight_cp) | 3305 WEIGHT_PA_SIG0(ni_pi->cac_weights->weight_pa_sig0) | 3306 WEIGHT_PA_SIG1(ni_pi->cac_weights->weight_pa_sig1) | 3307 WEIGHT_VGT_SIG0(ni_pi->cac_weights->weight_vgt_sig0)); 3308 WREG32_CG(CG_CAC_REGION_4_WEIGHT_1, reg); 3309 3310 reg = RREG32_CG(CG_CAC_REGION_4_WEIGHT_2) & ~(WEIGHT_VGT_SIG1_MASK | 3311 WEIGHT_VGT_SIG2_MASK | 3312 WEIGHT_DC_SIG0_MASK | 3313 WEIGHT_DC_SIG1_MASK | 3314 WEIGHT_DC_SIG2_MASK); 3315 reg |= (WEIGHT_VGT_SIG1(ni_pi->cac_weights->weight_vgt_sig1) | 3316 WEIGHT_VGT_SIG2(ni_pi->cac_weights->weight_vgt_sig2) | 3317 WEIGHT_DC_SIG0(ni_pi->cac_weights->weight_dc_sig0) | 3318 WEIGHT_DC_SIG1(ni_pi->cac_weights->weight_dc_sig1) | 3319 WEIGHT_DC_SIG2(ni_pi->cac_weights->weight_dc_sig2)); 3320 WREG32_CG(CG_CAC_REGION_4_WEIGHT_2, reg); 3321 3322 reg = RREG32_CG(CG_CAC_REGION_4_WEIGHT_3) & ~(WEIGHT_DC_SIG3_MASK | 3323 WEIGHT_UVD_SIG0_MASK | 3324 WEIGHT_UVD_SIG1_MASK | 3325 WEIGHT_SPARE0_MASK | 3326 WEIGHT_SPARE1_MASK); 3327 reg |= (WEIGHT_DC_SIG3(ni_pi->cac_weights->weight_dc_sig3) | 3328 WEIGHT_UVD_SIG0(ni_pi->cac_weights->weight_uvd_sig0) | 3329 WEIGHT_UVD_SIG1(ni_pi->cac_weights->weight_uvd_sig1) | 3330 WEIGHT_SPARE0(ni_pi->cac_weights->weight_spare0) | 3331 WEIGHT_SPARE1(ni_pi->cac_weights->weight_spare1)); 3332 WREG32_CG(CG_CAC_REGION_4_WEIGHT_3, reg); 3333 3334 reg = RREG32_CG(CG_CAC_REGION_5_WEIGHT_0) & ~(WEIGHT_SQ_VSP_MASK | 3335 WEIGHT_SQ_VSP0_MASK); 3336 reg |= (WEIGHT_SQ_VSP(ni_pi->cac_weights->weight_sq_vsp) | 3337 WEIGHT_SQ_VSP0(ni_pi->cac_weights->weight_sq_vsp0)); 3338 WREG32_CG(CG_CAC_REGION_5_WEIGHT_0, reg); 3339 3340 reg = RREG32_CG(CG_CAC_REGION_5_WEIGHT_1) & ~(WEIGHT_SQ_GPR_MASK); 3341 reg |= WEIGHT_SQ_GPR(ni_pi->cac_weights->weight_sq_gpr); 3342 WREG32_CG(CG_CAC_REGION_5_WEIGHT_1, reg); 3343 3344 reg = RREG32_CG(CG_CAC_REGION_4_OVERRIDE_4) & ~(OVR_MODE_SPARE_0_MASK | 3345 OVR_VAL_SPARE_0_MASK | 3346 OVR_MODE_SPARE_1_MASK | 3347 OVR_VAL_SPARE_1_MASK); 3348 reg |= (OVR_MODE_SPARE_0(ni_pi->cac_weights->ovr_mode_spare_0) | 3349 OVR_VAL_SPARE_0(ni_pi->cac_weights->ovr_val_spare_0) | 3350 OVR_MODE_SPARE_1(ni_pi->cac_weights->ovr_mode_spare_1) | 3351 OVR_VAL_SPARE_1(ni_pi->cac_weights->ovr_val_spare_1)); 3352 WREG32_CG(CG_CAC_REGION_4_OVERRIDE_4, reg); 3353 3354 reg = RREG32(SQ_CAC_THRESHOLD) & ~(VSP_MASK | 3355 VSP0_MASK | 3356 GPR_MASK); 3357 reg |= (VSP(ni_pi->cac_weights->vsp) | 3358 VSP0(ni_pi->cac_weights->vsp0) | 3359 GPR(ni_pi->cac_weights->gpr)); 3360 WREG32(SQ_CAC_THRESHOLD, reg); 3361 3362 reg = (MCDW_WR_ENABLE | 3363 MCDX_WR_ENABLE | 3364 MCDY_WR_ENABLE | 3365 MCDZ_WR_ENABLE | 3366 INDEX(0x09D4)); 3367 WREG32(MC_CG_CONFIG, reg); 3368 3369 reg = (READ_WEIGHT(ni_pi->cac_weights->mc_read_weight) | 3370 WRITE_WEIGHT(ni_pi->cac_weights->mc_write_weight) | 3371 ALLOW_OVERFLOW); 3372 WREG32(MC_CG_DATAPORT, reg); 3373 3374 return 0; 3375 } 3376 3377 static int ni_enable_smc_cac(struct radeon_device *rdev, 3378 struct radeon_ps *radeon_new_state, 3379 bool enable) 3380 { 3381 struct ni_power_info *ni_pi = ni_get_pi(rdev); 3382 int ret = 0; 3383 PPSMC_Result smc_result; 3384 3385 if (ni_pi->enable_cac) { 3386 if (enable) { 3387 if (!r600_is_uvd_state(radeon_new_state->class, radeon_new_state->class2)) { 3388 smc_result = rv770_send_msg_to_smc(rdev, PPSMC_MSG_CollectCAC_PowerCorreln); 3389 3390 if (ni_pi->support_cac_long_term_average) { 3391 smc_result = rv770_send_msg_to_smc(rdev, PPSMC_CACLongTermAvgEnable); 3392 if (PPSMC_Result_OK != smc_result) 3393 ni_pi->support_cac_long_term_average = false; 3394 } 3395 3396 smc_result = rv770_send_msg_to_smc(rdev, PPSMC_MSG_EnableCac); 3397 if (PPSMC_Result_OK != smc_result) 3398 ret = -EINVAL; 3399 3400 ni_pi->cac_enabled = (PPSMC_Result_OK == smc_result) ? true : false; 3401 } 3402 } else if (ni_pi->cac_enabled) { 3403 smc_result = rv770_send_msg_to_smc(rdev, PPSMC_MSG_DisableCac); 3404 3405 ni_pi->cac_enabled = false; 3406 3407 if (ni_pi->support_cac_long_term_average) { 3408 smc_result = rv770_send_msg_to_smc(rdev, PPSMC_CACLongTermAvgDisable); 3409 if (PPSMC_Result_OK != smc_result) 3410 ni_pi->support_cac_long_term_average = false; 3411 } 3412 } 3413 } 3414 3415 return ret; 3416 } 3417 3418 static int ni_pcie_performance_request(struct radeon_device *rdev, 3419 u8 perf_req, bool advertise) 3420 { 3421 #if defined(CONFIG_ACPI) 3422 struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev); 3423 3424 if ((perf_req == PCIE_PERF_REQ_PECI_GEN1) || 3425 (perf_req == PCIE_PERF_REQ_PECI_GEN2)) { 3426 if (eg_pi->pcie_performance_request_registered == false) 3427 radeon_acpi_pcie_notify_device_ready(rdev); 3428 eg_pi->pcie_performance_request_registered = true; 3429 return radeon_acpi_pcie_performance_request(rdev, perf_req, advertise); 3430 } else if ((perf_req == PCIE_PERF_REQ_REMOVE_REGISTRY) && 3431 eg_pi->pcie_performance_request_registered) { 3432 eg_pi->pcie_performance_request_registered = false; 3433 return radeon_acpi_pcie_performance_request(rdev, perf_req, advertise); 3434 } 3435 #endif 3436 return 0; 3437 } 3438 3439 static int ni_advertise_gen2_capability(struct radeon_device *rdev) 3440 { 3441 struct rv7xx_power_info *pi = rv770_get_pi(rdev); 3442 u32 tmp; 3443 3444 tmp = RREG32_PCIE_PORT(PCIE_LC_SPEED_CNTL); 3445 3446 if ((tmp & LC_OTHER_SIDE_EVER_SENT_GEN2) && 3447 (tmp & LC_OTHER_SIDE_SUPPORTS_GEN2)) 3448 pi->pcie_gen2 = true; 3449 else 3450 pi->pcie_gen2 = false; 3451 3452 if (!pi->pcie_gen2) 3453 ni_pcie_performance_request(rdev, PCIE_PERF_REQ_PECI_GEN2, true); 3454 3455 return 0; 3456 } 3457 3458 static void ni_enable_bif_dynamic_pcie_gen2(struct radeon_device *rdev, 3459 bool enable) 3460 { 3461 struct rv7xx_power_info *pi = rv770_get_pi(rdev); 3462 u32 tmp, bif; 3463 3464 tmp = RREG32_PCIE_PORT(PCIE_LC_SPEED_CNTL); 3465 3466 if ((tmp & LC_OTHER_SIDE_EVER_SENT_GEN2) && 3467 (tmp & LC_OTHER_SIDE_SUPPORTS_GEN2)) { 3468 if (enable) { 3469 if (!pi->boot_in_gen2) { 3470 bif = RREG32(CG_BIF_REQ_AND_RSP) & ~CG_CLIENT_REQ_MASK; 3471 bif |= CG_CLIENT_REQ(0xd); 3472 WREG32(CG_BIF_REQ_AND_RSP, bif); 3473 } 3474 tmp &= ~LC_HW_VOLTAGE_IF_CONTROL_MASK; 3475 tmp |= LC_HW_VOLTAGE_IF_CONTROL(1); 3476 tmp |= LC_GEN2_EN_STRAP; 3477 3478 tmp |= LC_CLR_FAILED_SPD_CHANGE_CNT; 3479 WREG32_PCIE_PORT(PCIE_LC_SPEED_CNTL, tmp); 3480 udelay(10); 3481 tmp &= ~LC_CLR_FAILED_SPD_CHANGE_CNT; 3482 WREG32_PCIE_PORT(PCIE_LC_SPEED_CNTL, tmp); 3483 } else { 3484 if (!pi->boot_in_gen2) { 3485 bif = RREG32(CG_BIF_REQ_AND_RSP) & ~CG_CLIENT_REQ_MASK; 3486 bif |= CG_CLIENT_REQ(0xd); 3487 WREG32(CG_BIF_REQ_AND_RSP, bif); 3488 3489 tmp &= ~LC_HW_VOLTAGE_IF_CONTROL_MASK; 3490 tmp &= ~LC_GEN2_EN_STRAP; 3491 } 3492 WREG32_PCIE_PORT(PCIE_LC_SPEED_CNTL, tmp); 3493 } 3494 } 3495 } 3496 3497 static void ni_enable_dynamic_pcie_gen2(struct radeon_device *rdev, 3498 bool enable) 3499 { 3500 ni_enable_bif_dynamic_pcie_gen2(rdev, enable); 3501 3502 if (enable) 3503 WREG32_P(GENERAL_PWRMGT, ENABLE_GEN2PCIE, ~ENABLE_GEN2PCIE); 3504 else 3505 WREG32_P(GENERAL_PWRMGT, 0, ~ENABLE_GEN2PCIE); 3506 } 3507 3508 void ni_set_uvd_clock_before_set_eng_clock(struct radeon_device *rdev, 3509 struct radeon_ps *new_ps, 3510 struct radeon_ps *old_ps) 3511 { 3512 struct ni_ps *new_state = ni_get_ps(new_ps); 3513 struct ni_ps *current_state = ni_get_ps(old_ps); 3514 3515 if ((new_ps->vclk == old_ps->vclk) && 3516 (new_ps->dclk == old_ps->dclk)) 3517 return; 3518 3519 if (new_state->performance_levels[new_state->performance_level_count - 1].sclk >= 3520 current_state->performance_levels[current_state->performance_level_count - 1].sclk) 3521 return; 3522 3523 radeon_set_uvd_clocks(rdev, new_ps->vclk, new_ps->dclk); 3524 } 3525 3526 void ni_set_uvd_clock_after_set_eng_clock(struct radeon_device *rdev, 3527 struct radeon_ps *new_ps, 3528 struct radeon_ps *old_ps) 3529 { 3530 struct ni_ps *new_state = ni_get_ps(new_ps); 3531 struct ni_ps *current_state = ni_get_ps(old_ps); 3532 3533 if ((new_ps->vclk == old_ps->vclk) && 3534 (new_ps->dclk == old_ps->dclk)) 3535 return; 3536 3537 if (new_state->performance_levels[new_state->performance_level_count - 1].sclk < 3538 current_state->performance_levels[current_state->performance_level_count - 1].sclk) 3539 return; 3540 3541 radeon_set_uvd_clocks(rdev, new_ps->vclk, new_ps->dclk); 3542 } 3543 3544 void ni_dpm_setup_asic(struct radeon_device *rdev) 3545 { 3546 struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev); 3547 int r; 3548 3549 r = ni_mc_load_microcode(rdev); 3550 if (r) 3551 DRM_ERROR("Failed to load MC firmware!\n"); 3552 ni_read_clock_registers(rdev); 3553 btc_read_arb_registers(rdev); 3554 rv770_get_memory_type(rdev); 3555 if (eg_pi->pcie_performance_request) 3556 ni_advertise_gen2_capability(rdev); 3557 rv770_get_pcie_gen2_status(rdev); 3558 rv770_enable_acpi_pm(rdev); 3559 } 3560 3561 void ni_update_current_ps(struct radeon_device *rdev, 3562 struct radeon_ps *rps) 3563 { 3564 struct ni_ps *new_ps = ni_get_ps(rps); 3565 struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev); 3566 struct ni_power_info *ni_pi = ni_get_pi(rdev); 3567 3568 eg_pi->current_rps = *rps; 3569 ni_pi->current_ps = *new_ps; 3570 eg_pi->current_rps.ps_priv = &ni_pi->current_ps; 3571 } 3572 3573 void ni_update_requested_ps(struct radeon_device *rdev, 3574 struct radeon_ps *rps) 3575 { 3576 struct ni_ps *new_ps = ni_get_ps(rps); 3577 struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev); 3578 struct ni_power_info *ni_pi = ni_get_pi(rdev); 3579 3580 eg_pi->requested_rps = *rps; 3581 ni_pi->requested_ps = *new_ps; 3582 eg_pi->requested_rps.ps_priv = &ni_pi->requested_ps; 3583 } 3584 3585 int ni_dpm_enable(struct radeon_device *rdev) 3586 { 3587 struct rv7xx_power_info *pi = rv770_get_pi(rdev); 3588 struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev); 3589 struct radeon_ps *boot_ps = rdev->pm.dpm.boot_ps; 3590 int ret; 3591 3592 if (pi->gfx_clock_gating) 3593 ni_cg_clockgating_default(rdev); 3594 if (btc_dpm_enabled(rdev)) 3595 return -EINVAL; 3596 if (pi->mg_clock_gating) 3597 ni_mg_clockgating_default(rdev); 3598 if (eg_pi->ls_clock_gating) 3599 ni_ls_clockgating_default(rdev); 3600 if (pi->voltage_control) { 3601 rv770_enable_voltage_control(rdev, true); 3602 ret = cypress_construct_voltage_tables(rdev); 3603 if (ret) { 3604 DRM_ERROR("cypress_construct_voltage_tables failed\n"); 3605 return ret; 3606 } 3607 } 3608 if (eg_pi->dynamic_ac_timing) { 3609 ret = ni_initialize_mc_reg_table(rdev); 3610 if (ret) 3611 eg_pi->dynamic_ac_timing = false; 3612 } 3613 if (pi->dynamic_ss) 3614 cypress_enable_spread_spectrum(rdev, true); 3615 if (pi->thermal_protection) 3616 rv770_enable_thermal_protection(rdev, true); 3617 rv770_setup_bsp(rdev); 3618 rv770_program_git(rdev); 3619 rv770_program_tp(rdev); 3620 rv770_program_tpp(rdev); 3621 rv770_program_sstp(rdev); 3622 cypress_enable_display_gap(rdev); 3623 rv770_program_vc(rdev); 3624 if (pi->dynamic_pcie_gen2) 3625 ni_enable_dynamic_pcie_gen2(rdev, true); 3626 ret = rv770_upload_firmware(rdev); 3627 if (ret) { 3628 DRM_ERROR("rv770_upload_firmware failed\n"); 3629 return ret; 3630 } 3631 ret = ni_process_firmware_header(rdev); 3632 if (ret) { 3633 DRM_ERROR("ni_process_firmware_header failed\n"); 3634 return ret; 3635 } 3636 ret = ni_initial_switch_from_arb_f0_to_f1(rdev); 3637 if (ret) { 3638 DRM_ERROR("ni_initial_switch_from_arb_f0_to_f1 failed\n"); 3639 return ret; 3640 } 3641 ret = ni_init_smc_table(rdev); 3642 if (ret) { 3643 DRM_ERROR("ni_init_smc_table failed\n"); 3644 return ret; 3645 } 3646 ret = ni_init_smc_spll_table(rdev); 3647 if (ret) { 3648 DRM_ERROR("ni_init_smc_spll_table failed\n"); 3649 return ret; 3650 } 3651 ret = ni_init_arb_table_index(rdev); 3652 if (ret) { 3653 DRM_ERROR("ni_init_arb_table_index failed\n"); 3654 return ret; 3655 } 3656 if (eg_pi->dynamic_ac_timing) { 3657 ret = ni_populate_mc_reg_table(rdev, boot_ps); 3658 if (ret) { 3659 DRM_ERROR("ni_populate_mc_reg_table failed\n"); 3660 return ret; 3661 } 3662 } 3663 ret = ni_initialize_smc_cac_tables(rdev); 3664 if (ret) { 3665 DRM_ERROR("ni_initialize_smc_cac_tables failed\n"); 3666 return ret; 3667 } 3668 ret = ni_initialize_hardware_cac_manager(rdev); 3669 if (ret) { 3670 DRM_ERROR("ni_initialize_hardware_cac_manager failed\n"); 3671 return ret; 3672 } 3673 ret = ni_populate_smc_tdp_limits(rdev, boot_ps); 3674 if (ret) { 3675 DRM_ERROR("ni_populate_smc_tdp_limits failed\n"); 3676 return ret; 3677 } 3678 ni_program_response_times(rdev); 3679 r7xx_start_smc(rdev); 3680 ret = cypress_notify_smc_display_change(rdev, false); 3681 if (ret) { 3682 DRM_ERROR("cypress_notify_smc_display_change failed\n"); 3683 return ret; 3684 } 3685 cypress_enable_sclk_control(rdev, true); 3686 if (eg_pi->memory_transition) 3687 cypress_enable_mclk_control(rdev, true); 3688 cypress_start_dpm(rdev); 3689 if (pi->gfx_clock_gating) 3690 ni_gfx_clockgating_enable(rdev, true); 3691 if (pi->mg_clock_gating) 3692 ni_mg_clockgating_enable(rdev, true); 3693 if (eg_pi->ls_clock_gating) 3694 ni_ls_clockgating_enable(rdev, true); 3695 3696 rv770_enable_auto_throttle_source(rdev, RADEON_DPM_AUTO_THROTTLE_SRC_THERMAL, true); 3697 3698 ni_update_current_ps(rdev, boot_ps); 3699 3700 return 0; 3701 } 3702 3703 void ni_dpm_disable(struct radeon_device *rdev) 3704 { 3705 struct rv7xx_power_info *pi = rv770_get_pi(rdev); 3706 struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev); 3707 struct radeon_ps *boot_ps = rdev->pm.dpm.boot_ps; 3708 3709 if (!btc_dpm_enabled(rdev)) 3710 return; 3711 rv770_clear_vc(rdev); 3712 if (pi->thermal_protection) 3713 rv770_enable_thermal_protection(rdev, false); 3714 ni_enable_power_containment(rdev, boot_ps, false); 3715 ni_enable_smc_cac(rdev, boot_ps, false); 3716 cypress_enable_spread_spectrum(rdev, false); 3717 rv770_enable_auto_throttle_source(rdev, RADEON_DPM_AUTO_THROTTLE_SRC_THERMAL, false); 3718 if (pi->dynamic_pcie_gen2) 3719 ni_enable_dynamic_pcie_gen2(rdev, false); 3720 3721 if (rdev->irq.installed && 3722 r600_is_internal_thermal_sensor(rdev->pm.int_thermal_type)) { 3723 rdev->irq.dpm_thermal = false; 3724 radeon_irq_set(rdev); 3725 } 3726 3727 if (pi->gfx_clock_gating) 3728 ni_gfx_clockgating_enable(rdev, false); 3729 if (pi->mg_clock_gating) 3730 ni_mg_clockgating_enable(rdev, false); 3731 if (eg_pi->ls_clock_gating) 3732 ni_ls_clockgating_enable(rdev, false); 3733 ni_stop_dpm(rdev); 3734 btc_reset_to_default(rdev); 3735 ni_stop_smc(rdev); 3736 ni_force_switch_to_arb_f0(rdev); 3737 3738 ni_update_current_ps(rdev, boot_ps); 3739 } 3740 3741 static int ni_power_control_set_level(struct radeon_device *rdev) 3742 { 3743 struct radeon_ps *new_ps = rdev->pm.dpm.requested_ps; 3744 int ret; 3745 3746 ret = ni_restrict_performance_levels_before_switch(rdev); 3747 if (ret) 3748 return ret; 3749 ret = rv770_halt_smc(rdev); 3750 if (ret) 3751 return ret; 3752 ret = ni_populate_smc_tdp_limits(rdev, new_ps); 3753 if (ret) 3754 return ret; 3755 ret = rv770_resume_smc(rdev); 3756 if (ret) 3757 return ret; 3758 ret = rv770_set_sw_state(rdev); 3759 if (ret) 3760 return ret; 3761 3762 return 0; 3763 } 3764 3765 int ni_dpm_pre_set_power_state(struct radeon_device *rdev) 3766 { 3767 struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev); 3768 struct radeon_ps requested_ps = *rdev->pm.dpm.requested_ps; 3769 struct radeon_ps *new_ps = &requested_ps; 3770 3771 ni_update_requested_ps(rdev, new_ps); 3772 3773 ni_apply_state_adjust_rules(rdev, &eg_pi->requested_rps); 3774 3775 return 0; 3776 } 3777 3778 int ni_dpm_set_power_state(struct radeon_device *rdev) 3779 { 3780 struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev); 3781 struct radeon_ps *new_ps = &eg_pi->requested_rps; 3782 struct radeon_ps *old_ps = &eg_pi->current_rps; 3783 int ret; 3784 3785 ret = ni_restrict_performance_levels_before_switch(rdev); 3786 if (ret) { 3787 DRM_ERROR("ni_restrict_performance_levels_before_switch failed\n"); 3788 return ret; 3789 } 3790 ni_set_uvd_clock_before_set_eng_clock(rdev, new_ps, old_ps); 3791 ret = ni_enable_power_containment(rdev, new_ps, false); 3792 if (ret) { 3793 DRM_ERROR("ni_enable_power_containment failed\n"); 3794 return ret; 3795 } 3796 ret = ni_enable_smc_cac(rdev, new_ps, false); 3797 if (ret) { 3798 DRM_ERROR("ni_enable_smc_cac failed\n"); 3799 return ret; 3800 } 3801 ret = rv770_halt_smc(rdev); 3802 if (ret) { 3803 DRM_ERROR("rv770_halt_smc failed\n"); 3804 return ret; 3805 } 3806 if (eg_pi->smu_uvd_hs) 3807 btc_notify_uvd_to_smc(rdev, new_ps); 3808 ret = ni_upload_sw_state(rdev, new_ps); 3809 if (ret) { 3810 DRM_ERROR("ni_upload_sw_state failed\n"); 3811 return ret; 3812 } 3813 if (eg_pi->dynamic_ac_timing) { 3814 ret = ni_upload_mc_reg_table(rdev, new_ps); 3815 if (ret) { 3816 DRM_ERROR("ni_upload_mc_reg_table failed\n"); 3817 return ret; 3818 } 3819 } 3820 ret = ni_program_memory_timing_parameters(rdev, new_ps); 3821 if (ret) { 3822 DRM_ERROR("ni_program_memory_timing_parameters failed\n"); 3823 return ret; 3824 } 3825 ret = rv770_resume_smc(rdev); 3826 if (ret) { 3827 DRM_ERROR("rv770_resume_smc failed\n"); 3828 return ret; 3829 } 3830 ret = rv770_set_sw_state(rdev); 3831 if (ret) { 3832 DRM_ERROR("rv770_set_sw_state failed\n"); 3833 return ret; 3834 } 3835 ni_set_uvd_clock_after_set_eng_clock(rdev, new_ps, old_ps); 3836 ret = ni_enable_smc_cac(rdev, new_ps, true); 3837 if (ret) { 3838 DRM_ERROR("ni_enable_smc_cac failed\n"); 3839 return ret; 3840 } 3841 ret = ni_enable_power_containment(rdev, new_ps, true); 3842 if (ret) { 3843 DRM_ERROR("ni_enable_power_containment failed\n"); 3844 return ret; 3845 } 3846 3847 /* update tdp */ 3848 ret = ni_power_control_set_level(rdev); 3849 if (ret) { 3850 DRM_ERROR("ni_power_control_set_level failed\n"); 3851 return ret; 3852 } 3853 3854 return 0; 3855 } 3856 3857 void ni_dpm_post_set_power_state(struct radeon_device *rdev) 3858 { 3859 struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev); 3860 struct radeon_ps *new_ps = &eg_pi->requested_rps; 3861 3862 ni_update_current_ps(rdev, new_ps); 3863 } 3864 3865 #if 0 3866 void ni_dpm_reset_asic(struct radeon_device *rdev) 3867 { 3868 ni_restrict_performance_levels_before_switch(rdev); 3869 rv770_set_boot_state(rdev); 3870 } 3871 #endif 3872 3873 union power_info { 3874 struct _ATOM_POWERPLAY_INFO info; 3875 struct _ATOM_POWERPLAY_INFO_V2 info_2; 3876 struct _ATOM_POWERPLAY_INFO_V3 info_3; 3877 struct _ATOM_PPLIB_POWERPLAYTABLE pplib; 3878 struct _ATOM_PPLIB_POWERPLAYTABLE2 pplib2; 3879 struct _ATOM_PPLIB_POWERPLAYTABLE3 pplib3; 3880 }; 3881 3882 union pplib_clock_info { 3883 struct _ATOM_PPLIB_R600_CLOCK_INFO r600; 3884 struct _ATOM_PPLIB_RS780_CLOCK_INFO rs780; 3885 struct _ATOM_PPLIB_EVERGREEN_CLOCK_INFO evergreen; 3886 struct _ATOM_PPLIB_SUMO_CLOCK_INFO sumo; 3887 }; 3888 3889 union pplib_power_state { 3890 struct _ATOM_PPLIB_STATE v1; 3891 struct _ATOM_PPLIB_STATE_V2 v2; 3892 }; 3893 3894 static void ni_parse_pplib_non_clock_info(struct radeon_device *rdev, 3895 struct radeon_ps *rps, 3896 struct _ATOM_PPLIB_NONCLOCK_INFO *non_clock_info, 3897 u8 table_rev) 3898 { 3899 rps->caps = le32_to_cpu(non_clock_info->ulCapsAndSettings); 3900 rps->class = le16_to_cpu(non_clock_info->usClassification); 3901 rps->class2 = le16_to_cpu(non_clock_info->usClassification2); 3902 3903 if (ATOM_PPLIB_NONCLOCKINFO_VER1 < table_rev) { 3904 rps->vclk = le32_to_cpu(non_clock_info->ulVCLK); 3905 rps->dclk = le32_to_cpu(non_clock_info->ulDCLK); 3906 } else if (r600_is_uvd_state(rps->class, rps->class2)) { 3907 rps->vclk = RV770_DEFAULT_VCLK_FREQ; 3908 rps->dclk = RV770_DEFAULT_DCLK_FREQ; 3909 } else { 3910 rps->vclk = 0; 3911 rps->dclk = 0; 3912 } 3913 3914 if (rps->class & ATOM_PPLIB_CLASSIFICATION_BOOT) 3915 rdev->pm.dpm.boot_ps = rps; 3916 if (rps->class & ATOM_PPLIB_CLASSIFICATION_UVDSTATE) 3917 rdev->pm.dpm.uvd_ps = rps; 3918 } 3919 3920 static void ni_parse_pplib_clock_info(struct radeon_device *rdev, 3921 struct radeon_ps *rps, int index, 3922 union pplib_clock_info *clock_info) 3923 { 3924 struct rv7xx_power_info *pi = rv770_get_pi(rdev); 3925 struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev); 3926 struct ni_ps *ps = ni_get_ps(rps); 3927 struct rv7xx_pl *pl = &ps->performance_levels[index]; 3928 3929 ps->performance_level_count = index + 1; 3930 3931 pl->sclk = le16_to_cpu(clock_info->evergreen.usEngineClockLow); 3932 pl->sclk |= clock_info->evergreen.ucEngineClockHigh << 16; 3933 pl->mclk = le16_to_cpu(clock_info->evergreen.usMemoryClockLow); 3934 pl->mclk |= clock_info->evergreen.ucMemoryClockHigh << 16; 3935 3936 pl->vddc = le16_to_cpu(clock_info->evergreen.usVDDC); 3937 pl->vddci = le16_to_cpu(clock_info->evergreen.usVDDCI); 3938 pl->flags = le32_to_cpu(clock_info->evergreen.ulFlags); 3939 3940 /* patch up vddc if necessary */ 3941 if (pl->vddc == 0xff01) { 3942 if (pi->max_vddc) 3943 pl->vddc = pi->max_vddc; 3944 } 3945 3946 if (rps->class & ATOM_PPLIB_CLASSIFICATION_ACPI) { 3947 pi->acpi_vddc = pl->vddc; 3948 eg_pi->acpi_vddci = pl->vddci; 3949 if (ps->performance_levels[0].flags & ATOM_PPLIB_R600_FLAGS_PCIEGEN2) 3950 pi->acpi_pcie_gen2 = true; 3951 else 3952 pi->acpi_pcie_gen2 = false; 3953 } 3954 3955 if (rps->class2 & ATOM_PPLIB_CLASSIFICATION2_ULV) { 3956 eg_pi->ulv.supported = true; 3957 eg_pi->ulv.pl = pl; 3958 } 3959 3960 if (pi->min_vddc_in_table > pl->vddc) 3961 pi->min_vddc_in_table = pl->vddc; 3962 3963 if (pi->max_vddc_in_table < pl->vddc) 3964 pi->max_vddc_in_table = pl->vddc; 3965 3966 /* patch up boot state */ 3967 if (rps->class & ATOM_PPLIB_CLASSIFICATION_BOOT) { 3968 u16 vddc, vddci, mvdd; 3969 radeon_atombios_get_default_voltages(rdev, &vddc, &vddci, &mvdd); 3970 pl->mclk = rdev->clock.default_mclk; 3971 pl->sclk = rdev->clock.default_sclk; 3972 pl->vddc = vddc; 3973 pl->vddci = vddci; 3974 } 3975 3976 if ((rps->class & ATOM_PPLIB_CLASSIFICATION_UI_MASK) == 3977 ATOM_PPLIB_CLASSIFICATION_UI_PERFORMANCE) { 3978 rdev->pm.dpm.dyn_state.max_clock_voltage_on_ac.sclk = pl->sclk; 3979 rdev->pm.dpm.dyn_state.max_clock_voltage_on_ac.mclk = pl->mclk; 3980 rdev->pm.dpm.dyn_state.max_clock_voltage_on_ac.vddc = pl->vddc; 3981 rdev->pm.dpm.dyn_state.max_clock_voltage_on_ac.vddci = pl->vddci; 3982 } 3983 } 3984 3985 static int ni_parse_power_table(struct radeon_device *rdev) 3986 { 3987 struct radeon_mode_info *mode_info = &rdev->mode_info; 3988 struct _ATOM_PPLIB_NONCLOCK_INFO *non_clock_info; 3989 union pplib_power_state *power_state; 3990 int i, j; 3991 union pplib_clock_info *clock_info; 3992 union power_info *power_info; 3993 int index = GetIndexIntoMasterTable(DATA, PowerPlayInfo); 3994 u16 data_offset; 3995 u8 frev, crev; 3996 struct ni_ps *ps; 3997 3998 if (!atom_parse_data_header(mode_info->atom_context, index, NULL, 3999 &frev, &crev, &data_offset)) 4000 return -EINVAL; 4001 power_info = (union power_info *)(mode_info->atom_context->bios + data_offset); 4002 4003 rdev->pm.dpm.ps = kcalloc(power_info->pplib.ucNumStates, 4004 sizeof(struct radeon_ps), 4005 GFP_KERNEL); 4006 if (!rdev->pm.dpm.ps) 4007 return -ENOMEM; 4008 4009 for (i = 0; i < power_info->pplib.ucNumStates; i++) { 4010 power_state = (union pplib_power_state *) 4011 (mode_info->atom_context->bios + data_offset + 4012 le16_to_cpu(power_info->pplib.usStateArrayOffset) + 4013 i * power_info->pplib.ucStateEntrySize); 4014 non_clock_info = (struct _ATOM_PPLIB_NONCLOCK_INFO *) 4015 (mode_info->atom_context->bios + data_offset + 4016 le16_to_cpu(power_info->pplib.usNonClockInfoArrayOffset) + 4017 (power_state->v1.ucNonClockStateIndex * 4018 power_info->pplib.ucNonClockSize)); 4019 if (power_info->pplib.ucStateEntrySize - 1) { 4020 u8 *idx; 4021 ps = kzalloc(sizeof(struct ni_ps), GFP_KERNEL); 4022 if (ps == NULL) { 4023 kfree(rdev->pm.dpm.ps); 4024 return -ENOMEM; 4025 } 4026 rdev->pm.dpm.ps[i].ps_priv = ps; 4027 ni_parse_pplib_non_clock_info(rdev, &rdev->pm.dpm.ps[i], 4028 non_clock_info, 4029 power_info->pplib.ucNonClockSize); 4030 idx = (u8 *)&power_state->v1.ucClockStateIndices[0]; 4031 for (j = 0; j < (power_info->pplib.ucStateEntrySize - 1); j++) { 4032 clock_info = (union pplib_clock_info *) 4033 (mode_info->atom_context->bios + data_offset + 4034 le16_to_cpu(power_info->pplib.usClockInfoArrayOffset) + 4035 (idx[j] * power_info->pplib.ucClockInfoSize)); 4036 ni_parse_pplib_clock_info(rdev, 4037 &rdev->pm.dpm.ps[i], j, 4038 clock_info); 4039 } 4040 } 4041 } 4042 rdev->pm.dpm.num_ps = power_info->pplib.ucNumStates; 4043 return 0; 4044 } 4045 4046 int ni_dpm_init(struct radeon_device *rdev) 4047 { 4048 struct rv7xx_power_info *pi; 4049 struct evergreen_power_info *eg_pi; 4050 struct ni_power_info *ni_pi; 4051 struct atom_clock_dividers dividers; 4052 int ret; 4053 4054 ni_pi = kzalloc(sizeof(struct ni_power_info), GFP_KERNEL); 4055 if (ni_pi == NULL) 4056 return -ENOMEM; 4057 rdev->pm.dpm.priv = ni_pi; 4058 eg_pi = &ni_pi->eg; 4059 pi = &eg_pi->rv7xx; 4060 4061 rv770_get_max_vddc(rdev); 4062 4063 eg_pi->ulv.supported = false; 4064 pi->acpi_vddc = 0; 4065 eg_pi->acpi_vddci = 0; 4066 pi->min_vddc_in_table = 0; 4067 pi->max_vddc_in_table = 0; 4068 4069 ret = r600_get_platform_caps(rdev); 4070 if (ret) 4071 return ret; 4072 4073 ret = ni_parse_power_table(rdev); 4074 if (ret) 4075 return ret; 4076 ret = r600_parse_extended_power_table(rdev); 4077 if (ret) 4078 return ret; 4079 4080 rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries = 4081 kcalloc(4, 4082 sizeof(struct radeon_clock_voltage_dependency_entry), 4083 GFP_KERNEL); 4084 if (!rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries) { 4085 r600_free_extended_power_table(rdev); 4086 return -ENOMEM; 4087 } 4088 rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.count = 4; 4089 rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries[0].clk = 0; 4090 rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries[0].v = 0; 4091 rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries[1].clk = 36000; 4092 rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries[1].v = 720; 4093 rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries[2].clk = 54000; 4094 rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries[2].v = 810; 4095 rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries[3].clk = 72000; 4096 rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries[3].v = 900; 4097 4098 ni_patch_dependency_tables_based_on_leakage(rdev); 4099 4100 if (rdev->pm.dpm.voltage_response_time == 0) 4101 rdev->pm.dpm.voltage_response_time = R600_VOLTAGERESPONSETIME_DFLT; 4102 if (rdev->pm.dpm.backbias_response_time == 0) 4103 rdev->pm.dpm.backbias_response_time = R600_BACKBIASRESPONSETIME_DFLT; 4104 4105 ret = radeon_atom_get_clock_dividers(rdev, COMPUTE_ENGINE_PLL_PARAM, 4106 0, false, ÷rs); 4107 if (ret) 4108 pi->ref_div = dividers.ref_div + 1; 4109 else 4110 pi->ref_div = R600_REFERENCEDIVIDER_DFLT; 4111 4112 pi->rlp = RV770_RLP_DFLT; 4113 pi->rmp = RV770_RMP_DFLT; 4114 pi->lhp = RV770_LHP_DFLT; 4115 pi->lmp = RV770_LMP_DFLT; 4116 4117 eg_pi->ats[0].rlp = RV770_RLP_DFLT; 4118 eg_pi->ats[0].rmp = RV770_RMP_DFLT; 4119 eg_pi->ats[0].lhp = RV770_LHP_DFLT; 4120 eg_pi->ats[0].lmp = RV770_LMP_DFLT; 4121 4122 eg_pi->ats[1].rlp = BTC_RLP_UVD_DFLT; 4123 eg_pi->ats[1].rmp = BTC_RMP_UVD_DFLT; 4124 eg_pi->ats[1].lhp = BTC_LHP_UVD_DFLT; 4125 eg_pi->ats[1].lmp = BTC_LMP_UVD_DFLT; 4126 4127 eg_pi->smu_uvd_hs = true; 4128 4129 if (rdev->pdev->device == 0x6707) { 4130 pi->mclk_strobe_mode_threshold = 55000; 4131 pi->mclk_edc_enable_threshold = 55000; 4132 eg_pi->mclk_edc_wr_enable_threshold = 55000; 4133 } else { 4134 pi->mclk_strobe_mode_threshold = 40000; 4135 pi->mclk_edc_enable_threshold = 40000; 4136 eg_pi->mclk_edc_wr_enable_threshold = 40000; 4137 } 4138 ni_pi->mclk_rtt_mode_threshold = eg_pi->mclk_edc_wr_enable_threshold; 4139 4140 pi->voltage_control = 4141 radeon_atom_is_voltage_gpio(rdev, SET_VOLTAGE_TYPE_ASIC_VDDC, 0); 4142 4143 pi->mvdd_control = 4144 radeon_atom_is_voltage_gpio(rdev, SET_VOLTAGE_TYPE_ASIC_MVDDC, 0); 4145 4146 eg_pi->vddci_control = 4147 radeon_atom_is_voltage_gpio(rdev, SET_VOLTAGE_TYPE_ASIC_VDDCI, 0); 4148 4149 rv770_get_engine_memory_ss(rdev); 4150 4151 pi->asi = RV770_ASI_DFLT; 4152 pi->pasi = CYPRESS_HASI_DFLT; 4153 pi->vrc = CYPRESS_VRC_DFLT; 4154 4155 pi->power_gating = false; 4156 4157 pi->gfx_clock_gating = true; 4158 4159 pi->mg_clock_gating = true; 4160 pi->mgcgtssm = true; 4161 eg_pi->ls_clock_gating = false; 4162 eg_pi->sclk_deep_sleep = false; 4163 4164 pi->dynamic_pcie_gen2 = true; 4165 4166 if (rdev->pm.int_thermal_type != THERMAL_TYPE_NONE) 4167 pi->thermal_protection = true; 4168 else 4169 pi->thermal_protection = false; 4170 4171 pi->display_gap = true; 4172 4173 pi->dcodt = true; 4174 4175 pi->ulps = true; 4176 4177 eg_pi->dynamic_ac_timing = true; 4178 eg_pi->abm = true; 4179 eg_pi->mcls = true; 4180 eg_pi->light_sleep = true; 4181 eg_pi->memory_transition = true; 4182 #if defined(CONFIG_ACPI) 4183 eg_pi->pcie_performance_request = 4184 radeon_acpi_is_pcie_performance_request_supported(rdev); 4185 #else 4186 eg_pi->pcie_performance_request = false; 4187 #endif 4188 4189 eg_pi->dll_default_on = false; 4190 4191 eg_pi->sclk_deep_sleep = false; 4192 4193 pi->mclk_stutter_mode_threshold = 0; 4194 4195 pi->sram_end = SMC_RAM_END; 4196 4197 rdev->pm.dpm.dyn_state.mclk_sclk_ratio = 3; 4198 rdev->pm.dpm.dyn_state.vddc_vddci_delta = 200; 4199 rdev->pm.dpm.dyn_state.min_vddc_for_pcie_gen2 = 900; 4200 rdev->pm.dpm.dyn_state.valid_sclk_values.count = ARRAY_SIZE(btc_valid_sclk); 4201 rdev->pm.dpm.dyn_state.valid_sclk_values.values = btc_valid_sclk; 4202 rdev->pm.dpm.dyn_state.valid_mclk_values.count = 0; 4203 rdev->pm.dpm.dyn_state.valid_mclk_values.values = NULL; 4204 rdev->pm.dpm.dyn_state.sclk_mclk_delta = 12500; 4205 4206 ni_pi->cac_data.leakage_coefficients.at = 516; 4207 ni_pi->cac_data.leakage_coefficients.bt = 18; 4208 ni_pi->cac_data.leakage_coefficients.av = 51; 4209 ni_pi->cac_data.leakage_coefficients.bv = 2957; 4210 4211 switch (rdev->pdev->device) { 4212 case 0x6700: 4213 case 0x6701: 4214 case 0x6702: 4215 case 0x6703: 4216 case 0x6718: 4217 ni_pi->cac_weights = &cac_weights_cayman_xt; 4218 break; 4219 case 0x6705: 4220 case 0x6719: 4221 case 0x671D: 4222 case 0x671C: 4223 default: 4224 ni_pi->cac_weights = &cac_weights_cayman_pro; 4225 break; 4226 case 0x6704: 4227 case 0x6706: 4228 case 0x6707: 4229 case 0x6708: 4230 case 0x6709: 4231 ni_pi->cac_weights = &cac_weights_cayman_le; 4232 break; 4233 } 4234 4235 if (ni_pi->cac_weights->enable_power_containment_by_default) { 4236 ni_pi->enable_power_containment = true; 4237 ni_pi->enable_cac = true; 4238 ni_pi->enable_sq_ramping = true; 4239 } else { 4240 ni_pi->enable_power_containment = false; 4241 ni_pi->enable_cac = false; 4242 ni_pi->enable_sq_ramping = false; 4243 } 4244 4245 ni_pi->driver_calculate_cac_leakage = false; 4246 ni_pi->cac_configuration_required = true; 4247 4248 if (ni_pi->cac_configuration_required) { 4249 ni_pi->support_cac_long_term_average = true; 4250 ni_pi->lta_window_size = ni_pi->cac_weights->l2_lta_window_size; 4251 ni_pi->lts_truncate = ni_pi->cac_weights->lts_truncate; 4252 } else { 4253 ni_pi->support_cac_long_term_average = false; 4254 ni_pi->lta_window_size = 0; 4255 ni_pi->lts_truncate = 0; 4256 } 4257 4258 ni_pi->use_power_boost_limit = true; 4259 4260 /* make sure dc limits are valid */ 4261 if ((rdev->pm.dpm.dyn_state.max_clock_voltage_on_dc.sclk == 0) || 4262 (rdev->pm.dpm.dyn_state.max_clock_voltage_on_dc.mclk == 0)) 4263 rdev->pm.dpm.dyn_state.max_clock_voltage_on_dc = 4264 rdev->pm.dpm.dyn_state.max_clock_voltage_on_ac; 4265 4266 return 0; 4267 } 4268 4269 void ni_dpm_fini(struct radeon_device *rdev) 4270 { 4271 int i; 4272 4273 for (i = 0; i < rdev->pm.dpm.num_ps; i++) { 4274 kfree(rdev->pm.dpm.ps[i].ps_priv); 4275 } 4276 kfree(rdev->pm.dpm.ps); 4277 kfree(rdev->pm.dpm.priv); 4278 kfree(rdev->pm.dpm.dyn_state.vddc_dependency_on_dispclk.entries); 4279 r600_free_extended_power_table(rdev); 4280 } 4281 4282 void ni_dpm_print_power_state(struct radeon_device *rdev, 4283 struct radeon_ps *rps) 4284 { 4285 struct ni_ps *ps = ni_get_ps(rps); 4286 struct rv7xx_pl *pl; 4287 int i; 4288 4289 r600_dpm_print_class_info(rps->class, rps->class2); 4290 r600_dpm_print_cap_info(rps->caps); 4291 printk("\tuvd vclk: %d dclk: %d\n", rps->vclk, rps->dclk); 4292 for (i = 0; i < ps->performance_level_count; i++) { 4293 pl = &ps->performance_levels[i]; 4294 if (rdev->family >= CHIP_TAHITI) 4295 printk("\t\tpower level %d sclk: %u mclk: %u vddc: %u vddci: %u pcie gen: %u\n", 4296 i, pl->sclk, pl->mclk, pl->vddc, pl->vddci, pl->pcie_gen + 1); 4297 else 4298 printk("\t\tpower level %d sclk: %u mclk: %u vddc: %u vddci: %u\n", 4299 i, pl->sclk, pl->mclk, pl->vddc, pl->vddci); 4300 } 4301 r600_dpm_print_ps_status(rdev, rps); 4302 } 4303 4304 void ni_dpm_debugfs_print_current_performance_level(struct radeon_device *rdev, 4305 struct seq_file *m) 4306 { 4307 struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev); 4308 struct radeon_ps *rps = &eg_pi->current_rps; 4309 struct ni_ps *ps = ni_get_ps(rps); 4310 struct rv7xx_pl *pl; 4311 u32 current_index = 4312 (RREG32(TARGET_AND_CURRENT_PROFILE_INDEX) & CURRENT_STATE_INDEX_MASK) >> 4313 CURRENT_STATE_INDEX_SHIFT; 4314 4315 if (current_index >= ps->performance_level_count) { 4316 seq_printf(m, "invalid dpm profile %d\n", current_index); 4317 } else { 4318 pl = &ps->performance_levels[current_index]; 4319 seq_printf(m, "uvd vclk: %d dclk: %d\n", rps->vclk, rps->dclk); 4320 seq_printf(m, "power level %d sclk: %u mclk: %u vddc: %u vddci: %u\n", 4321 current_index, pl->sclk, pl->mclk, pl->vddc, pl->vddci); 4322 } 4323 } 4324 4325 u32 ni_dpm_get_current_sclk(struct radeon_device *rdev) 4326 { 4327 struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev); 4328 struct radeon_ps *rps = &eg_pi->current_rps; 4329 struct ni_ps *ps = ni_get_ps(rps); 4330 struct rv7xx_pl *pl; 4331 u32 current_index = 4332 (RREG32(TARGET_AND_CURRENT_PROFILE_INDEX) & CURRENT_STATE_INDEX_MASK) >> 4333 CURRENT_STATE_INDEX_SHIFT; 4334 4335 if (current_index >= ps->performance_level_count) { 4336 return 0; 4337 } else { 4338 pl = &ps->performance_levels[current_index]; 4339 return pl->sclk; 4340 } 4341 } 4342 4343 u32 ni_dpm_get_current_mclk(struct radeon_device *rdev) 4344 { 4345 struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev); 4346 struct radeon_ps *rps = &eg_pi->current_rps; 4347 struct ni_ps *ps = ni_get_ps(rps); 4348 struct rv7xx_pl *pl; 4349 u32 current_index = 4350 (RREG32(TARGET_AND_CURRENT_PROFILE_INDEX) & CURRENT_STATE_INDEX_MASK) >> 4351 CURRENT_STATE_INDEX_SHIFT; 4352 4353 if (current_index >= ps->performance_level_count) { 4354 return 0; 4355 } else { 4356 pl = &ps->performance_levels[current_index]; 4357 return pl->mclk; 4358 } 4359 } 4360 4361 u32 ni_dpm_get_sclk(struct radeon_device *rdev, bool low) 4362 { 4363 struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev); 4364 struct ni_ps *requested_state = ni_get_ps(&eg_pi->requested_rps); 4365 4366 if (low) 4367 return requested_state->performance_levels[0].sclk; 4368 else 4369 return requested_state->performance_levels[requested_state->performance_level_count - 1].sclk; 4370 } 4371 4372 u32 ni_dpm_get_mclk(struct radeon_device *rdev, bool low) 4373 { 4374 struct evergreen_power_info *eg_pi = evergreen_get_pi(rdev); 4375 struct ni_ps *requested_state = ni_get_ps(&eg_pi->requested_rps); 4376 4377 if (low) 4378 return requested_state->performance_levels[0].mclk; 4379 else 4380 return requested_state->performance_levels[requested_state->performance_level_count - 1].mclk; 4381 } 4382 4383