1 // SPDX-License-Identifier: GPL-2.0-only 2 /* 3 * Copied from arch/arm64/kernel/cpufeature.c 4 * 5 * Copyright (C) 2015 ARM Ltd. 6 * Copyright (C) 2017 SiFive 7 */ 8 9 #include <linux/acpi.h> 10 #include <linux/bitmap.h> 11 #include <linux/ctype.h> 12 #include <linux/log2.h> 13 #include <linux/memory.h> 14 #include <linux/module.h> 15 #include <linux/of.h> 16 #include <asm/acpi.h> 17 #include <asm/alternative.h> 18 #include <asm/cacheflush.h> 19 #include <asm/cpufeature.h> 20 #include <asm/hwcap.h> 21 #include <asm/hwprobe.h> 22 #include <asm/patch.h> 23 #include <asm/processor.h> 24 #include <asm/sbi.h> 25 #include <asm/vector.h> 26 27 #include "copy-unaligned.h" 28 29 #define NUM_ALPHA_EXTS ('z' - 'a' + 1) 30 31 #define MISALIGNED_ACCESS_JIFFIES_LG2 1 32 #define MISALIGNED_BUFFER_SIZE 0x4000 33 #define MISALIGNED_COPY_SIZE ((MISALIGNED_BUFFER_SIZE / 2) - 0x80) 34 35 unsigned long elf_hwcap __read_mostly; 36 37 /* Host ISA bitmap */ 38 static DECLARE_BITMAP(riscv_isa, RISCV_ISA_EXT_MAX) __read_mostly; 39 40 /* Per-cpu ISA extensions. */ 41 struct riscv_isainfo hart_isa[NR_CPUS]; 42 43 /* Performance information */ 44 DEFINE_PER_CPU(long, misaligned_access_speed); 45 46 /** 47 * riscv_isa_extension_base() - Get base extension word 48 * 49 * @isa_bitmap: ISA bitmap to use 50 * Return: base extension word as unsigned long value 51 * 52 * NOTE: If isa_bitmap is NULL then Host ISA bitmap will be used. 53 */ 54 unsigned long riscv_isa_extension_base(const unsigned long *isa_bitmap) 55 { 56 if (!isa_bitmap) 57 return riscv_isa[0]; 58 return isa_bitmap[0]; 59 } 60 EXPORT_SYMBOL_GPL(riscv_isa_extension_base); 61 62 /** 63 * __riscv_isa_extension_available() - Check whether given extension 64 * is available or not 65 * 66 * @isa_bitmap: ISA bitmap to use 67 * @bit: bit position of the desired extension 68 * Return: true or false 69 * 70 * NOTE: If isa_bitmap is NULL then Host ISA bitmap will be used. 71 */ 72 bool __riscv_isa_extension_available(const unsigned long *isa_bitmap, int bit) 73 { 74 const unsigned long *bmap = (isa_bitmap) ? isa_bitmap : riscv_isa; 75 76 if (bit >= RISCV_ISA_EXT_MAX) 77 return false; 78 79 return test_bit(bit, bmap) ? true : false; 80 } 81 EXPORT_SYMBOL_GPL(__riscv_isa_extension_available); 82 83 static bool riscv_isa_extension_check(int id) 84 { 85 switch (id) { 86 case RISCV_ISA_EXT_ZICBOM: 87 if (!riscv_cbom_block_size) { 88 pr_err("Zicbom detected in ISA string, disabling as no cbom-block-size found\n"); 89 return false; 90 } else if (!is_power_of_2(riscv_cbom_block_size)) { 91 pr_err("Zicbom disabled as cbom-block-size present, but is not a power-of-2\n"); 92 return false; 93 } 94 return true; 95 case RISCV_ISA_EXT_ZICBOZ: 96 if (!riscv_cboz_block_size) { 97 pr_err("Zicboz detected in ISA string, but no cboz-block-size found\n"); 98 return false; 99 } else if (!is_power_of_2(riscv_cboz_block_size)) { 100 pr_err("cboz-block-size present, but is not a power-of-2\n"); 101 return false; 102 } 103 return true; 104 } 105 106 return true; 107 } 108 109 #define __RISCV_ISA_EXT_DATA(_name, _id) { \ 110 .name = #_name, \ 111 .property = #_name, \ 112 .id = _id, \ 113 } 114 115 /* 116 * The canonical order of ISA extension names in the ISA string is defined in 117 * chapter 27 of the unprivileged specification. 118 * 119 * Ordinarily, for in-kernel data structures, this order is unimportant but 120 * isa_ext_arr defines the order of the ISA string in /proc/cpuinfo. 121 * 122 * The specification uses vague wording, such as should, when it comes to 123 * ordering, so for our purposes the following rules apply: 124 * 125 * 1. All multi-letter extensions must be separated from other extensions by an 126 * underscore. 127 * 128 * 2. Additional standard extensions (starting with 'Z') must be sorted after 129 * single-letter extensions and before any higher-privileged extensions. 130 * 131 * 3. The first letter following the 'Z' conventionally indicates the most 132 * closely related alphabetical extension category, IMAFDQLCBKJTPVH. 133 * If multiple 'Z' extensions are named, they must be ordered first by 134 * category, then alphabetically within a category. 135 * 136 * 3. Standard supervisor-level extensions (starting with 'S') must be listed 137 * after standard unprivileged extensions. If multiple supervisor-level 138 * extensions are listed, they must be ordered alphabetically. 139 * 140 * 4. Standard machine-level extensions (starting with 'Zxm') must be listed 141 * after any lower-privileged, standard extensions. If multiple 142 * machine-level extensions are listed, they must be ordered 143 * alphabetically. 144 * 145 * 5. Non-standard extensions (starting with 'X') must be listed after all 146 * standard extensions. If multiple non-standard extensions are listed, they 147 * must be ordered alphabetically. 148 * 149 * An example string following the order is: 150 * rv64imadc_zifoo_zigoo_zafoo_sbar_scar_zxmbaz_xqux_xrux 151 * 152 * New entries to this struct should follow the ordering rules described above. 153 */ 154 const struct riscv_isa_ext_data riscv_isa_ext[] = { 155 __RISCV_ISA_EXT_DATA(i, RISCV_ISA_EXT_i), 156 __RISCV_ISA_EXT_DATA(m, RISCV_ISA_EXT_m), 157 __RISCV_ISA_EXT_DATA(a, RISCV_ISA_EXT_a), 158 __RISCV_ISA_EXT_DATA(f, RISCV_ISA_EXT_f), 159 __RISCV_ISA_EXT_DATA(d, RISCV_ISA_EXT_d), 160 __RISCV_ISA_EXT_DATA(q, RISCV_ISA_EXT_q), 161 __RISCV_ISA_EXT_DATA(c, RISCV_ISA_EXT_c), 162 __RISCV_ISA_EXT_DATA(b, RISCV_ISA_EXT_b), 163 __RISCV_ISA_EXT_DATA(k, RISCV_ISA_EXT_k), 164 __RISCV_ISA_EXT_DATA(j, RISCV_ISA_EXT_j), 165 __RISCV_ISA_EXT_DATA(p, RISCV_ISA_EXT_p), 166 __RISCV_ISA_EXT_DATA(v, RISCV_ISA_EXT_v), 167 __RISCV_ISA_EXT_DATA(h, RISCV_ISA_EXT_h), 168 __RISCV_ISA_EXT_DATA(zicbom, RISCV_ISA_EXT_ZICBOM), 169 __RISCV_ISA_EXT_DATA(zicboz, RISCV_ISA_EXT_ZICBOZ), 170 __RISCV_ISA_EXT_DATA(zicntr, RISCV_ISA_EXT_ZICNTR), 171 __RISCV_ISA_EXT_DATA(zicsr, RISCV_ISA_EXT_ZICSR), 172 __RISCV_ISA_EXT_DATA(zifencei, RISCV_ISA_EXT_ZIFENCEI), 173 __RISCV_ISA_EXT_DATA(zihintpause, RISCV_ISA_EXT_ZIHINTPAUSE), 174 __RISCV_ISA_EXT_DATA(zihpm, RISCV_ISA_EXT_ZIHPM), 175 __RISCV_ISA_EXT_DATA(zba, RISCV_ISA_EXT_ZBA), 176 __RISCV_ISA_EXT_DATA(zbb, RISCV_ISA_EXT_ZBB), 177 __RISCV_ISA_EXT_DATA(zbs, RISCV_ISA_EXT_ZBS), 178 __RISCV_ISA_EXT_DATA(smaia, RISCV_ISA_EXT_SMAIA), 179 __RISCV_ISA_EXT_DATA(ssaia, RISCV_ISA_EXT_SSAIA), 180 __RISCV_ISA_EXT_DATA(sscofpmf, RISCV_ISA_EXT_SSCOFPMF), 181 __RISCV_ISA_EXT_DATA(sstc, RISCV_ISA_EXT_SSTC), 182 __RISCV_ISA_EXT_DATA(svinval, RISCV_ISA_EXT_SVINVAL), 183 __RISCV_ISA_EXT_DATA(svnapot, RISCV_ISA_EXT_SVNAPOT), 184 __RISCV_ISA_EXT_DATA(svpbmt, RISCV_ISA_EXT_SVPBMT), 185 }; 186 187 const size_t riscv_isa_ext_count = ARRAY_SIZE(riscv_isa_ext); 188 189 static void __init riscv_parse_isa_string(unsigned long *this_hwcap, struct riscv_isainfo *isainfo, 190 unsigned long *isa2hwcap, const char *isa) 191 { 192 /* 193 * For all possible cpus, we have already validated in 194 * the boot process that they at least contain "rv" and 195 * whichever of "32"/"64" this kernel supports, and so this 196 * section can be skipped. 197 */ 198 isa += 4; 199 200 while (*isa) { 201 const char *ext = isa++; 202 const char *ext_end = isa; 203 bool ext_long = false, ext_err = false; 204 205 switch (*ext) { 206 case 's': 207 /* 208 * Workaround for invalid single-letter 's' & 'u'(QEMU). 209 * No need to set the bit in riscv_isa as 's' & 'u' are 210 * not valid ISA extensions. It works until multi-letter 211 * extension starting with "Su" appears. 212 */ 213 if (ext[-1] != '_' && ext[1] == 'u') { 214 ++isa; 215 ext_err = true; 216 break; 217 } 218 fallthrough; 219 case 'S': 220 case 'x': 221 case 'X': 222 case 'z': 223 case 'Z': 224 /* 225 * Before attempting to parse the extension itself, we find its end. 226 * As multi-letter extensions must be split from other multi-letter 227 * extensions with an "_", the end of a multi-letter extension will 228 * either be the null character or the "_" at the start of the next 229 * multi-letter extension. 230 * 231 * Next, as the extensions version is currently ignored, we 232 * eliminate that portion. This is done by parsing backwards from 233 * the end of the extension, removing any numbers. This may be a 234 * major or minor number however, so the process is repeated if a 235 * minor number was found. 236 * 237 * ext_end is intended to represent the first character *after* the 238 * name portion of an extension, but will be decremented to the last 239 * character itself while eliminating the extensions version number. 240 * A simple re-increment solves this problem. 241 */ 242 ext_long = true; 243 for (; *isa && *isa != '_'; ++isa) 244 if (unlikely(!isalnum(*isa))) 245 ext_err = true; 246 247 ext_end = isa; 248 if (unlikely(ext_err)) 249 break; 250 251 if (!isdigit(ext_end[-1])) 252 break; 253 254 while (isdigit(*--ext_end)) 255 ; 256 257 if (tolower(ext_end[0]) != 'p' || !isdigit(ext_end[-1])) { 258 ++ext_end; 259 break; 260 } 261 262 while (isdigit(*--ext_end)) 263 ; 264 265 ++ext_end; 266 break; 267 default: 268 /* 269 * Things are a little easier for single-letter extensions, as they 270 * are parsed forwards. 271 * 272 * After checking that our starting position is valid, we need to 273 * ensure that, when isa was incremented at the start of the loop, 274 * that it arrived at the start of the next extension. 275 * 276 * If we are already on a non-digit, there is nothing to do. Either 277 * we have a multi-letter extension's _, or the start of an 278 * extension. 279 * 280 * Otherwise we have found the current extension's major version 281 * number. Parse past it, and a subsequent p/minor version number 282 * if present. The `p` extension must not appear immediately after 283 * a number, so there is no fear of missing it. 284 * 285 */ 286 if (unlikely(!isalpha(*ext))) { 287 ext_err = true; 288 break; 289 } 290 291 if (!isdigit(*isa)) 292 break; 293 294 while (isdigit(*++isa)) 295 ; 296 297 if (tolower(*isa) != 'p') 298 break; 299 300 if (!isdigit(*++isa)) { 301 --isa; 302 break; 303 } 304 305 while (isdigit(*++isa)) 306 ; 307 308 break; 309 } 310 311 /* 312 * The parser expects that at the start of an iteration isa points to the 313 * first character of the next extension. As we stop parsing an extension 314 * on meeting a non-alphanumeric character, an extra increment is needed 315 * where the succeeding extension is a multi-letter prefixed with an "_". 316 */ 317 if (*isa == '_') 318 ++isa; 319 320 #define SET_ISA_EXT_MAP(name, bit) \ 321 do { \ 322 if ((ext_end - ext == strlen(name)) && \ 323 !strncasecmp(ext, name, strlen(name)) && \ 324 riscv_isa_extension_check(bit)) \ 325 set_bit(bit, isainfo->isa); \ 326 } while (false) \ 327 328 if (unlikely(ext_err)) 329 continue; 330 if (!ext_long) { 331 int nr = tolower(*ext) - 'a'; 332 333 if (riscv_isa_extension_check(nr)) { 334 *this_hwcap |= isa2hwcap[nr]; 335 set_bit(nr, isainfo->isa); 336 } 337 } else { 338 for (int i = 0; i < riscv_isa_ext_count; i++) 339 SET_ISA_EXT_MAP(riscv_isa_ext[i].name, 340 riscv_isa_ext[i].id); 341 } 342 #undef SET_ISA_EXT_MAP 343 } 344 } 345 346 static void __init riscv_fill_hwcap_from_isa_string(unsigned long *isa2hwcap) 347 { 348 struct device_node *node; 349 const char *isa; 350 int rc; 351 struct acpi_table_header *rhct; 352 acpi_status status; 353 unsigned int cpu; 354 355 if (!acpi_disabled) { 356 status = acpi_get_table(ACPI_SIG_RHCT, 0, &rhct); 357 if (ACPI_FAILURE(status)) 358 return; 359 } 360 361 for_each_possible_cpu(cpu) { 362 struct riscv_isainfo *isainfo = &hart_isa[cpu]; 363 unsigned long this_hwcap = 0; 364 365 if (acpi_disabled) { 366 node = of_cpu_device_node_get(cpu); 367 if (!node) { 368 pr_warn("Unable to find cpu node\n"); 369 continue; 370 } 371 372 rc = of_property_read_string(node, "riscv,isa", &isa); 373 of_node_put(node); 374 if (rc) { 375 pr_warn("Unable to find \"riscv,isa\" devicetree entry\n"); 376 continue; 377 } 378 } else { 379 rc = acpi_get_riscv_isa(rhct, cpu, &isa); 380 if (rc < 0) { 381 pr_warn("Unable to get ISA for the hart - %d\n", cpu); 382 continue; 383 } 384 } 385 386 riscv_parse_isa_string(&this_hwcap, isainfo, isa2hwcap, isa); 387 388 /* 389 * These ones were as they were part of the base ISA when the 390 * port & dt-bindings were upstreamed, and so can be set 391 * unconditionally where `i` is in riscv,isa on DT systems. 392 */ 393 if (acpi_disabled) { 394 set_bit(RISCV_ISA_EXT_ZICSR, isainfo->isa); 395 set_bit(RISCV_ISA_EXT_ZIFENCEI, isainfo->isa); 396 set_bit(RISCV_ISA_EXT_ZICNTR, isainfo->isa); 397 set_bit(RISCV_ISA_EXT_ZIHPM, isainfo->isa); 398 } 399 400 /* 401 * "V" in ISA strings is ambiguous in practice: it should mean 402 * just the standard V-1.0 but vendors aren't well behaved. 403 * Many vendors with T-Head CPU cores which implement the 0.7.1 404 * version of the vector specification put "v" into their DTs. 405 * CPU cores with the ratified spec will contain non-zero 406 * marchid. 407 */ 408 if (acpi_disabled && riscv_cached_mvendorid(cpu) == THEAD_VENDOR_ID && 409 riscv_cached_marchid(cpu) == 0x0) { 410 this_hwcap &= ~isa2hwcap[RISCV_ISA_EXT_v]; 411 clear_bit(RISCV_ISA_EXT_v, isainfo->isa); 412 } 413 414 /* 415 * All "okay" hart should have same isa. Set HWCAP based on 416 * common capabilities of every "okay" hart, in case they don't 417 * have. 418 */ 419 if (elf_hwcap) 420 elf_hwcap &= this_hwcap; 421 else 422 elf_hwcap = this_hwcap; 423 424 if (bitmap_empty(riscv_isa, RISCV_ISA_EXT_MAX)) 425 bitmap_copy(riscv_isa, isainfo->isa, RISCV_ISA_EXT_MAX); 426 else 427 bitmap_and(riscv_isa, riscv_isa, isainfo->isa, RISCV_ISA_EXT_MAX); 428 } 429 430 if (!acpi_disabled && rhct) 431 acpi_put_table((struct acpi_table_header *)rhct); 432 } 433 434 static int __init riscv_fill_hwcap_from_ext_list(unsigned long *isa2hwcap) 435 { 436 unsigned int cpu; 437 438 for_each_possible_cpu(cpu) { 439 unsigned long this_hwcap = 0; 440 struct device_node *cpu_node; 441 struct riscv_isainfo *isainfo = &hart_isa[cpu]; 442 443 cpu_node = of_cpu_device_node_get(cpu); 444 if (!cpu_node) { 445 pr_warn("Unable to find cpu node\n"); 446 continue; 447 } 448 449 if (!of_property_present(cpu_node, "riscv,isa-extensions")) { 450 of_node_put(cpu_node); 451 continue; 452 } 453 454 for (int i = 0; i < riscv_isa_ext_count; i++) { 455 if (of_property_match_string(cpu_node, "riscv,isa-extensions", 456 riscv_isa_ext[i].property) < 0) 457 continue; 458 459 if (!riscv_isa_extension_check(riscv_isa_ext[i].id)) 460 continue; 461 462 /* Only single letter extensions get set in hwcap */ 463 if (strnlen(riscv_isa_ext[i].name, 2) == 1) 464 this_hwcap |= isa2hwcap[riscv_isa_ext[i].id]; 465 466 set_bit(riscv_isa_ext[i].id, isainfo->isa); 467 } 468 469 of_node_put(cpu_node); 470 471 /* 472 * All "okay" harts should have same isa. Set HWCAP based on 473 * common capabilities of every "okay" hart, in case they don't. 474 */ 475 if (elf_hwcap) 476 elf_hwcap &= this_hwcap; 477 else 478 elf_hwcap = this_hwcap; 479 480 if (bitmap_empty(riscv_isa, RISCV_ISA_EXT_MAX)) 481 bitmap_copy(riscv_isa, isainfo->isa, RISCV_ISA_EXT_MAX); 482 else 483 bitmap_and(riscv_isa, riscv_isa, isainfo->isa, RISCV_ISA_EXT_MAX); 484 } 485 486 if (bitmap_empty(riscv_isa, RISCV_ISA_EXT_MAX)) 487 return -ENOENT; 488 489 return 0; 490 } 491 492 #ifdef CONFIG_RISCV_ISA_FALLBACK 493 bool __initdata riscv_isa_fallback = true; 494 #else 495 bool __initdata riscv_isa_fallback; 496 static int __init riscv_isa_fallback_setup(char *__unused) 497 { 498 riscv_isa_fallback = true; 499 return 1; 500 } 501 early_param("riscv_isa_fallback", riscv_isa_fallback_setup); 502 #endif 503 504 void __init riscv_fill_hwcap(void) 505 { 506 char print_str[NUM_ALPHA_EXTS + 1]; 507 unsigned long isa2hwcap[26] = {0}; 508 int i, j; 509 510 isa2hwcap['i' - 'a'] = COMPAT_HWCAP_ISA_I; 511 isa2hwcap['m' - 'a'] = COMPAT_HWCAP_ISA_M; 512 isa2hwcap['a' - 'a'] = COMPAT_HWCAP_ISA_A; 513 isa2hwcap['f' - 'a'] = COMPAT_HWCAP_ISA_F; 514 isa2hwcap['d' - 'a'] = COMPAT_HWCAP_ISA_D; 515 isa2hwcap['c' - 'a'] = COMPAT_HWCAP_ISA_C; 516 isa2hwcap['v' - 'a'] = COMPAT_HWCAP_ISA_V; 517 518 if (!acpi_disabled) { 519 riscv_fill_hwcap_from_isa_string(isa2hwcap); 520 } else { 521 int ret = riscv_fill_hwcap_from_ext_list(isa2hwcap); 522 523 if (ret && riscv_isa_fallback) { 524 pr_info("Falling back to deprecated \"riscv,isa\"\n"); 525 riscv_fill_hwcap_from_isa_string(isa2hwcap); 526 } 527 } 528 529 /* 530 * We don't support systems with F but without D, so mask those out 531 * here. 532 */ 533 if ((elf_hwcap & COMPAT_HWCAP_ISA_F) && !(elf_hwcap & COMPAT_HWCAP_ISA_D)) { 534 pr_info("This kernel does not support systems with F but not D\n"); 535 elf_hwcap &= ~COMPAT_HWCAP_ISA_F; 536 } 537 538 if (elf_hwcap & COMPAT_HWCAP_ISA_V) { 539 riscv_v_setup_vsize(); 540 /* 541 * ISA string in device tree might have 'v' flag, but 542 * CONFIG_RISCV_ISA_V is disabled in kernel. 543 * Clear V flag in elf_hwcap if CONFIG_RISCV_ISA_V is disabled. 544 */ 545 if (!IS_ENABLED(CONFIG_RISCV_ISA_V)) 546 elf_hwcap &= ~COMPAT_HWCAP_ISA_V; 547 } 548 549 memset(print_str, 0, sizeof(print_str)); 550 for (i = 0, j = 0; i < NUM_ALPHA_EXTS; i++) 551 if (riscv_isa[0] & BIT_MASK(i)) 552 print_str[j++] = (char)('a' + i); 553 pr_info("riscv: base ISA extensions %s\n", print_str); 554 555 memset(print_str, 0, sizeof(print_str)); 556 for (i = 0, j = 0; i < NUM_ALPHA_EXTS; i++) 557 if (elf_hwcap & BIT_MASK(i)) 558 print_str[j++] = (char)('a' + i); 559 pr_info("riscv: ELF capabilities %s\n", print_str); 560 } 561 562 unsigned long riscv_get_elf_hwcap(void) 563 { 564 unsigned long hwcap; 565 566 hwcap = (elf_hwcap & ((1UL << RISCV_ISA_EXT_BASE) - 1)); 567 568 if (!riscv_v_vstate_ctrl_user_allowed()) 569 hwcap &= ~COMPAT_HWCAP_ISA_V; 570 571 return hwcap; 572 } 573 574 void check_unaligned_access(int cpu) 575 { 576 u64 start_cycles, end_cycles; 577 u64 word_cycles; 578 u64 byte_cycles; 579 int ratio; 580 unsigned long start_jiffies, now; 581 struct page *page; 582 void *dst; 583 void *src; 584 long speed = RISCV_HWPROBE_MISALIGNED_SLOW; 585 586 /* We are already set since the last check */ 587 if (per_cpu(misaligned_access_speed, cpu) != RISCV_HWPROBE_MISALIGNED_UNKNOWN) 588 return; 589 590 page = alloc_pages(GFP_NOWAIT, get_order(MISALIGNED_BUFFER_SIZE)); 591 if (!page) { 592 pr_warn("Can't alloc pages to measure memcpy performance"); 593 return; 594 } 595 596 /* Make an unaligned destination buffer. */ 597 dst = (void *)((unsigned long)page_address(page) | 0x1); 598 /* Unalign src as well, but differently (off by 1 + 2 = 3). */ 599 src = dst + (MISALIGNED_BUFFER_SIZE / 2); 600 src += 2; 601 word_cycles = -1ULL; 602 /* Do a warmup. */ 603 __riscv_copy_words_unaligned(dst, src, MISALIGNED_COPY_SIZE); 604 preempt_disable(); 605 start_jiffies = jiffies; 606 while ((now = jiffies) == start_jiffies) 607 cpu_relax(); 608 609 /* 610 * For a fixed amount of time, repeatedly try the function, and take 611 * the best time in cycles as the measurement. 612 */ 613 while (time_before(jiffies, now + (1 << MISALIGNED_ACCESS_JIFFIES_LG2))) { 614 start_cycles = get_cycles64(); 615 /* Ensure the CSR read can't reorder WRT to the copy. */ 616 mb(); 617 __riscv_copy_words_unaligned(dst, src, MISALIGNED_COPY_SIZE); 618 /* Ensure the copy ends before the end time is snapped. */ 619 mb(); 620 end_cycles = get_cycles64(); 621 if ((end_cycles - start_cycles) < word_cycles) 622 word_cycles = end_cycles - start_cycles; 623 } 624 625 byte_cycles = -1ULL; 626 __riscv_copy_bytes_unaligned(dst, src, MISALIGNED_COPY_SIZE); 627 start_jiffies = jiffies; 628 while ((now = jiffies) == start_jiffies) 629 cpu_relax(); 630 631 while (time_before(jiffies, now + (1 << MISALIGNED_ACCESS_JIFFIES_LG2))) { 632 start_cycles = get_cycles64(); 633 mb(); 634 __riscv_copy_bytes_unaligned(dst, src, MISALIGNED_COPY_SIZE); 635 mb(); 636 end_cycles = get_cycles64(); 637 if ((end_cycles - start_cycles) < byte_cycles) 638 byte_cycles = end_cycles - start_cycles; 639 } 640 641 preempt_enable(); 642 643 /* Don't divide by zero. */ 644 if (!word_cycles || !byte_cycles) { 645 pr_warn("cpu%d: rdtime lacks granularity needed to measure unaligned access speed\n", 646 cpu); 647 648 goto out; 649 } 650 651 if (word_cycles < byte_cycles) 652 speed = RISCV_HWPROBE_MISALIGNED_FAST; 653 654 ratio = div_u64((byte_cycles * 100), word_cycles); 655 pr_info("cpu%d: Ratio of byte access time to unaligned word access is %d.%02d, unaligned accesses are %s\n", 656 cpu, 657 ratio / 100, 658 ratio % 100, 659 (speed == RISCV_HWPROBE_MISALIGNED_FAST) ? "fast" : "slow"); 660 661 per_cpu(misaligned_access_speed, cpu) = speed; 662 663 out: 664 __free_pages(page, get_order(MISALIGNED_BUFFER_SIZE)); 665 } 666 667 static int check_unaligned_access_boot_cpu(void) 668 { 669 check_unaligned_access(0); 670 return 0; 671 } 672 673 arch_initcall(check_unaligned_access_boot_cpu); 674 675 #ifdef CONFIG_RISCV_ALTERNATIVE 676 /* 677 * Alternative patch sites consider 48 bits when determining when to patch 678 * the old instruction sequence with the new. These bits are broken into a 679 * 16-bit vendor ID and a 32-bit patch ID. A non-zero vendor ID means the 680 * patch site is for an erratum, identified by the 32-bit patch ID. When 681 * the vendor ID is zero, the patch site is for a cpufeature. cpufeatures 682 * further break down patch ID into two 16-bit numbers. The lower 16 bits 683 * are the cpufeature ID and the upper 16 bits are used for a value specific 684 * to the cpufeature and patch site. If the upper 16 bits are zero, then it 685 * implies no specific value is specified. cpufeatures that want to control 686 * patching on a per-site basis will provide non-zero values and implement 687 * checks here. The checks return true when patching should be done, and 688 * false otherwise. 689 */ 690 static bool riscv_cpufeature_patch_check(u16 id, u16 value) 691 { 692 if (!value) 693 return true; 694 695 switch (id) { 696 case RISCV_ISA_EXT_ZICBOZ: 697 /* 698 * Zicboz alternative applications provide the maximum 699 * supported block size order, or zero when it doesn't 700 * matter. If the current block size exceeds the maximum, 701 * then the alternative cannot be applied. 702 */ 703 return riscv_cboz_block_size <= (1U << value); 704 } 705 706 return false; 707 } 708 709 void __init_or_module riscv_cpufeature_patch_func(struct alt_entry *begin, 710 struct alt_entry *end, 711 unsigned int stage) 712 { 713 struct alt_entry *alt; 714 void *oldptr, *altptr; 715 u16 id, value; 716 717 if (stage == RISCV_ALTERNATIVES_EARLY_BOOT) 718 return; 719 720 for (alt = begin; alt < end; alt++) { 721 if (alt->vendor_id != 0) 722 continue; 723 724 id = PATCH_ID_CPUFEATURE_ID(alt->patch_id); 725 726 if (id >= RISCV_ISA_EXT_MAX) { 727 WARN(1, "This extension id:%d is not in ISA extension list", id); 728 continue; 729 } 730 731 if (!__riscv_isa_extension_available(NULL, id)) 732 continue; 733 734 value = PATCH_ID_CPUFEATURE_VALUE(alt->patch_id); 735 if (!riscv_cpufeature_patch_check(id, value)) 736 continue; 737 738 oldptr = ALT_OLD_PTR(alt); 739 altptr = ALT_ALT_PTR(alt); 740 741 mutex_lock(&text_mutex); 742 patch_text_nosync(oldptr, altptr, alt->alt_len); 743 riscv_alternative_fix_offsets(oldptr, alt->alt_len, oldptr - altptr); 744 mutex_unlock(&text_mutex); 745 } 746 } 747 #endif 748