1*20c8ccb1SThomas Gleixner // SPDX-License-Identifier: GPL-2.0-only 2ff53604bSXiao Guangrong /* 3ff53604bSXiao Guangrong * vMTRR implementation 4ff53604bSXiao Guangrong * 5ff53604bSXiao Guangrong * Copyright (C) 2006 Qumranet, Inc. 6ff53604bSXiao Guangrong * Copyright 2010 Red Hat, Inc. and/or its affiliates. 7ff53604bSXiao Guangrong * Copyright(C) 2015 Intel Corporation. 8ff53604bSXiao Guangrong * 9ff53604bSXiao Guangrong * Authors: 10ff53604bSXiao Guangrong * Yaniv Kamay <yaniv@qumranet.com> 11ff53604bSXiao Guangrong * Avi Kivity <avi@qumranet.com> 12ff53604bSXiao Guangrong * Marcelo Tosatti <mtosatti@redhat.com> 13ff53604bSXiao Guangrong * Paolo Bonzini <pbonzini@redhat.com> 14ff53604bSXiao Guangrong * Xiao Guangrong <guangrong.xiao@linux.intel.com> 15ff53604bSXiao Guangrong */ 16ff53604bSXiao Guangrong 17ff53604bSXiao Guangrong #include <linux/kvm_host.h> 18ff53604bSXiao Guangrong #include <asm/mtrr.h> 19ff53604bSXiao Guangrong 20ff53604bSXiao Guangrong #include "cpuid.h" 21ff53604bSXiao Guangrong #include "mmu.h" 22ff53604bSXiao Guangrong 2310fac2dcSXiao Guangrong #define IA32_MTRR_DEF_TYPE_E (1ULL << 11) 2410fac2dcSXiao Guangrong #define IA32_MTRR_DEF_TYPE_FE (1ULL << 10) 2510fac2dcSXiao Guangrong #define IA32_MTRR_DEF_TYPE_TYPE_MASK (0xff) 2610fac2dcSXiao Guangrong 27ff53604bSXiao Guangrong static bool msr_mtrr_valid(unsigned msr) 28ff53604bSXiao Guangrong { 29ff53604bSXiao Guangrong switch (msr) { 30ff53604bSXiao Guangrong case 0x200 ... 0x200 + 2 * KVM_NR_VAR_MTRR - 1: 31ff53604bSXiao Guangrong case MSR_MTRRfix64K_00000: 32ff53604bSXiao Guangrong case MSR_MTRRfix16K_80000: 33ff53604bSXiao Guangrong case MSR_MTRRfix16K_A0000: 34ff53604bSXiao Guangrong case MSR_MTRRfix4K_C0000: 35ff53604bSXiao Guangrong case MSR_MTRRfix4K_C8000: 36ff53604bSXiao Guangrong case MSR_MTRRfix4K_D0000: 37ff53604bSXiao Guangrong case MSR_MTRRfix4K_D8000: 38ff53604bSXiao Guangrong case MSR_MTRRfix4K_E0000: 39ff53604bSXiao Guangrong case MSR_MTRRfix4K_E8000: 40ff53604bSXiao Guangrong case MSR_MTRRfix4K_F0000: 41ff53604bSXiao Guangrong case MSR_MTRRfix4K_F8000: 42ff53604bSXiao Guangrong case MSR_MTRRdefType: 43ff53604bSXiao Guangrong case MSR_IA32_CR_PAT: 44ff53604bSXiao Guangrong return true; 45ff53604bSXiao Guangrong } 46ff53604bSXiao Guangrong return false; 47ff53604bSXiao Guangrong } 48ff53604bSXiao Guangrong 49ff53604bSXiao Guangrong static bool valid_mtrr_type(unsigned t) 50ff53604bSXiao Guangrong { 51ff53604bSXiao Guangrong return t < 8 && (1 << t) & 0x73; /* 0, 1, 4, 5, 6 */ 52ff53604bSXiao Guangrong } 53ff53604bSXiao Guangrong 54ff53604bSXiao Guangrong bool kvm_mtrr_valid(struct kvm_vcpu *vcpu, u32 msr, u64 data) 55ff53604bSXiao Guangrong { 56ff53604bSXiao Guangrong int i; 57ff53604bSXiao Guangrong u64 mask; 58ff53604bSXiao Guangrong 59ff53604bSXiao Guangrong if (!msr_mtrr_valid(msr)) 60ff53604bSXiao Guangrong return false; 61ff53604bSXiao Guangrong 62ff53604bSXiao Guangrong if (msr == MSR_IA32_CR_PAT) { 63674ea351SPaolo Bonzini return kvm_pat_valid(data); 64ff53604bSXiao Guangrong } else if (msr == MSR_MTRRdefType) { 65ff53604bSXiao Guangrong if (data & ~0xcff) 66ff53604bSXiao Guangrong return false; 67ff53604bSXiao Guangrong return valid_mtrr_type(data & 0xff); 68ff53604bSXiao Guangrong } else if (msr >= MSR_MTRRfix64K_00000 && msr <= MSR_MTRRfix4K_F8000) { 69ff53604bSXiao Guangrong for (i = 0; i < 8 ; i++) 70ff53604bSXiao Guangrong if (!valid_mtrr_type((data >> (i * 8)) & 0xff)) 71ff53604bSXiao Guangrong return false; 72ff53604bSXiao Guangrong return true; 73ff53604bSXiao Guangrong } 74ff53604bSXiao Guangrong 75ff53604bSXiao Guangrong /* variable MTRRs */ 76ff53604bSXiao Guangrong WARN_ON(!(msr >= 0x200 && msr < 0x200 + 2 * KVM_NR_VAR_MTRR)); 77ff53604bSXiao Guangrong 78ff53604bSXiao Guangrong mask = (~0ULL) << cpuid_maxphyaddr(vcpu); 79ff53604bSXiao Guangrong if ((msr & 1) == 0) { 80ff53604bSXiao Guangrong /* MTRR base */ 81ff53604bSXiao Guangrong if (!valid_mtrr_type(data & 0xff)) 82ff53604bSXiao Guangrong return false; 83ff53604bSXiao Guangrong mask |= 0xf00; 84ff53604bSXiao Guangrong } else 85ff53604bSXiao Guangrong /* MTRR mask */ 86ff53604bSXiao Guangrong mask |= 0x7ff; 87ff53604bSXiao Guangrong if (data & mask) { 88ff53604bSXiao Guangrong kvm_inject_gp(vcpu, 0); 89ff53604bSXiao Guangrong return false; 90ff53604bSXiao Guangrong } 91ff53604bSXiao Guangrong 92ff53604bSXiao Guangrong return true; 93ff53604bSXiao Guangrong } 94ff53604bSXiao Guangrong EXPORT_SYMBOL_GPL(kvm_mtrr_valid); 95ff53604bSXiao Guangrong 9610fac2dcSXiao Guangrong static bool mtrr_is_enabled(struct kvm_mtrr *mtrr_state) 9710fac2dcSXiao Guangrong { 9810fac2dcSXiao Guangrong return !!(mtrr_state->deftype & IA32_MTRR_DEF_TYPE_E); 9910fac2dcSXiao Guangrong } 10010fac2dcSXiao Guangrong 10110fac2dcSXiao Guangrong static bool fixed_mtrr_is_enabled(struct kvm_mtrr *mtrr_state) 10210fac2dcSXiao Guangrong { 10310fac2dcSXiao Guangrong return !!(mtrr_state->deftype & IA32_MTRR_DEF_TYPE_FE); 10410fac2dcSXiao Guangrong } 10510fac2dcSXiao Guangrong 10610fac2dcSXiao Guangrong static u8 mtrr_default_type(struct kvm_mtrr *mtrr_state) 10710fac2dcSXiao Guangrong { 10810fac2dcSXiao Guangrong return mtrr_state->deftype & IA32_MTRR_DEF_TYPE_TYPE_MASK; 10910fac2dcSXiao Guangrong } 11010fac2dcSXiao Guangrong 111e24dea2aSPaolo Bonzini static u8 mtrr_disabled_type(struct kvm_vcpu *vcpu) 11210dc331fSXiao Guangrong { 11310dc331fSXiao Guangrong /* 11410dc331fSXiao Guangrong * Intel SDM 11.11.2.2: all MTRRs are disabled when 11510dc331fSXiao Guangrong * IA32_MTRR_DEF_TYPE.E bit is cleared, and the UC 11610dc331fSXiao Guangrong * memory type is applied to all of physical memory. 117e24dea2aSPaolo Bonzini * 118e24dea2aSPaolo Bonzini * However, virtual machines can be run with CPUID such that 119e24dea2aSPaolo Bonzini * there are no MTRRs. In that case, the firmware will never 120e24dea2aSPaolo Bonzini * enable MTRRs and it is obviously undesirable to run the 121e24dea2aSPaolo Bonzini * guest entirely with UC memory and we use WB. 12210dc331fSXiao Guangrong */ 123d6321d49SRadim Krčmář if (guest_cpuid_has(vcpu, X86_FEATURE_MTRR)) 12410dc331fSXiao Guangrong return MTRR_TYPE_UNCACHABLE; 125e24dea2aSPaolo Bonzini else 126e24dea2aSPaolo Bonzini return MTRR_TYPE_WRBACK; 12710dc331fSXiao Guangrong } 12810dc331fSXiao Guangrong 129de9aef5eSXiao Guangrong /* 130de9aef5eSXiao Guangrong * Three terms are used in the following code: 131de9aef5eSXiao Guangrong * - segment, it indicates the address segments covered by fixed MTRRs. 132de9aef5eSXiao Guangrong * - unit, it corresponds to the MSR entry in the segment. 133de9aef5eSXiao Guangrong * - range, a range is covered in one memory cache type. 134de9aef5eSXiao Guangrong */ 135de9aef5eSXiao Guangrong struct fixed_mtrr_segment { 136de9aef5eSXiao Guangrong u64 start; 137de9aef5eSXiao Guangrong u64 end; 138de9aef5eSXiao Guangrong 139de9aef5eSXiao Guangrong int range_shift; 140de9aef5eSXiao Guangrong 141de9aef5eSXiao Guangrong /* the start position in kvm_mtrr.fixed_ranges[]. */ 142de9aef5eSXiao Guangrong int range_start; 143de9aef5eSXiao Guangrong }; 144de9aef5eSXiao Guangrong 145de9aef5eSXiao Guangrong static struct fixed_mtrr_segment fixed_seg_table[] = { 146de9aef5eSXiao Guangrong /* MSR_MTRRfix64K_00000, 1 unit. 64K fixed mtrr. */ 147de9aef5eSXiao Guangrong { 148de9aef5eSXiao Guangrong .start = 0x0, 149de9aef5eSXiao Guangrong .end = 0x80000, 150de9aef5eSXiao Guangrong .range_shift = 16, /* 64K */ 151de9aef5eSXiao Guangrong .range_start = 0, 152de9aef5eSXiao Guangrong }, 153de9aef5eSXiao Guangrong 154de9aef5eSXiao Guangrong /* 155de9aef5eSXiao Guangrong * MSR_MTRRfix16K_80000 ... MSR_MTRRfix16K_A0000, 2 units, 156de9aef5eSXiao Guangrong * 16K fixed mtrr. 157de9aef5eSXiao Guangrong */ 158de9aef5eSXiao Guangrong { 159de9aef5eSXiao Guangrong .start = 0x80000, 160de9aef5eSXiao Guangrong .end = 0xc0000, 161de9aef5eSXiao Guangrong .range_shift = 14, /* 16K */ 162de9aef5eSXiao Guangrong .range_start = 8, 163de9aef5eSXiao Guangrong }, 164de9aef5eSXiao Guangrong 165de9aef5eSXiao Guangrong /* 166de9aef5eSXiao Guangrong * MSR_MTRRfix4K_C0000 ... MSR_MTRRfix4K_F8000, 8 units, 167de9aef5eSXiao Guangrong * 4K fixed mtrr. 168de9aef5eSXiao Guangrong */ 169de9aef5eSXiao Guangrong { 170de9aef5eSXiao Guangrong .start = 0xc0000, 171de9aef5eSXiao Guangrong .end = 0x100000, 172de9aef5eSXiao Guangrong .range_shift = 12, /* 12K */ 173de9aef5eSXiao Guangrong .range_start = 24, 174de9aef5eSXiao Guangrong } 175de9aef5eSXiao Guangrong }; 176de9aef5eSXiao Guangrong 177de9aef5eSXiao Guangrong /* 178de9aef5eSXiao Guangrong * The size of unit is covered in one MSR, one MSR entry contains 179de9aef5eSXiao Guangrong * 8 ranges so that unit size is always 8 * 2^range_shift. 180de9aef5eSXiao Guangrong */ 181de9aef5eSXiao Guangrong static u64 fixed_mtrr_seg_unit_size(int seg) 182de9aef5eSXiao Guangrong { 183de9aef5eSXiao Guangrong return 8 << fixed_seg_table[seg].range_shift; 184de9aef5eSXiao Guangrong } 185de9aef5eSXiao Guangrong 186de9aef5eSXiao Guangrong static bool fixed_msr_to_seg_unit(u32 msr, int *seg, int *unit) 187de9aef5eSXiao Guangrong { 188de9aef5eSXiao Guangrong switch (msr) { 189de9aef5eSXiao Guangrong case MSR_MTRRfix64K_00000: 190de9aef5eSXiao Guangrong *seg = 0; 191de9aef5eSXiao Guangrong *unit = 0; 192de9aef5eSXiao Guangrong break; 193de9aef5eSXiao Guangrong case MSR_MTRRfix16K_80000 ... MSR_MTRRfix16K_A0000: 194de9aef5eSXiao Guangrong *seg = 1; 195de9aef5eSXiao Guangrong *unit = msr - MSR_MTRRfix16K_80000; 196de9aef5eSXiao Guangrong break; 197de9aef5eSXiao Guangrong case MSR_MTRRfix4K_C0000 ... MSR_MTRRfix4K_F8000: 198de9aef5eSXiao Guangrong *seg = 2; 199de9aef5eSXiao Guangrong *unit = msr - MSR_MTRRfix4K_C0000; 200de9aef5eSXiao Guangrong break; 201de9aef5eSXiao Guangrong default: 202de9aef5eSXiao Guangrong return false; 203de9aef5eSXiao Guangrong } 204de9aef5eSXiao Guangrong 205de9aef5eSXiao Guangrong return true; 206de9aef5eSXiao Guangrong } 207de9aef5eSXiao Guangrong 208de9aef5eSXiao Guangrong static void fixed_mtrr_seg_unit_range(int seg, int unit, u64 *start, u64 *end) 209de9aef5eSXiao Guangrong { 210de9aef5eSXiao Guangrong struct fixed_mtrr_segment *mtrr_seg = &fixed_seg_table[seg]; 211de9aef5eSXiao Guangrong u64 unit_size = fixed_mtrr_seg_unit_size(seg); 212de9aef5eSXiao Guangrong 213de9aef5eSXiao Guangrong *start = mtrr_seg->start + unit * unit_size; 214de9aef5eSXiao Guangrong *end = *start + unit_size; 215de9aef5eSXiao Guangrong WARN_ON(*end > mtrr_seg->end); 216de9aef5eSXiao Guangrong } 217de9aef5eSXiao Guangrong 218de9aef5eSXiao Guangrong static int fixed_mtrr_seg_unit_range_index(int seg, int unit) 219de9aef5eSXiao Guangrong { 220de9aef5eSXiao Guangrong struct fixed_mtrr_segment *mtrr_seg = &fixed_seg_table[seg]; 221de9aef5eSXiao Guangrong 222de9aef5eSXiao Guangrong WARN_ON(mtrr_seg->start + unit * fixed_mtrr_seg_unit_size(seg) 223de9aef5eSXiao Guangrong > mtrr_seg->end); 224de9aef5eSXiao Guangrong 225de9aef5eSXiao Guangrong /* each unit has 8 ranges. */ 226de9aef5eSXiao Guangrong return mtrr_seg->range_start + 8 * unit; 227de9aef5eSXiao Guangrong } 228de9aef5eSXiao Guangrong 229f571c097SXiao Guangrong static int fixed_mtrr_seg_end_range_index(int seg) 230f571c097SXiao Guangrong { 231f571c097SXiao Guangrong struct fixed_mtrr_segment *mtrr_seg = &fixed_seg_table[seg]; 232f571c097SXiao Guangrong int n; 233f571c097SXiao Guangrong 234f571c097SXiao Guangrong n = (mtrr_seg->end - mtrr_seg->start) >> mtrr_seg->range_shift; 235f571c097SXiao Guangrong return mtrr_seg->range_start + n - 1; 236f571c097SXiao Guangrong } 237f571c097SXiao Guangrong 238de9aef5eSXiao Guangrong static bool fixed_msr_to_range(u32 msr, u64 *start, u64 *end) 239de9aef5eSXiao Guangrong { 240de9aef5eSXiao Guangrong int seg, unit; 241de9aef5eSXiao Guangrong 242de9aef5eSXiao Guangrong if (!fixed_msr_to_seg_unit(msr, &seg, &unit)) 243de9aef5eSXiao Guangrong return false; 244de9aef5eSXiao Guangrong 245de9aef5eSXiao Guangrong fixed_mtrr_seg_unit_range(seg, unit, start, end); 246de9aef5eSXiao Guangrong return true; 247de9aef5eSXiao Guangrong } 248de9aef5eSXiao Guangrong 249de9aef5eSXiao Guangrong static int fixed_msr_to_range_index(u32 msr) 250de9aef5eSXiao Guangrong { 251de9aef5eSXiao Guangrong int seg, unit; 252de9aef5eSXiao Guangrong 253de9aef5eSXiao Guangrong if (!fixed_msr_to_seg_unit(msr, &seg, &unit)) 254de9aef5eSXiao Guangrong return -1; 255de9aef5eSXiao Guangrong 256de9aef5eSXiao Guangrong return fixed_mtrr_seg_unit_range_index(seg, unit); 257de9aef5eSXiao Guangrong } 258de9aef5eSXiao Guangrong 259f7bfb57bSXiao Guangrong static int fixed_mtrr_addr_to_seg(u64 addr) 260f7bfb57bSXiao Guangrong { 261f7bfb57bSXiao Guangrong struct fixed_mtrr_segment *mtrr_seg; 262f7bfb57bSXiao Guangrong int seg, seg_num = ARRAY_SIZE(fixed_seg_table); 263f7bfb57bSXiao Guangrong 264f7bfb57bSXiao Guangrong for (seg = 0; seg < seg_num; seg++) { 265f7bfb57bSXiao Guangrong mtrr_seg = &fixed_seg_table[seg]; 266a7f2d786SAlexis Dambricourt if (mtrr_seg->start <= addr && addr < mtrr_seg->end) 267f7bfb57bSXiao Guangrong return seg; 268f7bfb57bSXiao Guangrong } 269f7bfb57bSXiao Guangrong 270f7bfb57bSXiao Guangrong return -1; 271f7bfb57bSXiao Guangrong } 272f7bfb57bSXiao Guangrong 273f7bfb57bSXiao Guangrong static int fixed_mtrr_addr_seg_to_range_index(u64 addr, int seg) 274f7bfb57bSXiao Guangrong { 275f7bfb57bSXiao Guangrong struct fixed_mtrr_segment *mtrr_seg; 276f7bfb57bSXiao Guangrong int index; 277f7bfb57bSXiao Guangrong 278f7bfb57bSXiao Guangrong mtrr_seg = &fixed_seg_table[seg]; 279f7bfb57bSXiao Guangrong index = mtrr_seg->range_start; 280f7bfb57bSXiao Guangrong index += (addr - mtrr_seg->start) >> mtrr_seg->range_shift; 281f7bfb57bSXiao Guangrong return index; 282f7bfb57bSXiao Guangrong } 283f7bfb57bSXiao Guangrong 284f571c097SXiao Guangrong static u64 fixed_mtrr_range_end_addr(int seg, int index) 285f571c097SXiao Guangrong { 286f571c097SXiao Guangrong struct fixed_mtrr_segment *mtrr_seg = &fixed_seg_table[seg]; 287f571c097SXiao Guangrong int pos = index - mtrr_seg->range_start; 288f571c097SXiao Guangrong 289f571c097SXiao Guangrong return mtrr_seg->start + ((pos + 1) << mtrr_seg->range_shift); 290f571c097SXiao Guangrong } 291f571c097SXiao Guangrong 292a13842dcSXiao Guangrong static void var_mtrr_range(struct kvm_mtrr_range *range, u64 *start, u64 *end) 293a13842dcSXiao Guangrong { 294a13842dcSXiao Guangrong u64 mask; 295a13842dcSXiao Guangrong 296a13842dcSXiao Guangrong *start = range->base & PAGE_MASK; 297a13842dcSXiao Guangrong 298a13842dcSXiao Guangrong mask = range->mask & PAGE_MASK; 299a13842dcSXiao Guangrong 300a13842dcSXiao Guangrong /* This cannot overflow because writing to the reserved bits of 301a13842dcSXiao Guangrong * variable MTRRs causes a #GP. 302a13842dcSXiao Guangrong */ 303a13842dcSXiao Guangrong *end = (*start | ~mask) + 1; 304a13842dcSXiao Guangrong } 305a13842dcSXiao Guangrong 306ff53604bSXiao Guangrong static void update_mtrr(struct kvm_vcpu *vcpu, u32 msr) 307ff53604bSXiao Guangrong { 30870109e7dSXiao Guangrong struct kvm_mtrr *mtrr_state = &vcpu->arch.mtrr_state; 309a13842dcSXiao Guangrong gfn_t start, end; 310ff53604bSXiao Guangrong int index; 311ff53604bSXiao Guangrong 312ff53604bSXiao Guangrong if (msr == MSR_IA32_CR_PAT || !tdp_enabled || 313ff53604bSXiao Guangrong !kvm_arch_has_noncoherent_dma(vcpu->kvm)) 314ff53604bSXiao Guangrong return; 315ff53604bSXiao Guangrong 31610fac2dcSXiao Guangrong if (!mtrr_is_enabled(mtrr_state) && msr != MSR_MTRRdefType) 317ff53604bSXiao Guangrong return; 318ff53604bSXiao Guangrong 319de9aef5eSXiao Guangrong /* fixed MTRRs. */ 320de9aef5eSXiao Guangrong if (fixed_msr_to_range(msr, &start, &end)) { 321de9aef5eSXiao Guangrong if (!fixed_mtrr_is_enabled(mtrr_state)) 322de9aef5eSXiao Guangrong return; 323de9aef5eSXiao Guangrong } else if (msr == MSR_MTRRdefType) { 324ff53604bSXiao Guangrong start = 0x0; 325ff53604bSXiao Guangrong end = ~0ULL; 326de9aef5eSXiao Guangrong } else { 327ff53604bSXiao Guangrong /* variable range MTRRs. */ 328ff53604bSXiao Guangrong index = (msr - 0x200) / 2; 329a13842dcSXiao Guangrong var_mtrr_range(&mtrr_state->var_ranges[index], &start, &end); 330ff53604bSXiao Guangrong } 331ff53604bSXiao Guangrong 332ff53604bSXiao Guangrong kvm_zap_gfn_range(vcpu->kvm, gpa_to_gfn(start), gpa_to_gfn(end)); 333ff53604bSXiao Guangrong } 334ff53604bSXiao Guangrong 33519efffa2SXiao Guangrong static bool var_mtrr_range_is_valid(struct kvm_mtrr_range *range) 33619efffa2SXiao Guangrong { 33719efffa2SXiao Guangrong return (range->mask & (1 << 11)) != 0; 33819efffa2SXiao Guangrong } 33919efffa2SXiao Guangrong 34019efffa2SXiao Guangrong static void set_var_mtrr_msr(struct kvm_vcpu *vcpu, u32 msr, u64 data) 34119efffa2SXiao Guangrong { 34219efffa2SXiao Guangrong struct kvm_mtrr *mtrr_state = &vcpu->arch.mtrr_state; 34319efffa2SXiao Guangrong struct kvm_mtrr_range *tmp, *cur; 34419efffa2SXiao Guangrong int index, is_mtrr_mask; 34519efffa2SXiao Guangrong 34619efffa2SXiao Guangrong index = (msr - 0x200) / 2; 34719efffa2SXiao Guangrong is_mtrr_mask = msr - 0x200 - 2 * index; 34819efffa2SXiao Guangrong cur = &mtrr_state->var_ranges[index]; 34919efffa2SXiao Guangrong 35019efffa2SXiao Guangrong /* remove the entry if it's in the list. */ 35119efffa2SXiao Guangrong if (var_mtrr_range_is_valid(cur)) 35219efffa2SXiao Guangrong list_del(&mtrr_state->var_ranges[index].node); 35319efffa2SXiao Guangrong 354fa7c4ebdSPaolo Bonzini /* Extend the mask with all 1 bits to the left, since those 355fa7c4ebdSPaolo Bonzini * bits must implicitly be 0. The bits are then cleared 356fa7c4ebdSPaolo Bonzini * when reading them. 357fa7c4ebdSPaolo Bonzini */ 35819efffa2SXiao Guangrong if (!is_mtrr_mask) 35919efffa2SXiao Guangrong cur->base = data; 36019efffa2SXiao Guangrong else 361fa7c4ebdSPaolo Bonzini cur->mask = data | (-1LL << cpuid_maxphyaddr(vcpu)); 36219efffa2SXiao Guangrong 36319efffa2SXiao Guangrong /* add it to the list if it's enabled. */ 36419efffa2SXiao Guangrong if (var_mtrr_range_is_valid(cur)) { 36519efffa2SXiao Guangrong list_for_each_entry(tmp, &mtrr_state->head, node) 36619efffa2SXiao Guangrong if (cur->base >= tmp->base) 36719efffa2SXiao Guangrong break; 36819efffa2SXiao Guangrong list_add_tail(&cur->node, &tmp->node); 36919efffa2SXiao Guangrong } 37019efffa2SXiao Guangrong } 37119efffa2SXiao Guangrong 372ff53604bSXiao Guangrong int kvm_mtrr_set_msr(struct kvm_vcpu *vcpu, u32 msr, u64 data) 373ff53604bSXiao Guangrong { 374de9aef5eSXiao Guangrong int index; 375ff53604bSXiao Guangrong 376ff53604bSXiao Guangrong if (!kvm_mtrr_valid(vcpu, msr, data)) 377ff53604bSXiao Guangrong return 1; 378ff53604bSXiao Guangrong 379de9aef5eSXiao Guangrong index = fixed_msr_to_range_index(msr); 380de9aef5eSXiao Guangrong if (index >= 0) 381de9aef5eSXiao Guangrong *(u64 *)&vcpu->arch.mtrr_state.fixed_ranges[index] = data; 382de9aef5eSXiao Guangrong else if (msr == MSR_MTRRdefType) 38310fac2dcSXiao Guangrong vcpu->arch.mtrr_state.deftype = data; 384ff53604bSXiao Guangrong else if (msr == MSR_IA32_CR_PAT) 385ff53604bSXiao Guangrong vcpu->arch.pat = data; 386ff53604bSXiao Guangrong else 38719efffa2SXiao Guangrong set_var_mtrr_msr(vcpu, msr, data); 388ff53604bSXiao Guangrong 389ff53604bSXiao Guangrong update_mtrr(vcpu, msr); 390ff53604bSXiao Guangrong return 0; 391ff53604bSXiao Guangrong } 392ff53604bSXiao Guangrong 393ff53604bSXiao Guangrong int kvm_mtrr_get_msr(struct kvm_vcpu *vcpu, u32 msr, u64 *pdata) 394ff53604bSXiao Guangrong { 395de9aef5eSXiao Guangrong int index; 396ff53604bSXiao Guangrong 397eb839917SXiao Guangrong /* MSR_MTRRcap is a readonly MSR. */ 398eb839917SXiao Guangrong if (msr == MSR_MTRRcap) { 399eb839917SXiao Guangrong /* 400eb839917SXiao Guangrong * SMRR = 0 401eb839917SXiao Guangrong * WC = 1 402eb839917SXiao Guangrong * FIX = 1 403eb839917SXiao Guangrong * VCNT = KVM_NR_VAR_MTRR 404eb839917SXiao Guangrong */ 405eb839917SXiao Guangrong *pdata = 0x500 | KVM_NR_VAR_MTRR; 406eb839917SXiao Guangrong return 0; 407eb839917SXiao Guangrong } 408eb839917SXiao Guangrong 409ff53604bSXiao Guangrong if (!msr_mtrr_valid(msr)) 410ff53604bSXiao Guangrong return 1; 411ff53604bSXiao Guangrong 412de9aef5eSXiao Guangrong index = fixed_msr_to_range_index(msr); 413de9aef5eSXiao Guangrong if (index >= 0) 414de9aef5eSXiao Guangrong *pdata = *(u64 *)&vcpu->arch.mtrr_state.fixed_ranges[index]; 415de9aef5eSXiao Guangrong else if (msr == MSR_MTRRdefType) 41610fac2dcSXiao Guangrong *pdata = vcpu->arch.mtrr_state.deftype; 417ff53604bSXiao Guangrong else if (msr == MSR_IA32_CR_PAT) 418ff53604bSXiao Guangrong *pdata = vcpu->arch.pat; 419ff53604bSXiao Guangrong else { /* Variable MTRRs */ 420de9aef5eSXiao Guangrong int is_mtrr_mask; 421ff53604bSXiao Guangrong 422de9aef5eSXiao Guangrong index = (msr - 0x200) / 2; 423de9aef5eSXiao Guangrong is_mtrr_mask = msr - 0x200 - 2 * index; 424ff53604bSXiao Guangrong if (!is_mtrr_mask) 425de9aef5eSXiao Guangrong *pdata = vcpu->arch.mtrr_state.var_ranges[index].base; 426ff53604bSXiao Guangrong else 427de9aef5eSXiao Guangrong *pdata = vcpu->arch.mtrr_state.var_ranges[index].mask; 428fa7c4ebdSPaolo Bonzini 429fa7c4ebdSPaolo Bonzini *pdata &= (1ULL << cpuid_maxphyaddr(vcpu)) - 1; 430ff53604bSXiao Guangrong } 431ff53604bSXiao Guangrong 432ff53604bSXiao Guangrong return 0; 433ff53604bSXiao Guangrong } 434ff53604bSXiao Guangrong 43519efffa2SXiao Guangrong void kvm_vcpu_mtrr_init(struct kvm_vcpu *vcpu) 43619efffa2SXiao Guangrong { 43719efffa2SXiao Guangrong INIT_LIST_HEAD(&vcpu->arch.mtrr_state.head); 43819efffa2SXiao Guangrong } 43919efffa2SXiao Guangrong 440f571c097SXiao Guangrong struct mtrr_iter { 441f571c097SXiao Guangrong /* input fields. */ 442f571c097SXiao Guangrong struct kvm_mtrr *mtrr_state; 443f571c097SXiao Guangrong u64 start; 444f571c097SXiao Guangrong u64 end; 445f571c097SXiao Guangrong 446f571c097SXiao Guangrong /* output fields. */ 447f571c097SXiao Guangrong int mem_type; 44810dc331fSXiao Guangrong /* mtrr is completely disabled? */ 44910dc331fSXiao Guangrong bool mtrr_disabled; 450f571c097SXiao Guangrong /* [start, end) is not fully covered in MTRRs? */ 451f571c097SXiao Guangrong bool partial_map; 452f571c097SXiao Guangrong 453f571c097SXiao Guangrong /* private fields. */ 454f571c097SXiao Guangrong union { 455f571c097SXiao Guangrong /* used for fixed MTRRs. */ 456f571c097SXiao Guangrong struct { 457f571c097SXiao Guangrong int index; 458f571c097SXiao Guangrong int seg; 459f571c097SXiao Guangrong }; 460f571c097SXiao Guangrong 461f571c097SXiao Guangrong /* used for var MTRRs. */ 462f571c097SXiao Guangrong struct { 463f571c097SXiao Guangrong struct kvm_mtrr_range *range; 464f571c097SXiao Guangrong /* max address has been covered in var MTRRs. */ 465f571c097SXiao Guangrong u64 start_max; 466f571c097SXiao Guangrong }; 467f571c097SXiao Guangrong }; 468f571c097SXiao Guangrong 469f571c097SXiao Guangrong bool fixed; 470f571c097SXiao Guangrong }; 471f571c097SXiao Guangrong 472f571c097SXiao Guangrong static bool mtrr_lookup_fixed_start(struct mtrr_iter *iter) 473f571c097SXiao Guangrong { 474f571c097SXiao Guangrong int seg, index; 475f571c097SXiao Guangrong 476f571c097SXiao Guangrong if (!fixed_mtrr_is_enabled(iter->mtrr_state)) 477f571c097SXiao Guangrong return false; 478f571c097SXiao Guangrong 479f571c097SXiao Guangrong seg = fixed_mtrr_addr_to_seg(iter->start); 480f571c097SXiao Guangrong if (seg < 0) 481f571c097SXiao Guangrong return false; 482f571c097SXiao Guangrong 483f571c097SXiao Guangrong iter->fixed = true; 484f571c097SXiao Guangrong index = fixed_mtrr_addr_seg_to_range_index(iter->start, seg); 485f571c097SXiao Guangrong iter->index = index; 486f571c097SXiao Guangrong iter->seg = seg; 487f571c097SXiao Guangrong return true; 488f571c097SXiao Guangrong } 489f571c097SXiao Guangrong 490f571c097SXiao Guangrong static bool match_var_range(struct mtrr_iter *iter, 491f571c097SXiao Guangrong struct kvm_mtrr_range *range) 492f571c097SXiao Guangrong { 493f571c097SXiao Guangrong u64 start, end; 494f571c097SXiao Guangrong 495f571c097SXiao Guangrong var_mtrr_range(range, &start, &end); 496f571c097SXiao Guangrong if (!(start >= iter->end || end <= iter->start)) { 497f571c097SXiao Guangrong iter->range = range; 498f571c097SXiao Guangrong 499f571c097SXiao Guangrong /* 500f571c097SXiao Guangrong * the function is called when we do kvm_mtrr.head walking. 501f571c097SXiao Guangrong * Range has the minimum base address which interleaves 502f571c097SXiao Guangrong * [looker->start_max, looker->end). 503f571c097SXiao Guangrong */ 504f571c097SXiao Guangrong iter->partial_map |= iter->start_max < start; 505f571c097SXiao Guangrong 506f571c097SXiao Guangrong /* update the max address has been covered. */ 507f571c097SXiao Guangrong iter->start_max = max(iter->start_max, end); 508f571c097SXiao Guangrong return true; 509f571c097SXiao Guangrong } 510f571c097SXiao Guangrong 511f571c097SXiao Guangrong return false; 512f571c097SXiao Guangrong } 513f571c097SXiao Guangrong 514f571c097SXiao Guangrong static void __mtrr_lookup_var_next(struct mtrr_iter *iter) 515f571c097SXiao Guangrong { 516f571c097SXiao Guangrong struct kvm_mtrr *mtrr_state = iter->mtrr_state; 517f571c097SXiao Guangrong 518f571c097SXiao Guangrong list_for_each_entry_continue(iter->range, &mtrr_state->head, node) 519f571c097SXiao Guangrong if (match_var_range(iter, iter->range)) 520f571c097SXiao Guangrong return; 521f571c097SXiao Guangrong 522f571c097SXiao Guangrong iter->range = NULL; 523f571c097SXiao Guangrong iter->partial_map |= iter->start_max < iter->end; 524f571c097SXiao Guangrong } 525f571c097SXiao Guangrong 526f571c097SXiao Guangrong static void mtrr_lookup_var_start(struct mtrr_iter *iter) 527f571c097SXiao Guangrong { 528f571c097SXiao Guangrong struct kvm_mtrr *mtrr_state = iter->mtrr_state; 529f571c097SXiao Guangrong 530f571c097SXiao Guangrong iter->fixed = false; 531f571c097SXiao Guangrong iter->start_max = iter->start; 53230b072ceSAlexis Dambricourt iter->range = NULL; 533f571c097SXiao Guangrong iter->range = list_prepare_entry(iter->range, &mtrr_state->head, node); 534f571c097SXiao Guangrong 535f571c097SXiao Guangrong __mtrr_lookup_var_next(iter); 536f571c097SXiao Guangrong } 537f571c097SXiao Guangrong 538f571c097SXiao Guangrong static void mtrr_lookup_fixed_next(struct mtrr_iter *iter) 539f571c097SXiao Guangrong { 540f571c097SXiao Guangrong /* terminate the lookup. */ 541f571c097SXiao Guangrong if (fixed_mtrr_range_end_addr(iter->seg, iter->index) >= iter->end) { 542f571c097SXiao Guangrong iter->fixed = false; 543f571c097SXiao Guangrong iter->range = NULL; 544f571c097SXiao Guangrong return; 545f571c097SXiao Guangrong } 546f571c097SXiao Guangrong 547f571c097SXiao Guangrong iter->index++; 548f571c097SXiao Guangrong 549f571c097SXiao Guangrong /* have looked up for all fixed MTRRs. */ 550f571c097SXiao Guangrong if (iter->index >= ARRAY_SIZE(iter->mtrr_state->fixed_ranges)) 551f571c097SXiao Guangrong return mtrr_lookup_var_start(iter); 552f571c097SXiao Guangrong 553f571c097SXiao Guangrong /* switch to next segment. */ 554f571c097SXiao Guangrong if (iter->index > fixed_mtrr_seg_end_range_index(iter->seg)) 555f571c097SXiao Guangrong iter->seg++; 556f571c097SXiao Guangrong } 557f571c097SXiao Guangrong 558f571c097SXiao Guangrong static void mtrr_lookup_var_next(struct mtrr_iter *iter) 559f571c097SXiao Guangrong { 560f571c097SXiao Guangrong __mtrr_lookup_var_next(iter); 561f571c097SXiao Guangrong } 562f571c097SXiao Guangrong 563f571c097SXiao Guangrong static void mtrr_lookup_start(struct mtrr_iter *iter) 564f571c097SXiao Guangrong { 565f571c097SXiao Guangrong if (!mtrr_is_enabled(iter->mtrr_state)) { 56610dc331fSXiao Guangrong iter->mtrr_disabled = true; 567f571c097SXiao Guangrong return; 568f571c097SXiao Guangrong } 569f571c097SXiao Guangrong 570f571c097SXiao Guangrong if (!mtrr_lookup_fixed_start(iter)) 571f571c097SXiao Guangrong mtrr_lookup_var_start(iter); 572f571c097SXiao Guangrong } 573f571c097SXiao Guangrong 574f571c097SXiao Guangrong static void mtrr_lookup_init(struct mtrr_iter *iter, 575f571c097SXiao Guangrong struct kvm_mtrr *mtrr_state, u64 start, u64 end) 576f571c097SXiao Guangrong { 577f571c097SXiao Guangrong iter->mtrr_state = mtrr_state; 578f571c097SXiao Guangrong iter->start = start; 579f571c097SXiao Guangrong iter->end = end; 58010dc331fSXiao Guangrong iter->mtrr_disabled = false; 581f571c097SXiao Guangrong iter->partial_map = false; 582f571c097SXiao Guangrong iter->fixed = false; 583f571c097SXiao Guangrong iter->range = NULL; 584f571c097SXiao Guangrong 585f571c097SXiao Guangrong mtrr_lookup_start(iter); 586f571c097SXiao Guangrong } 587f571c097SXiao Guangrong 588f571c097SXiao Guangrong static bool mtrr_lookup_okay(struct mtrr_iter *iter) 589f571c097SXiao Guangrong { 590f571c097SXiao Guangrong if (iter->fixed) { 591f571c097SXiao Guangrong iter->mem_type = iter->mtrr_state->fixed_ranges[iter->index]; 592f571c097SXiao Guangrong return true; 593f571c097SXiao Guangrong } 594f571c097SXiao Guangrong 595f571c097SXiao Guangrong if (iter->range) { 596f571c097SXiao Guangrong iter->mem_type = iter->range->base & 0xff; 597f571c097SXiao Guangrong return true; 598f571c097SXiao Guangrong } 599f571c097SXiao Guangrong 600f571c097SXiao Guangrong return false; 601f571c097SXiao Guangrong } 602f571c097SXiao Guangrong 603f571c097SXiao Guangrong static void mtrr_lookup_next(struct mtrr_iter *iter) 604f571c097SXiao Guangrong { 605f571c097SXiao Guangrong if (iter->fixed) 606f571c097SXiao Guangrong mtrr_lookup_fixed_next(iter); 607f571c097SXiao Guangrong else 608f571c097SXiao Guangrong mtrr_lookup_var_next(iter); 609f571c097SXiao Guangrong } 610f571c097SXiao Guangrong 611f571c097SXiao Guangrong #define mtrr_for_each_mem_type(_iter_, _mtrr_, _gpa_start_, _gpa_end_) \ 612f571c097SXiao Guangrong for (mtrr_lookup_init(_iter_, _mtrr_, _gpa_start_, _gpa_end_); \ 613f571c097SXiao Guangrong mtrr_lookup_okay(_iter_); mtrr_lookup_next(_iter_)) 614f571c097SXiao Guangrong 6153f3f78b6SXiao Guangrong u8 kvm_mtrr_get_guest_memory_type(struct kvm_vcpu *vcpu, gfn_t gfn) 616ff53604bSXiao Guangrong { 6173f3f78b6SXiao Guangrong struct kvm_mtrr *mtrr_state = &vcpu->arch.mtrr_state; 618fa612137SXiao Guangrong struct mtrr_iter iter; 619fa612137SXiao Guangrong u64 start, end; 620fa612137SXiao Guangrong int type = -1; 6213f3f78b6SXiao Guangrong const int wt_wb_mask = (1 << MTRR_TYPE_WRBACK) 6223f3f78b6SXiao Guangrong | (1 << MTRR_TYPE_WRTHROUGH); 6233f3f78b6SXiao Guangrong 6243f3f78b6SXiao Guangrong start = gfn_to_gpa(gfn); 625fa612137SXiao Guangrong end = start + PAGE_SIZE; 626ff53604bSXiao Guangrong 627fa612137SXiao Guangrong mtrr_for_each_mem_type(&iter, mtrr_state, start, end) { 628fa612137SXiao Guangrong int curr_type = iter.mem_type; 629ff53604bSXiao Guangrong 6303f3f78b6SXiao Guangrong /* 6313f3f78b6SXiao Guangrong * Please refer to Intel SDM Volume 3: 11.11.4.1 MTRR 6323f3f78b6SXiao Guangrong * Precedences. 6333f3f78b6SXiao Guangrong */ 6343f3f78b6SXiao Guangrong 6353f3f78b6SXiao Guangrong if (type == -1) { 6363f3f78b6SXiao Guangrong type = curr_type; 637ff53604bSXiao Guangrong continue; 638ff53604bSXiao Guangrong } 639ff53604bSXiao Guangrong 6403f3f78b6SXiao Guangrong /* 6413f3f78b6SXiao Guangrong * If two or more variable memory ranges match and the 6423f3f78b6SXiao Guangrong * memory types are identical, then that memory type is 6433f3f78b6SXiao Guangrong * used. 6443f3f78b6SXiao Guangrong */ 6453f3f78b6SXiao Guangrong if (type == curr_type) 6463f3f78b6SXiao Guangrong continue; 6473f3f78b6SXiao Guangrong 6483f3f78b6SXiao Guangrong /* 6493f3f78b6SXiao Guangrong * If two or more variable memory ranges match and one of 6503f3f78b6SXiao Guangrong * the memory types is UC, the UC memory type used. 6513f3f78b6SXiao Guangrong */ 6523f3f78b6SXiao Guangrong if (curr_type == MTRR_TYPE_UNCACHABLE) 653ff53604bSXiao Guangrong return MTRR_TYPE_UNCACHABLE; 654ff53604bSXiao Guangrong 6553f3f78b6SXiao Guangrong /* 6563f3f78b6SXiao Guangrong * If two or more variable memory ranges match and the 6573f3f78b6SXiao Guangrong * memory types are WT and WB, the WT memory type is used. 6583f3f78b6SXiao Guangrong */ 6593f3f78b6SXiao Guangrong if (((1 << type) & wt_wb_mask) && 6603f3f78b6SXiao Guangrong ((1 << curr_type) & wt_wb_mask)) { 6613f3f78b6SXiao Guangrong type = MTRR_TYPE_WRTHROUGH; 6623f3f78b6SXiao Guangrong continue; 663ff53604bSXiao Guangrong } 664ff53604bSXiao Guangrong 6653f3f78b6SXiao Guangrong /* 6663f3f78b6SXiao Guangrong * For overlaps not defined by the above rules, processor 6673f3f78b6SXiao Guangrong * behavior is undefined. 6683f3f78b6SXiao Guangrong */ 6693f3f78b6SXiao Guangrong 6703f3f78b6SXiao Guangrong /* We use WB for this undefined behavior. :( */ 6713f3f78b6SXiao Guangrong return MTRR_TYPE_WRBACK; 672ff53604bSXiao Guangrong } 673ff53604bSXiao Guangrong 67410dc331fSXiao Guangrong if (iter.mtrr_disabled) 675e24dea2aSPaolo Bonzini return mtrr_disabled_type(vcpu); 67610dc331fSXiao Guangrong 677fc1a8126SAlex Williamson /* not contained in any MTRRs. */ 678fc1a8126SAlex Williamson if (type == -1) 679fc1a8126SAlex Williamson return mtrr_default_type(mtrr_state); 680fc1a8126SAlex Williamson 681fa612137SXiao Guangrong /* 682fa612137SXiao Guangrong * We just check one page, partially covered by MTRRs is 683fa612137SXiao Guangrong * impossible. 684fa612137SXiao Guangrong */ 6853e5d2fdcSXiao Guangrong WARN_ON(iter.partial_map); 6863e5d2fdcSXiao Guangrong 6873f3f78b6SXiao Guangrong return type; 688ff53604bSXiao Guangrong } 689ff53604bSXiao Guangrong EXPORT_SYMBOL_GPL(kvm_mtrr_get_guest_memory_type); 6906a39bbc5SXiao Guangrong 6916a39bbc5SXiao Guangrong bool kvm_mtrr_check_gfn_range_consistency(struct kvm_vcpu *vcpu, gfn_t gfn, 6926a39bbc5SXiao Guangrong int page_num) 6936a39bbc5SXiao Guangrong { 6946a39bbc5SXiao Guangrong struct kvm_mtrr *mtrr_state = &vcpu->arch.mtrr_state; 6956a39bbc5SXiao Guangrong struct mtrr_iter iter; 6966a39bbc5SXiao Guangrong u64 start, end; 6976a39bbc5SXiao Guangrong int type = -1; 6986a39bbc5SXiao Guangrong 6996a39bbc5SXiao Guangrong start = gfn_to_gpa(gfn); 7006a39bbc5SXiao Guangrong end = gfn_to_gpa(gfn + page_num); 7016a39bbc5SXiao Guangrong mtrr_for_each_mem_type(&iter, mtrr_state, start, end) { 7026a39bbc5SXiao Guangrong if (type == -1) { 7036a39bbc5SXiao Guangrong type = iter.mem_type; 7046a39bbc5SXiao Guangrong continue; 7056a39bbc5SXiao Guangrong } 7066a39bbc5SXiao Guangrong 7076a39bbc5SXiao Guangrong if (type != iter.mem_type) 7086a39bbc5SXiao Guangrong return false; 7096a39bbc5SXiao Guangrong } 7106a39bbc5SXiao Guangrong 71110dc331fSXiao Guangrong if (iter.mtrr_disabled) 71210dc331fSXiao Guangrong return true; 71310dc331fSXiao Guangrong 7146a39bbc5SXiao Guangrong if (!iter.partial_map) 7156a39bbc5SXiao Guangrong return true; 7166a39bbc5SXiao Guangrong 7176a39bbc5SXiao Guangrong if (type == -1) 7186a39bbc5SXiao Guangrong return true; 7196a39bbc5SXiao Guangrong 7206a39bbc5SXiao Guangrong return type == mtrr_default_type(mtrr_state); 7216a39bbc5SXiao Guangrong } 722