Loading...
1// SPDX-License-Identifier: GPL-2.0-only
2/*
3 * This only handles 32bit MTRR on 32bit hosts. This is strictly wrong
4 * because MTRRs can span up to 40 bits (36bits on most modern x86)
5 */
6#define DEBUG
7
8#include <linux/export.h>
9#include <linux/init.h>
10#include <linux/io.h>
11#include <linux/mm.h>
12
13#include <asm/processor-flags.h>
14#include <asm/cpufeature.h>
15#include <asm/tlbflush.h>
16#include <asm/mtrr.h>
17#include <asm/msr.h>
18#include <asm/pat.h>
19
20#include "mtrr.h"
21
22struct fixed_range_block {
23 int base_msr; /* start address of an MTRR block */
24 int ranges; /* number of MTRRs in this block */
25};
26
27static struct fixed_range_block fixed_range_blocks[] = {
28 { MSR_MTRRfix64K_00000, 1 }, /* one 64k MTRR */
29 { MSR_MTRRfix16K_80000, 2 }, /* two 16k MTRRs */
30 { MSR_MTRRfix4K_C0000, 8 }, /* eight 4k MTRRs */
31 {}
32};
33
34static unsigned long smp_changes_mask;
35static int mtrr_state_set;
36u64 mtrr_tom2;
37
38struct mtrr_state_type mtrr_state;
39EXPORT_SYMBOL_GPL(mtrr_state);
40
41/*
42 * BIOS is expected to clear MtrrFixDramModEn bit, see for example
43 * "BIOS and Kernel Developer's Guide for the AMD Athlon 64 and AMD
44 * Opteron Processors" (26094 Rev. 3.30 February 2006), section
45 * "13.2.1.2 SYSCFG Register": "The MtrrFixDramModEn bit should be set
46 * to 1 during BIOS initialization of the fixed MTRRs, then cleared to
47 * 0 for operation."
48 */
49static inline void k8_check_syscfg_dram_mod_en(void)
50{
51 u32 lo, hi;
52
53 if (!((boot_cpu_data.x86_vendor == X86_VENDOR_AMD) &&
54 (boot_cpu_data.x86 >= 0x0f)))
55 return;
56
57 rdmsr(MSR_K8_SYSCFG, lo, hi);
58 if (lo & K8_MTRRFIXRANGE_DRAM_MODIFY) {
59 pr_err(FW_WARN "MTRR: CPU %u: SYSCFG[MtrrFixDramModEn]"
60 " not cleared by BIOS, clearing this bit\n",
61 smp_processor_id());
62 lo &= ~K8_MTRRFIXRANGE_DRAM_MODIFY;
63 mtrr_wrmsr(MSR_K8_SYSCFG, lo, hi);
64 }
65}
66
67/* Get the size of contiguous MTRR range */
68static u64 get_mtrr_size(u64 mask)
69{
70 u64 size;
71
72 mask >>= PAGE_SHIFT;
73 mask |= size_or_mask;
74 size = -mask;
75 size <<= PAGE_SHIFT;
76 return size;
77}
78
79/*
80 * Check and return the effective type for MTRR-MTRR type overlap.
81 * Returns 1 if the effective type is UNCACHEABLE, else returns 0
82 */
83static int check_type_overlap(u8 *prev, u8 *curr)
84{
85 if (*prev == MTRR_TYPE_UNCACHABLE || *curr == MTRR_TYPE_UNCACHABLE) {
86 *prev = MTRR_TYPE_UNCACHABLE;
87 *curr = MTRR_TYPE_UNCACHABLE;
88 return 1;
89 }
90
91 if ((*prev == MTRR_TYPE_WRBACK && *curr == MTRR_TYPE_WRTHROUGH) ||
92 (*prev == MTRR_TYPE_WRTHROUGH && *curr == MTRR_TYPE_WRBACK)) {
93 *prev = MTRR_TYPE_WRTHROUGH;
94 *curr = MTRR_TYPE_WRTHROUGH;
95 }
96
97 if (*prev != *curr) {
98 *prev = MTRR_TYPE_UNCACHABLE;
99 *curr = MTRR_TYPE_UNCACHABLE;
100 return 1;
101 }
102
103 return 0;
104}
105
106/**
107 * mtrr_type_lookup_fixed - look up memory type in MTRR fixed entries
108 *
109 * Return the MTRR fixed memory type of 'start'.
110 *
111 * MTRR fixed entries are divided into the following ways:
112 * 0x00000 - 0x7FFFF : This range is divided into eight 64KB sub-ranges
113 * 0x80000 - 0xBFFFF : This range is divided into sixteen 16KB sub-ranges
114 * 0xC0000 - 0xFFFFF : This range is divided into sixty-four 4KB sub-ranges
115 *
116 * Return Values:
117 * MTRR_TYPE_(type) - Matched memory type
118 * MTRR_TYPE_INVALID - Unmatched
119 */
120static u8 mtrr_type_lookup_fixed(u64 start, u64 end)
121{
122 int idx;
123
124 if (start >= 0x100000)
125 return MTRR_TYPE_INVALID;
126
127 /* 0x0 - 0x7FFFF */
128 if (start < 0x80000) {
129 idx = 0;
130 idx += (start >> 16);
131 return mtrr_state.fixed_ranges[idx];
132 /* 0x80000 - 0xBFFFF */
133 } else if (start < 0xC0000) {
134 idx = 1 * 8;
135 idx += ((start - 0x80000) >> 14);
136 return mtrr_state.fixed_ranges[idx];
137 }
138
139 /* 0xC0000 - 0xFFFFF */
140 idx = 3 * 8;
141 idx += ((start - 0xC0000) >> 12);
142 return mtrr_state.fixed_ranges[idx];
143}
144
145/**
146 * mtrr_type_lookup_variable - look up memory type in MTRR variable entries
147 *
148 * Return Value:
149 * MTRR_TYPE_(type) - Matched memory type or default memory type (unmatched)
150 *
151 * Output Arguments:
152 * repeat - Set to 1 when [start:end] spanned across MTRR range and type
153 * returned corresponds only to [start:*partial_end]. Caller has
154 * to lookup again for [*partial_end:end].
155 *
156 * uniform - Set to 1 when an MTRR covers the region uniformly, i.e. the
157 * region is fully covered by a single MTRR entry or the default
158 * type.
159 */
160static u8 mtrr_type_lookup_variable(u64 start, u64 end, u64 *partial_end,
161 int *repeat, u8 *uniform)
162{
163 int i;
164 u64 base, mask;
165 u8 prev_match, curr_match;
166
167 *repeat = 0;
168 *uniform = 1;
169
170 /* Make end inclusive instead of exclusive */
171 end--;
172
173 prev_match = MTRR_TYPE_INVALID;
174 for (i = 0; i < num_var_ranges; ++i) {
175 unsigned short start_state, end_state, inclusive;
176
177 if (!(mtrr_state.var_ranges[i].mask_lo & (1 << 11)))
178 continue;
179
180 base = (((u64)mtrr_state.var_ranges[i].base_hi) << 32) +
181 (mtrr_state.var_ranges[i].base_lo & PAGE_MASK);
182 mask = (((u64)mtrr_state.var_ranges[i].mask_hi) << 32) +
183 (mtrr_state.var_ranges[i].mask_lo & PAGE_MASK);
184
185 start_state = ((start & mask) == (base & mask));
186 end_state = ((end & mask) == (base & mask));
187 inclusive = ((start < base) && (end > base));
188
189 if ((start_state != end_state) || inclusive) {
190 /*
191 * We have start:end spanning across an MTRR.
192 * We split the region into either
193 *
194 * - start_state:1
195 * (start:mtrr_end)(mtrr_end:end)
196 * - end_state:1
197 * (start:mtrr_start)(mtrr_start:end)
198 * - inclusive:1
199 * (start:mtrr_start)(mtrr_start:mtrr_end)(mtrr_end:end)
200 *
201 * depending on kind of overlap.
202 *
203 * Return the type of the first region and a pointer
204 * to the start of next region so that caller will be
205 * advised to lookup again after having adjusted start
206 * and end.
207 *
208 * Note: This way we handle overlaps with multiple
209 * entries and the default type properly.
210 */
211 if (start_state)
212 *partial_end = base + get_mtrr_size(mask);
213 else
214 *partial_end = base;
215
216 if (unlikely(*partial_end <= start)) {
217 WARN_ON(1);
218 *partial_end = start + PAGE_SIZE;
219 }
220
221 end = *partial_end - 1; /* end is inclusive */
222 *repeat = 1;
223 *uniform = 0;
224 }
225
226 if ((start & mask) != (base & mask))
227 continue;
228
229 curr_match = mtrr_state.var_ranges[i].base_lo & 0xff;
230 if (prev_match == MTRR_TYPE_INVALID) {
231 prev_match = curr_match;
232 continue;
233 }
234
235 *uniform = 0;
236 if (check_type_overlap(&prev_match, &curr_match))
237 return curr_match;
238 }
239
240 if (prev_match != MTRR_TYPE_INVALID)
241 return prev_match;
242
243 return mtrr_state.def_type;
244}
245
246/**
247 * mtrr_type_lookup - look up memory type in MTRR
248 *
249 * Return Values:
250 * MTRR_TYPE_(type) - The effective MTRR type for the region
251 * MTRR_TYPE_INVALID - MTRR is disabled
252 *
253 * Output Argument:
254 * uniform - Set to 1 when an MTRR covers the region uniformly, i.e. the
255 * region is fully covered by a single MTRR entry or the default
256 * type.
257 */
258u8 mtrr_type_lookup(u64 start, u64 end, u8 *uniform)
259{
260 u8 type, prev_type, is_uniform = 1, dummy;
261 int repeat;
262 u64 partial_end;
263
264 if (!mtrr_state_set)
265 return MTRR_TYPE_INVALID;
266
267 if (!(mtrr_state.enabled & MTRR_STATE_MTRR_ENABLED))
268 return MTRR_TYPE_INVALID;
269
270 /*
271 * Look up the fixed ranges first, which take priority over
272 * the variable ranges.
273 */
274 if ((start < 0x100000) &&
275 (mtrr_state.have_fixed) &&
276 (mtrr_state.enabled & MTRR_STATE_MTRR_FIXED_ENABLED)) {
277 is_uniform = 0;
278 type = mtrr_type_lookup_fixed(start, end);
279 goto out;
280 }
281
282 /*
283 * Look up the variable ranges. Look of multiple ranges matching
284 * this address and pick type as per MTRR precedence.
285 */
286 type = mtrr_type_lookup_variable(start, end, &partial_end,
287 &repeat, &is_uniform);
288
289 /*
290 * Common path is with repeat = 0.
291 * However, we can have cases where [start:end] spans across some
292 * MTRR ranges and/or the default type. Do repeated lookups for
293 * that case here.
294 */
295 while (repeat) {
296 prev_type = type;
297 start = partial_end;
298 is_uniform = 0;
299 type = mtrr_type_lookup_variable(start, end, &partial_end,
300 &repeat, &dummy);
301
302 if (check_type_overlap(&prev_type, &type))
303 goto out;
304 }
305
306 if (mtrr_tom2 && (start >= (1ULL<<32)) && (end < mtrr_tom2))
307 type = MTRR_TYPE_WRBACK;
308
309out:
310 *uniform = is_uniform;
311 return type;
312}
313
314/* Get the MSR pair relating to a var range */
315static void
316get_mtrr_var_range(unsigned int index, struct mtrr_var_range *vr)
317{
318 rdmsr(MTRRphysBase_MSR(index), vr->base_lo, vr->base_hi);
319 rdmsr(MTRRphysMask_MSR(index), vr->mask_lo, vr->mask_hi);
320}
321
322/* Fill the MSR pair relating to a var range */
323void fill_mtrr_var_range(unsigned int index,
324 u32 base_lo, u32 base_hi, u32 mask_lo, u32 mask_hi)
325{
326 struct mtrr_var_range *vr;
327
328 vr = mtrr_state.var_ranges;
329
330 vr[index].base_lo = base_lo;
331 vr[index].base_hi = base_hi;
332 vr[index].mask_lo = mask_lo;
333 vr[index].mask_hi = mask_hi;
334}
335
336static void get_fixed_ranges(mtrr_type *frs)
337{
338 unsigned int *p = (unsigned int *)frs;
339 int i;
340
341 k8_check_syscfg_dram_mod_en();
342
343 rdmsr(MSR_MTRRfix64K_00000, p[0], p[1]);
344
345 for (i = 0; i < 2; i++)
346 rdmsr(MSR_MTRRfix16K_80000 + i, p[2 + i * 2], p[3 + i * 2]);
347 for (i = 0; i < 8; i++)
348 rdmsr(MSR_MTRRfix4K_C0000 + i, p[6 + i * 2], p[7 + i * 2]);
349}
350
351void mtrr_save_fixed_ranges(void *info)
352{
353 if (boot_cpu_has(X86_FEATURE_MTRR))
354 get_fixed_ranges(mtrr_state.fixed_ranges);
355}
356
357static unsigned __initdata last_fixed_start;
358static unsigned __initdata last_fixed_end;
359static mtrr_type __initdata last_fixed_type;
360
361static void __init print_fixed_last(void)
362{
363 if (!last_fixed_end)
364 return;
365
366 pr_debug(" %05X-%05X %s\n", last_fixed_start,
367 last_fixed_end - 1, mtrr_attrib_to_str(last_fixed_type));
368
369 last_fixed_end = 0;
370}
371
372static void __init update_fixed_last(unsigned base, unsigned end,
373 mtrr_type type)
374{
375 last_fixed_start = base;
376 last_fixed_end = end;
377 last_fixed_type = type;
378}
379
380static void __init
381print_fixed(unsigned base, unsigned step, const mtrr_type *types)
382{
383 unsigned i;
384
385 for (i = 0; i < 8; ++i, ++types, base += step) {
386 if (last_fixed_end == 0) {
387 update_fixed_last(base, base + step, *types);
388 continue;
389 }
390 if (last_fixed_end == base && last_fixed_type == *types) {
391 last_fixed_end = base + step;
392 continue;
393 }
394 /* new segments: gap or different type */
395 print_fixed_last();
396 update_fixed_last(base, base + step, *types);
397 }
398}
399
400static void prepare_set(void);
401static void post_set(void);
402
403static void __init print_mtrr_state(void)
404{
405 unsigned int i;
406 int high_width;
407
408 pr_debug("MTRR default type: %s\n",
409 mtrr_attrib_to_str(mtrr_state.def_type));
410 if (mtrr_state.have_fixed) {
411 pr_debug("MTRR fixed ranges %sabled:\n",
412 ((mtrr_state.enabled & MTRR_STATE_MTRR_ENABLED) &&
413 (mtrr_state.enabled & MTRR_STATE_MTRR_FIXED_ENABLED)) ?
414 "en" : "dis");
415 print_fixed(0x00000, 0x10000, mtrr_state.fixed_ranges + 0);
416 for (i = 0; i < 2; ++i)
417 print_fixed(0x80000 + i * 0x20000, 0x04000,
418 mtrr_state.fixed_ranges + (i + 1) * 8);
419 for (i = 0; i < 8; ++i)
420 print_fixed(0xC0000 + i * 0x08000, 0x01000,
421 mtrr_state.fixed_ranges + (i + 3) * 8);
422
423 /* tail */
424 print_fixed_last();
425 }
426 pr_debug("MTRR variable ranges %sabled:\n",
427 mtrr_state.enabled & MTRR_STATE_MTRR_ENABLED ? "en" : "dis");
428 high_width = (__ffs64(size_or_mask) - (32 - PAGE_SHIFT) + 3) / 4;
429
430 for (i = 0; i < num_var_ranges; ++i) {
431 if (mtrr_state.var_ranges[i].mask_lo & (1 << 11))
432 pr_debug(" %u base %0*X%05X000 mask %0*X%05X000 %s\n",
433 i,
434 high_width,
435 mtrr_state.var_ranges[i].base_hi,
436 mtrr_state.var_ranges[i].base_lo >> 12,
437 high_width,
438 mtrr_state.var_ranges[i].mask_hi,
439 mtrr_state.var_ranges[i].mask_lo >> 12,
440 mtrr_attrib_to_str(mtrr_state.var_ranges[i].base_lo & 0xff));
441 else
442 pr_debug(" %u disabled\n", i);
443 }
444 if (mtrr_tom2)
445 pr_debug("TOM2: %016llx aka %lldM\n", mtrr_tom2, mtrr_tom2>>20);
446}
447
448/* PAT setup for BP. We need to go through sync steps here */
449void __init mtrr_bp_pat_init(void)
450{
451 unsigned long flags;
452
453 local_irq_save(flags);
454 prepare_set();
455
456 pat_init();
457
458 post_set();
459 local_irq_restore(flags);
460}
461
462/* Grab all of the MTRR state for this CPU into *state */
463bool __init get_mtrr_state(void)
464{
465 struct mtrr_var_range *vrs;
466 unsigned lo, dummy;
467 unsigned int i;
468
469 vrs = mtrr_state.var_ranges;
470
471 rdmsr(MSR_MTRRcap, lo, dummy);
472 mtrr_state.have_fixed = (lo >> 8) & 1;
473
474 for (i = 0; i < num_var_ranges; i++)
475 get_mtrr_var_range(i, &vrs[i]);
476 if (mtrr_state.have_fixed)
477 get_fixed_ranges(mtrr_state.fixed_ranges);
478
479 rdmsr(MSR_MTRRdefType, lo, dummy);
480 mtrr_state.def_type = (lo & 0xff);
481 mtrr_state.enabled = (lo & 0xc00) >> 10;
482
483 if (amd_special_default_mtrr()) {
484 unsigned low, high;
485
486 /* TOP_MEM2 */
487 rdmsr(MSR_K8_TOP_MEM2, low, high);
488 mtrr_tom2 = high;
489 mtrr_tom2 <<= 32;
490 mtrr_tom2 |= low;
491 mtrr_tom2 &= 0xffffff800000ULL;
492 }
493
494 print_mtrr_state();
495
496 mtrr_state_set = 1;
497
498 return !!(mtrr_state.enabled & MTRR_STATE_MTRR_ENABLED);
499}
500
501/* Some BIOS's are messed up and don't set all MTRRs the same! */
502void __init mtrr_state_warn(void)
503{
504 unsigned long mask = smp_changes_mask;
505
506 if (!mask)
507 return;
508 if (mask & MTRR_CHANGE_MASK_FIXED)
509 pr_warn("mtrr: your CPUs had inconsistent fixed MTRR settings\n");
510 if (mask & MTRR_CHANGE_MASK_VARIABLE)
511 pr_warn("mtrr: your CPUs had inconsistent variable MTRR settings\n");
512 if (mask & MTRR_CHANGE_MASK_DEFTYPE)
513 pr_warn("mtrr: your CPUs had inconsistent MTRRdefType settings\n");
514
515 pr_info("mtrr: probably your BIOS does not setup all CPUs.\n");
516 pr_info("mtrr: corrected configuration.\n");
517}
518
519/*
520 * Doesn't attempt to pass an error out to MTRR users
521 * because it's quite complicated in some cases and probably not
522 * worth it because the best error handling is to ignore it.
523 */
524void mtrr_wrmsr(unsigned msr, unsigned a, unsigned b)
525{
526 if (wrmsr_safe(msr, a, b) < 0) {
527 pr_err("MTRR: CPU %u: Writing MSR %x to %x:%x failed\n",
528 smp_processor_id(), msr, a, b);
529 }
530}
531
532/**
533 * set_fixed_range - checks & updates a fixed-range MTRR if it
534 * differs from the value it should have
535 * @msr: MSR address of the MTTR which should be checked and updated
536 * @changed: pointer which indicates whether the MTRR needed to be changed
537 * @msrwords: pointer to the MSR values which the MSR should have
538 */
539static void set_fixed_range(int msr, bool *changed, unsigned int *msrwords)
540{
541 unsigned lo, hi;
542
543 rdmsr(msr, lo, hi);
544
545 if (lo != msrwords[0] || hi != msrwords[1]) {
546 mtrr_wrmsr(msr, msrwords[0], msrwords[1]);
547 *changed = true;
548 }
549}
550
551/**
552 * generic_get_free_region - Get a free MTRR.
553 * @base: The starting (base) address of the region.
554 * @size: The size (in bytes) of the region.
555 * @replace_reg: mtrr index to be replaced; set to invalid value if none.
556 *
557 * Returns: The index of the region on success, else negative on error.
558 */
559int
560generic_get_free_region(unsigned long base, unsigned long size, int replace_reg)
561{
562 unsigned long lbase, lsize;
563 mtrr_type ltype;
564 int i, max;
565
566 max = num_var_ranges;
567 if (replace_reg >= 0 && replace_reg < max)
568 return replace_reg;
569
570 for (i = 0; i < max; ++i) {
571 mtrr_if->get(i, &lbase, &lsize, <ype);
572 if (lsize == 0)
573 return i;
574 }
575
576 return -ENOSPC;
577}
578
579static void generic_get_mtrr(unsigned int reg, unsigned long *base,
580 unsigned long *size, mtrr_type *type)
581{
582 u32 mask_lo, mask_hi, base_lo, base_hi;
583 unsigned int hi;
584 u64 tmp, mask;
585
586 /*
587 * get_mtrr doesn't need to update mtrr_state, also it could be called
588 * from any cpu, so try to print it out directly.
589 */
590 get_cpu();
591
592 rdmsr(MTRRphysMask_MSR(reg), mask_lo, mask_hi);
593
594 if ((mask_lo & 0x800) == 0) {
595 /* Invalid (i.e. free) range */
596 *base = 0;
597 *size = 0;
598 *type = 0;
599 goto out_put_cpu;
600 }
601
602 rdmsr(MTRRphysBase_MSR(reg), base_lo, base_hi);
603
604 /* Work out the shifted address mask: */
605 tmp = (u64)mask_hi << (32 - PAGE_SHIFT) | mask_lo >> PAGE_SHIFT;
606 mask = size_or_mask | tmp;
607
608 /* Expand tmp with high bits to all 1s: */
609 hi = fls64(tmp);
610 if (hi > 0) {
611 tmp |= ~((1ULL<<(hi - 1)) - 1);
612
613 if (tmp != mask) {
614 pr_warn("mtrr: your BIOS has configured an incorrect mask, fixing it.\n");
615 add_taint(TAINT_FIRMWARE_WORKAROUND, LOCKDEP_STILL_OK);
616 mask = tmp;
617 }
618 }
619
620 /*
621 * This works correctly if size is a power of two, i.e. a
622 * contiguous range:
623 */
624 *size = -mask;
625 *base = (u64)base_hi << (32 - PAGE_SHIFT) | base_lo >> PAGE_SHIFT;
626 *type = base_lo & 0xff;
627
628out_put_cpu:
629 put_cpu();
630}
631
632/**
633 * set_fixed_ranges - checks & updates the fixed-range MTRRs if they
634 * differ from the saved set
635 * @frs: pointer to fixed-range MTRR values, saved by get_fixed_ranges()
636 */
637static int set_fixed_ranges(mtrr_type *frs)
638{
639 unsigned long long *saved = (unsigned long long *)frs;
640 bool changed = false;
641 int block = -1, range;
642
643 k8_check_syscfg_dram_mod_en();
644
645 while (fixed_range_blocks[++block].ranges) {
646 for (range = 0; range < fixed_range_blocks[block].ranges; range++)
647 set_fixed_range(fixed_range_blocks[block].base_msr + range,
648 &changed, (unsigned int *)saved++);
649 }
650
651 return changed;
652}
653
654/*
655 * Set the MSR pair relating to a var range.
656 * Returns true if changes are made.
657 */
658static bool set_mtrr_var_ranges(unsigned int index, struct mtrr_var_range *vr)
659{
660 unsigned int lo, hi;
661 bool changed = false;
662
663 rdmsr(MTRRphysBase_MSR(index), lo, hi);
664 if ((vr->base_lo & 0xfffff0ffUL) != (lo & 0xfffff0ffUL)
665 || (vr->base_hi & (size_and_mask >> (32 - PAGE_SHIFT))) !=
666 (hi & (size_and_mask >> (32 - PAGE_SHIFT)))) {
667
668 mtrr_wrmsr(MTRRphysBase_MSR(index), vr->base_lo, vr->base_hi);
669 changed = true;
670 }
671
672 rdmsr(MTRRphysMask_MSR(index), lo, hi);
673
674 if ((vr->mask_lo & 0xfffff800UL) != (lo & 0xfffff800UL)
675 || (vr->mask_hi & (size_and_mask >> (32 - PAGE_SHIFT))) !=
676 (hi & (size_and_mask >> (32 - PAGE_SHIFT)))) {
677 mtrr_wrmsr(MTRRphysMask_MSR(index), vr->mask_lo, vr->mask_hi);
678 changed = true;
679 }
680 return changed;
681}
682
683static u32 deftype_lo, deftype_hi;
684
685/**
686 * set_mtrr_state - Set the MTRR state for this CPU.
687 *
688 * NOTE: The CPU must already be in a safe state for MTRR changes.
689 * RETURNS: 0 if no changes made, else a mask indicating what was changed.
690 */
691static unsigned long set_mtrr_state(void)
692{
693 unsigned long change_mask = 0;
694 unsigned int i;
695
696 for (i = 0; i < num_var_ranges; i++) {
697 if (set_mtrr_var_ranges(i, &mtrr_state.var_ranges[i]))
698 change_mask |= MTRR_CHANGE_MASK_VARIABLE;
699 }
700
701 if (mtrr_state.have_fixed && set_fixed_ranges(mtrr_state.fixed_ranges))
702 change_mask |= MTRR_CHANGE_MASK_FIXED;
703
704 /*
705 * Set_mtrr_restore restores the old value of MTRRdefType,
706 * so to set it we fiddle with the saved value:
707 */
708 if ((deftype_lo & 0xff) != mtrr_state.def_type
709 || ((deftype_lo & 0xc00) >> 10) != mtrr_state.enabled) {
710
711 deftype_lo = (deftype_lo & ~0xcff) | mtrr_state.def_type |
712 (mtrr_state.enabled << 10);
713 change_mask |= MTRR_CHANGE_MASK_DEFTYPE;
714 }
715
716 return change_mask;
717}
718
719
720static unsigned long cr4;
721static DEFINE_RAW_SPINLOCK(set_atomicity_lock);
722
723/*
724 * Since we are disabling the cache don't allow any interrupts,
725 * they would run extremely slow and would only increase the pain.
726 *
727 * The caller must ensure that local interrupts are disabled and
728 * are reenabled after post_set() has been called.
729 */
730static void prepare_set(void) __acquires(set_atomicity_lock)
731{
732 unsigned long cr0;
733
734 /*
735 * Note that this is not ideal
736 * since the cache is only flushed/disabled for this CPU while the
737 * MTRRs are changed, but changing this requires more invasive
738 * changes to the way the kernel boots
739 */
740
741 raw_spin_lock(&set_atomicity_lock);
742
743 /* Enter the no-fill (CD=1, NW=0) cache mode and flush caches. */
744 cr0 = read_cr0() | X86_CR0_CD;
745 write_cr0(cr0);
746
747 /*
748 * Cache flushing is the most time-consuming step when programming
749 * the MTRRs. Fortunately, as per the Intel Software Development
750 * Manual, we can skip it if the processor supports cache self-
751 * snooping.
752 */
753 if (!static_cpu_has(X86_FEATURE_SELFSNOOP))
754 wbinvd();
755
756 /* Save value of CR4 and clear Page Global Enable (bit 7) */
757 if (boot_cpu_has(X86_FEATURE_PGE)) {
758 cr4 = __read_cr4();
759 __write_cr4(cr4 & ~X86_CR4_PGE);
760 }
761
762 /* Flush all TLBs via a mov %cr3, %reg; mov %reg, %cr3 */
763 count_vm_tlb_event(NR_TLB_LOCAL_FLUSH_ALL);
764 __flush_tlb();
765
766 /* Save MTRR state */
767 rdmsr(MSR_MTRRdefType, deftype_lo, deftype_hi);
768
769 /* Disable MTRRs, and set the default type to uncached */
770 mtrr_wrmsr(MSR_MTRRdefType, deftype_lo & ~0xcff, deftype_hi);
771
772 /* Again, only flush caches if we have to. */
773 if (!static_cpu_has(X86_FEATURE_SELFSNOOP))
774 wbinvd();
775}
776
777static void post_set(void) __releases(set_atomicity_lock)
778{
779 /* Flush TLBs (no need to flush caches - they are disabled) */
780 count_vm_tlb_event(NR_TLB_LOCAL_FLUSH_ALL);
781 __flush_tlb();
782
783 /* Intel (P6) standard MTRRs */
784 mtrr_wrmsr(MSR_MTRRdefType, deftype_lo, deftype_hi);
785
786 /* Enable caches */
787 write_cr0(read_cr0() & ~X86_CR0_CD);
788
789 /* Restore value of CR4 */
790 if (boot_cpu_has(X86_FEATURE_PGE))
791 __write_cr4(cr4);
792 raw_spin_unlock(&set_atomicity_lock);
793}
794
795static void generic_set_all(void)
796{
797 unsigned long mask, count;
798 unsigned long flags;
799
800 local_irq_save(flags);
801 prepare_set();
802
803 /* Actually set the state */
804 mask = set_mtrr_state();
805
806 /* also set PAT */
807 pat_init();
808
809 post_set();
810 local_irq_restore(flags);
811
812 /* Use the atomic bitops to update the global mask */
813 for (count = 0; count < sizeof(mask) * 8; ++count) {
814 if (mask & 0x01)
815 set_bit(count, &smp_changes_mask);
816 mask >>= 1;
817 }
818
819}
820
821/**
822 * generic_set_mtrr - set variable MTRR register on the local CPU.
823 *
824 * @reg: The register to set.
825 * @base: The base address of the region.
826 * @size: The size of the region. If this is 0 the region is disabled.
827 * @type: The type of the region.
828 *
829 * Returns nothing.
830 */
831static void generic_set_mtrr(unsigned int reg, unsigned long base,
832 unsigned long size, mtrr_type type)
833{
834 unsigned long flags;
835 struct mtrr_var_range *vr;
836
837 vr = &mtrr_state.var_ranges[reg];
838
839 local_irq_save(flags);
840 prepare_set();
841
842 if (size == 0) {
843 /*
844 * The invalid bit is kept in the mask, so we simply
845 * clear the relevant mask register to disable a range.
846 */
847 mtrr_wrmsr(MTRRphysMask_MSR(reg), 0, 0);
848 memset(vr, 0, sizeof(struct mtrr_var_range));
849 } else {
850 vr->base_lo = base << PAGE_SHIFT | type;
851 vr->base_hi = (base & size_and_mask) >> (32 - PAGE_SHIFT);
852 vr->mask_lo = -size << PAGE_SHIFT | 0x800;
853 vr->mask_hi = (-size & size_and_mask) >> (32 - PAGE_SHIFT);
854
855 mtrr_wrmsr(MTRRphysBase_MSR(reg), vr->base_lo, vr->base_hi);
856 mtrr_wrmsr(MTRRphysMask_MSR(reg), vr->mask_lo, vr->mask_hi);
857 }
858
859 post_set();
860 local_irq_restore(flags);
861}
862
863int generic_validate_add_page(unsigned long base, unsigned long size,
864 unsigned int type)
865{
866 unsigned long lbase, last;
867
868 /*
869 * For Intel PPro stepping <= 7
870 * must be 4 MiB aligned and not touch 0x70000000 -> 0x7003FFFF
871 */
872 if (is_cpu(INTEL) && boot_cpu_data.x86 == 6 &&
873 boot_cpu_data.x86_model == 1 &&
874 boot_cpu_data.x86_stepping <= 7) {
875 if (base & ((1 << (22 - PAGE_SHIFT)) - 1)) {
876 pr_warn("mtrr: base(0x%lx000) is not 4 MiB aligned\n", base);
877 return -EINVAL;
878 }
879 if (!(base + size < 0x70000 || base > 0x7003F) &&
880 (type == MTRR_TYPE_WRCOMB
881 || type == MTRR_TYPE_WRBACK)) {
882 pr_warn("mtrr: writable mtrr between 0x70000000 and 0x7003FFFF may hang the CPU.\n");
883 return -EINVAL;
884 }
885 }
886
887 /*
888 * Check upper bits of base and last are equal and lower bits are 0
889 * for base and 1 for last
890 */
891 last = base + size - 1;
892 for (lbase = base; !(lbase & 1) && (last & 1);
893 lbase = lbase >> 1, last = last >> 1)
894 ;
895 if (lbase != last) {
896 pr_warn("mtrr: base(0x%lx000) is not aligned on a size(0x%lx000) boundary\n", base, size);
897 return -EINVAL;
898 }
899 return 0;
900}
901
902static int generic_have_wrcomb(void)
903{
904 unsigned long config, dummy;
905 rdmsr(MSR_MTRRcap, config, dummy);
906 return config & (1 << 10);
907}
908
909int positive_have_wrcomb(void)
910{
911 return 1;
912}
913
914/*
915 * Generic structure...
916 */
917const struct mtrr_ops generic_mtrr_ops = {
918 .use_intel_if = 1,
919 .set_all = generic_set_all,
920 .get = generic_get_mtrr,
921 .get_free_region = generic_get_free_region,
922 .set = generic_set_mtrr,
923 .validate_add_page = generic_validate_add_page,
924 .have_wrcomb = generic_have_wrcomb,
925};
1// SPDX-License-Identifier: GPL-2.0-only
2/*
3 * This only handles 32bit MTRR on 32bit hosts. This is strictly wrong
4 * because MTRRs can span up to 40 bits (36bits on most modern x86)
5 */
6
7#include <linux/export.h>
8#include <linux/init.h>
9#include <linux/io.h>
10#include <linux/mm.h>
11#include <linux/cc_platform.h>
12#include <asm/processor-flags.h>
13#include <asm/cacheinfo.h>
14#include <asm/cpufeature.h>
15#include <asm/hypervisor.h>
16#include <asm/mshyperv.h>
17#include <asm/tlbflush.h>
18#include <asm/mtrr.h>
19#include <asm/msr.h>
20#include <asm/memtype.h>
21
22#include "mtrr.h"
23
24struct fixed_range_block {
25 int base_msr; /* start address of an MTRR block */
26 int ranges; /* number of MTRRs in this block */
27};
28
29static struct fixed_range_block fixed_range_blocks[] = {
30 { MSR_MTRRfix64K_00000, 1 }, /* one 64k MTRR */
31 { MSR_MTRRfix16K_80000, 2 }, /* two 16k MTRRs */
32 { MSR_MTRRfix4K_C0000, 8 }, /* eight 4k MTRRs */
33 {}
34};
35
36struct cache_map {
37 u64 start;
38 u64 end;
39 u64 flags;
40 u64 type:8;
41 u64 fixed:1;
42};
43
44bool mtrr_debug;
45
46static int __init mtrr_param_setup(char *str)
47{
48 int rc = 0;
49
50 if (!str)
51 return -EINVAL;
52 if (!strcmp(str, "debug"))
53 mtrr_debug = true;
54 else
55 rc = -EINVAL;
56
57 return rc;
58}
59early_param("mtrr", mtrr_param_setup);
60
61/*
62 * CACHE_MAP_MAX is the maximum number of memory ranges in cache_map, where
63 * no 2 adjacent ranges have the same cache mode (those would be merged).
64 * The number is based on the worst case:
65 * - no two adjacent fixed MTRRs share the same cache mode
66 * - one variable MTRR is spanning a huge area with mode WB
67 * - 255 variable MTRRs with mode UC all overlap with the WB MTRR, creating 2
68 * additional ranges each (result like "ababababa...aba" with a = WB, b = UC),
69 * accounting for MTRR_MAX_VAR_RANGES * 2 - 1 range entries
70 * - a TOP_MEM2 area (even with overlapping an UC MTRR can't add 2 range entries
71 * to the possible maximum, as it always starts at 4GB, thus it can't be in
72 * the middle of that MTRR, unless that MTRR starts at 0, which would remove
73 * the initial "a" from the "abababa" pattern above)
74 * The map won't contain ranges with no matching MTRR (those fall back to the
75 * default cache mode).
76 */
77#define CACHE_MAP_MAX (MTRR_NUM_FIXED_RANGES + MTRR_MAX_VAR_RANGES * 2)
78
79static struct cache_map init_cache_map[CACHE_MAP_MAX] __initdata;
80static struct cache_map *cache_map __refdata = init_cache_map;
81static unsigned int cache_map_size = CACHE_MAP_MAX;
82static unsigned int cache_map_n;
83static unsigned int cache_map_fixed;
84
85static unsigned long smp_changes_mask;
86static int mtrr_state_set;
87u64 mtrr_tom2;
88
89struct mtrr_state_type mtrr_state;
90EXPORT_SYMBOL_GPL(mtrr_state);
91
92/* Reserved bits in the high portion of the MTRRphysBaseN MSR. */
93u32 phys_hi_rsvd;
94
95/*
96 * BIOS is expected to clear MtrrFixDramModEn bit, see for example
97 * "BIOS and Kernel Developer's Guide for the AMD Athlon 64 and AMD
98 * Opteron Processors" (26094 Rev. 3.30 February 2006), section
99 * "13.2.1.2 SYSCFG Register": "The MtrrFixDramModEn bit should be set
100 * to 1 during BIOS initialization of the fixed MTRRs, then cleared to
101 * 0 for operation."
102 */
103static inline void k8_check_syscfg_dram_mod_en(void)
104{
105 u32 lo, hi;
106
107 if (!((boot_cpu_data.x86_vendor == X86_VENDOR_AMD) &&
108 (boot_cpu_data.x86 >= 0x0f)))
109 return;
110
111 if (cc_platform_has(CC_ATTR_HOST_SEV_SNP))
112 return;
113
114 rdmsr(MSR_AMD64_SYSCFG, lo, hi);
115 if (lo & K8_MTRRFIXRANGE_DRAM_MODIFY) {
116 pr_err(FW_WARN "MTRR: CPU %u: SYSCFG[MtrrFixDramModEn]"
117 " not cleared by BIOS, clearing this bit\n",
118 smp_processor_id());
119 lo &= ~K8_MTRRFIXRANGE_DRAM_MODIFY;
120 mtrr_wrmsr(MSR_AMD64_SYSCFG, lo, hi);
121 }
122}
123
124/* Get the size of contiguous MTRR range */
125static u64 get_mtrr_size(u64 mask)
126{
127 u64 size;
128
129 mask |= (u64)phys_hi_rsvd << 32;
130 size = -mask;
131
132 return size;
133}
134
135static u8 get_var_mtrr_state(unsigned int reg, u64 *start, u64 *size)
136{
137 struct mtrr_var_range *mtrr = mtrr_state.var_ranges + reg;
138
139 if (!(mtrr->mask_lo & MTRR_PHYSMASK_V))
140 return MTRR_TYPE_INVALID;
141
142 *start = (((u64)mtrr->base_hi) << 32) + (mtrr->base_lo & PAGE_MASK);
143 *size = get_mtrr_size((((u64)mtrr->mask_hi) << 32) +
144 (mtrr->mask_lo & PAGE_MASK));
145
146 return mtrr->base_lo & MTRR_PHYSBASE_TYPE;
147}
148
149static u8 get_effective_type(u8 type1, u8 type2)
150{
151 if (type1 == MTRR_TYPE_UNCACHABLE || type2 == MTRR_TYPE_UNCACHABLE)
152 return MTRR_TYPE_UNCACHABLE;
153
154 if ((type1 == MTRR_TYPE_WRBACK && type2 == MTRR_TYPE_WRTHROUGH) ||
155 (type1 == MTRR_TYPE_WRTHROUGH && type2 == MTRR_TYPE_WRBACK))
156 return MTRR_TYPE_WRTHROUGH;
157
158 if (type1 != type2)
159 return MTRR_TYPE_UNCACHABLE;
160
161 return type1;
162}
163
164static void rm_map_entry_at(int idx)
165{
166 cache_map_n--;
167 if (cache_map_n > idx) {
168 memmove(cache_map + idx, cache_map + idx + 1,
169 sizeof(*cache_map) * (cache_map_n - idx));
170 }
171}
172
173/*
174 * Add an entry into cache_map at a specific index. Merges adjacent entries if
175 * appropriate. Return the number of merges for correcting the scan index
176 * (this is needed as merging will reduce the number of entries, which will
177 * result in skipping entries in future iterations if the scan index isn't
178 * corrected).
179 * Note that the corrected index can never go below -1 (resulting in being 0 in
180 * the next scan iteration), as "2" is returned only if the current index is
181 * larger than zero.
182 */
183static int add_map_entry_at(u64 start, u64 end, u8 type, int idx)
184{
185 bool merge_prev = false, merge_next = false;
186
187 if (start >= end)
188 return 0;
189
190 if (idx > 0) {
191 struct cache_map *prev = cache_map + idx - 1;
192
193 if (!prev->fixed && start == prev->end && type == prev->type)
194 merge_prev = true;
195 }
196
197 if (idx < cache_map_n) {
198 struct cache_map *next = cache_map + idx;
199
200 if (!next->fixed && end == next->start && type == next->type)
201 merge_next = true;
202 }
203
204 if (merge_prev && merge_next) {
205 cache_map[idx - 1].end = cache_map[idx].end;
206 rm_map_entry_at(idx);
207 return 2;
208 }
209 if (merge_prev) {
210 cache_map[idx - 1].end = end;
211 return 1;
212 }
213 if (merge_next) {
214 cache_map[idx].start = start;
215 return 1;
216 }
217
218 /* Sanity check: the array should NEVER be too small! */
219 if (cache_map_n == cache_map_size) {
220 WARN(1, "MTRR cache mode memory map exhausted!\n");
221 cache_map_n = cache_map_fixed;
222 return 0;
223 }
224
225 if (cache_map_n > idx) {
226 memmove(cache_map + idx + 1, cache_map + idx,
227 sizeof(*cache_map) * (cache_map_n - idx));
228 }
229
230 cache_map[idx].start = start;
231 cache_map[idx].end = end;
232 cache_map[idx].type = type;
233 cache_map[idx].fixed = 0;
234 cache_map_n++;
235
236 return 0;
237}
238
239/* Clear a part of an entry. Return 1 if start of entry is still valid. */
240static int clr_map_range_at(u64 start, u64 end, int idx)
241{
242 int ret = start != cache_map[idx].start;
243 u64 tmp;
244
245 if (start == cache_map[idx].start && end == cache_map[idx].end) {
246 rm_map_entry_at(idx);
247 } else if (start == cache_map[idx].start) {
248 cache_map[idx].start = end;
249 } else if (end == cache_map[idx].end) {
250 cache_map[idx].end = start;
251 } else {
252 tmp = cache_map[idx].end;
253 cache_map[idx].end = start;
254 add_map_entry_at(end, tmp, cache_map[idx].type, idx + 1);
255 }
256
257 return ret;
258}
259
260/*
261 * Add MTRR to the map. The current map is scanned and each part of the MTRR
262 * either overlapping with an existing entry or with a hole in the map is
263 * handled separately.
264 */
265static void add_map_entry(u64 start, u64 end, u8 type)
266{
267 u8 new_type, old_type;
268 u64 tmp;
269 int i;
270
271 for (i = 0; i < cache_map_n && start < end; i++) {
272 if (start >= cache_map[i].end)
273 continue;
274
275 if (start < cache_map[i].start) {
276 /* Region start has no overlap. */
277 tmp = min(end, cache_map[i].start);
278 i -= add_map_entry_at(start, tmp, type, i);
279 start = tmp;
280 continue;
281 }
282
283 new_type = get_effective_type(type, cache_map[i].type);
284 old_type = cache_map[i].type;
285
286 if (cache_map[i].fixed || new_type == old_type) {
287 /* Cut off start of new entry. */
288 start = cache_map[i].end;
289 continue;
290 }
291
292 /* Handle only overlapping part of region. */
293 tmp = min(end, cache_map[i].end);
294 i += clr_map_range_at(start, tmp, i);
295 i -= add_map_entry_at(start, tmp, new_type, i);
296 start = tmp;
297 }
298
299 /* Add rest of region after last map entry (rest might be empty). */
300 add_map_entry_at(start, end, type, i);
301}
302
303/* Add variable MTRRs to cache map. */
304static void map_add_var(void)
305{
306 u64 start, size;
307 unsigned int i;
308 u8 type;
309
310 /*
311 * Add AMD TOP_MEM2 area. Can't be added in mtrr_build_map(), as it
312 * needs to be added again when rebuilding the map due to potentially
313 * having moved as a result of variable MTRRs for memory below 4GB.
314 */
315 if (mtrr_tom2) {
316 add_map_entry(BIT_ULL(32), mtrr_tom2, MTRR_TYPE_WRBACK);
317 cache_map[cache_map_n - 1].fixed = 1;
318 }
319
320 for (i = 0; i < num_var_ranges; i++) {
321 type = get_var_mtrr_state(i, &start, &size);
322 if (type != MTRR_TYPE_INVALID)
323 add_map_entry(start, start + size, type);
324 }
325}
326
327/*
328 * Rebuild map by replacing variable entries. Needs to be called when MTRR
329 * registers are being changed after boot, as such changes could include
330 * removals of registers, which are complicated to handle without rebuild of
331 * the map.
332 */
333void generic_rebuild_map(void)
334{
335 if (mtrr_if != &generic_mtrr_ops)
336 return;
337
338 cache_map_n = cache_map_fixed;
339
340 map_add_var();
341}
342
343static unsigned int __init get_cache_map_size(void)
344{
345 return cache_map_fixed + 2 * num_var_ranges + (mtrr_tom2 != 0);
346}
347
348/* Build the cache_map containing the cache modes per memory range. */
349void __init mtrr_build_map(void)
350{
351 u64 start, end, size;
352 unsigned int i;
353 u8 type;
354
355 /* Add fixed MTRRs, optimize for adjacent entries with same type. */
356 if (mtrr_state.enabled & MTRR_STATE_MTRR_FIXED_ENABLED) {
357 /*
358 * Start with 64k size fixed entries, preset 1st one (hence the
359 * loop below is starting with index 1).
360 */
361 start = 0;
362 end = size = 0x10000;
363 type = mtrr_state.fixed_ranges[0];
364
365 for (i = 1; i < MTRR_NUM_FIXED_RANGES; i++) {
366 /* 8 64k entries, then 16 16k ones, rest 4k. */
367 if (i == 8 || i == 24)
368 size >>= 2;
369
370 if (mtrr_state.fixed_ranges[i] != type) {
371 add_map_entry(start, end, type);
372 start = end;
373 type = mtrr_state.fixed_ranges[i];
374 }
375 end += size;
376 }
377 add_map_entry(start, end, type);
378 }
379
380 /* Mark fixed, they take precedence. */
381 for (i = 0; i < cache_map_n; i++)
382 cache_map[i].fixed = 1;
383 cache_map_fixed = cache_map_n;
384
385 map_add_var();
386
387 pr_info("MTRR map: %u entries (%u fixed + %u variable; max %u), built from %u variable MTRRs\n",
388 cache_map_n, cache_map_fixed, cache_map_n - cache_map_fixed,
389 get_cache_map_size(), num_var_ranges + (mtrr_tom2 != 0));
390
391 if (mtrr_debug) {
392 for (i = 0; i < cache_map_n; i++) {
393 pr_info("%3u: %016llx-%016llx %s\n", i,
394 cache_map[i].start, cache_map[i].end - 1,
395 mtrr_attrib_to_str(cache_map[i].type));
396 }
397 }
398}
399
400/* Copy the cache_map from __initdata memory to dynamically allocated one. */
401void __init mtrr_copy_map(void)
402{
403 unsigned int new_size = get_cache_map_size();
404
405 if (!mtrr_state.enabled || !new_size) {
406 cache_map = NULL;
407 return;
408 }
409
410 mutex_lock(&mtrr_mutex);
411
412 cache_map = kcalloc(new_size, sizeof(*cache_map), GFP_KERNEL);
413 if (cache_map) {
414 memmove(cache_map, init_cache_map,
415 cache_map_n * sizeof(*cache_map));
416 cache_map_size = new_size;
417 } else {
418 mtrr_state.enabled = 0;
419 pr_err("MTRRs disabled due to allocation failure for lookup map.\n");
420 }
421
422 mutex_unlock(&mtrr_mutex);
423}
424
425/**
426 * mtrr_overwrite_state - set static MTRR state
427 *
428 * Used to set MTRR state via different means (e.g. with data obtained from
429 * a hypervisor).
430 * Is allowed only for special cases when running virtualized. Must be called
431 * from the x86_init.hyper.init_platform() hook. It can be called only once.
432 * The MTRR state can't be changed afterwards. To ensure that, X86_FEATURE_MTRR
433 * is cleared.
434 *
435 * @var: MTRR variable range array to use
436 * @num_var: length of the @var array
437 * @def_type: default caching type
438 */
439void mtrr_overwrite_state(struct mtrr_var_range *var, unsigned int num_var,
440 mtrr_type def_type)
441{
442 unsigned int i;
443
444 /* Only allowed to be called once before mtrr_bp_init(). */
445 if (WARN_ON_ONCE(mtrr_state_set))
446 return;
447
448 /* Only allowed when running virtualized. */
449 if (!cpu_feature_enabled(X86_FEATURE_HYPERVISOR))
450 return;
451
452 /*
453 * Only allowed for special virtualization cases:
454 * - when running as Hyper-V, SEV-SNP guest using vTOM
455 * - when running as Xen PV guest
456 * - when running as SEV-SNP or TDX guest to avoid unnecessary
457 * VMM communication/Virtualization exceptions (#VC, #VE)
458 */
459 if (!cc_platform_has(CC_ATTR_GUEST_SEV_SNP) &&
460 !hv_is_isolation_supported() &&
461 !cpu_feature_enabled(X86_FEATURE_XENPV) &&
462 !cpu_feature_enabled(X86_FEATURE_TDX_GUEST))
463 return;
464
465 /* Disable MTRR in order to disable MTRR modifications. */
466 setup_clear_cpu_cap(X86_FEATURE_MTRR);
467
468 if (var) {
469 if (num_var > MTRR_MAX_VAR_RANGES) {
470 pr_warn("Trying to overwrite MTRR state with %u variable entries\n",
471 num_var);
472 num_var = MTRR_MAX_VAR_RANGES;
473 }
474 for (i = 0; i < num_var; i++)
475 mtrr_state.var_ranges[i] = var[i];
476 num_var_ranges = num_var;
477 }
478
479 mtrr_state.def_type = def_type;
480 mtrr_state.enabled |= MTRR_STATE_MTRR_ENABLED;
481
482 mtrr_state_set = 1;
483}
484
485static u8 type_merge(u8 type, u8 new_type, u8 *uniform)
486{
487 u8 effective_type;
488
489 if (type == MTRR_TYPE_INVALID)
490 return new_type;
491
492 effective_type = get_effective_type(type, new_type);
493 if (type != effective_type)
494 *uniform = 0;
495
496 return effective_type;
497}
498
499/**
500 * mtrr_type_lookup - look up memory type in MTRR
501 *
502 * @start: Begin of the physical address range
503 * @end: End of the physical address range
504 * @uniform: output argument:
505 * - 1: the returned MTRR type is valid for the whole region
506 * - 0: otherwise
507 *
508 * Return Values:
509 * MTRR_TYPE_(type) - The effective MTRR type for the region
510 * MTRR_TYPE_INVALID - MTRR is disabled
511 */
512u8 mtrr_type_lookup(u64 start, u64 end, u8 *uniform)
513{
514 u8 type = MTRR_TYPE_INVALID;
515 unsigned int i;
516
517 if (!mtrr_state_set) {
518 /* Uniformity is unknown. */
519 *uniform = 0;
520 return MTRR_TYPE_UNCACHABLE;
521 }
522
523 *uniform = 1;
524
525 if (!(mtrr_state.enabled & MTRR_STATE_MTRR_ENABLED))
526 return MTRR_TYPE_UNCACHABLE;
527
528 for (i = 0; i < cache_map_n && start < end; i++) {
529 /* Region after current map entry? -> continue with next one. */
530 if (start >= cache_map[i].end)
531 continue;
532
533 /* Start of region not covered by current map entry? */
534 if (start < cache_map[i].start) {
535 /* At least some part of region has default type. */
536 type = type_merge(type, mtrr_state.def_type, uniform);
537 /* End of region not covered, too? -> lookup done. */
538 if (end <= cache_map[i].start)
539 return type;
540 }
541
542 /* At least part of region covered by map entry. */
543 type = type_merge(type, cache_map[i].type, uniform);
544
545 start = cache_map[i].end;
546 }
547
548 /* End of region past last entry in map? -> use default type. */
549 if (start < end)
550 type = type_merge(type, mtrr_state.def_type, uniform);
551
552 return type;
553}
554
555/* Get the MSR pair relating to a var range */
556static void
557get_mtrr_var_range(unsigned int index, struct mtrr_var_range *vr)
558{
559 rdmsr(MTRRphysBase_MSR(index), vr->base_lo, vr->base_hi);
560 rdmsr(MTRRphysMask_MSR(index), vr->mask_lo, vr->mask_hi);
561}
562
563/* Fill the MSR pair relating to a var range */
564void fill_mtrr_var_range(unsigned int index,
565 u32 base_lo, u32 base_hi, u32 mask_lo, u32 mask_hi)
566{
567 struct mtrr_var_range *vr;
568
569 vr = mtrr_state.var_ranges;
570
571 vr[index].base_lo = base_lo;
572 vr[index].base_hi = base_hi;
573 vr[index].mask_lo = mask_lo;
574 vr[index].mask_hi = mask_hi;
575}
576
577static void get_fixed_ranges(mtrr_type *frs)
578{
579 unsigned int *p = (unsigned int *)frs;
580 int i;
581
582 k8_check_syscfg_dram_mod_en();
583
584 rdmsr(MSR_MTRRfix64K_00000, p[0], p[1]);
585
586 for (i = 0; i < 2; i++)
587 rdmsr(MSR_MTRRfix16K_80000 + i, p[2 + i * 2], p[3 + i * 2]);
588 for (i = 0; i < 8; i++)
589 rdmsr(MSR_MTRRfix4K_C0000 + i, p[6 + i * 2], p[7 + i * 2]);
590}
591
592void mtrr_save_fixed_ranges(void *info)
593{
594 if (boot_cpu_has(X86_FEATURE_MTRR))
595 get_fixed_ranges(mtrr_state.fixed_ranges);
596}
597
598static unsigned __initdata last_fixed_start;
599static unsigned __initdata last_fixed_end;
600static mtrr_type __initdata last_fixed_type;
601
602static void __init print_fixed_last(void)
603{
604 if (!last_fixed_end)
605 return;
606
607 pr_info(" %05X-%05X %s\n", last_fixed_start,
608 last_fixed_end - 1, mtrr_attrib_to_str(last_fixed_type));
609
610 last_fixed_end = 0;
611}
612
613static void __init update_fixed_last(unsigned base, unsigned end,
614 mtrr_type type)
615{
616 last_fixed_start = base;
617 last_fixed_end = end;
618 last_fixed_type = type;
619}
620
621static void __init
622print_fixed(unsigned base, unsigned step, const mtrr_type *types)
623{
624 unsigned i;
625
626 for (i = 0; i < 8; ++i, ++types, base += step) {
627 if (last_fixed_end == 0) {
628 update_fixed_last(base, base + step, *types);
629 continue;
630 }
631 if (last_fixed_end == base && last_fixed_type == *types) {
632 last_fixed_end = base + step;
633 continue;
634 }
635 /* new segments: gap or different type */
636 print_fixed_last();
637 update_fixed_last(base, base + step, *types);
638 }
639}
640
641static void __init print_mtrr_state(void)
642{
643 unsigned int i;
644 int high_width;
645
646 pr_info("MTRR default type: %s\n",
647 mtrr_attrib_to_str(mtrr_state.def_type));
648 if (mtrr_state.have_fixed) {
649 pr_info("MTRR fixed ranges %sabled:\n",
650 ((mtrr_state.enabled & MTRR_STATE_MTRR_ENABLED) &&
651 (mtrr_state.enabled & MTRR_STATE_MTRR_FIXED_ENABLED)) ?
652 "en" : "dis");
653 print_fixed(0x00000, 0x10000, mtrr_state.fixed_ranges + 0);
654 for (i = 0; i < 2; ++i)
655 print_fixed(0x80000 + i * 0x20000, 0x04000,
656 mtrr_state.fixed_ranges + (i + 1) * 8);
657 for (i = 0; i < 8; ++i)
658 print_fixed(0xC0000 + i * 0x08000, 0x01000,
659 mtrr_state.fixed_ranges + (i + 3) * 8);
660
661 /* tail */
662 print_fixed_last();
663 }
664 pr_info("MTRR variable ranges %sabled:\n",
665 mtrr_state.enabled & MTRR_STATE_MTRR_ENABLED ? "en" : "dis");
666 high_width = (boot_cpu_data.x86_phys_bits - (32 - PAGE_SHIFT) + 3) / 4;
667
668 for (i = 0; i < num_var_ranges; ++i) {
669 if (mtrr_state.var_ranges[i].mask_lo & MTRR_PHYSMASK_V)
670 pr_info(" %u base %0*X%05X000 mask %0*X%05X000 %s\n",
671 i,
672 high_width,
673 mtrr_state.var_ranges[i].base_hi,
674 mtrr_state.var_ranges[i].base_lo >> 12,
675 high_width,
676 mtrr_state.var_ranges[i].mask_hi,
677 mtrr_state.var_ranges[i].mask_lo >> 12,
678 mtrr_attrib_to_str(mtrr_state.var_ranges[i].base_lo &
679 MTRR_PHYSBASE_TYPE));
680 else
681 pr_info(" %u disabled\n", i);
682 }
683 if (mtrr_tom2)
684 pr_info("TOM2: %016llx aka %lldM\n", mtrr_tom2, mtrr_tom2>>20);
685}
686
687/* Grab all of the MTRR state for this CPU into *state */
688bool __init get_mtrr_state(void)
689{
690 struct mtrr_var_range *vrs;
691 unsigned lo, dummy;
692 unsigned int i;
693
694 vrs = mtrr_state.var_ranges;
695
696 rdmsr(MSR_MTRRcap, lo, dummy);
697 mtrr_state.have_fixed = lo & MTRR_CAP_FIX;
698
699 for (i = 0; i < num_var_ranges; i++)
700 get_mtrr_var_range(i, &vrs[i]);
701 if (mtrr_state.have_fixed)
702 get_fixed_ranges(mtrr_state.fixed_ranges);
703
704 rdmsr(MSR_MTRRdefType, lo, dummy);
705 mtrr_state.def_type = lo & MTRR_DEF_TYPE_TYPE;
706 mtrr_state.enabled = (lo & MTRR_DEF_TYPE_ENABLE) >> MTRR_STATE_SHIFT;
707
708 if (amd_special_default_mtrr()) {
709 unsigned low, high;
710
711 /* TOP_MEM2 */
712 rdmsr(MSR_K8_TOP_MEM2, low, high);
713 mtrr_tom2 = high;
714 mtrr_tom2 <<= 32;
715 mtrr_tom2 |= low;
716 mtrr_tom2 &= 0xffffff800000ULL;
717 }
718
719 if (mtrr_debug)
720 print_mtrr_state();
721
722 mtrr_state_set = 1;
723
724 return !!(mtrr_state.enabled & MTRR_STATE_MTRR_ENABLED);
725}
726
727/* Some BIOS's are messed up and don't set all MTRRs the same! */
728void __init mtrr_state_warn(void)
729{
730 unsigned long mask = smp_changes_mask;
731
732 if (!mask)
733 return;
734 if (mask & MTRR_CHANGE_MASK_FIXED)
735 pr_warn("mtrr: your CPUs had inconsistent fixed MTRR settings\n");
736 if (mask & MTRR_CHANGE_MASK_VARIABLE)
737 pr_warn("mtrr: your CPUs had inconsistent variable MTRR settings\n");
738 if (mask & MTRR_CHANGE_MASK_DEFTYPE)
739 pr_warn("mtrr: your CPUs had inconsistent MTRRdefType settings\n");
740
741 pr_info("mtrr: probably your BIOS does not setup all CPUs.\n");
742 pr_info("mtrr: corrected configuration.\n");
743}
744
745/*
746 * Doesn't attempt to pass an error out to MTRR users
747 * because it's quite complicated in some cases and probably not
748 * worth it because the best error handling is to ignore it.
749 */
750void mtrr_wrmsr(unsigned msr, unsigned a, unsigned b)
751{
752 if (wrmsr_safe(msr, a, b) < 0) {
753 pr_err("MTRR: CPU %u: Writing MSR %x to %x:%x failed\n",
754 smp_processor_id(), msr, a, b);
755 }
756}
757
758/**
759 * set_fixed_range - checks & updates a fixed-range MTRR if it
760 * differs from the value it should have
761 * @msr: MSR address of the MTTR which should be checked and updated
762 * @changed: pointer which indicates whether the MTRR needed to be changed
763 * @msrwords: pointer to the MSR values which the MSR should have
764 */
765static void set_fixed_range(int msr, bool *changed, unsigned int *msrwords)
766{
767 unsigned lo, hi;
768
769 rdmsr(msr, lo, hi);
770
771 if (lo != msrwords[0] || hi != msrwords[1]) {
772 mtrr_wrmsr(msr, msrwords[0], msrwords[1]);
773 *changed = true;
774 }
775}
776
777/**
778 * generic_get_free_region - Get a free MTRR.
779 * @base: The starting (base) address of the region.
780 * @size: The size (in bytes) of the region.
781 * @replace_reg: mtrr index to be replaced; set to invalid value if none.
782 *
783 * Returns: The index of the region on success, else negative on error.
784 */
785int
786generic_get_free_region(unsigned long base, unsigned long size, int replace_reg)
787{
788 unsigned long lbase, lsize;
789 mtrr_type ltype;
790 int i, max;
791
792 max = num_var_ranges;
793 if (replace_reg >= 0 && replace_reg < max)
794 return replace_reg;
795
796 for (i = 0; i < max; ++i) {
797 mtrr_if->get(i, &lbase, &lsize, <ype);
798 if (lsize == 0)
799 return i;
800 }
801
802 return -ENOSPC;
803}
804
805static void generic_get_mtrr(unsigned int reg, unsigned long *base,
806 unsigned long *size, mtrr_type *type)
807{
808 u32 mask_lo, mask_hi, base_lo, base_hi;
809 unsigned int hi;
810 u64 tmp, mask;
811
812 /*
813 * get_mtrr doesn't need to update mtrr_state, also it could be called
814 * from any cpu, so try to print it out directly.
815 */
816 get_cpu();
817
818 rdmsr(MTRRphysMask_MSR(reg), mask_lo, mask_hi);
819
820 if (!(mask_lo & MTRR_PHYSMASK_V)) {
821 /* Invalid (i.e. free) range */
822 *base = 0;
823 *size = 0;
824 *type = 0;
825 goto out_put_cpu;
826 }
827
828 rdmsr(MTRRphysBase_MSR(reg), base_lo, base_hi);
829
830 /* Work out the shifted address mask: */
831 tmp = (u64)mask_hi << 32 | (mask_lo & PAGE_MASK);
832 mask = (u64)phys_hi_rsvd << 32 | tmp;
833
834 /* Expand tmp with high bits to all 1s: */
835 hi = fls64(tmp);
836 if (hi > 0) {
837 tmp |= ~((1ULL<<(hi - 1)) - 1);
838
839 if (tmp != mask) {
840 pr_warn("mtrr: your BIOS has configured an incorrect mask, fixing it.\n");
841 add_taint(TAINT_FIRMWARE_WORKAROUND, LOCKDEP_STILL_OK);
842 mask = tmp;
843 }
844 }
845
846 /*
847 * This works correctly if size is a power of two, i.e. a
848 * contiguous range:
849 */
850 *size = -mask >> PAGE_SHIFT;
851 *base = (u64)base_hi << (32 - PAGE_SHIFT) | base_lo >> PAGE_SHIFT;
852 *type = base_lo & MTRR_PHYSBASE_TYPE;
853
854out_put_cpu:
855 put_cpu();
856}
857
858/**
859 * set_fixed_ranges - checks & updates the fixed-range MTRRs if they
860 * differ from the saved set
861 * @frs: pointer to fixed-range MTRR values, saved by get_fixed_ranges()
862 */
863static int set_fixed_ranges(mtrr_type *frs)
864{
865 unsigned long long *saved = (unsigned long long *)frs;
866 bool changed = false;
867 int block = -1, range;
868
869 k8_check_syscfg_dram_mod_en();
870
871 while (fixed_range_blocks[++block].ranges) {
872 for (range = 0; range < fixed_range_blocks[block].ranges; range++)
873 set_fixed_range(fixed_range_blocks[block].base_msr + range,
874 &changed, (unsigned int *)saved++);
875 }
876
877 return changed;
878}
879
880/*
881 * Set the MSR pair relating to a var range.
882 * Returns true if changes are made.
883 */
884static bool set_mtrr_var_ranges(unsigned int index, struct mtrr_var_range *vr)
885{
886 unsigned int lo, hi;
887 bool changed = false;
888
889 rdmsr(MTRRphysBase_MSR(index), lo, hi);
890 if ((vr->base_lo & ~MTRR_PHYSBASE_RSVD) != (lo & ~MTRR_PHYSBASE_RSVD)
891 || (vr->base_hi & ~phys_hi_rsvd) != (hi & ~phys_hi_rsvd)) {
892
893 mtrr_wrmsr(MTRRphysBase_MSR(index), vr->base_lo, vr->base_hi);
894 changed = true;
895 }
896
897 rdmsr(MTRRphysMask_MSR(index), lo, hi);
898
899 if ((vr->mask_lo & ~MTRR_PHYSMASK_RSVD) != (lo & ~MTRR_PHYSMASK_RSVD)
900 || (vr->mask_hi & ~phys_hi_rsvd) != (hi & ~phys_hi_rsvd)) {
901 mtrr_wrmsr(MTRRphysMask_MSR(index), vr->mask_lo, vr->mask_hi);
902 changed = true;
903 }
904 return changed;
905}
906
907static u32 deftype_lo, deftype_hi;
908
909/**
910 * set_mtrr_state - Set the MTRR state for this CPU.
911 *
912 * NOTE: The CPU must already be in a safe state for MTRR changes, including
913 * measures that only a single CPU can be active in set_mtrr_state() in
914 * order to not be subject to races for usage of deftype_lo. This is
915 * accomplished by taking cache_disable_lock.
916 * RETURNS: 0 if no changes made, else a mask indicating what was changed.
917 */
918static unsigned long set_mtrr_state(void)
919{
920 unsigned long change_mask = 0;
921 unsigned int i;
922
923 for (i = 0; i < num_var_ranges; i++) {
924 if (set_mtrr_var_ranges(i, &mtrr_state.var_ranges[i]))
925 change_mask |= MTRR_CHANGE_MASK_VARIABLE;
926 }
927
928 if (mtrr_state.have_fixed && set_fixed_ranges(mtrr_state.fixed_ranges))
929 change_mask |= MTRR_CHANGE_MASK_FIXED;
930
931 /*
932 * Set_mtrr_restore restores the old value of MTRRdefType,
933 * so to set it we fiddle with the saved value:
934 */
935 if ((deftype_lo & MTRR_DEF_TYPE_TYPE) != mtrr_state.def_type ||
936 ((deftype_lo & MTRR_DEF_TYPE_ENABLE) >> MTRR_STATE_SHIFT) != mtrr_state.enabled) {
937
938 deftype_lo = (deftype_lo & MTRR_DEF_TYPE_DISABLE) |
939 mtrr_state.def_type |
940 (mtrr_state.enabled << MTRR_STATE_SHIFT);
941 change_mask |= MTRR_CHANGE_MASK_DEFTYPE;
942 }
943
944 return change_mask;
945}
946
947void mtrr_disable(void)
948{
949 /* Save MTRR state */
950 rdmsr(MSR_MTRRdefType, deftype_lo, deftype_hi);
951
952 /* Disable MTRRs, and set the default type to uncached */
953 mtrr_wrmsr(MSR_MTRRdefType, deftype_lo & MTRR_DEF_TYPE_DISABLE, deftype_hi);
954}
955
956void mtrr_enable(void)
957{
958 /* Intel (P6) standard MTRRs */
959 mtrr_wrmsr(MSR_MTRRdefType, deftype_lo, deftype_hi);
960}
961
962void mtrr_generic_set_state(void)
963{
964 unsigned long mask, count;
965
966 /* Actually set the state */
967 mask = set_mtrr_state();
968
969 /* Use the atomic bitops to update the global mask */
970 for (count = 0; count < sizeof(mask) * 8; ++count) {
971 if (mask & 0x01)
972 set_bit(count, &smp_changes_mask);
973 mask >>= 1;
974 }
975}
976
977/**
978 * generic_set_mtrr - set variable MTRR register on the local CPU.
979 *
980 * @reg: The register to set.
981 * @base: The base address of the region.
982 * @size: The size of the region. If this is 0 the region is disabled.
983 * @type: The type of the region.
984 *
985 * Returns nothing.
986 */
987static void generic_set_mtrr(unsigned int reg, unsigned long base,
988 unsigned long size, mtrr_type type)
989{
990 unsigned long flags;
991 struct mtrr_var_range *vr;
992
993 vr = &mtrr_state.var_ranges[reg];
994
995 local_irq_save(flags);
996 cache_disable();
997
998 if (size == 0) {
999 /*
1000 * The invalid bit is kept in the mask, so we simply
1001 * clear the relevant mask register to disable a range.
1002 */
1003 mtrr_wrmsr(MTRRphysMask_MSR(reg), 0, 0);
1004 memset(vr, 0, sizeof(struct mtrr_var_range));
1005 } else {
1006 vr->base_lo = base << PAGE_SHIFT | type;
1007 vr->base_hi = (base >> (32 - PAGE_SHIFT)) & ~phys_hi_rsvd;
1008 vr->mask_lo = -size << PAGE_SHIFT | MTRR_PHYSMASK_V;
1009 vr->mask_hi = (-size >> (32 - PAGE_SHIFT)) & ~phys_hi_rsvd;
1010
1011 mtrr_wrmsr(MTRRphysBase_MSR(reg), vr->base_lo, vr->base_hi);
1012 mtrr_wrmsr(MTRRphysMask_MSR(reg), vr->mask_lo, vr->mask_hi);
1013 }
1014
1015 cache_enable();
1016 local_irq_restore(flags);
1017}
1018
1019int generic_validate_add_page(unsigned long base, unsigned long size,
1020 unsigned int type)
1021{
1022 unsigned long lbase, last;
1023
1024 /*
1025 * For Intel PPro stepping <= 7
1026 * must be 4 MiB aligned and not touch 0x70000000 -> 0x7003FFFF
1027 */
1028 if (mtrr_if == &generic_mtrr_ops && boot_cpu_data.x86 == 6 &&
1029 boot_cpu_data.x86_model == 1 &&
1030 boot_cpu_data.x86_stepping <= 7) {
1031 if (base & ((1 << (22 - PAGE_SHIFT)) - 1)) {
1032 pr_warn("mtrr: base(0x%lx000) is not 4 MiB aligned\n", base);
1033 return -EINVAL;
1034 }
1035 if (!(base + size < 0x70000 || base > 0x7003F) &&
1036 (type == MTRR_TYPE_WRCOMB
1037 || type == MTRR_TYPE_WRBACK)) {
1038 pr_warn("mtrr: writable mtrr between 0x70000000 and 0x7003FFFF may hang the CPU.\n");
1039 return -EINVAL;
1040 }
1041 }
1042
1043 /*
1044 * Check upper bits of base and last are equal and lower bits are 0
1045 * for base and 1 for last
1046 */
1047 last = base + size - 1;
1048 for (lbase = base; !(lbase & 1) && (last & 1);
1049 lbase = lbase >> 1, last = last >> 1)
1050 ;
1051 if (lbase != last) {
1052 pr_warn("mtrr: base(0x%lx000) is not aligned on a size(0x%lx000) boundary\n", base, size);
1053 return -EINVAL;
1054 }
1055 return 0;
1056}
1057
1058static int generic_have_wrcomb(void)
1059{
1060 unsigned long config, dummy;
1061 rdmsr(MSR_MTRRcap, config, dummy);
1062 return config & MTRR_CAP_WC;
1063}
1064
1065int positive_have_wrcomb(void)
1066{
1067 return 1;
1068}
1069
1070/*
1071 * Generic structure...
1072 */
1073const struct mtrr_ops generic_mtrr_ops = {
1074 .get = generic_get_mtrr,
1075 .get_free_region = generic_get_free_region,
1076 .set = generic_set_mtrr,
1077 .validate_add_page = generic_validate_add_page,
1078 .have_wrcomb = generic_have_wrcomb,
1079};