Loading...
1// SPDX-License-Identifier: GPL-2.0-or-later
2/* ----------------------------------------------------------------------- *
3 *
4 * Copyright 2000-2008 H. Peter Anvin - All Rights Reserved
5 * Copyright 2009 Intel Corporation; author: H. Peter Anvin
6 *
7 * ----------------------------------------------------------------------- */
8
9/*
10 * x86 MSR access device
11 *
12 * This device is accessed by lseek() to the appropriate register number
13 * and then read/write in chunks of 8 bytes. A larger size means multiple
14 * reads or writes of the same register.
15 *
16 * This driver uses /dev/cpu/%d/msr where %d is the minor number, and on
17 * an SMP box will direct the access to CPU %d.
18 */
19
20#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
21
22#include <linux/module.h>
23
24#include <linux/types.h>
25#include <linux/errno.h>
26#include <linux/fcntl.h>
27#include <linux/init.h>
28#include <linux/poll.h>
29#include <linux/smp.h>
30#include <linux/major.h>
31#include <linux/fs.h>
32#include <linux/device.h>
33#include <linux/cpu.h>
34#include <linux/notifier.h>
35#include <linux/uaccess.h>
36#include <linux/gfp.h>
37#include <linux/security.h>
38
39#include <asm/cpufeature.h>
40#include <asm/msr.h>
41
42static enum cpuhp_state cpuhp_msr_state;
43
44enum allow_write_msrs {
45 MSR_WRITES_ON,
46 MSR_WRITES_OFF,
47 MSR_WRITES_DEFAULT,
48};
49
50static enum allow_write_msrs allow_writes = MSR_WRITES_DEFAULT;
51
52static ssize_t msr_read(struct file *file, char __user *buf,
53 size_t count, loff_t *ppos)
54{
55 u32 __user *tmp = (u32 __user *) buf;
56 u32 data[2];
57 u32 reg = *ppos;
58 int cpu = iminor(file_inode(file));
59 int err = 0;
60 ssize_t bytes = 0;
61
62 if (count % 8)
63 return -EINVAL; /* Invalid chunk size */
64
65 for (; count; count -= 8) {
66 err = rdmsr_safe_on_cpu(cpu, reg, &data[0], &data[1]);
67 if (err)
68 break;
69 if (copy_to_user(tmp, &data, 8)) {
70 err = -EFAULT;
71 break;
72 }
73 tmp += 2;
74 bytes += 8;
75 }
76
77 return bytes ? bytes : err;
78}
79
80static int filter_write(u32 reg)
81{
82 /*
83 * MSRs writes usually happen all at once, and can easily saturate kmsg.
84 * Only allow one message every 30 seconds.
85 *
86 * It's possible to be smarter here and do it (for example) per-MSR, but
87 * it would certainly be more complex, and this is enough at least to
88 * avoid saturating the ring buffer.
89 */
90 static DEFINE_RATELIMIT_STATE(fw_rs, 30 * HZ, 1);
91
92 switch (allow_writes) {
93 case MSR_WRITES_ON: return 0;
94 case MSR_WRITES_OFF: return -EPERM;
95 default: break;
96 }
97
98 if (!__ratelimit(&fw_rs))
99 return 0;
100
101 pr_warn("Write to unrecognized MSR 0x%x by %s (pid: %d).\n",
102 reg, current->comm, current->pid);
103 pr_warn("See https://git.kernel.org/pub/scm/linux/kernel/git/tip/tip.git/about for details.\n");
104
105 return 0;
106}
107
108static ssize_t msr_write(struct file *file, const char __user *buf,
109 size_t count, loff_t *ppos)
110{
111 const u32 __user *tmp = (const u32 __user *)buf;
112 u32 data[2];
113 u32 reg = *ppos;
114 int cpu = iminor(file_inode(file));
115 int err = 0;
116 ssize_t bytes = 0;
117
118 err = security_locked_down(LOCKDOWN_MSR);
119 if (err)
120 return err;
121
122 err = filter_write(reg);
123 if (err)
124 return err;
125
126 if (count % 8)
127 return -EINVAL; /* Invalid chunk size */
128
129 for (; count; count -= 8) {
130 if (copy_from_user(&data, tmp, 8)) {
131 err = -EFAULT;
132 break;
133 }
134
135 add_taint(TAINT_CPU_OUT_OF_SPEC, LOCKDEP_STILL_OK);
136
137 err = wrmsr_safe_on_cpu(cpu, reg, data[0], data[1]);
138 if (err)
139 break;
140
141 tmp += 2;
142 bytes += 8;
143 }
144
145 return bytes ? bytes : err;
146}
147
148static long msr_ioctl(struct file *file, unsigned int ioc, unsigned long arg)
149{
150 u32 __user *uregs = (u32 __user *)arg;
151 u32 regs[8];
152 int cpu = iminor(file_inode(file));
153 int err;
154
155 switch (ioc) {
156 case X86_IOC_RDMSR_REGS:
157 if (!(file->f_mode & FMODE_READ)) {
158 err = -EBADF;
159 break;
160 }
161 if (copy_from_user(®s, uregs, sizeof(regs))) {
162 err = -EFAULT;
163 break;
164 }
165 err = rdmsr_safe_regs_on_cpu(cpu, regs);
166 if (err)
167 break;
168 if (copy_to_user(uregs, ®s, sizeof(regs)))
169 err = -EFAULT;
170 break;
171
172 case X86_IOC_WRMSR_REGS:
173 if (!(file->f_mode & FMODE_WRITE)) {
174 err = -EBADF;
175 break;
176 }
177 if (copy_from_user(®s, uregs, sizeof(regs))) {
178 err = -EFAULT;
179 break;
180 }
181 err = security_locked_down(LOCKDOWN_MSR);
182 if (err)
183 break;
184
185 err = filter_write(regs[1]);
186 if (err)
187 return err;
188
189 add_taint(TAINT_CPU_OUT_OF_SPEC, LOCKDEP_STILL_OK);
190
191 err = wrmsr_safe_regs_on_cpu(cpu, regs);
192 if (err)
193 break;
194 if (copy_to_user(uregs, ®s, sizeof(regs)))
195 err = -EFAULT;
196 break;
197
198 default:
199 err = -ENOTTY;
200 break;
201 }
202
203 return err;
204}
205
206static int msr_open(struct inode *inode, struct file *file)
207{
208 unsigned int cpu = iminor(file_inode(file));
209 struct cpuinfo_x86 *c;
210
211 if (!capable(CAP_SYS_RAWIO))
212 return -EPERM;
213
214 if (cpu >= nr_cpu_ids || !cpu_online(cpu))
215 return -ENXIO; /* No such CPU */
216
217 c = &cpu_data(cpu);
218 if (!cpu_has(c, X86_FEATURE_MSR))
219 return -EIO; /* MSR not supported */
220
221 return 0;
222}
223
224/*
225 * File operations we support
226 */
227static const struct file_operations msr_fops = {
228 .owner = THIS_MODULE,
229 .llseek = no_seek_end_llseek,
230 .read = msr_read,
231 .write = msr_write,
232 .open = msr_open,
233 .unlocked_ioctl = msr_ioctl,
234 .compat_ioctl = msr_ioctl,
235};
236
237static char *msr_devnode(const struct device *dev, umode_t *mode)
238{
239 return kasprintf(GFP_KERNEL, "cpu/%u/msr", MINOR(dev->devt));
240}
241
242static const struct class msr_class = {
243 .name = "msr",
244 .devnode = msr_devnode,
245};
246
247static int msr_device_create(unsigned int cpu)
248{
249 struct device *dev;
250
251 dev = device_create(&msr_class, NULL, MKDEV(MSR_MAJOR, cpu), NULL,
252 "msr%d", cpu);
253 return PTR_ERR_OR_ZERO(dev);
254}
255
256static int msr_device_destroy(unsigned int cpu)
257{
258 device_destroy(&msr_class, MKDEV(MSR_MAJOR, cpu));
259 return 0;
260}
261
262static int __init msr_init(void)
263{
264 int err;
265
266 if (__register_chrdev(MSR_MAJOR, 0, NR_CPUS, "cpu/msr", &msr_fops)) {
267 pr_err("unable to get major %d for msr\n", MSR_MAJOR);
268 return -EBUSY;
269 }
270 err = class_register(&msr_class);
271 if (err)
272 goto out_chrdev;
273
274 err = cpuhp_setup_state(CPUHP_AP_ONLINE_DYN, "x86/msr:online",
275 msr_device_create, msr_device_destroy);
276 if (err < 0)
277 goto out_class;
278 cpuhp_msr_state = err;
279 return 0;
280
281out_class:
282 class_unregister(&msr_class);
283out_chrdev:
284 __unregister_chrdev(MSR_MAJOR, 0, NR_CPUS, "cpu/msr");
285 return err;
286}
287module_init(msr_init);
288
289static void __exit msr_exit(void)
290{
291 cpuhp_remove_state(cpuhp_msr_state);
292 class_unregister(&msr_class);
293 __unregister_chrdev(MSR_MAJOR, 0, NR_CPUS, "cpu/msr");
294}
295module_exit(msr_exit)
296
297static int set_allow_writes(const char *val, const struct kernel_param *cp)
298{
299 /* val is NUL-terminated, see kernfs_fop_write() */
300 char *s = strstrip((char *)val);
301
302 if (!strcmp(s, "on"))
303 allow_writes = MSR_WRITES_ON;
304 else if (!strcmp(s, "off"))
305 allow_writes = MSR_WRITES_OFF;
306 else
307 allow_writes = MSR_WRITES_DEFAULT;
308
309 return 0;
310}
311
312static int get_allow_writes(char *buf, const struct kernel_param *kp)
313{
314 const char *res;
315
316 switch (allow_writes) {
317 case MSR_WRITES_ON: res = "on"; break;
318 case MSR_WRITES_OFF: res = "off"; break;
319 default: res = "default"; break;
320 }
321
322 return sprintf(buf, "%s\n", res);
323}
324
325static const struct kernel_param_ops allow_writes_ops = {
326 .set = set_allow_writes,
327 .get = get_allow_writes
328};
329
330module_param_cb(allow_writes, &allow_writes_ops, NULL, 0600);
331
332MODULE_AUTHOR("H. Peter Anvin <hpa@zytor.com>");
333MODULE_DESCRIPTION("x86 generic MSR driver");
334MODULE_LICENSE("GPL");
1// SPDX-License-Identifier: GPL-2.0-or-later
2/* ----------------------------------------------------------------------- *
3 *
4 * Copyright 2000-2008 H. Peter Anvin - All Rights Reserved
5 * Copyright 2009 Intel Corporation; author: H. Peter Anvin
6 *
7 * ----------------------------------------------------------------------- */
8
9/*
10 * x86 MSR access device
11 *
12 * This device is accessed by lseek() to the appropriate register number
13 * and then read/write in chunks of 8 bytes. A larger size means multiple
14 * reads or writes of the same register.
15 *
16 * This driver uses /dev/cpu/%d/msr where %d is the minor number, and on
17 * an SMP box will direct the access to CPU %d.
18 */
19
20#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
21
22#include <linux/module.h>
23
24#include <linux/types.h>
25#include <linux/errno.h>
26#include <linux/fcntl.h>
27#include <linux/init.h>
28#include <linux/poll.h>
29#include <linux/smp.h>
30#include <linux/major.h>
31#include <linux/fs.h>
32#include <linux/device.h>
33#include <linux/cpu.h>
34#include <linux/notifier.h>
35#include <linux/uaccess.h>
36#include <linux/gfp.h>
37#include <linux/security.h>
38
39#include <asm/cpufeature.h>
40#include <asm/msr.h>
41
42static struct class *msr_class;
43static enum cpuhp_state cpuhp_msr_state;
44
45enum allow_write_msrs {
46 MSR_WRITES_ON,
47 MSR_WRITES_OFF,
48 MSR_WRITES_DEFAULT,
49};
50
51static enum allow_write_msrs allow_writes = MSR_WRITES_DEFAULT;
52
53static ssize_t msr_read(struct file *file, char __user *buf,
54 size_t count, loff_t *ppos)
55{
56 u32 __user *tmp = (u32 __user *) buf;
57 u32 data[2];
58 u32 reg = *ppos;
59 int cpu = iminor(file_inode(file));
60 int err = 0;
61 ssize_t bytes = 0;
62
63 if (count % 8)
64 return -EINVAL; /* Invalid chunk size */
65
66 for (; count; count -= 8) {
67 err = rdmsr_safe_on_cpu(cpu, reg, &data[0], &data[1]);
68 if (err)
69 break;
70 if (copy_to_user(tmp, &data, 8)) {
71 err = -EFAULT;
72 break;
73 }
74 tmp += 2;
75 bytes += 8;
76 }
77
78 return bytes ? bytes : err;
79}
80
81static int filter_write(u32 reg)
82{
83 switch (allow_writes) {
84 case MSR_WRITES_ON: return 0;
85 case MSR_WRITES_OFF: return -EPERM;
86 default: break;
87 }
88
89 if (reg == MSR_IA32_ENERGY_PERF_BIAS)
90 return 0;
91
92 pr_err_ratelimited("Write to unrecognized MSR 0x%x by %s\n"
93 "Please report to x86@kernel.org\n",
94 reg, current->comm);
95
96 return 0;
97}
98
99static ssize_t msr_write(struct file *file, const char __user *buf,
100 size_t count, loff_t *ppos)
101{
102 const u32 __user *tmp = (const u32 __user *)buf;
103 u32 data[2];
104 u32 reg = *ppos;
105 int cpu = iminor(file_inode(file));
106 int err = 0;
107 ssize_t bytes = 0;
108
109 err = security_locked_down(LOCKDOWN_MSR);
110 if (err)
111 return err;
112
113 err = filter_write(reg);
114 if (err)
115 return err;
116
117 if (count % 8)
118 return -EINVAL; /* Invalid chunk size */
119
120 for (; count; count -= 8) {
121 if (copy_from_user(&data, tmp, 8)) {
122 err = -EFAULT;
123 break;
124 }
125
126 add_taint(TAINT_CPU_OUT_OF_SPEC, LOCKDEP_STILL_OK);
127
128 err = wrmsr_safe_on_cpu(cpu, reg, data[0], data[1]);
129 if (err)
130 break;
131
132 tmp += 2;
133 bytes += 8;
134 }
135
136 return bytes ? bytes : err;
137}
138
139static long msr_ioctl(struct file *file, unsigned int ioc, unsigned long arg)
140{
141 u32 __user *uregs = (u32 __user *)arg;
142 u32 regs[8];
143 int cpu = iminor(file_inode(file));
144 int err;
145
146 switch (ioc) {
147 case X86_IOC_RDMSR_REGS:
148 if (!(file->f_mode & FMODE_READ)) {
149 err = -EBADF;
150 break;
151 }
152 if (copy_from_user(®s, uregs, sizeof(regs))) {
153 err = -EFAULT;
154 break;
155 }
156 err = rdmsr_safe_regs_on_cpu(cpu, regs);
157 if (err)
158 break;
159 if (copy_to_user(uregs, ®s, sizeof(regs)))
160 err = -EFAULT;
161 break;
162
163 case X86_IOC_WRMSR_REGS:
164 if (!(file->f_mode & FMODE_WRITE)) {
165 err = -EBADF;
166 break;
167 }
168 if (copy_from_user(®s, uregs, sizeof(regs))) {
169 err = -EFAULT;
170 break;
171 }
172 err = security_locked_down(LOCKDOWN_MSR);
173 if (err)
174 break;
175 err = wrmsr_safe_regs_on_cpu(cpu, regs);
176 if (err)
177 break;
178 if (copy_to_user(uregs, ®s, sizeof(regs)))
179 err = -EFAULT;
180 break;
181
182 default:
183 err = -ENOTTY;
184 break;
185 }
186
187 return err;
188}
189
190static int msr_open(struct inode *inode, struct file *file)
191{
192 unsigned int cpu = iminor(file_inode(file));
193 struct cpuinfo_x86 *c;
194
195 if (!capable(CAP_SYS_RAWIO))
196 return -EPERM;
197
198 if (cpu >= nr_cpu_ids || !cpu_online(cpu))
199 return -ENXIO; /* No such CPU */
200
201 c = &cpu_data(cpu);
202 if (!cpu_has(c, X86_FEATURE_MSR))
203 return -EIO; /* MSR not supported */
204
205 return 0;
206}
207
208/*
209 * File operations we support
210 */
211static const struct file_operations msr_fops = {
212 .owner = THIS_MODULE,
213 .llseek = no_seek_end_llseek,
214 .read = msr_read,
215 .write = msr_write,
216 .open = msr_open,
217 .unlocked_ioctl = msr_ioctl,
218 .compat_ioctl = msr_ioctl,
219};
220
221static int msr_device_create(unsigned int cpu)
222{
223 struct device *dev;
224
225 dev = device_create(msr_class, NULL, MKDEV(MSR_MAJOR, cpu), NULL,
226 "msr%d", cpu);
227 return PTR_ERR_OR_ZERO(dev);
228}
229
230static int msr_device_destroy(unsigned int cpu)
231{
232 device_destroy(msr_class, MKDEV(MSR_MAJOR, cpu));
233 return 0;
234}
235
236static char *msr_devnode(struct device *dev, umode_t *mode)
237{
238 return kasprintf(GFP_KERNEL, "cpu/%u/msr", MINOR(dev->devt));
239}
240
241static int __init msr_init(void)
242{
243 int err;
244
245 if (__register_chrdev(MSR_MAJOR, 0, NR_CPUS, "cpu/msr", &msr_fops)) {
246 pr_err("unable to get major %d for msr\n", MSR_MAJOR);
247 return -EBUSY;
248 }
249 msr_class = class_create(THIS_MODULE, "msr");
250 if (IS_ERR(msr_class)) {
251 err = PTR_ERR(msr_class);
252 goto out_chrdev;
253 }
254 msr_class->devnode = msr_devnode;
255
256 err = cpuhp_setup_state(CPUHP_AP_ONLINE_DYN, "x86/msr:online",
257 msr_device_create, msr_device_destroy);
258 if (err < 0)
259 goto out_class;
260 cpuhp_msr_state = err;
261 return 0;
262
263out_class:
264 class_destroy(msr_class);
265out_chrdev:
266 __unregister_chrdev(MSR_MAJOR, 0, NR_CPUS, "cpu/msr");
267 return err;
268}
269module_init(msr_init);
270
271static void __exit msr_exit(void)
272{
273 cpuhp_remove_state(cpuhp_msr_state);
274 class_destroy(msr_class);
275 __unregister_chrdev(MSR_MAJOR, 0, NR_CPUS, "cpu/msr");
276}
277module_exit(msr_exit)
278
279static int set_allow_writes(const char *val, const struct kernel_param *cp)
280{
281 /* val is NUL-terminated, see kernfs_fop_write() */
282 char *s = strstrip((char *)val);
283
284 if (!strcmp(s, "on"))
285 allow_writes = MSR_WRITES_ON;
286 else if (!strcmp(s, "off"))
287 allow_writes = MSR_WRITES_OFF;
288 else
289 allow_writes = MSR_WRITES_DEFAULT;
290
291 return 0;
292}
293
294static int get_allow_writes(char *buf, const struct kernel_param *kp)
295{
296 const char *res;
297
298 switch (allow_writes) {
299 case MSR_WRITES_ON: res = "on"; break;
300 case MSR_WRITES_OFF: res = "off"; break;
301 default: res = "default"; break;
302 }
303
304 return sprintf(buf, "%s\n", res);
305}
306
307static const struct kernel_param_ops allow_writes_ops = {
308 .set = set_allow_writes,
309 .get = get_allow_writes
310};
311
312module_param_cb(allow_writes, &allow_writes_ops, NULL, 0600);
313
314MODULE_AUTHOR("H. Peter Anvin <hpa@zytor.com>");
315MODULE_DESCRIPTION("x86 generic MSR driver");
316MODULE_LICENSE("GPL");