Linux Audio

Check our new training course

Loading...
v5.4
  1// SPDX-License-Identifier: GPL-2.0-only
  2/*:
  3 * Hibernate support specific for ARM64
  4 *
  5 * Derived from work on ARM hibernation support by:
  6 *
  7 * Ubuntu project, hibernation support for mach-dove
  8 * Copyright (C) 2010 Nokia Corporation (Hiroshi Doyu)
  9 * Copyright (C) 2010 Texas Instruments, Inc. (Teerth Reddy et al.)
 10 *  https://lkml.org/lkml/2010/6/18/4
 11 *  https://lists.linux-foundation.org/pipermail/linux-pm/2010-June/027422.html
 12 *  https://patchwork.kernel.org/patch/96442/
 13 *
 14 * Copyright (C) 2006 Rafael J. Wysocki <rjw@sisk.pl>
 
 
 15 */
 16#define pr_fmt(x) "hibernate: " x
 17#include <linux/cpu.h>
 18#include <linux/kvm_host.h>
 19#include <linux/mm.h>
 20#include <linux/pm.h>
 21#include <linux/sched.h>
 22#include <linux/suspend.h>
 23#include <linux/utsname.h>
 24#include <linux/version.h>
 25
 26#include <asm/barrier.h>
 27#include <asm/cacheflush.h>
 28#include <asm/cputype.h>
 29#include <asm/daifflags.h>
 30#include <asm/irqflags.h>
 31#include <asm/kexec.h>
 32#include <asm/memory.h>
 33#include <asm/mmu_context.h>
 34#include <asm/pgalloc.h>
 35#include <asm/pgtable.h>
 36#include <asm/pgtable-hwdef.h>
 37#include <asm/sections.h>
 38#include <asm/smp.h>
 39#include <asm/smp_plat.h>
 40#include <asm/suspend.h>
 41#include <asm/sysreg.h>
 42#include <asm/virt.h>
 43
 44/*
 45 * Hibernate core relies on this value being 0 on resume, and marks it
 46 * __nosavedata assuming it will keep the resume kernel's '0' value. This
 47 * doesn't happen with either KASLR.
 48 *
 49 * defined as "__visible int in_suspend __nosavedata" in
 50 * kernel/power/hibernate.c
 51 */
 52extern int in_suspend;
 53
 54/* Do we need to reset el2? */
 55#define el2_reset_needed() (is_hyp_mode_available() && !is_kernel_in_hyp_mode())
 56
 57/* temporary el2 vectors in the __hibernate_exit_text section. */
 58extern char hibernate_el2_vectors[];
 59
 60/* hyp-stub vectors, used to restore el2 during resume from hibernate. */
 61extern char __hyp_stub_vectors[];
 62
 63/*
 64 * The logical cpu number we should resume on, initialised to a non-cpu
 65 * number.
 66 */
 67static int sleep_cpu = -EINVAL;
 68
 69/*
 70 * Values that may not change over hibernate/resume. We put the build number
 71 * and date in here so that we guarantee not to resume with a different
 72 * kernel.
 73 */
 74struct arch_hibernate_hdr_invariants {
 75	char		uts_version[__NEW_UTS_LEN + 1];
 76};
 77
 78/* These values need to be know across a hibernate/restore. */
 79static struct arch_hibernate_hdr {
 80	struct arch_hibernate_hdr_invariants invariants;
 81
 82	/* These are needed to find the relocated kernel if built with kaslr */
 83	phys_addr_t	ttbr1_el1;
 84	void		(*reenter_kernel)(void);
 85
 86	/*
 87	 * We need to know where the __hyp_stub_vectors are after restore to
 88	 * re-configure el2.
 89	 */
 90	phys_addr_t	__hyp_stub_vectors;
 91
 92	u64		sleep_cpu_mpidr;
 93} resume_hdr;
 94
 95static inline void arch_hdr_invariants(struct arch_hibernate_hdr_invariants *i)
 96{
 97	memset(i, 0, sizeof(*i));
 98	memcpy(i->uts_version, init_utsname()->version, sizeof(i->uts_version));
 99}
100
101int pfn_is_nosave(unsigned long pfn)
102{
103	unsigned long nosave_begin_pfn = sym_to_pfn(&__nosave_begin);
104	unsigned long nosave_end_pfn = sym_to_pfn(&__nosave_end - 1);
105
106	return ((pfn >= nosave_begin_pfn) && (pfn <= nosave_end_pfn)) ||
107		crash_is_nosave(pfn);
108}
109
110void notrace save_processor_state(void)
111{
112	WARN_ON(num_online_cpus() != 1);
113}
114
115void notrace restore_processor_state(void)
116{
117}
118
119int arch_hibernation_header_save(void *addr, unsigned int max_size)
120{
121	struct arch_hibernate_hdr *hdr = addr;
122
123	if (max_size < sizeof(*hdr))
124		return -EOVERFLOW;
125
126	arch_hdr_invariants(&hdr->invariants);
127	hdr->ttbr1_el1		= __pa_symbol(swapper_pg_dir);
128	hdr->reenter_kernel	= _cpu_resume;
129
130	/* We can't use __hyp_get_vectors() because kvm may still be loaded */
131	if (el2_reset_needed())
132		hdr->__hyp_stub_vectors = __pa_symbol(__hyp_stub_vectors);
133	else
134		hdr->__hyp_stub_vectors = 0;
135
136	/* Save the mpidr of the cpu we called cpu_suspend() on... */
137	if (sleep_cpu < 0) {
138		pr_err("Failing to hibernate on an unknown CPU.\n");
139		return -ENODEV;
140	}
141	hdr->sleep_cpu_mpidr = cpu_logical_map(sleep_cpu);
142	pr_info("Hibernating on CPU %d [mpidr:0x%llx]\n", sleep_cpu,
143		hdr->sleep_cpu_mpidr);
144
145	return 0;
146}
147EXPORT_SYMBOL(arch_hibernation_header_save);
148
149int arch_hibernation_header_restore(void *addr)
150{
151	int ret;
152	struct arch_hibernate_hdr_invariants invariants;
153	struct arch_hibernate_hdr *hdr = addr;
154
155	arch_hdr_invariants(&invariants);
156	if (memcmp(&hdr->invariants, &invariants, sizeof(invariants))) {
157		pr_crit("Hibernate image not generated by this kernel!\n");
158		return -EINVAL;
159	}
160
161	sleep_cpu = get_logical_index(hdr->sleep_cpu_mpidr);
162	pr_info("Hibernated on CPU %d [mpidr:0x%llx]\n", sleep_cpu,
163		hdr->sleep_cpu_mpidr);
164	if (sleep_cpu < 0) {
165		pr_crit("Hibernated on a CPU not known to this kernel!\n");
166		sleep_cpu = -EINVAL;
167		return -EINVAL;
168	}
169	if (!cpu_online(sleep_cpu)) {
170		pr_info("Hibernated on a CPU that is offline! Bringing CPU up.\n");
171		ret = cpu_up(sleep_cpu);
172		if (ret) {
173			pr_err("Failed to bring hibernate-CPU up!\n");
174			sleep_cpu = -EINVAL;
175			return ret;
176		}
177	}
178
179	resume_hdr = *hdr;
180
181	return 0;
182}
183EXPORT_SYMBOL(arch_hibernation_header_restore);
184
185/*
186 * Copies length bytes, starting at src_start into an new page,
187 * perform cache maintentance, then maps it at the specified address low
188 * address as executable.
189 *
190 * This is used by hibernate to copy the code it needs to execute when
191 * overwriting the kernel text. This function generates a new set of page
192 * tables, which it loads into ttbr0.
193 *
194 * Length is provided as we probably only want 4K of data, even on a 64K
195 * page system.
196 */
197static int create_safe_exec_page(void *src_start, size_t length,
198				 unsigned long dst_addr,
199				 phys_addr_t *phys_dst_addr,
200				 void *(*allocator)(gfp_t mask),
201				 gfp_t mask)
202{
203	int rc = 0;
204	pgd_t *trans_pgd;
205	pgd_t *pgdp;
206	pud_t *pudp;
207	pmd_t *pmdp;
208	pte_t *ptep;
209	unsigned long dst = (unsigned long)allocator(mask);
210
211	if (!dst) {
212		rc = -ENOMEM;
213		goto out;
214	}
215
216	memcpy((void *)dst, src_start, length);
217	__flush_icache_range(dst, dst + length);
218
219	trans_pgd = allocator(mask);
220	if (!trans_pgd) {
221		rc = -ENOMEM;
222		goto out;
223	}
224
225	pgdp = pgd_offset_raw(trans_pgd, dst_addr);
226	if (pgd_none(READ_ONCE(*pgdp))) {
227		pudp = allocator(mask);
228		if (!pudp) {
229			rc = -ENOMEM;
230			goto out;
231		}
232		pgd_populate(&init_mm, pgdp, pudp);
233	}
234
235	pudp = pud_offset(pgdp, dst_addr);
236	if (pud_none(READ_ONCE(*pudp))) {
237		pmdp = allocator(mask);
238		if (!pmdp) {
239			rc = -ENOMEM;
240			goto out;
241		}
242		pud_populate(&init_mm, pudp, pmdp);
243	}
244
245	pmdp = pmd_offset(pudp, dst_addr);
246	if (pmd_none(READ_ONCE(*pmdp))) {
247		ptep = allocator(mask);
248		if (!ptep) {
249			rc = -ENOMEM;
250			goto out;
251		}
252		pmd_populate_kernel(&init_mm, pmdp, ptep);
253	}
254
255	ptep = pte_offset_kernel(pmdp, dst_addr);
256	set_pte(ptep, pfn_pte(virt_to_pfn(dst), PAGE_KERNEL_EXEC));
257
258	/*
259	 * Load our new page tables. A strict BBM approach requires that we
260	 * ensure that TLBs are free of any entries that may overlap with the
261	 * global mappings we are about to install.
262	 *
263	 * For a real hibernate/resume cycle TTBR0 currently points to a zero
264	 * page, but TLBs may contain stale ASID-tagged entries (e.g. for EFI
265	 * runtime services), while for a userspace-driven test_resume cycle it
266	 * points to userspace page tables (and we must point it at a zero page
267	 * ourselves). Elsewhere we only (un)install the idmap with preemption
268	 * disabled, so T0SZ should be as required regardless.
269	 */
270	cpu_set_reserved_ttbr0();
271	local_flush_tlb_all();
272	write_sysreg(phys_to_ttbr(virt_to_phys(pgdp)), ttbr0_el1);
273	isb();
274
275	*phys_dst_addr = virt_to_phys((void *)dst);
276
277out:
278	return rc;
279}
280
281#define dcache_clean_range(start, end)	__flush_dcache_area(start, (end - start))
282
283int swsusp_arch_suspend(void)
284{
285	int ret = 0;
286	unsigned long flags;
287	struct sleep_stack_data state;
288
289	if (cpus_are_stuck_in_kernel()) {
290		pr_err("Can't hibernate: no mechanism to offline secondary CPUs.\n");
291		return -EBUSY;
292	}
293
294	flags = local_daif_save();
295
296	if (__cpu_suspend_enter(&state)) {
297		/* make the crash dump kernel image visible/saveable */
298		crash_prepare_suspend();
299
300		sleep_cpu = smp_processor_id();
301		ret = swsusp_save();
302	} else {
303		/* Clean kernel core startup/idle code to PoC*/
304		dcache_clean_range(__mmuoff_data_start, __mmuoff_data_end);
305		dcache_clean_range(__idmap_text_start, __idmap_text_end);
306
307		/* Clean kvm setup code to PoC? */
308		if (el2_reset_needed()) {
309			dcache_clean_range(__hyp_idmap_text_start, __hyp_idmap_text_end);
310			dcache_clean_range(__hyp_text_start, __hyp_text_end);
311		}
312
313		/* make the crash dump kernel image protected again */
314		crash_post_resume();
315
316		/*
317		 * Tell the hibernation core that we've just restored
318		 * the memory
319		 */
320		in_suspend = 0;
321
322		sleep_cpu = -EINVAL;
323		__cpu_suspend_exit();
324
325		/*
326		 * Just in case the boot kernel did turn the SSBD
327		 * mitigation off behind our back, let's set the state
328		 * to what we expect it to be.
329		 */
330		switch (arm64_get_ssbd_state()) {
331		case ARM64_SSBD_FORCE_ENABLE:
332		case ARM64_SSBD_KERNEL:
333			arm64_set_ssbd_mitigation(true);
334		}
335	}
336
337	local_daif_restore(flags);
338
339	return ret;
340}
341
342static void _copy_pte(pte_t *dst_ptep, pte_t *src_ptep, unsigned long addr)
343{
344	pte_t pte = READ_ONCE(*src_ptep);
345
346	if (pte_valid(pte)) {
347		/*
348		 * Resume will overwrite areas that may be marked
349		 * read only (code, rodata). Clear the RDONLY bit from
350		 * the temporary mappings we use during restore.
351		 */
352		set_pte(dst_ptep, pte_mkwrite(pte));
353	} else if (debug_pagealloc_enabled() && !pte_none(pte)) {
354		/*
355		 * debug_pagealloc will removed the PTE_VALID bit if
356		 * the page isn't in use by the resume kernel. It may have
357		 * been in use by the original kernel, in which case we need
358		 * to put it back in our copy to do the restore.
359		 *
360		 * Before marking this entry valid, check the pfn should
361		 * be mapped.
362		 */
363		BUG_ON(!pfn_valid(pte_pfn(pte)));
364
365		set_pte(dst_ptep, pte_mkpresent(pte_mkwrite(pte)));
366	}
367}
368
369static int copy_pte(pmd_t *dst_pmdp, pmd_t *src_pmdp, unsigned long start,
370		    unsigned long end)
371{
372	pte_t *src_ptep;
373	pte_t *dst_ptep;
374	unsigned long addr = start;
375
376	dst_ptep = (pte_t *)get_safe_page(GFP_ATOMIC);
377	if (!dst_ptep)
378		return -ENOMEM;
379	pmd_populate_kernel(&init_mm, dst_pmdp, dst_ptep);
380	dst_ptep = pte_offset_kernel(dst_pmdp, start);
381
382	src_ptep = pte_offset_kernel(src_pmdp, start);
383	do {
384		_copy_pte(dst_ptep, src_ptep, addr);
385	} while (dst_ptep++, src_ptep++, addr += PAGE_SIZE, addr != end);
386
387	return 0;
388}
389
390static int copy_pmd(pud_t *dst_pudp, pud_t *src_pudp, unsigned long start,
391		    unsigned long end)
392{
393	pmd_t *src_pmdp;
394	pmd_t *dst_pmdp;
395	unsigned long next;
396	unsigned long addr = start;
397
398	if (pud_none(READ_ONCE(*dst_pudp))) {
399		dst_pmdp = (pmd_t *)get_safe_page(GFP_ATOMIC);
400		if (!dst_pmdp)
401			return -ENOMEM;
402		pud_populate(&init_mm, dst_pudp, dst_pmdp);
403	}
404	dst_pmdp = pmd_offset(dst_pudp, start);
405
406	src_pmdp = pmd_offset(src_pudp, start);
407	do {
408		pmd_t pmd = READ_ONCE(*src_pmdp);
409
410		next = pmd_addr_end(addr, end);
411		if (pmd_none(pmd))
412			continue;
413		if (pmd_table(pmd)) {
414			if (copy_pte(dst_pmdp, src_pmdp, addr, next))
415				return -ENOMEM;
416		} else {
417			set_pmd(dst_pmdp,
418				__pmd(pmd_val(pmd) & ~PMD_SECT_RDONLY));
419		}
420	} while (dst_pmdp++, src_pmdp++, addr = next, addr != end);
421
422	return 0;
423}
424
425static int copy_pud(pgd_t *dst_pgdp, pgd_t *src_pgdp, unsigned long start,
426		    unsigned long end)
427{
428	pud_t *dst_pudp;
429	pud_t *src_pudp;
430	unsigned long next;
431	unsigned long addr = start;
432
433	if (pgd_none(READ_ONCE(*dst_pgdp))) {
434		dst_pudp = (pud_t *)get_safe_page(GFP_ATOMIC);
435		if (!dst_pudp)
436			return -ENOMEM;
437		pgd_populate(&init_mm, dst_pgdp, dst_pudp);
438	}
439	dst_pudp = pud_offset(dst_pgdp, start);
440
441	src_pudp = pud_offset(src_pgdp, start);
442	do {
443		pud_t pud = READ_ONCE(*src_pudp);
444
445		next = pud_addr_end(addr, end);
446		if (pud_none(pud))
447			continue;
448		if (pud_table(pud)) {
449			if (copy_pmd(dst_pudp, src_pudp, addr, next))
450				return -ENOMEM;
451		} else {
452			set_pud(dst_pudp,
453				__pud(pud_val(pud) & ~PMD_SECT_RDONLY));
454		}
455	} while (dst_pudp++, src_pudp++, addr = next, addr != end);
456
457	return 0;
458}
459
460static int copy_page_tables(pgd_t *dst_pgdp, unsigned long start,
461			    unsigned long end)
462{
463	unsigned long next;
464	unsigned long addr = start;
465	pgd_t *src_pgdp = pgd_offset_k(start);
466
467	dst_pgdp = pgd_offset_raw(dst_pgdp, start);
468	do {
469		next = pgd_addr_end(addr, end);
470		if (pgd_none(READ_ONCE(*src_pgdp)))
471			continue;
472		if (copy_pud(dst_pgdp, src_pgdp, addr, next))
473			return -ENOMEM;
474	} while (dst_pgdp++, src_pgdp++, addr = next, addr != end);
475
476	return 0;
477}
478
479/*
480 * Setup then Resume from the hibernate image using swsusp_arch_suspend_exit().
481 *
482 * Memory allocated by get_safe_page() will be dealt with by the hibernate code,
483 * we don't need to free it here.
484 */
485int swsusp_arch_resume(void)
486{
487	int rc = 0;
488	void *zero_page;
489	size_t exit_size;
490	pgd_t *tmp_pg_dir;
491	phys_addr_t phys_hibernate_exit;
492	void __noreturn (*hibernate_exit)(phys_addr_t, phys_addr_t, void *,
493					  void *, phys_addr_t, phys_addr_t);
494
495	/*
496	 * Restoring the memory image will overwrite the ttbr1 page tables.
497	 * Create a second copy of just the linear map, and use this when
498	 * restoring.
499	 */
500	tmp_pg_dir = (pgd_t *)get_safe_page(GFP_ATOMIC);
501	if (!tmp_pg_dir) {
502		pr_err("Failed to allocate memory for temporary page tables.\n");
503		rc = -ENOMEM;
504		goto out;
505	}
506	rc = copy_page_tables(tmp_pg_dir, PAGE_OFFSET, PAGE_END);
507	if (rc)
508		goto out;
509
510	/*
511	 * We need a zero page that is zero before & after resume in order to
512	 * to break before make on the ttbr1 page tables.
513	 */
514	zero_page = (void *)get_safe_page(GFP_ATOMIC);
515	if (!zero_page) {
516		pr_err("Failed to allocate zero page.\n");
517		rc = -ENOMEM;
518		goto out;
519	}
520
521	/*
522	 * Locate the exit code in the bottom-but-one page, so that *NULL
523	 * still has disastrous affects.
524	 */
525	hibernate_exit = (void *)PAGE_SIZE;
526	exit_size = __hibernate_exit_text_end - __hibernate_exit_text_start;
527	/*
528	 * Copy swsusp_arch_suspend_exit() to a safe page. This will generate
529	 * a new set of ttbr0 page tables and load them.
530	 */
531	rc = create_safe_exec_page(__hibernate_exit_text_start, exit_size,
532				   (unsigned long)hibernate_exit,
533				   &phys_hibernate_exit,
534				   (void *)get_safe_page, GFP_ATOMIC);
535	if (rc) {
536		pr_err("Failed to create safe executable page for hibernate_exit code.\n");
537		goto out;
538	}
539
540	/*
541	 * The hibernate exit text contains a set of el2 vectors, that will
542	 * be executed at el2 with the mmu off in order to reload hyp-stub.
543	 */
544	__flush_dcache_area(hibernate_exit, exit_size);
545
546	/*
547	 * KASLR will cause the el2 vectors to be in a different location in
548	 * the resumed kernel. Load hibernate's temporary copy into el2.
549	 *
550	 * We can skip this step if we booted at EL1, or are running with VHE.
551	 */
552	if (el2_reset_needed()) {
553		phys_addr_t el2_vectors = phys_hibernate_exit;  /* base */
554		el2_vectors += hibernate_el2_vectors -
555			       __hibernate_exit_text_start;     /* offset */
556
557		__hyp_set_vectors(el2_vectors);
558	}
559
560	hibernate_exit(virt_to_phys(tmp_pg_dir), resume_hdr.ttbr1_el1,
561		       resume_hdr.reenter_kernel, restore_pblist,
562		       resume_hdr.__hyp_stub_vectors, virt_to_phys(zero_page));
563
564out:
565	return rc;
566}
567
568int hibernate_resume_nonboot_cpu_disable(void)
569{
570	if (sleep_cpu < 0) {
571		pr_err("Failing to resume from hibernate on an unknown CPU.\n");
572		return -ENODEV;
573	}
574
575	return freeze_secondary_cpus(sleep_cpu);
576}
v4.17
 
  1/*:
  2 * Hibernate support specific for ARM64
  3 *
  4 * Derived from work on ARM hibernation support by:
  5 *
  6 * Ubuntu project, hibernation support for mach-dove
  7 * Copyright (C) 2010 Nokia Corporation (Hiroshi Doyu)
  8 * Copyright (C) 2010 Texas Instruments, Inc. (Teerth Reddy et al.)
  9 *  https://lkml.org/lkml/2010/6/18/4
 10 *  https://lists.linux-foundation.org/pipermail/linux-pm/2010-June/027422.html
 11 *  https://patchwork.kernel.org/patch/96442/
 12 *
 13 * Copyright (C) 2006 Rafael J. Wysocki <rjw@sisk.pl>
 14 *
 15 * License terms: GNU General Public License (GPL) version 2
 16 */
 17#define pr_fmt(x) "hibernate: " x
 18#include <linux/cpu.h>
 19#include <linux/kvm_host.h>
 20#include <linux/mm.h>
 21#include <linux/pm.h>
 22#include <linux/sched.h>
 23#include <linux/suspend.h>
 24#include <linux/utsname.h>
 25#include <linux/version.h>
 26
 27#include <asm/barrier.h>
 28#include <asm/cacheflush.h>
 29#include <asm/cputype.h>
 30#include <asm/daifflags.h>
 31#include <asm/irqflags.h>
 32#include <asm/kexec.h>
 33#include <asm/memory.h>
 34#include <asm/mmu_context.h>
 35#include <asm/pgalloc.h>
 36#include <asm/pgtable.h>
 37#include <asm/pgtable-hwdef.h>
 38#include <asm/sections.h>
 39#include <asm/smp.h>
 40#include <asm/smp_plat.h>
 41#include <asm/suspend.h>
 42#include <asm/sysreg.h>
 43#include <asm/virt.h>
 44
 45/*
 46 * Hibernate core relies on this value being 0 on resume, and marks it
 47 * __nosavedata assuming it will keep the resume kernel's '0' value. This
 48 * doesn't happen with either KASLR.
 49 *
 50 * defined as "__visible int in_suspend __nosavedata" in
 51 * kernel/power/hibernate.c
 52 */
 53extern int in_suspend;
 54
 55/* Do we need to reset el2? */
 56#define el2_reset_needed() (is_hyp_mode_available() && !is_kernel_in_hyp_mode())
 57
 58/* temporary el2 vectors in the __hibernate_exit_text section. */
 59extern char hibernate_el2_vectors[];
 60
 61/* hyp-stub vectors, used to restore el2 during resume from hibernate. */
 62extern char __hyp_stub_vectors[];
 63
 64/*
 65 * The logical cpu number we should resume on, initialised to a non-cpu
 66 * number.
 67 */
 68static int sleep_cpu = -EINVAL;
 69
 70/*
 71 * Values that may not change over hibernate/resume. We put the build number
 72 * and date in here so that we guarantee not to resume with a different
 73 * kernel.
 74 */
 75struct arch_hibernate_hdr_invariants {
 76	char		uts_version[__NEW_UTS_LEN + 1];
 77};
 78
 79/* These values need to be know across a hibernate/restore. */
 80static struct arch_hibernate_hdr {
 81	struct arch_hibernate_hdr_invariants invariants;
 82
 83	/* These are needed to find the relocated kernel if built with kaslr */
 84	phys_addr_t	ttbr1_el1;
 85	void		(*reenter_kernel)(void);
 86
 87	/*
 88	 * We need to know where the __hyp_stub_vectors are after restore to
 89	 * re-configure el2.
 90	 */
 91	phys_addr_t	__hyp_stub_vectors;
 92
 93	u64		sleep_cpu_mpidr;
 94} resume_hdr;
 95
 96static inline void arch_hdr_invariants(struct arch_hibernate_hdr_invariants *i)
 97{
 98	memset(i, 0, sizeof(*i));
 99	memcpy(i->uts_version, init_utsname()->version, sizeof(i->uts_version));
100}
101
102int pfn_is_nosave(unsigned long pfn)
103{
104	unsigned long nosave_begin_pfn = sym_to_pfn(&__nosave_begin);
105	unsigned long nosave_end_pfn = sym_to_pfn(&__nosave_end - 1);
106
107	return ((pfn >= nosave_begin_pfn) && (pfn <= nosave_end_pfn)) ||
108		crash_is_nosave(pfn);
109}
110
111void notrace save_processor_state(void)
112{
113	WARN_ON(num_online_cpus() != 1);
114}
115
116void notrace restore_processor_state(void)
117{
118}
119
120int arch_hibernation_header_save(void *addr, unsigned int max_size)
121{
122	struct arch_hibernate_hdr *hdr = addr;
123
124	if (max_size < sizeof(*hdr))
125		return -EOVERFLOW;
126
127	arch_hdr_invariants(&hdr->invariants);
128	hdr->ttbr1_el1		= __pa_symbol(swapper_pg_dir);
129	hdr->reenter_kernel	= _cpu_resume;
130
131	/* We can't use __hyp_get_vectors() because kvm may still be loaded */
132	if (el2_reset_needed())
133		hdr->__hyp_stub_vectors = __pa_symbol(__hyp_stub_vectors);
134	else
135		hdr->__hyp_stub_vectors = 0;
136
137	/* Save the mpidr of the cpu we called cpu_suspend() on... */
138	if (sleep_cpu < 0) {
139		pr_err("Failing to hibernate on an unknown CPU.\n");
140		return -ENODEV;
141	}
142	hdr->sleep_cpu_mpidr = cpu_logical_map(sleep_cpu);
143	pr_info("Hibernating on CPU %d [mpidr:0x%llx]\n", sleep_cpu,
144		hdr->sleep_cpu_mpidr);
145
146	return 0;
147}
148EXPORT_SYMBOL(arch_hibernation_header_save);
149
150int arch_hibernation_header_restore(void *addr)
151{
152	int ret;
153	struct arch_hibernate_hdr_invariants invariants;
154	struct arch_hibernate_hdr *hdr = addr;
155
156	arch_hdr_invariants(&invariants);
157	if (memcmp(&hdr->invariants, &invariants, sizeof(invariants))) {
158		pr_crit("Hibernate image not generated by this kernel!\n");
159		return -EINVAL;
160	}
161
162	sleep_cpu = get_logical_index(hdr->sleep_cpu_mpidr);
163	pr_info("Hibernated on CPU %d [mpidr:0x%llx]\n", sleep_cpu,
164		hdr->sleep_cpu_mpidr);
165	if (sleep_cpu < 0) {
166		pr_crit("Hibernated on a CPU not known to this kernel!\n");
167		sleep_cpu = -EINVAL;
168		return -EINVAL;
169	}
170	if (!cpu_online(sleep_cpu)) {
171		pr_info("Hibernated on a CPU that is offline! Bringing CPU up.\n");
172		ret = cpu_up(sleep_cpu);
173		if (ret) {
174			pr_err("Failed to bring hibernate-CPU up!\n");
175			sleep_cpu = -EINVAL;
176			return ret;
177		}
178	}
179
180	resume_hdr = *hdr;
181
182	return 0;
183}
184EXPORT_SYMBOL(arch_hibernation_header_restore);
185
186/*
187 * Copies length bytes, starting at src_start into an new page,
188 * perform cache maintentance, then maps it at the specified address low
189 * address as executable.
190 *
191 * This is used by hibernate to copy the code it needs to execute when
192 * overwriting the kernel text. This function generates a new set of page
193 * tables, which it loads into ttbr0.
194 *
195 * Length is provided as we probably only want 4K of data, even on a 64K
196 * page system.
197 */
198static int create_safe_exec_page(void *src_start, size_t length,
199				 unsigned long dst_addr,
200				 phys_addr_t *phys_dst_addr,
201				 void *(*allocator)(gfp_t mask),
202				 gfp_t mask)
203{
204	int rc = 0;
 
205	pgd_t *pgdp;
206	pud_t *pudp;
207	pmd_t *pmdp;
208	pte_t *ptep;
209	unsigned long dst = (unsigned long)allocator(mask);
210
211	if (!dst) {
212		rc = -ENOMEM;
213		goto out;
214	}
215
216	memcpy((void *)dst, src_start, length);
217	flush_icache_range(dst, dst + length);
 
 
 
 
 
 
218
219	pgdp = pgd_offset_raw(allocator(mask), dst_addr);
220	if (pgd_none(READ_ONCE(*pgdp))) {
221		pudp = allocator(mask);
222		if (!pudp) {
223			rc = -ENOMEM;
224			goto out;
225		}
226		pgd_populate(&init_mm, pgdp, pudp);
227	}
228
229	pudp = pud_offset(pgdp, dst_addr);
230	if (pud_none(READ_ONCE(*pudp))) {
231		pmdp = allocator(mask);
232		if (!pmdp) {
233			rc = -ENOMEM;
234			goto out;
235		}
236		pud_populate(&init_mm, pudp, pmdp);
237	}
238
239	pmdp = pmd_offset(pudp, dst_addr);
240	if (pmd_none(READ_ONCE(*pmdp))) {
241		ptep = allocator(mask);
242		if (!ptep) {
243			rc = -ENOMEM;
244			goto out;
245		}
246		pmd_populate_kernel(&init_mm, pmdp, ptep);
247	}
248
249	ptep = pte_offset_kernel(pmdp, dst_addr);
250	set_pte(ptep, pfn_pte(virt_to_pfn(dst), PAGE_KERNEL_EXEC));
251
252	/*
253	 * Load our new page tables. A strict BBM approach requires that we
254	 * ensure that TLBs are free of any entries that may overlap with the
255	 * global mappings we are about to install.
256	 *
257	 * For a real hibernate/resume cycle TTBR0 currently points to a zero
258	 * page, but TLBs may contain stale ASID-tagged entries (e.g. for EFI
259	 * runtime services), while for a userspace-driven test_resume cycle it
260	 * points to userspace page tables (and we must point it at a zero page
261	 * ourselves). Elsewhere we only (un)install the idmap with preemption
262	 * disabled, so T0SZ should be as required regardless.
263	 */
264	cpu_set_reserved_ttbr0();
265	local_flush_tlb_all();
266	write_sysreg(phys_to_ttbr(virt_to_phys(pgdp)), ttbr0_el1);
267	isb();
268
269	*phys_dst_addr = virt_to_phys((void *)dst);
270
271out:
272	return rc;
273}
274
275#define dcache_clean_range(start, end)	__flush_dcache_area(start, (end - start))
276
277int swsusp_arch_suspend(void)
278{
279	int ret = 0;
280	unsigned long flags;
281	struct sleep_stack_data state;
282
283	if (cpus_are_stuck_in_kernel()) {
284		pr_err("Can't hibernate: no mechanism to offline secondary CPUs.\n");
285		return -EBUSY;
286	}
287
288	flags = local_daif_save();
289
290	if (__cpu_suspend_enter(&state)) {
291		/* make the crash dump kernel image visible/saveable */
292		crash_prepare_suspend();
293
294		sleep_cpu = smp_processor_id();
295		ret = swsusp_save();
296	} else {
297		/* Clean kernel core startup/idle code to PoC*/
298		dcache_clean_range(__mmuoff_data_start, __mmuoff_data_end);
299		dcache_clean_range(__idmap_text_start, __idmap_text_end);
300
301		/* Clean kvm setup code to PoC? */
302		if (el2_reset_needed())
303			dcache_clean_range(__hyp_idmap_text_start, __hyp_idmap_text_end);
 
 
304
305		/* make the crash dump kernel image protected again */
306		crash_post_resume();
307
308		/*
309		 * Tell the hibernation core that we've just restored
310		 * the memory
311		 */
312		in_suspend = 0;
313
314		sleep_cpu = -EINVAL;
315		__cpu_suspend_exit();
 
 
 
 
 
 
 
 
 
 
 
316	}
317
318	local_daif_restore(flags);
319
320	return ret;
321}
322
323static void _copy_pte(pte_t *dst_ptep, pte_t *src_ptep, unsigned long addr)
324{
325	pte_t pte = READ_ONCE(*src_ptep);
326
327	if (pte_valid(pte)) {
328		/*
329		 * Resume will overwrite areas that may be marked
330		 * read only (code, rodata). Clear the RDONLY bit from
331		 * the temporary mappings we use during restore.
332		 */
333		set_pte(dst_ptep, pte_mkwrite(pte));
334	} else if (debug_pagealloc_enabled() && !pte_none(pte)) {
335		/*
336		 * debug_pagealloc will removed the PTE_VALID bit if
337		 * the page isn't in use by the resume kernel. It may have
338		 * been in use by the original kernel, in which case we need
339		 * to put it back in our copy to do the restore.
340		 *
341		 * Before marking this entry valid, check the pfn should
342		 * be mapped.
343		 */
344		BUG_ON(!pfn_valid(pte_pfn(pte)));
345
346		set_pte(dst_ptep, pte_mkpresent(pte_mkwrite(pte)));
347	}
348}
349
350static int copy_pte(pmd_t *dst_pmdp, pmd_t *src_pmdp, unsigned long start,
351		    unsigned long end)
352{
353	pte_t *src_ptep;
354	pte_t *dst_ptep;
355	unsigned long addr = start;
356
357	dst_ptep = (pte_t *)get_safe_page(GFP_ATOMIC);
358	if (!dst_ptep)
359		return -ENOMEM;
360	pmd_populate_kernel(&init_mm, dst_pmdp, dst_ptep);
361	dst_ptep = pte_offset_kernel(dst_pmdp, start);
362
363	src_ptep = pte_offset_kernel(src_pmdp, start);
364	do {
365		_copy_pte(dst_ptep, src_ptep, addr);
366	} while (dst_ptep++, src_ptep++, addr += PAGE_SIZE, addr != end);
367
368	return 0;
369}
370
371static int copy_pmd(pud_t *dst_pudp, pud_t *src_pudp, unsigned long start,
372		    unsigned long end)
373{
374	pmd_t *src_pmdp;
375	pmd_t *dst_pmdp;
376	unsigned long next;
377	unsigned long addr = start;
378
379	if (pud_none(READ_ONCE(*dst_pudp))) {
380		dst_pmdp = (pmd_t *)get_safe_page(GFP_ATOMIC);
381		if (!dst_pmdp)
382			return -ENOMEM;
383		pud_populate(&init_mm, dst_pudp, dst_pmdp);
384	}
385	dst_pmdp = pmd_offset(dst_pudp, start);
386
387	src_pmdp = pmd_offset(src_pudp, start);
388	do {
389		pmd_t pmd = READ_ONCE(*src_pmdp);
390
391		next = pmd_addr_end(addr, end);
392		if (pmd_none(pmd))
393			continue;
394		if (pmd_table(pmd)) {
395			if (copy_pte(dst_pmdp, src_pmdp, addr, next))
396				return -ENOMEM;
397		} else {
398			set_pmd(dst_pmdp,
399				__pmd(pmd_val(pmd) & ~PMD_SECT_RDONLY));
400		}
401	} while (dst_pmdp++, src_pmdp++, addr = next, addr != end);
402
403	return 0;
404}
405
406static int copy_pud(pgd_t *dst_pgdp, pgd_t *src_pgdp, unsigned long start,
407		    unsigned long end)
408{
409	pud_t *dst_pudp;
410	pud_t *src_pudp;
411	unsigned long next;
412	unsigned long addr = start;
413
414	if (pgd_none(READ_ONCE(*dst_pgdp))) {
415		dst_pudp = (pud_t *)get_safe_page(GFP_ATOMIC);
416		if (!dst_pudp)
417			return -ENOMEM;
418		pgd_populate(&init_mm, dst_pgdp, dst_pudp);
419	}
420	dst_pudp = pud_offset(dst_pgdp, start);
421
422	src_pudp = pud_offset(src_pgdp, start);
423	do {
424		pud_t pud = READ_ONCE(*src_pudp);
425
426		next = pud_addr_end(addr, end);
427		if (pud_none(pud))
428			continue;
429		if (pud_table(pud)) {
430			if (copy_pmd(dst_pudp, src_pudp, addr, next))
431				return -ENOMEM;
432		} else {
433			set_pud(dst_pudp,
434				__pud(pud_val(pud) & ~PMD_SECT_RDONLY));
435		}
436	} while (dst_pudp++, src_pudp++, addr = next, addr != end);
437
438	return 0;
439}
440
441static int copy_page_tables(pgd_t *dst_pgdp, unsigned long start,
442			    unsigned long end)
443{
444	unsigned long next;
445	unsigned long addr = start;
446	pgd_t *src_pgdp = pgd_offset_k(start);
447
448	dst_pgdp = pgd_offset_raw(dst_pgdp, start);
449	do {
450		next = pgd_addr_end(addr, end);
451		if (pgd_none(READ_ONCE(*src_pgdp)))
452			continue;
453		if (copy_pud(dst_pgdp, src_pgdp, addr, next))
454			return -ENOMEM;
455	} while (dst_pgdp++, src_pgdp++, addr = next, addr != end);
456
457	return 0;
458}
459
460/*
461 * Setup then Resume from the hibernate image using swsusp_arch_suspend_exit().
462 *
463 * Memory allocated by get_safe_page() will be dealt with by the hibernate code,
464 * we don't need to free it here.
465 */
466int swsusp_arch_resume(void)
467{
468	int rc = 0;
469	void *zero_page;
470	size_t exit_size;
471	pgd_t *tmp_pg_dir;
472	phys_addr_t phys_hibernate_exit;
473	void __noreturn (*hibernate_exit)(phys_addr_t, phys_addr_t, void *,
474					  void *, phys_addr_t, phys_addr_t);
475
476	/*
477	 * Restoring the memory image will overwrite the ttbr1 page tables.
478	 * Create a second copy of just the linear map, and use this when
479	 * restoring.
480	 */
481	tmp_pg_dir = (pgd_t *)get_safe_page(GFP_ATOMIC);
482	if (!tmp_pg_dir) {
483		pr_err("Failed to allocate memory for temporary page tables.\n");
484		rc = -ENOMEM;
485		goto out;
486	}
487	rc = copy_page_tables(tmp_pg_dir, PAGE_OFFSET, 0);
488	if (rc)
489		goto out;
490
491	/*
492	 * We need a zero page that is zero before & after resume in order to
493	 * to break before make on the ttbr1 page tables.
494	 */
495	zero_page = (void *)get_safe_page(GFP_ATOMIC);
496	if (!zero_page) {
497		pr_err("Failed to allocate zero page.\n");
498		rc = -ENOMEM;
499		goto out;
500	}
501
502	/*
503	 * Locate the exit code in the bottom-but-one page, so that *NULL
504	 * still has disastrous affects.
505	 */
506	hibernate_exit = (void *)PAGE_SIZE;
507	exit_size = __hibernate_exit_text_end - __hibernate_exit_text_start;
508	/*
509	 * Copy swsusp_arch_suspend_exit() to a safe page. This will generate
510	 * a new set of ttbr0 page tables and load them.
511	 */
512	rc = create_safe_exec_page(__hibernate_exit_text_start, exit_size,
513				   (unsigned long)hibernate_exit,
514				   &phys_hibernate_exit,
515				   (void *)get_safe_page, GFP_ATOMIC);
516	if (rc) {
517		pr_err("Failed to create safe executable page for hibernate_exit code.\n");
518		goto out;
519	}
520
521	/*
522	 * The hibernate exit text contains a set of el2 vectors, that will
523	 * be executed at el2 with the mmu off in order to reload hyp-stub.
524	 */
525	__flush_dcache_area(hibernate_exit, exit_size);
526
527	/*
528	 * KASLR will cause the el2 vectors to be in a different location in
529	 * the resumed kernel. Load hibernate's temporary copy into el2.
530	 *
531	 * We can skip this step if we booted at EL1, or are running with VHE.
532	 */
533	if (el2_reset_needed()) {
534		phys_addr_t el2_vectors = phys_hibernate_exit;  /* base */
535		el2_vectors += hibernate_el2_vectors -
536			       __hibernate_exit_text_start;     /* offset */
537
538		__hyp_set_vectors(el2_vectors);
539	}
540
541	hibernate_exit(virt_to_phys(tmp_pg_dir), resume_hdr.ttbr1_el1,
542		       resume_hdr.reenter_kernel, restore_pblist,
543		       resume_hdr.__hyp_stub_vectors, virt_to_phys(zero_page));
544
545out:
546	return rc;
547}
548
549int hibernate_resume_nonboot_cpu_disable(void)
550{
551	if (sleep_cpu < 0) {
552		pr_err("Failing to resume from hibernate on an unknown CPU.\n");
553		return -ENODEV;
554	}
555
556	return freeze_secondary_cpus(sleep_cpu);
557}