xref: /linux-6.15/kernel/kexec_file.c (revision 9f0552c9)
140b0b3f8SThomas Gleixner // SPDX-License-Identifier: GPL-2.0-only
2a43cac0dSDave Young /*
3a43cac0dSDave Young  * kexec: kexec_file_load system call
4a43cac0dSDave Young  *
5a43cac0dSDave Young  * Copyright (C) 2014 Red Hat Inc.
6a43cac0dSDave Young  * Authors:
7a43cac0dSDave Young  *      Vivek Goyal <[email protected]>
8a43cac0dSDave Young  */
9a43cac0dSDave Young 
10de90a6bcSMinfei Huang #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
11de90a6bcSMinfei Huang 
12a43cac0dSDave Young #include <linux/capability.h>
13a43cac0dSDave Young #include <linux/mm.h>
14a43cac0dSDave Young #include <linux/file.h>
15a43cac0dSDave Young #include <linux/slab.h>
16a43cac0dSDave Young #include <linux/kexec.h>
17735c2f90SAKASHI Takahiro #include <linux/memblock.h>
18a43cac0dSDave Young #include <linux/mutex.h>
19a43cac0dSDave Young #include <linux/list.h>
20b804defeSMimi Zohar #include <linux/fs.h>
217b8589ccSMimi Zohar #include <linux/ima.h>
22a43cac0dSDave Young #include <crypto/hash.h>
23a24d22b2SEric Biggers #include <crypto/sha2.h>
24babac4a8SAKASHI Takahiro #include <linux/elf.h>
25babac4a8SAKASHI Takahiro #include <linux/elfcore.h>
26babac4a8SAKASHI Takahiro #include <linux/kernel.h>
27b89999d0SScott Branden #include <linux/kernel_read_file.h>
28a43cac0dSDave Young #include <linux/syscalls.h>
29a43cac0dSDave Young #include <linux/vmalloc.h>
30a43cac0dSDave Young #include "kexec_internal.h"
31a43cac0dSDave Young 
32af16df54SCoiby Xu #ifdef CONFIG_KEXEC_SIG
33af16df54SCoiby Xu static bool sig_enforce = IS_ENABLED(CONFIG_KEXEC_SIG_FORCE);
34af16df54SCoiby Xu 
set_kexec_sig_enforced(void)35af16df54SCoiby Xu void set_kexec_sig_enforced(void)
36af16df54SCoiby Xu {
37af16df54SCoiby Xu 	sig_enforce = true;
38af16df54SCoiby Xu }
39af16df54SCoiby Xu #endif
40af16df54SCoiby Xu 
41a43cac0dSDave Young static int kexec_calculate_store_digests(struct kimage *image);
42a43cac0dSDave Young 
43f4da7afeSPasha Tatashin /* Maximum size in bytes for kernel/initrd files. */
44f4da7afeSPasha Tatashin #define KEXEC_FILE_SIZE_MAX	min_t(s64, 4LL << 30, SSIZE_MAX)
45f4da7afeSPasha Tatashin 
469ec4ecefSAKASHI Takahiro /*
479ec4ecefSAKASHI Takahiro  * Currently this is the only default function that is exported as some
489ec4ecefSAKASHI Takahiro  * architectures need it to do additional handlings.
499ec4ecefSAKASHI Takahiro  * In the future, other default functions may be exported too if required.
509ec4ecefSAKASHI Takahiro  */
kexec_image_probe_default(struct kimage * image,void * buf,unsigned long buf_len)519ec4ecefSAKASHI Takahiro int kexec_image_probe_default(struct kimage *image, void *buf,
529ec4ecefSAKASHI Takahiro 			      unsigned long buf_len)
539ec4ecefSAKASHI Takahiro {
549ec4ecefSAKASHI Takahiro 	const struct kexec_file_ops * const *fops;
559ec4ecefSAKASHI Takahiro 	int ret = -ENOEXEC;
569ec4ecefSAKASHI Takahiro 
579ec4ecefSAKASHI Takahiro 	for (fops = &kexec_file_loaders[0]; *fops && (*fops)->probe; ++fops) {
589ec4ecefSAKASHI Takahiro 		ret = (*fops)->probe(buf, buf_len);
599ec4ecefSAKASHI Takahiro 		if (!ret) {
609ec4ecefSAKASHI Takahiro 			image->fops = *fops;
619ec4ecefSAKASHI Takahiro 			return ret;
629ec4ecefSAKASHI Takahiro 		}
639ec4ecefSAKASHI Takahiro 	}
649ec4ecefSAKASHI Takahiro 
659ec4ecefSAKASHI Takahiro 	return ret;
669ec4ecefSAKASHI Takahiro }
679ec4ecefSAKASHI Takahiro 
kexec_image_load_default(struct kimage * image)68fb15abdcSBjorn Helgaas static void *kexec_image_load_default(struct kimage *image)
699ec4ecefSAKASHI Takahiro {
709ec4ecefSAKASHI Takahiro 	if (!image->fops || !image->fops->load)
719ec4ecefSAKASHI Takahiro 		return ERR_PTR(-ENOEXEC);
729ec4ecefSAKASHI Takahiro 
739ec4ecefSAKASHI Takahiro 	return image->fops->load(image, image->kernel_buf,
749ec4ecefSAKASHI Takahiro 				 image->kernel_buf_len, image->initrd_buf,
759ec4ecefSAKASHI Takahiro 				 image->initrd_buf_len, image->cmdline_buf,
769ec4ecefSAKASHI Takahiro 				 image->cmdline_buf_len);
77a43cac0dSDave Young }
78a43cac0dSDave Young 
kexec_image_post_load_cleanup_default(struct kimage * image)7992a98a2bSAKASHI Takahiro int kexec_image_post_load_cleanup_default(struct kimage *image)
809ec4ecefSAKASHI Takahiro {
819ec4ecefSAKASHI Takahiro 	if (!image->fops || !image->fops->cleanup)
829ec4ecefSAKASHI Takahiro 		return 0;
839ec4ecefSAKASHI Takahiro 
849ec4ecefSAKASHI Takahiro 	return image->fops->cleanup(image->image_loader_data);
85a43cac0dSDave Young }
86a43cac0dSDave Young 
878aec395bSPhilipp Rudo /*
88a43cac0dSDave Young  * Free up memory used by kernel, initrd, and command line. This is temporary
89a43cac0dSDave Young  * memory allocation which is not needed any more after these buffers have
90a43cac0dSDave Young  * been loaded into separate segments and have been copied elsewhere.
91a43cac0dSDave Young  */
kimage_file_post_load_cleanup(struct kimage * image)92a43cac0dSDave Young void kimage_file_post_load_cleanup(struct kimage *image)
93a43cac0dSDave Young {
94a43cac0dSDave Young 	struct purgatory_info *pi = &image->purgatory_info;
95a43cac0dSDave Young 
96a43cac0dSDave Young 	vfree(image->kernel_buf);
97a43cac0dSDave Young 	image->kernel_buf = NULL;
98a43cac0dSDave Young 
99a43cac0dSDave Young 	vfree(image->initrd_buf);
100a43cac0dSDave Young 	image->initrd_buf = NULL;
101a43cac0dSDave Young 
102a43cac0dSDave Young 	kfree(image->cmdline_buf);
103a43cac0dSDave Young 	image->cmdline_buf = NULL;
104a43cac0dSDave Young 
105a43cac0dSDave Young 	vfree(pi->purgatory_buf);
106a43cac0dSDave Young 	pi->purgatory_buf = NULL;
107a43cac0dSDave Young 
108a43cac0dSDave Young 	vfree(pi->sechdrs);
109a43cac0dSDave Young 	pi->sechdrs = NULL;
110a43cac0dSDave Young 
111f31e3386SLakshmi Ramasubramanian #ifdef CONFIG_IMA_KEXEC
112f31e3386SLakshmi Ramasubramanian 	vfree(image->ima_buffer);
113f31e3386SLakshmi Ramasubramanian 	image->ima_buffer = NULL;
114f31e3386SLakshmi Ramasubramanian #endif /* CONFIG_IMA_KEXEC */
115f31e3386SLakshmi Ramasubramanian 
116a43cac0dSDave Young 	/* See if architecture has anything to cleanup post load */
117a43cac0dSDave Young 	arch_kimage_file_post_load_cleanup(image);
118a43cac0dSDave Young 
119a43cac0dSDave Young 	/*
120a43cac0dSDave Young 	 * Above call should have called into bootloader to free up
121a43cac0dSDave Young 	 * any data stored in kimage->image_loader_data. It should
122a43cac0dSDave Young 	 * be ok now to free it up.
123a43cac0dSDave Young 	 */
124a43cac0dSDave Young 	kfree(image->image_loader_data);
125a43cac0dSDave Young 	image->image_loader_data = NULL;
126cbc2fe9dSBaoquan He 
127cbc2fe9dSBaoquan He 	kexec_file_dbg_print = false;
128a43cac0dSDave Young }
129a43cac0dSDave Young 
13099d5cadfSJiri Bohac #ifdef CONFIG_KEXEC_SIG
131c903dae8SCoiby Xu #ifdef CONFIG_SIGNED_PE_FILE_VERIFICATION
kexec_kernel_verify_pe_sig(const char * kernel,unsigned long kernel_len)132c903dae8SCoiby Xu int kexec_kernel_verify_pe_sig(const char *kernel, unsigned long kernel_len)
133c903dae8SCoiby Xu {
134c903dae8SCoiby Xu 	int ret;
135c903dae8SCoiby Xu 
136c903dae8SCoiby Xu 	ret = verify_pefile_signature(kernel, kernel_len,
137c903dae8SCoiby Xu 				      VERIFY_USE_SECONDARY_KEYRING,
138c903dae8SCoiby Xu 				      VERIFYING_KEXEC_PE_SIGNATURE);
139c903dae8SCoiby Xu 	if (ret == -ENOKEY && IS_ENABLED(CONFIG_INTEGRITY_PLATFORM_KEYRING)) {
140c903dae8SCoiby Xu 		ret = verify_pefile_signature(kernel, kernel_len,
141c903dae8SCoiby Xu 					      VERIFY_USE_PLATFORM_KEYRING,
142c903dae8SCoiby Xu 					      VERIFYING_KEXEC_PE_SIGNATURE);
143c903dae8SCoiby Xu 	}
144c903dae8SCoiby Xu 	return ret;
145c903dae8SCoiby Xu }
146c903dae8SCoiby Xu #endif
147c903dae8SCoiby Xu 
kexec_image_verify_sig(struct kimage * image,void * buf,unsigned long buf_len)148689a7149SCoiby Xu static int kexec_image_verify_sig(struct kimage *image, void *buf,
149689a7149SCoiby Xu 				  unsigned long buf_len)
150689a7149SCoiby Xu {
151689a7149SCoiby Xu 	if (!image->fops || !image->fops->verify_sig) {
152689a7149SCoiby Xu 		pr_debug("kernel loader does not support signature verification.\n");
153689a7149SCoiby Xu 		return -EKEYREJECTED;
154689a7149SCoiby Xu 	}
155689a7149SCoiby Xu 
156689a7149SCoiby Xu 	return image->fops->verify_sig(buf, buf_len);
157689a7149SCoiby Xu }
158689a7149SCoiby Xu 
15999d5cadfSJiri Bohac static int
kimage_validate_signature(struct kimage * image)16099d5cadfSJiri Bohac kimage_validate_signature(struct kimage *image)
16199d5cadfSJiri Bohac {
16299d5cadfSJiri Bohac 	int ret;
16399d5cadfSJiri Bohac 
164689a7149SCoiby Xu 	ret = kexec_image_verify_sig(image, image->kernel_buf,
16599d5cadfSJiri Bohac 				     image->kernel_buf_len);
166fd7af71bSLianbo Jiang 	if (ret) {
16799d5cadfSJiri Bohac 
168af16df54SCoiby Xu 		if (sig_enforce) {
169fd7af71bSLianbo Jiang 			pr_notice("Enforced kernel signature verification failed (%d).\n", ret);
17099d5cadfSJiri Bohac 			return ret;
17199d5cadfSJiri Bohac 		}
17299d5cadfSJiri Bohac 
173fd7af71bSLianbo Jiang 		/*
174fd7af71bSLianbo Jiang 		 * If IMA is guaranteed to appraise a signature on the kexec
17529d3c1c8SMatthew Garrett 		 * image, permit it even if the kernel is otherwise locked
17629d3c1c8SMatthew Garrett 		 * down.
17729d3c1c8SMatthew Garrett 		 */
17829d3c1c8SMatthew Garrett 		if (!ima_appraise_signature(READING_KEXEC_IMAGE) &&
17929d3c1c8SMatthew Garrett 		    security_locked_down(LOCKDOWN_KEXEC))
18029d3c1c8SMatthew Garrett 			return -EPERM;
18129d3c1c8SMatthew Garrett 
182fd7af71bSLianbo Jiang 		pr_debug("kernel signature verification failed (%d).\n", ret);
18399d5cadfSJiri Bohac 	}
18499d5cadfSJiri Bohac 
185fd7af71bSLianbo Jiang 	return 0;
18699d5cadfSJiri Bohac }
18799d5cadfSJiri Bohac #endif
18899d5cadfSJiri Bohac 
189a43cac0dSDave Young /*
190a43cac0dSDave Young  * In file mode list of segments is prepared by kernel. Copy relevant
191a43cac0dSDave Young  * data from user space, do error checking, prepare segment list
192a43cac0dSDave Young  */
193a43cac0dSDave Young static int
kimage_file_prepare_segments(struct kimage * image,int kernel_fd,int initrd_fd,const char __user * cmdline_ptr,unsigned long cmdline_len,unsigned flags)194a43cac0dSDave Young kimage_file_prepare_segments(struct kimage *image, int kernel_fd, int initrd_fd,
195a43cac0dSDave Young 			     const char __user *cmdline_ptr,
196a43cac0dSDave Young 			     unsigned long cmdline_len, unsigned flags)
197a43cac0dSDave Young {
198f4da7afeSPasha Tatashin 	ssize_t ret;
199a43cac0dSDave Young 	void *ldata;
200a43cac0dSDave Young 
2010fa8e084SKees Cook 	ret = kernel_read_file_from_fd(kernel_fd, 0, &image->kernel_buf,
202f4da7afeSPasha Tatashin 				       KEXEC_FILE_SIZE_MAX, NULL,
203f4da7afeSPasha Tatashin 				       READING_KEXEC_IMAGE);
204f7a4f689SKees Cook 	if (ret < 0)
205a43cac0dSDave Young 		return ret;
206f7a4f689SKees Cook 	image->kernel_buf_len = ret;
207a85ee18cSBaoquan He 	kexec_dprintk("kernel: %p kernel_size: %#lx\n",
208a85ee18cSBaoquan He 		      image->kernel_buf, image->kernel_buf_len);
209a43cac0dSDave Young 
210a43cac0dSDave Young 	/* Call arch image probe handlers */
211a43cac0dSDave Young 	ret = arch_kexec_kernel_image_probe(image, image->kernel_buf,
212a43cac0dSDave Young 					    image->kernel_buf_len);
213a43cac0dSDave Young 	if (ret)
214a43cac0dSDave Young 		goto out;
215a43cac0dSDave Young 
21699d5cadfSJiri Bohac #ifdef CONFIG_KEXEC_SIG
21799d5cadfSJiri Bohac 	ret = kimage_validate_signature(image);
21899d5cadfSJiri Bohac 
21999d5cadfSJiri Bohac 	if (ret)
220a43cac0dSDave Young 		goto out;
221a43cac0dSDave Young #endif
222a43cac0dSDave Young 	/* It is possible that there no initramfs is being loaded */
223a43cac0dSDave Young 	if (!(flags & KEXEC_FILE_NO_INITRAMFS)) {
2240fa8e084SKees Cook 		ret = kernel_read_file_from_fd(initrd_fd, 0, &image->initrd_buf,
225f4da7afeSPasha Tatashin 					       KEXEC_FILE_SIZE_MAX, NULL,
226b804defeSMimi Zohar 					       READING_KEXEC_INITRAMFS);
227f7a4f689SKees Cook 		if (ret < 0)
228a43cac0dSDave Young 			goto out;
229f7a4f689SKees Cook 		image->initrd_buf_len = ret;
230f7a4f689SKees Cook 		ret = 0;
231a43cac0dSDave Young 	}
232a43cac0dSDave Young 
233a43cac0dSDave Young 	if (cmdline_len) {
234a9bd8dfaSAl Viro 		image->cmdline_buf = memdup_user(cmdline_ptr, cmdline_len);
235a9bd8dfaSAl Viro 		if (IS_ERR(image->cmdline_buf)) {
236a9bd8dfaSAl Viro 			ret = PTR_ERR(image->cmdline_buf);
237a9bd8dfaSAl Viro 			image->cmdline_buf = NULL;
238a43cac0dSDave Young 			goto out;
239a43cac0dSDave Young 		}
240a43cac0dSDave Young 
241a43cac0dSDave Young 		image->cmdline_buf_len = cmdline_len;
242a43cac0dSDave Young 
243a43cac0dSDave Young 		/* command line should be a string with last byte null */
244a43cac0dSDave Young 		if (image->cmdline_buf[cmdline_len - 1] != '\0') {
245a43cac0dSDave Young 			ret = -EINVAL;
246a43cac0dSDave Young 			goto out;
247a43cac0dSDave Young 		}
2486a31fcd4SPrakhar Srivastava 
2494834177eSTyler Hicks 		ima_kexec_cmdline(kernel_fd, image->cmdline_buf,
2506a31fcd4SPrakhar Srivastava 				  image->cmdline_buf_len - 1);
251a43cac0dSDave Young 	}
252a43cac0dSDave Young 
2536a31fcd4SPrakhar Srivastava 	/* IMA needs to pass the measurement list to the next kernel. */
2546a31fcd4SPrakhar Srivastava 	ima_add_kexec_buffer(image);
2556a31fcd4SPrakhar Srivastava 
256fb15abdcSBjorn Helgaas 	/* Call image load handler */
257fb15abdcSBjorn Helgaas 	ldata = kexec_image_load_default(image);
258a43cac0dSDave Young 
259a43cac0dSDave Young 	if (IS_ERR(ldata)) {
260a43cac0dSDave Young 		ret = PTR_ERR(ldata);
261a43cac0dSDave Young 		goto out;
262a43cac0dSDave Young 	}
263a43cac0dSDave Young 
264a43cac0dSDave Young 	image->image_loader_data = ldata;
265a43cac0dSDave Young out:
266a43cac0dSDave Young 	/* In case of error, free up all allocated memory in this function */
267a43cac0dSDave Young 	if (ret)
268a43cac0dSDave Young 		kimage_file_post_load_cleanup(image);
269a43cac0dSDave Young 	return ret;
270a43cac0dSDave Young }
271a43cac0dSDave Young 
272a43cac0dSDave Young static int
kimage_file_alloc_init(struct kimage ** rimage,int kernel_fd,int initrd_fd,const char __user * cmdline_ptr,unsigned long cmdline_len,unsigned long flags)273a43cac0dSDave Young kimage_file_alloc_init(struct kimage **rimage, int kernel_fd,
274a43cac0dSDave Young 		       int initrd_fd, const char __user *cmdline_ptr,
275a43cac0dSDave Young 		       unsigned long cmdline_len, unsigned long flags)
276a43cac0dSDave Young {
277a43cac0dSDave Young 	int ret;
278a43cac0dSDave Young 	struct kimage *image;
279a43cac0dSDave Young 	bool kexec_on_panic = flags & KEXEC_FILE_ON_CRASH;
280a43cac0dSDave Young 
281a43cac0dSDave Young 	image = do_kimage_alloc_init();
282a43cac0dSDave Young 	if (!image)
283a43cac0dSDave Young 		return -ENOMEM;
284a43cac0dSDave Young 
285cbc2fe9dSBaoquan He 	kexec_file_dbg_print = !!(flags & KEXEC_FILE_DEBUG);
286a43cac0dSDave Young 	image->file_mode = 1;
287a43cac0dSDave Young 
28802aff848SBaoquan He #ifdef CONFIG_CRASH_DUMP
289a43cac0dSDave Young 	if (kexec_on_panic) {
290a43cac0dSDave Young 		/* Enable special crash kernel control page alloc policy. */
291a43cac0dSDave Young 		image->control_page = crashk_res.start;
292a43cac0dSDave Young 		image->type = KEXEC_TYPE_CRASH;
293a43cac0dSDave Young 	}
29402aff848SBaoquan He #endif
295a43cac0dSDave Young 
296a43cac0dSDave Young 	ret = kimage_file_prepare_segments(image, kernel_fd, initrd_fd,
297a43cac0dSDave Young 					   cmdline_ptr, cmdline_len, flags);
298a43cac0dSDave Young 	if (ret)
299a43cac0dSDave Young 		goto out_free_image;
300a43cac0dSDave Young 
301a43cac0dSDave Young 	ret = sanity_check_segment_list(image);
302a43cac0dSDave Young 	if (ret)
303a43cac0dSDave Young 		goto out_free_post_load_bufs;
304a43cac0dSDave Young 
305a43cac0dSDave Young 	ret = -ENOMEM;
306a43cac0dSDave Young 	image->control_code_page = kimage_alloc_control_pages(image,
307a43cac0dSDave Young 					   get_order(KEXEC_CONTROL_PAGE_SIZE));
308a43cac0dSDave Young 	if (!image->control_code_page) {
309a43cac0dSDave Young 		pr_err("Could not allocate control_code_buffer\n");
310a43cac0dSDave Young 		goto out_free_post_load_bufs;
311a43cac0dSDave Young 	}
312a43cac0dSDave Young 
313a43cac0dSDave Young 	if (!kexec_on_panic) {
314a43cac0dSDave Young 		image->swap_page = kimage_alloc_control_pages(image, 0);
315a43cac0dSDave Young 		if (!image->swap_page) {
316a43cac0dSDave Young 			pr_err("Could not allocate swap buffer\n");
317a43cac0dSDave Young 			goto out_free_control_pages;
318a43cac0dSDave Young 		}
319a43cac0dSDave Young 	}
320a43cac0dSDave Young 
321a43cac0dSDave Young 	*rimage = image;
322a43cac0dSDave Young 	return 0;
323a43cac0dSDave Young out_free_control_pages:
324a43cac0dSDave Young 	kimage_free_page_list(&image->control_pages);
325a43cac0dSDave Young out_free_post_load_bufs:
326a43cac0dSDave Young 	kimage_file_post_load_cleanup(image);
327a43cac0dSDave Young out_free_image:
328a43cac0dSDave Young 	kfree(image);
329a43cac0dSDave Young 	return ret;
330a43cac0dSDave Young }
331a43cac0dSDave Young 
SYSCALL_DEFINE5(kexec_file_load,int,kernel_fd,int,initrd_fd,unsigned long,cmdline_len,const char __user *,cmdline_ptr,unsigned long,flags)332a43cac0dSDave Young SYSCALL_DEFINE5(kexec_file_load, int, kernel_fd, int, initrd_fd,
333a43cac0dSDave Young 		unsigned long, cmdline_len, const char __user *, cmdline_ptr,
334a43cac0dSDave Young 		unsigned long, flags)
335a43cac0dSDave Young {
336a42aaad2SRicardo Ribalda 	int image_type = (flags & KEXEC_FILE_ON_CRASH) ?
337a42aaad2SRicardo Ribalda 			 KEXEC_TYPE_CRASH : KEXEC_TYPE_DEFAULT;
338a43cac0dSDave Young 	struct kimage **dest_image, *image;
339a42aaad2SRicardo Ribalda 	int ret = 0, i;
340a43cac0dSDave Young 
341a43cac0dSDave Young 	/* We only trust the superuser with rebooting the system. */
342a42aaad2SRicardo Ribalda 	if (!kexec_load_permitted(image_type))
343a43cac0dSDave Young 		return -EPERM;
344a43cac0dSDave Young 
345a43cac0dSDave Young 	/* Make sure we have a legal set of flags */
346a43cac0dSDave Young 	if (flags != (flags & KEXEC_FILE_FLAGS))
347a43cac0dSDave Young 		return -EINVAL;
348a43cac0dSDave Young 
349a43cac0dSDave Young 	image = NULL;
350a43cac0dSDave Young 
35105c62574SValentin Schneider 	if (!kexec_trylock())
352a43cac0dSDave Young 		return -EBUSY;
353a43cac0dSDave Young 
35402aff848SBaoquan He #ifdef CONFIG_CRASH_DUMP
355a42aaad2SRicardo Ribalda 	if (image_type == KEXEC_TYPE_CRASH) {
356a43cac0dSDave Young 		dest_image = &kexec_crash_image;
3579b492cf5SXunlei Pang 		if (kexec_crash_image)
3589b492cf5SXunlei Pang 			arch_kexec_unprotect_crashkres();
35902aff848SBaoquan He 	} else
36002aff848SBaoquan He #endif
361a42aaad2SRicardo Ribalda 		dest_image = &kexec_image;
362a43cac0dSDave Young 
363a43cac0dSDave Young 	if (flags & KEXEC_FILE_UNLOAD)
364a43cac0dSDave Young 		goto exchange;
365a43cac0dSDave Young 
366a43cac0dSDave Young 	/*
367a43cac0dSDave Young 	 * In case of crash, new kernel gets loaded in reserved region. It is
368a43cac0dSDave Young 	 * same memory where old crash kernel might be loaded. Free any
369a43cac0dSDave Young 	 * current crash dump kernel before we corrupt it.
370a43cac0dSDave Young 	 */
371a43cac0dSDave Young 	if (flags & KEXEC_FILE_ON_CRASH)
372a43cac0dSDave Young 		kimage_free(xchg(&kexec_crash_image, NULL));
373a43cac0dSDave Young 
374a43cac0dSDave Young 	ret = kimage_file_alloc_init(&image, kernel_fd, initrd_fd, cmdline_ptr,
375a43cac0dSDave Young 				     cmdline_len, flags);
376a43cac0dSDave Young 	if (ret)
377a43cac0dSDave Young 		goto out;
378a43cac0dSDave Young 
37979365026SSourabh Jain #ifdef CONFIG_CRASH_HOTPLUG
38079365026SSourabh Jain 	if ((flags & KEXEC_FILE_ON_CRASH) && arch_crash_hotplug_support(image, flags))
38179365026SSourabh Jain 		image->hotplug_support = 1;
38279365026SSourabh Jain #endif
38379365026SSourabh Jain 
384a43cac0dSDave Young 	ret = machine_kexec_prepare(image);
385a43cac0dSDave Young 	if (ret)
386a43cac0dSDave Young 		goto out;
387a43cac0dSDave Young 
3881229384fSXunlei Pang 	/*
3891229384fSXunlei Pang 	 * Some architecture(like S390) may touch the crash memory before
3901229384fSXunlei Pang 	 * machine_kexec_prepare(), we must copy vmcoreinfo data after it.
3911229384fSXunlei Pang 	 */
3921229384fSXunlei Pang 	ret = kimage_crash_copy_vmcoreinfo(image);
3931229384fSXunlei Pang 	if (ret)
3941229384fSXunlei Pang 		goto out;
3951229384fSXunlei Pang 
396a43cac0dSDave Young 	ret = kexec_calculate_store_digests(image);
397a43cac0dSDave Young 	if (ret)
398a43cac0dSDave Young 		goto out;
399a43cac0dSDave Young 
400a85ee18cSBaoquan He 	kexec_dprintk("nr_segments = %lu\n", image->nr_segments);
401a43cac0dSDave Young 	for (i = 0; i < image->nr_segments; i++) {
402a43cac0dSDave Young 		struct kexec_segment *ksegment;
403a43cac0dSDave Young 
404a43cac0dSDave Young 		ksegment = &image->segment[i];
405a85ee18cSBaoquan He 		kexec_dprintk("segment[%d]: buf=0x%p bufsz=0x%zx mem=0x%lx memsz=0x%zx\n",
406a43cac0dSDave Young 			      i, ksegment->buf, ksegment->bufsz, ksegment->mem,
407a43cac0dSDave Young 			      ksegment->memsz);
408a43cac0dSDave Young 
409a43cac0dSDave Young 		ret = kimage_load_segment(image, &image->segment[i]);
410a43cac0dSDave Young 		if (ret)
411a43cac0dSDave Young 			goto out;
412a43cac0dSDave Young 	}
413a43cac0dSDave Young 
414a43cac0dSDave Young 	kimage_terminate(image);
415a43cac0dSDave Young 
416de68e4daSPavel Tatashin 	ret = machine_kexec_post_load(image);
417de68e4daSPavel Tatashin 	if (ret)
418de68e4daSPavel Tatashin 		goto out;
419de68e4daSPavel Tatashin 
420a85ee18cSBaoquan He 	kexec_dprintk("kexec_file_load: type:%u, start:0x%lx head:0x%lx flags:0x%lx\n",
421a85ee18cSBaoquan He 		      image->type, image->start, image->head, flags);
422a43cac0dSDave Young 	/*
423a43cac0dSDave Young 	 * Free up any temporary buffers allocated which are not needed
424a43cac0dSDave Young 	 * after image has been loaded
425a43cac0dSDave Young 	 */
426a43cac0dSDave Young 	kimage_file_post_load_cleanup(image);
427a43cac0dSDave Young exchange:
428a43cac0dSDave Young 	image = xchg(dest_image, image);
429a43cac0dSDave Young out:
43002aff848SBaoquan He #ifdef CONFIG_CRASH_DUMP
4319b492cf5SXunlei Pang 	if ((flags & KEXEC_FILE_ON_CRASH) && kexec_crash_image)
4329b492cf5SXunlei Pang 		arch_kexec_protect_crashkres();
43302aff848SBaoquan He #endif
4349b492cf5SXunlei Pang 
43505c62574SValentin Schneider 	kexec_unlock();
436a43cac0dSDave Young 	kimage_free(image);
437a43cac0dSDave Young 	return ret;
438a43cac0dSDave Young }
439a43cac0dSDave Young 
locate_mem_hole_top_down(unsigned long start,unsigned long end,struct kexec_buf * kbuf)440a43cac0dSDave Young static int locate_mem_hole_top_down(unsigned long start, unsigned long end,
441a43cac0dSDave Young 				    struct kexec_buf *kbuf)
442a43cac0dSDave Young {
443a43cac0dSDave Young 	struct kimage *image = kbuf->image;
444a43cac0dSDave Young 	unsigned long temp_start, temp_end;
445a43cac0dSDave Young 
446a43cac0dSDave Young 	temp_end = min(end, kbuf->buf_max);
44718d565eaSYuntao Wang 	temp_start = temp_end - kbuf->memsz + 1;
448a43cac0dSDave Young 
449a43cac0dSDave Young 	do {
450a43cac0dSDave Young 		/* align down start */
45118d565eaSYuntao Wang 		temp_start = ALIGN_DOWN(temp_start, kbuf->buf_align);
452a43cac0dSDave Young 
453a43cac0dSDave Young 		if (temp_start < start || temp_start < kbuf->buf_min)
454a43cac0dSDave Young 			return 0;
455a43cac0dSDave Young 
456a43cac0dSDave Young 		temp_end = temp_start + kbuf->memsz - 1;
457a43cac0dSDave Young 
458a43cac0dSDave Young 		/*
459a43cac0dSDave Young 		 * Make sure this does not conflict with any of existing
460a43cac0dSDave Young 		 * segments
461a43cac0dSDave Young 		 */
462a43cac0dSDave Young 		if (kimage_is_destination_range(image, temp_start, temp_end)) {
463a43cac0dSDave Young 			temp_start = temp_start - PAGE_SIZE;
464a43cac0dSDave Young 			continue;
465a43cac0dSDave Young 		}
466a43cac0dSDave Young 
467*9f0552c9SSourabh Jain 		/* Make sure this does not conflict with exclude range */
468*9f0552c9SSourabh Jain 		if (arch_check_excluded_range(image, temp_start, temp_end)) {
469*9f0552c9SSourabh Jain 			temp_start = temp_start - PAGE_SIZE;
470*9f0552c9SSourabh Jain 			continue;
471*9f0552c9SSourabh Jain 		}
472*9f0552c9SSourabh Jain 
473a43cac0dSDave Young 		/* We found a suitable memory range */
474a43cac0dSDave Young 		break;
475a43cac0dSDave Young 	} while (1);
476a43cac0dSDave Young 
477a43cac0dSDave Young 	/* If we are here, we found a suitable memory range */
478a43cac0dSDave Young 	kbuf->mem = temp_start;
479a43cac0dSDave Young 
480a43cac0dSDave Young 	/* Success, stop navigating through remaining System RAM ranges */
481a43cac0dSDave Young 	return 1;
482a43cac0dSDave Young }
483a43cac0dSDave Young 
locate_mem_hole_bottom_up(unsigned long start,unsigned long end,struct kexec_buf * kbuf)484a43cac0dSDave Young static int locate_mem_hole_bottom_up(unsigned long start, unsigned long end,
485a43cac0dSDave Young 				     struct kexec_buf *kbuf)
486a43cac0dSDave Young {
487a43cac0dSDave Young 	struct kimage *image = kbuf->image;
488a43cac0dSDave Young 	unsigned long temp_start, temp_end;
489a43cac0dSDave Young 
490a43cac0dSDave Young 	temp_start = max(start, kbuf->buf_min);
491a43cac0dSDave Young 
492a43cac0dSDave Young 	do {
493a43cac0dSDave Young 		temp_start = ALIGN(temp_start, kbuf->buf_align);
494a43cac0dSDave Young 		temp_end = temp_start + kbuf->memsz - 1;
495a43cac0dSDave Young 
496a43cac0dSDave Young 		if (temp_end > end || temp_end > kbuf->buf_max)
497a43cac0dSDave Young 			return 0;
498a43cac0dSDave Young 		/*
499a43cac0dSDave Young 		 * Make sure this does not conflict with any of existing
500a43cac0dSDave Young 		 * segments
501a43cac0dSDave Young 		 */
502a43cac0dSDave Young 		if (kimage_is_destination_range(image, temp_start, temp_end)) {
503a43cac0dSDave Young 			temp_start = temp_start + PAGE_SIZE;
504a43cac0dSDave Young 			continue;
505a43cac0dSDave Young 		}
506a43cac0dSDave Young 
507*9f0552c9SSourabh Jain 		/* Make sure this does not conflict with exclude range */
508*9f0552c9SSourabh Jain 		if (arch_check_excluded_range(image, temp_start, temp_end)) {
509*9f0552c9SSourabh Jain 			temp_start = temp_start + PAGE_SIZE;
510*9f0552c9SSourabh Jain 			continue;
511*9f0552c9SSourabh Jain 		}
512*9f0552c9SSourabh Jain 
513a43cac0dSDave Young 		/* We found a suitable memory range */
514a43cac0dSDave Young 		break;
515a43cac0dSDave Young 	} while (1);
516a43cac0dSDave Young 
517a43cac0dSDave Young 	/* If we are here, we found a suitable memory range */
518a43cac0dSDave Young 	kbuf->mem = temp_start;
519a43cac0dSDave Young 
520a43cac0dSDave Young 	/* Success, stop navigating through remaining System RAM ranges */
521a43cac0dSDave Young 	return 1;
522a43cac0dSDave Young }
523a43cac0dSDave Young 
locate_mem_hole_callback(struct resource * res,void * arg)5241d2e733bSTom Lendacky static int locate_mem_hole_callback(struct resource *res, void *arg)
525a43cac0dSDave Young {
526a43cac0dSDave Young 	struct kexec_buf *kbuf = (struct kexec_buf *)arg;
5271d2e733bSTom Lendacky 	u64 start = res->start, end = res->end;
528a43cac0dSDave Young 	unsigned long sz = end - start + 1;
529a43cac0dSDave Young 
530a43cac0dSDave Young 	/* Returning 0 will take to next memory range */
5313fe4f499SDavid Hildenbrand 
5323fe4f499SDavid Hildenbrand 	/* Don't use memory that will be detected and handled by a driver. */
5337cf603d1SDavid Hildenbrand 	if (res->flags & IORESOURCE_SYSRAM_DRIVER_MANAGED)
5343fe4f499SDavid Hildenbrand 		return 0;
5353fe4f499SDavid Hildenbrand 
536a43cac0dSDave Young 	if (sz < kbuf->memsz)
537a43cac0dSDave Young 		return 0;
538a43cac0dSDave Young 
539a43cac0dSDave Young 	if (end < kbuf->buf_min || start > kbuf->buf_max)
540a43cac0dSDave Young 		return 0;
541a43cac0dSDave Young 
542a43cac0dSDave Young 	/*
543a43cac0dSDave Young 	 * Allocate memory top down with-in ram range. Otherwise bottom up
544a43cac0dSDave Young 	 * allocation.
545a43cac0dSDave Young 	 */
546a43cac0dSDave Young 	if (kbuf->top_down)
547a43cac0dSDave Young 		return locate_mem_hole_top_down(start, end, kbuf);
548a43cac0dSDave Young 	return locate_mem_hole_bottom_up(start, end, kbuf);
549a43cac0dSDave Young }
550a43cac0dSDave Young 
551350e88baSMike Rapoport #ifdef CONFIG_ARCH_KEEP_MEMBLOCK
kexec_walk_memblock(struct kexec_buf * kbuf,int (* func)(struct resource *,void *))552735c2f90SAKASHI Takahiro static int kexec_walk_memblock(struct kexec_buf *kbuf,
553735c2f90SAKASHI Takahiro 			       int (*func)(struct resource *, void *))
554735c2f90SAKASHI Takahiro {
555735c2f90SAKASHI Takahiro 	int ret = 0;
556735c2f90SAKASHI Takahiro 	u64 i;
557735c2f90SAKASHI Takahiro 	phys_addr_t mstart, mend;
558735c2f90SAKASHI Takahiro 	struct resource res = { };
559735c2f90SAKASHI Takahiro 
56040254101SBaoquan He #ifdef CONFIG_CRASH_DUMP
561497e1858SAKASHI Takahiro 	if (kbuf->image->type == KEXEC_TYPE_CRASH)
562497e1858SAKASHI Takahiro 		return func(&crashk_res, kbuf);
56340254101SBaoquan He #endif
564497e1858SAKASHI Takahiro 
565f7892d8eSDavid Hildenbrand 	/*
566f7892d8eSDavid Hildenbrand 	 * Using MEMBLOCK_NONE will properly skip MEMBLOCK_DRIVER_MANAGED. See
567f7892d8eSDavid Hildenbrand 	 * IORESOURCE_SYSRAM_DRIVER_MANAGED handling in
568f7892d8eSDavid Hildenbrand 	 * locate_mem_hole_callback().
569f7892d8eSDavid Hildenbrand 	 */
570735c2f90SAKASHI Takahiro 	if (kbuf->top_down) {
571497e1858SAKASHI Takahiro 		for_each_free_mem_range_reverse(i, NUMA_NO_NODE, MEMBLOCK_NONE,
572735c2f90SAKASHI Takahiro 						&mstart, &mend, NULL) {
573735c2f90SAKASHI Takahiro 			/*
574735c2f90SAKASHI Takahiro 			 * In memblock, end points to the first byte after the
575735c2f90SAKASHI Takahiro 			 * range while in kexec, end points to the last byte
576735c2f90SAKASHI Takahiro 			 * in the range.
577735c2f90SAKASHI Takahiro 			 */
578735c2f90SAKASHI Takahiro 			res.start = mstart;
579735c2f90SAKASHI Takahiro 			res.end = mend - 1;
580735c2f90SAKASHI Takahiro 			ret = func(&res, kbuf);
581735c2f90SAKASHI Takahiro 			if (ret)
582735c2f90SAKASHI Takahiro 				break;
583735c2f90SAKASHI Takahiro 		}
584735c2f90SAKASHI Takahiro 	} else {
585497e1858SAKASHI Takahiro 		for_each_free_mem_range(i, NUMA_NO_NODE, MEMBLOCK_NONE,
586497e1858SAKASHI Takahiro 					&mstart, &mend, NULL) {
587735c2f90SAKASHI Takahiro 			/*
588735c2f90SAKASHI Takahiro 			 * In memblock, end points to the first byte after the
589735c2f90SAKASHI Takahiro 			 * range while in kexec, end points to the last byte
590735c2f90SAKASHI Takahiro 			 * in the range.
591735c2f90SAKASHI Takahiro 			 */
592735c2f90SAKASHI Takahiro 			res.start = mstart;
593735c2f90SAKASHI Takahiro 			res.end = mend - 1;
594735c2f90SAKASHI Takahiro 			ret = func(&res, kbuf);
595735c2f90SAKASHI Takahiro 			if (ret)
596735c2f90SAKASHI Takahiro 				break;
597735c2f90SAKASHI Takahiro 		}
598735c2f90SAKASHI Takahiro 	}
599735c2f90SAKASHI Takahiro 
600735c2f90SAKASHI Takahiro 	return ret;
601735c2f90SAKASHI Takahiro }
602350e88baSMike Rapoport #else
kexec_walk_memblock(struct kexec_buf * kbuf,int (* func)(struct resource *,void *))603350e88baSMike Rapoport static int kexec_walk_memblock(struct kexec_buf *kbuf,
604350e88baSMike Rapoport 			       int (*func)(struct resource *, void *))
605350e88baSMike Rapoport {
606350e88baSMike Rapoport 	return 0;
607350e88baSMike Rapoport }
608735c2f90SAKASHI Takahiro #endif
609735c2f90SAKASHI Takahiro 
61060fe3910SThiago Jung Bauermann /**
611735c2f90SAKASHI Takahiro  * kexec_walk_resources - call func(data) on free memory regions
61260fe3910SThiago Jung Bauermann  * @kbuf:	Context info for the search. Also passed to @func.
61360fe3910SThiago Jung Bauermann  * @func:	Function to call for each memory region.
61460fe3910SThiago Jung Bauermann  *
61560fe3910SThiago Jung Bauermann  * Return: The memory walk will stop when func returns a non-zero value
61660fe3910SThiago Jung Bauermann  * and that value will be returned. If all free regions are visited without
61760fe3910SThiago Jung Bauermann  * func returning non-zero, then zero will be returned.
61860fe3910SThiago Jung Bauermann  */
kexec_walk_resources(struct kexec_buf * kbuf,int (* func)(struct resource *,void *))619735c2f90SAKASHI Takahiro static int kexec_walk_resources(struct kexec_buf *kbuf,
6201d2e733bSTom Lendacky 				int (*func)(struct resource *, void *))
62160fe3910SThiago Jung Bauermann {
62202aff848SBaoquan He #ifdef CONFIG_CRASH_DUMP
62360fe3910SThiago Jung Bauermann 	if (kbuf->image->type == KEXEC_TYPE_CRASH)
62460fe3910SThiago Jung Bauermann 		return walk_iomem_res_desc(crashk_res.desc,
62560fe3910SThiago Jung Bauermann 					   IORESOURCE_SYSTEM_RAM | IORESOURCE_BUSY,
62660fe3910SThiago Jung Bauermann 					   crashk_res.start, crashk_res.end,
62760fe3910SThiago Jung Bauermann 					   kbuf, func);
62802aff848SBaoquan He #endif
62902aff848SBaoquan He 	if (kbuf->top_down)
630b3ba2341SBaoquan He 		return walk_system_ram_res_rev(0, ULONG_MAX, kbuf, func);
63160fe3910SThiago Jung Bauermann 	else
63260fe3910SThiago Jung Bauermann 		return walk_system_ram_res(0, ULONG_MAX, kbuf, func);
63360fe3910SThiago Jung Bauermann }
63460fe3910SThiago Jung Bauermann 
635ec2b9bfaSThiago Jung Bauermann /**
636e2e806f9SThiago Jung Bauermann  * kexec_locate_mem_hole - find free memory for the purgatory or the next kernel
637e2e806f9SThiago Jung Bauermann  * @kbuf:	Parameters for the memory search.
638e2e806f9SThiago Jung Bauermann  *
639e2e806f9SThiago Jung Bauermann  * On success, kbuf->mem will have the start address of the memory region found.
640e2e806f9SThiago Jung Bauermann  *
641e2e806f9SThiago Jung Bauermann  * Return: 0 on success, negative errno on error.
642e2e806f9SThiago Jung Bauermann  */
kexec_locate_mem_hole(struct kexec_buf * kbuf)643e2e806f9SThiago Jung Bauermann int kexec_locate_mem_hole(struct kexec_buf *kbuf)
644e2e806f9SThiago Jung Bauermann {
645e2e806f9SThiago Jung Bauermann 	int ret;
646e2e806f9SThiago Jung Bauermann 
647b6664ba4SAKASHI Takahiro 	/* Arch knows where to place */
648b6664ba4SAKASHI Takahiro 	if (kbuf->mem != KEXEC_BUF_MEM_UNKNOWN)
649b6664ba4SAKASHI Takahiro 		return 0;
650b6664ba4SAKASHI Takahiro 
651350e88baSMike Rapoport 	if (!IS_ENABLED(CONFIG_ARCH_KEEP_MEMBLOCK))
652735c2f90SAKASHI Takahiro 		ret = kexec_walk_resources(kbuf, locate_mem_hole_callback);
653735c2f90SAKASHI Takahiro 	else
654735c2f90SAKASHI Takahiro 		ret = kexec_walk_memblock(kbuf, locate_mem_hole_callback);
655e2e806f9SThiago Jung Bauermann 
656e2e806f9SThiago Jung Bauermann 	return ret == 1 ? 0 : -EADDRNOTAVAIL;
657e2e806f9SThiago Jung Bauermann }
658e2e806f9SThiago Jung Bauermann 
659e2e806f9SThiago Jung Bauermann /**
660ec2b9bfaSThiago Jung Bauermann  * kexec_add_buffer - place a buffer in a kexec segment
661ec2b9bfaSThiago Jung Bauermann  * @kbuf:	Buffer contents and memory parameters.
662ec2b9bfaSThiago Jung Bauermann  *
66355e2b696SWenyu Liu  * This function assumes that kexec_lock is held.
664ec2b9bfaSThiago Jung Bauermann  * On successful return, @kbuf->mem will have the physical address of
665ec2b9bfaSThiago Jung Bauermann  * the buffer in memory.
666ec2b9bfaSThiago Jung Bauermann  *
667ec2b9bfaSThiago Jung Bauermann  * Return: 0 on success, negative errno on error.
668a43cac0dSDave Young  */
kexec_add_buffer(struct kexec_buf * kbuf)669ec2b9bfaSThiago Jung Bauermann int kexec_add_buffer(struct kexec_buf *kbuf)
670a43cac0dSDave Young {
671a43cac0dSDave Young 	struct kexec_segment *ksegment;
672a43cac0dSDave Young 	int ret;
673a43cac0dSDave Young 
674a43cac0dSDave Young 	/* Currently adding segment this way is allowed only in file mode */
675ec2b9bfaSThiago Jung Bauermann 	if (!kbuf->image->file_mode)
676a43cac0dSDave Young 		return -EINVAL;
677a43cac0dSDave Young 
678ec2b9bfaSThiago Jung Bauermann 	if (kbuf->image->nr_segments >= KEXEC_SEGMENT_MAX)
679a43cac0dSDave Young 		return -EINVAL;
680a43cac0dSDave Young 
681a43cac0dSDave Young 	/*
682a43cac0dSDave Young 	 * Make sure we are not trying to add buffer after allocating
683a43cac0dSDave Young 	 * control pages. All segments need to be placed first before
684a43cac0dSDave Young 	 * any control pages are allocated. As control page allocation
685a43cac0dSDave Young 	 * logic goes through list of segments to make sure there are
686a43cac0dSDave Young 	 * no destination overlaps.
687a43cac0dSDave Young 	 */
688ec2b9bfaSThiago Jung Bauermann 	if (!list_empty(&kbuf->image->control_pages)) {
689a43cac0dSDave Young 		WARN_ON(1);
690a43cac0dSDave Young 		return -EINVAL;
691a43cac0dSDave Young 	}
692a43cac0dSDave Young 
693ec2b9bfaSThiago Jung Bauermann 	/* Ensure minimum alignment needed for segments. */
694ec2b9bfaSThiago Jung Bauermann 	kbuf->memsz = ALIGN(kbuf->memsz, PAGE_SIZE);
695ec2b9bfaSThiago Jung Bauermann 	kbuf->buf_align = max(kbuf->buf_align, PAGE_SIZE);
696a43cac0dSDave Young 
697a43cac0dSDave Young 	/* Walk the RAM ranges and allocate a suitable range for the buffer */
698f891f197SHari Bathini 	ret = arch_kexec_locate_mem_hole(kbuf);
699e2e806f9SThiago Jung Bauermann 	if (ret)
700e2e806f9SThiago Jung Bauermann 		return ret;
701a43cac0dSDave Young 
702a43cac0dSDave Young 	/* Found a suitable memory range */
703ec2b9bfaSThiago Jung Bauermann 	ksegment = &kbuf->image->segment[kbuf->image->nr_segments];
704a43cac0dSDave Young 	ksegment->kbuf = kbuf->buffer;
705a43cac0dSDave Young 	ksegment->bufsz = kbuf->bufsz;
706a43cac0dSDave Young 	ksegment->mem = kbuf->mem;
707a43cac0dSDave Young 	ksegment->memsz = kbuf->memsz;
708ec2b9bfaSThiago Jung Bauermann 	kbuf->image->nr_segments++;
709a43cac0dSDave Young 	return 0;
710a43cac0dSDave Young }
711a43cac0dSDave Young 
712a43cac0dSDave Young /* Calculate and store the digest of segments */
kexec_calculate_store_digests(struct kimage * image)713a43cac0dSDave Young static int kexec_calculate_store_digests(struct kimage *image)
714a43cac0dSDave Young {
715a43cac0dSDave Young 	struct crypto_shash *tfm;
716a43cac0dSDave Young 	struct shash_desc *desc;
717a43cac0dSDave Young 	int ret = 0, i, j, zero_buf_sz, sha_region_sz;
718a43cac0dSDave Young 	size_t desc_size, nullsz;
719a43cac0dSDave Young 	char *digest;
720a43cac0dSDave Young 	void *zero_buf;
721a43cac0dSDave Young 	struct kexec_sha_region *sha_regions;
722a43cac0dSDave Young 	struct purgatory_info *pi = &image->purgatory_info;
723a43cac0dSDave Young 
724e6265fe7SEric DeVolder 	if (!IS_ENABLED(CONFIG_ARCH_SUPPORTS_KEXEC_PURGATORY))
725b799a09fSAKASHI Takahiro 		return 0;
726b799a09fSAKASHI Takahiro 
727a43cac0dSDave Young 	zero_buf = __va(page_to_pfn(ZERO_PAGE(0)) << PAGE_SHIFT);
728a43cac0dSDave Young 	zero_buf_sz = PAGE_SIZE;
729a43cac0dSDave Young 
730a43cac0dSDave Young 	tfm = crypto_alloc_shash("sha256", 0, 0);
731a43cac0dSDave Young 	if (IS_ERR(tfm)) {
732a43cac0dSDave Young 		ret = PTR_ERR(tfm);
733a43cac0dSDave Young 		goto out;
734a43cac0dSDave Young 	}
735a43cac0dSDave Young 
736a43cac0dSDave Young 	desc_size = crypto_shash_descsize(tfm) + sizeof(*desc);
737a43cac0dSDave Young 	desc = kzalloc(desc_size, GFP_KERNEL);
738a43cac0dSDave Young 	if (!desc) {
739a43cac0dSDave Young 		ret = -ENOMEM;
740a43cac0dSDave Young 		goto out_free_tfm;
741a43cac0dSDave Young 	}
742a43cac0dSDave Young 
743a43cac0dSDave Young 	sha_region_sz = KEXEC_SEGMENT_MAX * sizeof(struct kexec_sha_region);
744a43cac0dSDave Young 	sha_regions = vzalloc(sha_region_sz);
74531d82c2cSJia-Ju Bai 	if (!sha_regions) {
74631d82c2cSJia-Ju Bai 		ret = -ENOMEM;
747a43cac0dSDave Young 		goto out_free_desc;
74831d82c2cSJia-Ju Bai 	}
749a43cac0dSDave Young 
750a43cac0dSDave Young 	desc->tfm   = tfm;
751a43cac0dSDave Young 
752a43cac0dSDave Young 	ret = crypto_shash_init(desc);
753a43cac0dSDave Young 	if (ret < 0)
754a43cac0dSDave Young 		goto out_free_sha_regions;
755a43cac0dSDave Young 
756a43cac0dSDave Young 	digest = kzalloc(SHA256_DIGEST_SIZE, GFP_KERNEL);
757a43cac0dSDave Young 	if (!digest) {
758a43cac0dSDave Young 		ret = -ENOMEM;
759a43cac0dSDave Young 		goto out_free_sha_regions;
760a43cac0dSDave Young 	}
761a43cac0dSDave Young 
762a43cac0dSDave Young 	for (j = i = 0; i < image->nr_segments; i++) {
763a43cac0dSDave Young 		struct kexec_segment *ksegment;
764a43cac0dSDave Young 
765f7cc804aSEric DeVolder #ifdef CONFIG_CRASH_HOTPLUG
766f7cc804aSEric DeVolder 		/* Exclude elfcorehdr segment to allow future changes via hotplug */
7676dacd79dSPetr Tesarik 		if (i == image->elfcorehdr_index)
768f7cc804aSEric DeVolder 			continue;
769f7cc804aSEric DeVolder #endif
770f7cc804aSEric DeVolder 
771a43cac0dSDave Young 		ksegment = &image->segment[i];
772a43cac0dSDave Young 		/*
773a43cac0dSDave Young 		 * Skip purgatory as it will be modified once we put digest
774a43cac0dSDave Young 		 * info in purgatory.
775a43cac0dSDave Young 		 */
776a43cac0dSDave Young 		if (ksegment->kbuf == pi->purgatory_buf)
777a43cac0dSDave Young 			continue;
778a43cac0dSDave Young 
779a43cac0dSDave Young 		ret = crypto_shash_update(desc, ksegment->kbuf,
780a43cac0dSDave Young 					  ksegment->bufsz);
781a43cac0dSDave Young 		if (ret)
782a43cac0dSDave Young 			break;
783a43cac0dSDave Young 
784a43cac0dSDave Young 		/*
785a43cac0dSDave Young 		 * Assume rest of the buffer is filled with zero and
786a43cac0dSDave Young 		 * update digest accordingly.
787a43cac0dSDave Young 		 */
788a43cac0dSDave Young 		nullsz = ksegment->memsz - ksegment->bufsz;
789a43cac0dSDave Young 		while (nullsz) {
790a43cac0dSDave Young 			unsigned long bytes = nullsz;
791a43cac0dSDave Young 
792a43cac0dSDave Young 			if (bytes > zero_buf_sz)
793a43cac0dSDave Young 				bytes = zero_buf_sz;
794a43cac0dSDave Young 			ret = crypto_shash_update(desc, zero_buf, bytes);
795a43cac0dSDave Young 			if (ret)
796a43cac0dSDave Young 				break;
797a43cac0dSDave Young 			nullsz -= bytes;
798a43cac0dSDave Young 		}
799a43cac0dSDave Young 
800a43cac0dSDave Young 		if (ret)
801a43cac0dSDave Young 			break;
802a43cac0dSDave Young 
803a43cac0dSDave Young 		sha_regions[j].start = ksegment->mem;
804a43cac0dSDave Young 		sha_regions[j].len = ksegment->memsz;
805a43cac0dSDave Young 		j++;
806a43cac0dSDave Young 	}
807a43cac0dSDave Young 
808a43cac0dSDave Young 	if (!ret) {
809a43cac0dSDave Young 		ret = crypto_shash_final(desc, digest);
810a43cac0dSDave Young 		if (ret)
811a43cac0dSDave Young 			goto out_free_digest;
81240c50c1fSThomas Gleixner 		ret = kexec_purgatory_get_set_symbol(image, "purgatory_sha_regions",
813a43cac0dSDave Young 						     sha_regions, sha_region_sz, 0);
814a43cac0dSDave Young 		if (ret)
815a43cac0dSDave Young 			goto out_free_digest;
816a43cac0dSDave Young 
81740c50c1fSThomas Gleixner 		ret = kexec_purgatory_get_set_symbol(image, "purgatory_sha256_digest",
818a43cac0dSDave Young 						     digest, SHA256_DIGEST_SIZE, 0);
819a43cac0dSDave Young 		if (ret)
820a43cac0dSDave Young 			goto out_free_digest;
821a43cac0dSDave Young 	}
822a43cac0dSDave Young 
823a43cac0dSDave Young out_free_digest:
824a43cac0dSDave Young 	kfree(digest);
825a43cac0dSDave Young out_free_sha_regions:
826a43cac0dSDave Young 	vfree(sha_regions);
827a43cac0dSDave Young out_free_desc:
828a43cac0dSDave Young 	kfree(desc);
829a43cac0dSDave Young out_free_tfm:
830a43cac0dSDave Young 	kfree(tfm);
831a43cac0dSDave Young out:
832a43cac0dSDave Young 	return ret;
833a43cac0dSDave Young }
834a43cac0dSDave Young 
835e6265fe7SEric DeVolder #ifdef CONFIG_ARCH_SUPPORTS_KEXEC_PURGATORY
83693045705SPhilipp Rudo /*
83793045705SPhilipp Rudo  * kexec_purgatory_setup_kbuf - prepare buffer to load purgatory.
83893045705SPhilipp Rudo  * @pi:		Purgatory to be loaded.
83993045705SPhilipp Rudo  * @kbuf:	Buffer to setup.
84093045705SPhilipp Rudo  *
84193045705SPhilipp Rudo  * Allocates the memory needed for the buffer. Caller is responsible to free
84293045705SPhilipp Rudo  * the memory after use.
84393045705SPhilipp Rudo  *
84493045705SPhilipp Rudo  * Return: 0 on success, negative errno on error.
84593045705SPhilipp Rudo  */
kexec_purgatory_setup_kbuf(struct purgatory_info * pi,struct kexec_buf * kbuf)84693045705SPhilipp Rudo static int kexec_purgatory_setup_kbuf(struct purgatory_info *pi,
84793045705SPhilipp Rudo 				      struct kexec_buf *kbuf)
848a43cac0dSDave Young {
84993045705SPhilipp Rudo 	const Elf_Shdr *sechdrs;
85093045705SPhilipp Rudo 	unsigned long bss_align;
85193045705SPhilipp Rudo 	unsigned long bss_sz;
85293045705SPhilipp Rudo 	unsigned long align;
85393045705SPhilipp Rudo 	int i, ret;
85493045705SPhilipp Rudo 
85593045705SPhilipp Rudo 	sechdrs = (void *)pi->ehdr + pi->ehdr->e_shoff;
8563be3f61dSPhilipp Rudo 	kbuf->buf_align = bss_align = 1;
8573be3f61dSPhilipp Rudo 	kbuf->bufsz = bss_sz = 0;
85893045705SPhilipp Rudo 
85993045705SPhilipp Rudo 	for (i = 0; i < pi->ehdr->e_shnum; i++) {
86093045705SPhilipp Rudo 		if (!(sechdrs[i].sh_flags & SHF_ALLOC))
86193045705SPhilipp Rudo 			continue;
86293045705SPhilipp Rudo 
86393045705SPhilipp Rudo 		align = sechdrs[i].sh_addralign;
86493045705SPhilipp Rudo 		if (sechdrs[i].sh_type != SHT_NOBITS) {
86593045705SPhilipp Rudo 			if (kbuf->buf_align < align)
86693045705SPhilipp Rudo 				kbuf->buf_align = align;
86793045705SPhilipp Rudo 			kbuf->bufsz = ALIGN(kbuf->bufsz, align);
86893045705SPhilipp Rudo 			kbuf->bufsz += sechdrs[i].sh_size;
86993045705SPhilipp Rudo 		} else {
87093045705SPhilipp Rudo 			if (bss_align < align)
87193045705SPhilipp Rudo 				bss_align = align;
87293045705SPhilipp Rudo 			bss_sz = ALIGN(bss_sz, align);
87393045705SPhilipp Rudo 			bss_sz += sechdrs[i].sh_size;
87493045705SPhilipp Rudo 		}
87593045705SPhilipp Rudo 	}
87693045705SPhilipp Rudo 	kbuf->bufsz = ALIGN(kbuf->bufsz, bss_align);
87793045705SPhilipp Rudo 	kbuf->memsz = kbuf->bufsz + bss_sz;
87893045705SPhilipp Rudo 	if (kbuf->buf_align < bss_align)
87993045705SPhilipp Rudo 		kbuf->buf_align = bss_align;
88093045705SPhilipp Rudo 
88193045705SPhilipp Rudo 	kbuf->buffer = vzalloc(kbuf->bufsz);
88293045705SPhilipp Rudo 	if (!kbuf->buffer)
88393045705SPhilipp Rudo 		return -ENOMEM;
88493045705SPhilipp Rudo 	pi->purgatory_buf = kbuf->buffer;
88593045705SPhilipp Rudo 
88693045705SPhilipp Rudo 	ret = kexec_add_buffer(kbuf);
88793045705SPhilipp Rudo 	if (ret)
88893045705SPhilipp Rudo 		goto out;
88993045705SPhilipp Rudo 
89093045705SPhilipp Rudo 	return 0;
89193045705SPhilipp Rudo out:
89293045705SPhilipp Rudo 	vfree(pi->purgatory_buf);
89393045705SPhilipp Rudo 	pi->purgatory_buf = NULL;
89493045705SPhilipp Rudo 	return ret;
89593045705SPhilipp Rudo }
896a43cac0dSDave Young 
897a43cac0dSDave Young /*
89893045705SPhilipp Rudo  * kexec_purgatory_setup_sechdrs - prepares the pi->sechdrs buffer.
89993045705SPhilipp Rudo  * @pi:		Purgatory to be loaded.
90093045705SPhilipp Rudo  * @kbuf:	Buffer prepared to store purgatory.
90193045705SPhilipp Rudo  *
90293045705SPhilipp Rudo  * Allocates the memory needed for the buffer. Caller is responsible to free
90393045705SPhilipp Rudo  * the memory after use.
90493045705SPhilipp Rudo  *
90593045705SPhilipp Rudo  * Return: 0 on success, negative errno on error.
906a43cac0dSDave Young  */
kexec_purgatory_setup_sechdrs(struct purgatory_info * pi,struct kexec_buf * kbuf)90793045705SPhilipp Rudo static int kexec_purgatory_setup_sechdrs(struct purgatory_info *pi,
90893045705SPhilipp Rudo 					 struct kexec_buf *kbuf)
90993045705SPhilipp Rudo {
91093045705SPhilipp Rudo 	unsigned long bss_addr;
91193045705SPhilipp Rudo 	unsigned long offset;
9124df3504eSSimon Horman 	size_t sechdrs_size;
91393045705SPhilipp Rudo 	Elf_Shdr *sechdrs;
91493045705SPhilipp Rudo 	int i;
915a43cac0dSDave Young 
9168da0b724SPhilipp Rudo 	/*
9178da0b724SPhilipp Rudo 	 * The section headers in kexec_purgatory are read-only. In order to
9188da0b724SPhilipp Rudo 	 * have them modifiable make a temporary copy.
9198da0b724SPhilipp Rudo 	 */
9204df3504eSSimon Horman 	sechdrs_size = array_size(sizeof(Elf_Shdr), pi->ehdr->e_shnum);
9214df3504eSSimon Horman 	sechdrs = vzalloc(sechdrs_size);
922a43cac0dSDave Young 	if (!sechdrs)
923a43cac0dSDave Young 		return -ENOMEM;
9244df3504eSSimon Horman 	memcpy(sechdrs, (void *)pi->ehdr + pi->ehdr->e_shoff, sechdrs_size);
92593045705SPhilipp Rudo 	pi->sechdrs = sechdrs;
926a43cac0dSDave Young 
927620f697cSPhilipp Rudo 	offset = 0;
928620f697cSPhilipp Rudo 	bss_addr = kbuf->mem + kbuf->bufsz;
929f1b1cca3SPhilipp Rudo 	kbuf->image->start = pi->ehdr->e_entry;
930a43cac0dSDave Young 
931a43cac0dSDave Young 	for (i = 0; i < pi->ehdr->e_shnum; i++) {
93293045705SPhilipp Rudo 		unsigned long align;
933620f697cSPhilipp Rudo 		void *src, *dst;
93493045705SPhilipp Rudo 
935a43cac0dSDave Young 		if (!(sechdrs[i].sh_flags & SHF_ALLOC))
936a43cac0dSDave Young 			continue;
937a43cac0dSDave Young 
938a43cac0dSDave Young 		align = sechdrs[i].sh_addralign;
939f1b1cca3SPhilipp Rudo 		if (sechdrs[i].sh_type == SHT_NOBITS) {
940f1b1cca3SPhilipp Rudo 			bss_addr = ALIGN(bss_addr, align);
941f1b1cca3SPhilipp Rudo 			sechdrs[i].sh_addr = bss_addr;
942f1b1cca3SPhilipp Rudo 			bss_addr += sechdrs[i].sh_size;
943f1b1cca3SPhilipp Rudo 			continue;
944f1b1cca3SPhilipp Rudo 		}
945f1b1cca3SPhilipp Rudo 
946620f697cSPhilipp Rudo 		offset = ALIGN(offset, align);
9478652d44fSRicardo Ribalda 
9488652d44fSRicardo Ribalda 		/*
9498652d44fSRicardo Ribalda 		 * Check if the segment contains the entry point, if so,
9508652d44fSRicardo Ribalda 		 * calculate the value of image->start based on it.
9518652d44fSRicardo Ribalda 		 * If the compiler has produced more than one .text section
9528652d44fSRicardo Ribalda 		 * (Eg: .text.hot), they are generally after the main .text
9538652d44fSRicardo Ribalda 		 * section, and they shall not be used to calculate
9548652d44fSRicardo Ribalda 		 * image->start. So do not re-calculate image->start if it
9558652d44fSRicardo Ribalda 		 * is not set to the initial value, and warn the user so they
9568652d44fSRicardo Ribalda 		 * have a chance to fix their purgatory's linker script.
9578652d44fSRicardo Ribalda 		 */
958f1b1cca3SPhilipp Rudo 		if (sechdrs[i].sh_flags & SHF_EXECINSTR &&
959f1b1cca3SPhilipp Rudo 		    pi->ehdr->e_entry >= sechdrs[i].sh_addr &&
960f1b1cca3SPhilipp Rudo 		    pi->ehdr->e_entry < (sechdrs[i].sh_addr
9618652d44fSRicardo Ribalda 					 + sechdrs[i].sh_size) &&
9628652d44fSRicardo Ribalda 		    !WARN_ON(kbuf->image->start != pi->ehdr->e_entry)) {
963f1b1cca3SPhilipp Rudo 			kbuf->image->start -= sechdrs[i].sh_addr;
964620f697cSPhilipp Rudo 			kbuf->image->start += kbuf->mem + offset;
965f1b1cca3SPhilipp Rudo 		}
966f1b1cca3SPhilipp Rudo 
9678da0b724SPhilipp Rudo 		src = (void *)pi->ehdr + sechdrs[i].sh_offset;
968620f697cSPhilipp Rudo 		dst = pi->purgatory_buf + offset;
969620f697cSPhilipp Rudo 		memcpy(dst, src, sechdrs[i].sh_size);
970620f697cSPhilipp Rudo 
971620f697cSPhilipp Rudo 		sechdrs[i].sh_addr = kbuf->mem + offset;
9728da0b724SPhilipp Rudo 		sechdrs[i].sh_offset = offset;
973620f697cSPhilipp Rudo 		offset += sechdrs[i].sh_size;
974a43cac0dSDave Young 	}
975a43cac0dSDave Young 
97693045705SPhilipp Rudo 	return 0;
977a43cac0dSDave Young }
978a43cac0dSDave Young 
kexec_apply_relocations(struct kimage * image)979a43cac0dSDave Young static int kexec_apply_relocations(struct kimage *image)
980a43cac0dSDave Young {
981a43cac0dSDave Young 	int i, ret;
982a43cac0dSDave Young 	struct purgatory_info *pi = &image->purgatory_info;
9838aec395bSPhilipp Rudo 	const Elf_Shdr *sechdrs;
984a43cac0dSDave Young 
9858aec395bSPhilipp Rudo 	sechdrs = (void *)pi->ehdr + pi->ehdr->e_shoff;
9868aec395bSPhilipp Rudo 
987a43cac0dSDave Young 	for (i = 0; i < pi->ehdr->e_shnum; i++) {
9888aec395bSPhilipp Rudo 		const Elf_Shdr *relsec;
9898aec395bSPhilipp Rudo 		const Elf_Shdr *symtab;
9908aec395bSPhilipp Rudo 		Elf_Shdr *section;
991a43cac0dSDave Young 
9928aec395bSPhilipp Rudo 		relsec = sechdrs + i;
9938aec395bSPhilipp Rudo 
9948aec395bSPhilipp Rudo 		if (relsec->sh_type != SHT_RELA &&
9958aec395bSPhilipp Rudo 		    relsec->sh_type != SHT_REL)
996a43cac0dSDave Young 			continue;
997a43cac0dSDave Young 
998a43cac0dSDave Young 		/*
999a43cac0dSDave Young 		 * For section of type SHT_RELA/SHT_REL,
1000a43cac0dSDave Young 		 * ->sh_link contains section header index of associated
1001a43cac0dSDave Young 		 * symbol table. And ->sh_info contains section header
1002a43cac0dSDave Young 		 * index of section to which relocations apply.
1003a43cac0dSDave Young 		 */
10048aec395bSPhilipp Rudo 		if (relsec->sh_info >= pi->ehdr->e_shnum ||
10058aec395bSPhilipp Rudo 		    relsec->sh_link >= pi->ehdr->e_shnum)
1006a43cac0dSDave Young 			return -ENOEXEC;
1007a43cac0dSDave Young 
10088aec395bSPhilipp Rudo 		section = pi->sechdrs + relsec->sh_info;
10098aec395bSPhilipp Rudo 		symtab = sechdrs + relsec->sh_link;
1010a43cac0dSDave Young 
1011a43cac0dSDave Young 		if (!(section->sh_flags & SHF_ALLOC))
1012a43cac0dSDave Young 			continue;
1013a43cac0dSDave Young 
1014a43cac0dSDave Young 		/*
1015a43cac0dSDave Young 		 * symtab->sh_link contain section header index of associated
1016a43cac0dSDave Young 		 * string table.
1017a43cac0dSDave Young 		 */
1018a43cac0dSDave Young 		if (symtab->sh_link >= pi->ehdr->e_shnum)
1019a43cac0dSDave Young 			/* Invalid section number? */
1020a43cac0dSDave Young 			continue;
1021a43cac0dSDave Young 
1022a43cac0dSDave Young 		/*
1023a43cac0dSDave Young 		 * Respective architecture needs to provide support for applying
1024a43cac0dSDave Young 		 * relocations of type SHT_RELA/SHT_REL.
1025a43cac0dSDave Young 		 */
10268aec395bSPhilipp Rudo 		if (relsec->sh_type == SHT_RELA)
10278aec395bSPhilipp Rudo 			ret = arch_kexec_apply_relocations_add(pi, section,
10288aec395bSPhilipp Rudo 							       relsec, symtab);
10298aec395bSPhilipp Rudo 		else if (relsec->sh_type == SHT_REL)
10308aec395bSPhilipp Rudo 			ret = arch_kexec_apply_relocations(pi, section,
10318aec395bSPhilipp Rudo 							   relsec, symtab);
1032a43cac0dSDave Young 		if (ret)
1033a43cac0dSDave Young 			return ret;
1034a43cac0dSDave Young 	}
1035a43cac0dSDave Young 
1036a43cac0dSDave Young 	return 0;
1037a43cac0dSDave Young }
1038a43cac0dSDave Young 
10393be3f61dSPhilipp Rudo /*
10403be3f61dSPhilipp Rudo  * kexec_load_purgatory - Load and relocate the purgatory object.
10413be3f61dSPhilipp Rudo  * @image:	Image to add the purgatory to.
10423be3f61dSPhilipp Rudo  * @kbuf:	Memory parameters to use.
10433be3f61dSPhilipp Rudo  *
10443be3f61dSPhilipp Rudo  * Allocates the memory needed for image->purgatory_info.sechdrs and
10453be3f61dSPhilipp Rudo  * image->purgatory_info.purgatory_buf/kbuf->buffer. Caller is responsible
10463be3f61dSPhilipp Rudo  * to free the memory after use.
10473be3f61dSPhilipp Rudo  *
10483be3f61dSPhilipp Rudo  * Return: 0 on success, negative errno on error.
10493be3f61dSPhilipp Rudo  */
kexec_load_purgatory(struct kimage * image,struct kexec_buf * kbuf)10503be3f61dSPhilipp Rudo int kexec_load_purgatory(struct kimage *image, struct kexec_buf *kbuf)
1051a43cac0dSDave Young {
1052a43cac0dSDave Young 	struct purgatory_info *pi = &image->purgatory_info;
1053a43cac0dSDave Young 	int ret;
1054a43cac0dSDave Young 
1055a43cac0dSDave Young 	if (kexec_purgatory_size <= 0)
1056a43cac0dSDave Young 		return -EINVAL;
1057a43cac0dSDave Young 
105865c225d3SPhilipp Rudo 	pi->ehdr = (const Elf_Ehdr *)kexec_purgatory;
1059a43cac0dSDave Young 
10603be3f61dSPhilipp Rudo 	ret = kexec_purgatory_setup_kbuf(pi, kbuf);
1061a43cac0dSDave Young 	if (ret)
1062a43cac0dSDave Young 		return ret;
1063a43cac0dSDave Young 
10643be3f61dSPhilipp Rudo 	ret = kexec_purgatory_setup_sechdrs(pi, kbuf);
106593045705SPhilipp Rudo 	if (ret)
106693045705SPhilipp Rudo 		goto out_free_kbuf;
106793045705SPhilipp Rudo 
1068a43cac0dSDave Young 	ret = kexec_apply_relocations(image);
1069a43cac0dSDave Young 	if (ret)
1070a43cac0dSDave Young 		goto out;
1071a43cac0dSDave Young 
1072a43cac0dSDave Young 	return 0;
1073a43cac0dSDave Young out:
1074a43cac0dSDave Young 	vfree(pi->sechdrs);
1075070c43eeSThiago Jung Bauermann 	pi->sechdrs = NULL;
107693045705SPhilipp Rudo out_free_kbuf:
1077a43cac0dSDave Young 	vfree(pi->purgatory_buf);
1078070c43eeSThiago Jung Bauermann 	pi->purgatory_buf = NULL;
1079a43cac0dSDave Young 	return ret;
1080a43cac0dSDave Young }
1081a43cac0dSDave Young 
1082961d921aSPhilipp Rudo /*
1083961d921aSPhilipp Rudo  * kexec_purgatory_find_symbol - find a symbol in the purgatory
1084961d921aSPhilipp Rudo  * @pi:		Purgatory to search in.
1085961d921aSPhilipp Rudo  * @name:	Name of the symbol.
1086961d921aSPhilipp Rudo  *
1087961d921aSPhilipp Rudo  * Return: pointer to symbol in read-only symtab on success, NULL on error.
1088961d921aSPhilipp Rudo  */
kexec_purgatory_find_symbol(struct purgatory_info * pi,const char * name)1089961d921aSPhilipp Rudo static const Elf_Sym *kexec_purgatory_find_symbol(struct purgatory_info *pi,
1090a43cac0dSDave Young 						  const char *name)
1091a43cac0dSDave Young {
1092961d921aSPhilipp Rudo 	const Elf_Shdr *sechdrs;
109365c225d3SPhilipp Rudo 	const Elf_Ehdr *ehdr;
1094961d921aSPhilipp Rudo 	const Elf_Sym *syms;
1095a43cac0dSDave Young 	const char *strtab;
1096961d921aSPhilipp Rudo 	int i, k;
1097a43cac0dSDave Young 
1098961d921aSPhilipp Rudo 	if (!pi->ehdr)
1099a43cac0dSDave Young 		return NULL;
1100a43cac0dSDave Young 
1101a43cac0dSDave Young 	ehdr = pi->ehdr;
1102961d921aSPhilipp Rudo 	sechdrs = (void *)ehdr + ehdr->e_shoff;
1103a43cac0dSDave Young 
1104a43cac0dSDave Young 	for (i = 0; i < ehdr->e_shnum; i++) {
1105a43cac0dSDave Young 		if (sechdrs[i].sh_type != SHT_SYMTAB)
1106a43cac0dSDave Young 			continue;
1107a43cac0dSDave Young 
1108a43cac0dSDave Young 		if (sechdrs[i].sh_link >= ehdr->e_shnum)
1109a43cac0dSDave Young 			/* Invalid strtab section number */
1110a43cac0dSDave Young 			continue;
1111961d921aSPhilipp Rudo 		strtab = (void *)ehdr + sechdrs[sechdrs[i].sh_link].sh_offset;
1112961d921aSPhilipp Rudo 		syms = (void *)ehdr + sechdrs[i].sh_offset;
1113a43cac0dSDave Young 
1114a43cac0dSDave Young 		/* Go through symbols for a match */
1115a43cac0dSDave Young 		for (k = 0; k < sechdrs[i].sh_size/sizeof(Elf_Sym); k++) {
1116a43cac0dSDave Young 			if (ELF_ST_BIND(syms[k].st_info) != STB_GLOBAL)
1117a43cac0dSDave Young 				continue;
1118a43cac0dSDave Young 
1119a43cac0dSDave Young 			if (strcmp(strtab + syms[k].st_name, name) != 0)
1120a43cac0dSDave Young 				continue;
1121a43cac0dSDave Young 
1122a43cac0dSDave Young 			if (syms[k].st_shndx == SHN_UNDEF ||
1123a43cac0dSDave Young 			    syms[k].st_shndx >= ehdr->e_shnum) {
1124a43cac0dSDave Young 				pr_debug("Symbol: %s has bad section index %d.\n",
1125a43cac0dSDave Young 						name, syms[k].st_shndx);
1126a43cac0dSDave Young 				return NULL;
1127a43cac0dSDave Young 			}
1128a43cac0dSDave Young 
1129a43cac0dSDave Young 			/* Found the symbol we are looking for */
1130a43cac0dSDave Young 			return &syms[k];
1131a43cac0dSDave Young 		}
1132a43cac0dSDave Young 	}
1133a43cac0dSDave Young 
1134a43cac0dSDave Young 	return NULL;
1135a43cac0dSDave Young }
1136a43cac0dSDave Young 
kexec_purgatory_get_symbol_addr(struct kimage * image,const char * name)1137a43cac0dSDave Young void *kexec_purgatory_get_symbol_addr(struct kimage *image, const char *name)
1138a43cac0dSDave Young {
1139a43cac0dSDave Young 	struct purgatory_info *pi = &image->purgatory_info;
1140961d921aSPhilipp Rudo 	const Elf_Sym *sym;
1141a43cac0dSDave Young 	Elf_Shdr *sechdr;
1142a43cac0dSDave Young 
1143a43cac0dSDave Young 	sym = kexec_purgatory_find_symbol(pi, name);
1144a43cac0dSDave Young 	if (!sym)
1145a43cac0dSDave Young 		return ERR_PTR(-EINVAL);
1146a43cac0dSDave Young 
1147a43cac0dSDave Young 	sechdr = &pi->sechdrs[sym->st_shndx];
1148a43cac0dSDave Young 
1149a43cac0dSDave Young 	/*
1150a43cac0dSDave Young 	 * Returns the address where symbol will finally be loaded after
1151a43cac0dSDave Young 	 * kexec_load_segment()
1152a43cac0dSDave Young 	 */
1153a43cac0dSDave Young 	return (void *)(sechdr->sh_addr + sym->st_value);
1154a43cac0dSDave Young }
1155a43cac0dSDave Young 
1156a43cac0dSDave Young /*
1157a43cac0dSDave Young  * Get or set value of a symbol. If "get_value" is true, symbol value is
1158a43cac0dSDave Young  * returned in buf otherwise symbol value is set based on value in buf.
1159a43cac0dSDave Young  */
kexec_purgatory_get_set_symbol(struct kimage * image,const char * name,void * buf,unsigned int size,bool get_value)1160a43cac0dSDave Young int kexec_purgatory_get_set_symbol(struct kimage *image, const char *name,
1161a43cac0dSDave Young 				   void *buf, unsigned int size, bool get_value)
1162a43cac0dSDave Young {
1163a43cac0dSDave Young 	struct purgatory_info *pi = &image->purgatory_info;
1164961d921aSPhilipp Rudo 	const Elf_Sym *sym;
1165961d921aSPhilipp Rudo 	Elf_Shdr *sec;
1166a43cac0dSDave Young 	char *sym_buf;
1167a43cac0dSDave Young 
1168a43cac0dSDave Young 	sym = kexec_purgatory_find_symbol(pi, name);
1169a43cac0dSDave Young 	if (!sym)
1170a43cac0dSDave Young 		return -EINVAL;
1171a43cac0dSDave Young 
1172a43cac0dSDave Young 	if (sym->st_size != size) {
1173a43cac0dSDave Young 		pr_err("symbol %s size mismatch: expected %lu actual %u\n",
1174a43cac0dSDave Young 		       name, (unsigned long)sym->st_size, size);
1175a43cac0dSDave Young 		return -EINVAL;
1176a43cac0dSDave Young 	}
1177a43cac0dSDave Young 
1178961d921aSPhilipp Rudo 	sec = pi->sechdrs + sym->st_shndx;
1179a43cac0dSDave Young 
1180961d921aSPhilipp Rudo 	if (sec->sh_type == SHT_NOBITS) {
1181a43cac0dSDave Young 		pr_err("symbol %s is in a bss section. Cannot %s\n", name,
1182a43cac0dSDave Young 		       get_value ? "get" : "set");
1183a43cac0dSDave Young 		return -EINVAL;
1184a43cac0dSDave Young 	}
1185a43cac0dSDave Young 
11868da0b724SPhilipp Rudo 	sym_buf = (char *)pi->purgatory_buf + sec->sh_offset + sym->st_value;
1187a43cac0dSDave Young 
1188a43cac0dSDave Young 	if (get_value)
1189a43cac0dSDave Young 		memcpy((void *)buf, sym_buf, size);
1190a43cac0dSDave Young 	else
1191a43cac0dSDave Young 		memcpy((void *)sym_buf, buf, size);
1192a43cac0dSDave Young 
1193a43cac0dSDave Young 	return 0;
1194a43cac0dSDave Young }
1195e6265fe7SEric DeVolder #endif /* CONFIG_ARCH_SUPPORTS_KEXEC_PURGATORY */
1196