1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-only
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * powerpc code to implement the kexec_file_load syscall
4*4882a593Smuzhiyun *
5*4882a593Smuzhiyun * Copyright (C) 2004 Adam Litke (agl@us.ibm.com)
6*4882a593Smuzhiyun * Copyright (C) 2004 IBM Corp.
7*4882a593Smuzhiyun * Copyright (C) 2004,2005 Milton D Miller II, IBM Corporation
8*4882a593Smuzhiyun * Copyright (C) 2005 R Sharada (sharada@in.ibm.com)
9*4882a593Smuzhiyun * Copyright (C) 2006 Mohan Kumar M (mohan@in.ibm.com)
10*4882a593Smuzhiyun * Copyright (C) 2016 IBM Corporation
11*4882a593Smuzhiyun *
12*4882a593Smuzhiyun * Based on kexec-tools' kexec-elf-ppc64.c, fs2dt.c.
13*4882a593Smuzhiyun * Heavily modified for the kernel by
14*4882a593Smuzhiyun * Thiago Jung Bauermann <bauerman@linux.vnet.ibm.com>.
15*4882a593Smuzhiyun */
16*4882a593Smuzhiyun
17*4882a593Smuzhiyun #include <linux/slab.h>
18*4882a593Smuzhiyun #include <linux/kexec.h>
19*4882a593Smuzhiyun #include <linux/of_fdt.h>
20*4882a593Smuzhiyun #include <linux/libfdt.h>
21*4882a593Smuzhiyun #include <asm/setup.h>
22*4882a593Smuzhiyun #include <asm/ima.h>
23*4882a593Smuzhiyun
24*4882a593Smuzhiyun #define SLAVE_CODE_SIZE 256 /* First 0x100 bytes */
25*4882a593Smuzhiyun
26*4882a593Smuzhiyun /**
27*4882a593Smuzhiyun * setup_kdump_cmdline - Prepend "elfcorehdr=<addr> " to command line
28*4882a593Smuzhiyun * of kdump kernel for exporting the core.
29*4882a593Smuzhiyun * @image: Kexec image
30*4882a593Smuzhiyun * @cmdline: Command line parameters to update.
31*4882a593Smuzhiyun * @cmdline_len: Length of the cmdline parameters.
32*4882a593Smuzhiyun *
33*4882a593Smuzhiyun * kdump segment must be setup before calling this function.
34*4882a593Smuzhiyun *
35*4882a593Smuzhiyun * Returns new cmdline buffer for kdump kernel on success, NULL otherwise.
36*4882a593Smuzhiyun */
setup_kdump_cmdline(struct kimage * image,char * cmdline,unsigned long cmdline_len)37*4882a593Smuzhiyun char *setup_kdump_cmdline(struct kimage *image, char *cmdline,
38*4882a593Smuzhiyun unsigned long cmdline_len)
39*4882a593Smuzhiyun {
40*4882a593Smuzhiyun int elfcorehdr_strlen;
41*4882a593Smuzhiyun char *cmdline_ptr;
42*4882a593Smuzhiyun
43*4882a593Smuzhiyun cmdline_ptr = kzalloc(COMMAND_LINE_SIZE, GFP_KERNEL);
44*4882a593Smuzhiyun if (!cmdline_ptr)
45*4882a593Smuzhiyun return NULL;
46*4882a593Smuzhiyun
47*4882a593Smuzhiyun elfcorehdr_strlen = sprintf(cmdline_ptr, "elfcorehdr=0x%lx ",
48*4882a593Smuzhiyun image->arch.elfcorehdr_addr);
49*4882a593Smuzhiyun
50*4882a593Smuzhiyun if (elfcorehdr_strlen + cmdline_len > COMMAND_LINE_SIZE) {
51*4882a593Smuzhiyun pr_err("Appending elfcorehdr=<addr> exceeds cmdline size\n");
52*4882a593Smuzhiyun kfree(cmdline_ptr);
53*4882a593Smuzhiyun return NULL;
54*4882a593Smuzhiyun }
55*4882a593Smuzhiyun
56*4882a593Smuzhiyun memcpy(cmdline_ptr + elfcorehdr_strlen, cmdline, cmdline_len);
57*4882a593Smuzhiyun // Ensure it's nul terminated
58*4882a593Smuzhiyun cmdline_ptr[COMMAND_LINE_SIZE - 1] = '\0';
59*4882a593Smuzhiyun return cmdline_ptr;
60*4882a593Smuzhiyun }
61*4882a593Smuzhiyun
62*4882a593Smuzhiyun /**
63*4882a593Smuzhiyun * setup_purgatory - initialize the purgatory's global variables
64*4882a593Smuzhiyun * @image: kexec image.
65*4882a593Smuzhiyun * @slave_code: Slave code for the purgatory.
66*4882a593Smuzhiyun * @fdt: Flattened device tree for the next kernel.
67*4882a593Smuzhiyun * @kernel_load_addr: Address where the kernel is loaded.
68*4882a593Smuzhiyun * @fdt_load_addr: Address where the flattened device tree is loaded.
69*4882a593Smuzhiyun *
70*4882a593Smuzhiyun * Return: 0 on success, or negative errno on error.
71*4882a593Smuzhiyun */
setup_purgatory(struct kimage * image,const void * slave_code,const void * fdt,unsigned long kernel_load_addr,unsigned long fdt_load_addr)72*4882a593Smuzhiyun int setup_purgatory(struct kimage *image, const void *slave_code,
73*4882a593Smuzhiyun const void *fdt, unsigned long kernel_load_addr,
74*4882a593Smuzhiyun unsigned long fdt_load_addr)
75*4882a593Smuzhiyun {
76*4882a593Smuzhiyun unsigned int *slave_code_buf, master_entry;
77*4882a593Smuzhiyun int ret;
78*4882a593Smuzhiyun
79*4882a593Smuzhiyun slave_code_buf = kmalloc(SLAVE_CODE_SIZE, GFP_KERNEL);
80*4882a593Smuzhiyun if (!slave_code_buf)
81*4882a593Smuzhiyun return -ENOMEM;
82*4882a593Smuzhiyun
83*4882a593Smuzhiyun /* Get the slave code from the new kernel and put it in purgatory. */
84*4882a593Smuzhiyun ret = kexec_purgatory_get_set_symbol(image, "purgatory_start",
85*4882a593Smuzhiyun slave_code_buf, SLAVE_CODE_SIZE,
86*4882a593Smuzhiyun true);
87*4882a593Smuzhiyun if (ret) {
88*4882a593Smuzhiyun kfree(slave_code_buf);
89*4882a593Smuzhiyun return ret;
90*4882a593Smuzhiyun }
91*4882a593Smuzhiyun
92*4882a593Smuzhiyun master_entry = slave_code_buf[0];
93*4882a593Smuzhiyun memcpy(slave_code_buf, slave_code, SLAVE_CODE_SIZE);
94*4882a593Smuzhiyun slave_code_buf[0] = master_entry;
95*4882a593Smuzhiyun ret = kexec_purgatory_get_set_symbol(image, "purgatory_start",
96*4882a593Smuzhiyun slave_code_buf, SLAVE_CODE_SIZE,
97*4882a593Smuzhiyun false);
98*4882a593Smuzhiyun kfree(slave_code_buf);
99*4882a593Smuzhiyun
100*4882a593Smuzhiyun ret = kexec_purgatory_get_set_symbol(image, "kernel", &kernel_load_addr,
101*4882a593Smuzhiyun sizeof(kernel_load_addr), false);
102*4882a593Smuzhiyun if (ret)
103*4882a593Smuzhiyun return ret;
104*4882a593Smuzhiyun ret = kexec_purgatory_get_set_symbol(image, "dt_offset", &fdt_load_addr,
105*4882a593Smuzhiyun sizeof(fdt_load_addr), false);
106*4882a593Smuzhiyun if (ret)
107*4882a593Smuzhiyun return ret;
108*4882a593Smuzhiyun
109*4882a593Smuzhiyun return 0;
110*4882a593Smuzhiyun }
111*4882a593Smuzhiyun
112*4882a593Smuzhiyun /**
113*4882a593Smuzhiyun * delete_fdt_mem_rsv - delete memory reservation with given address and size
114*4882a593Smuzhiyun *
115*4882a593Smuzhiyun * Return: 0 on success, or negative errno on error.
116*4882a593Smuzhiyun */
delete_fdt_mem_rsv(void * fdt,unsigned long start,unsigned long size)117*4882a593Smuzhiyun int delete_fdt_mem_rsv(void *fdt, unsigned long start, unsigned long size)
118*4882a593Smuzhiyun {
119*4882a593Smuzhiyun int i, ret, num_rsvs = fdt_num_mem_rsv(fdt);
120*4882a593Smuzhiyun
121*4882a593Smuzhiyun for (i = 0; i < num_rsvs; i++) {
122*4882a593Smuzhiyun uint64_t rsv_start, rsv_size;
123*4882a593Smuzhiyun
124*4882a593Smuzhiyun ret = fdt_get_mem_rsv(fdt, i, &rsv_start, &rsv_size);
125*4882a593Smuzhiyun if (ret) {
126*4882a593Smuzhiyun pr_err("Malformed device tree.\n");
127*4882a593Smuzhiyun return -EINVAL;
128*4882a593Smuzhiyun }
129*4882a593Smuzhiyun
130*4882a593Smuzhiyun if (rsv_start == start && rsv_size == size) {
131*4882a593Smuzhiyun ret = fdt_del_mem_rsv(fdt, i);
132*4882a593Smuzhiyun if (ret) {
133*4882a593Smuzhiyun pr_err("Error deleting device tree reservation.\n");
134*4882a593Smuzhiyun return -EINVAL;
135*4882a593Smuzhiyun }
136*4882a593Smuzhiyun
137*4882a593Smuzhiyun return 0;
138*4882a593Smuzhiyun }
139*4882a593Smuzhiyun }
140*4882a593Smuzhiyun
141*4882a593Smuzhiyun return -ENOENT;
142*4882a593Smuzhiyun }
143*4882a593Smuzhiyun
144*4882a593Smuzhiyun /*
145*4882a593Smuzhiyun * setup_new_fdt - modify /chosen and memory reservation for the next kernel
146*4882a593Smuzhiyun * @image: kexec image being loaded.
147*4882a593Smuzhiyun * @fdt: Flattened device tree for the next kernel.
148*4882a593Smuzhiyun * @initrd_load_addr: Address where the next initrd will be loaded.
149*4882a593Smuzhiyun * @initrd_len: Size of the next initrd, or 0 if there will be none.
150*4882a593Smuzhiyun * @cmdline: Command line for the next kernel, or NULL if there will
151*4882a593Smuzhiyun * be none.
152*4882a593Smuzhiyun *
153*4882a593Smuzhiyun * Return: 0 on success, or negative errno on error.
154*4882a593Smuzhiyun */
setup_new_fdt(const struct kimage * image,void * fdt,unsigned long initrd_load_addr,unsigned long initrd_len,const char * cmdline)155*4882a593Smuzhiyun int setup_new_fdt(const struct kimage *image, void *fdt,
156*4882a593Smuzhiyun unsigned long initrd_load_addr, unsigned long initrd_len,
157*4882a593Smuzhiyun const char *cmdline)
158*4882a593Smuzhiyun {
159*4882a593Smuzhiyun int ret, chosen_node;
160*4882a593Smuzhiyun const void *prop;
161*4882a593Smuzhiyun
162*4882a593Smuzhiyun /* Remove memory reservation for the current device tree. */
163*4882a593Smuzhiyun ret = delete_fdt_mem_rsv(fdt, __pa(initial_boot_params),
164*4882a593Smuzhiyun fdt_totalsize(initial_boot_params));
165*4882a593Smuzhiyun if (ret == 0)
166*4882a593Smuzhiyun pr_debug("Removed old device tree reservation.\n");
167*4882a593Smuzhiyun else if (ret != -ENOENT)
168*4882a593Smuzhiyun return ret;
169*4882a593Smuzhiyun
170*4882a593Smuzhiyun chosen_node = fdt_path_offset(fdt, "/chosen");
171*4882a593Smuzhiyun if (chosen_node == -FDT_ERR_NOTFOUND) {
172*4882a593Smuzhiyun chosen_node = fdt_add_subnode(fdt, fdt_path_offset(fdt, "/"),
173*4882a593Smuzhiyun "chosen");
174*4882a593Smuzhiyun if (chosen_node < 0) {
175*4882a593Smuzhiyun pr_err("Error creating /chosen.\n");
176*4882a593Smuzhiyun return -EINVAL;
177*4882a593Smuzhiyun }
178*4882a593Smuzhiyun } else if (chosen_node < 0) {
179*4882a593Smuzhiyun pr_err("Malformed device tree: error reading /chosen.\n");
180*4882a593Smuzhiyun return -EINVAL;
181*4882a593Smuzhiyun }
182*4882a593Smuzhiyun
183*4882a593Smuzhiyun /* Did we boot using an initrd? */
184*4882a593Smuzhiyun prop = fdt_getprop(fdt, chosen_node, "linux,initrd-start", NULL);
185*4882a593Smuzhiyun if (prop) {
186*4882a593Smuzhiyun uint64_t tmp_start, tmp_end, tmp_size;
187*4882a593Smuzhiyun
188*4882a593Smuzhiyun tmp_start = fdt64_to_cpu(*((const fdt64_t *) prop));
189*4882a593Smuzhiyun
190*4882a593Smuzhiyun prop = fdt_getprop(fdt, chosen_node, "linux,initrd-end", NULL);
191*4882a593Smuzhiyun if (!prop) {
192*4882a593Smuzhiyun pr_err("Malformed device tree.\n");
193*4882a593Smuzhiyun return -EINVAL;
194*4882a593Smuzhiyun }
195*4882a593Smuzhiyun tmp_end = fdt64_to_cpu(*((const fdt64_t *) prop));
196*4882a593Smuzhiyun
197*4882a593Smuzhiyun /*
198*4882a593Smuzhiyun * kexec reserves exact initrd size, while firmware may
199*4882a593Smuzhiyun * reserve a multiple of PAGE_SIZE, so check for both.
200*4882a593Smuzhiyun */
201*4882a593Smuzhiyun tmp_size = tmp_end - tmp_start;
202*4882a593Smuzhiyun ret = delete_fdt_mem_rsv(fdt, tmp_start, tmp_size);
203*4882a593Smuzhiyun if (ret == -ENOENT)
204*4882a593Smuzhiyun ret = delete_fdt_mem_rsv(fdt, tmp_start,
205*4882a593Smuzhiyun round_up(tmp_size, PAGE_SIZE));
206*4882a593Smuzhiyun if (ret == 0)
207*4882a593Smuzhiyun pr_debug("Removed old initrd reservation.\n");
208*4882a593Smuzhiyun else if (ret != -ENOENT)
209*4882a593Smuzhiyun return ret;
210*4882a593Smuzhiyun
211*4882a593Smuzhiyun /* If there's no new initrd, delete the old initrd's info. */
212*4882a593Smuzhiyun if (initrd_len == 0) {
213*4882a593Smuzhiyun ret = fdt_delprop(fdt, chosen_node,
214*4882a593Smuzhiyun "linux,initrd-start");
215*4882a593Smuzhiyun if (ret) {
216*4882a593Smuzhiyun pr_err("Error deleting linux,initrd-start.\n");
217*4882a593Smuzhiyun return -EINVAL;
218*4882a593Smuzhiyun }
219*4882a593Smuzhiyun
220*4882a593Smuzhiyun ret = fdt_delprop(fdt, chosen_node, "linux,initrd-end");
221*4882a593Smuzhiyun if (ret) {
222*4882a593Smuzhiyun pr_err("Error deleting linux,initrd-end.\n");
223*4882a593Smuzhiyun return -EINVAL;
224*4882a593Smuzhiyun }
225*4882a593Smuzhiyun }
226*4882a593Smuzhiyun }
227*4882a593Smuzhiyun
228*4882a593Smuzhiyun if (initrd_len) {
229*4882a593Smuzhiyun ret = fdt_setprop_u64(fdt, chosen_node,
230*4882a593Smuzhiyun "linux,initrd-start",
231*4882a593Smuzhiyun initrd_load_addr);
232*4882a593Smuzhiyun if (ret < 0)
233*4882a593Smuzhiyun goto err;
234*4882a593Smuzhiyun
235*4882a593Smuzhiyun /* initrd-end is the first address after the initrd image. */
236*4882a593Smuzhiyun ret = fdt_setprop_u64(fdt, chosen_node, "linux,initrd-end",
237*4882a593Smuzhiyun initrd_load_addr + initrd_len);
238*4882a593Smuzhiyun if (ret < 0)
239*4882a593Smuzhiyun goto err;
240*4882a593Smuzhiyun
241*4882a593Smuzhiyun ret = fdt_add_mem_rsv(fdt, initrd_load_addr, initrd_len);
242*4882a593Smuzhiyun if (ret) {
243*4882a593Smuzhiyun pr_err("Error reserving initrd memory: %s\n",
244*4882a593Smuzhiyun fdt_strerror(ret));
245*4882a593Smuzhiyun return -EINVAL;
246*4882a593Smuzhiyun }
247*4882a593Smuzhiyun }
248*4882a593Smuzhiyun
249*4882a593Smuzhiyun if (cmdline != NULL) {
250*4882a593Smuzhiyun ret = fdt_setprop_string(fdt, chosen_node, "bootargs", cmdline);
251*4882a593Smuzhiyun if (ret < 0)
252*4882a593Smuzhiyun goto err;
253*4882a593Smuzhiyun } else {
254*4882a593Smuzhiyun ret = fdt_delprop(fdt, chosen_node, "bootargs");
255*4882a593Smuzhiyun if (ret && ret != -FDT_ERR_NOTFOUND) {
256*4882a593Smuzhiyun pr_err("Error deleting bootargs.\n");
257*4882a593Smuzhiyun return -EINVAL;
258*4882a593Smuzhiyun }
259*4882a593Smuzhiyun }
260*4882a593Smuzhiyun
261*4882a593Smuzhiyun if (image->type == KEXEC_TYPE_CRASH) {
262*4882a593Smuzhiyun /*
263*4882a593Smuzhiyun * Avoid elfcorehdr from being stomped on in kdump kernel by
264*4882a593Smuzhiyun * setting up memory reserve map.
265*4882a593Smuzhiyun */
266*4882a593Smuzhiyun ret = fdt_add_mem_rsv(fdt, image->arch.elfcorehdr_addr,
267*4882a593Smuzhiyun image->arch.elf_headers_sz);
268*4882a593Smuzhiyun if (ret) {
269*4882a593Smuzhiyun pr_err("Error reserving elfcorehdr memory: %s\n",
270*4882a593Smuzhiyun fdt_strerror(ret));
271*4882a593Smuzhiyun goto err;
272*4882a593Smuzhiyun }
273*4882a593Smuzhiyun }
274*4882a593Smuzhiyun
275*4882a593Smuzhiyun ret = setup_ima_buffer(image, fdt, chosen_node);
276*4882a593Smuzhiyun if (ret) {
277*4882a593Smuzhiyun pr_err("Error setting up the new device tree.\n");
278*4882a593Smuzhiyun return ret;
279*4882a593Smuzhiyun }
280*4882a593Smuzhiyun
281*4882a593Smuzhiyun ret = fdt_setprop(fdt, chosen_node, "linux,booted-from-kexec", NULL, 0);
282*4882a593Smuzhiyun if (ret)
283*4882a593Smuzhiyun goto err;
284*4882a593Smuzhiyun
285*4882a593Smuzhiyun return 0;
286*4882a593Smuzhiyun
287*4882a593Smuzhiyun err:
288*4882a593Smuzhiyun pr_err("Error setting up the new device tree.\n");
289*4882a593Smuzhiyun return -EINVAL;
290*4882a593Smuzhiyun }
291