]> git.proxmox.com Git - mirror_qemu.git/blob - hw/ppc/spapr_nvdimm.c
Merge remote-tracking branch 'remotes/vivier2/tags/trivial-branch-for-6.0-pull-reques...
[mirror_qemu.git] / hw / ppc / spapr_nvdimm.c
1 /*
2 * QEMU PAPR Storage Class Memory Interfaces
3 *
4 * Copyright (c) 2019-2020, IBM Corporation.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
22 * THE SOFTWARE.
23 */
24 #include "qemu/osdep.h"
25 #include "qapi/error.h"
26 #include "hw/ppc/spapr_drc.h"
27 #include "hw/ppc/spapr_nvdimm.h"
28 #include "hw/mem/nvdimm.h"
29 #include "qemu/nvdimm-utils.h"
30 #include "qemu/option.h"
31 #include "hw/ppc/fdt.h"
32 #include "qemu/range.h"
33 #include "sysemu/sysemu.h"
34 #include "hw/ppc/spapr_numa.h"
35
36 bool spapr_nvdimm_validate(HotplugHandler *hotplug_dev, NVDIMMDevice *nvdimm,
37 uint64_t size, Error **errp)
38 {
39 const MachineClass *mc = MACHINE_GET_CLASS(hotplug_dev);
40 const MachineState *ms = MACHINE(hotplug_dev);
41 const char *nvdimm_opt = qemu_opt_get(qemu_get_machine_opts(), "nvdimm");
42 g_autofree char *uuidstr = NULL;
43 QemuUUID uuid;
44 int ret;
45
46 if (!mc->nvdimm_supported) {
47 error_setg(errp, "NVDIMM hotplug not supported for this machine");
48 return false;
49 }
50
51 /*
52 * NVDIMM support went live in 5.1 without considering that, in
53 * other archs, the user needs to enable NVDIMM support with the
54 * 'nvdimm' machine option and the default behavior is NVDIMM
55 * support disabled. It is too late to roll back to the standard
56 * behavior without breaking 5.1 guests. What we can do is to
57 * ensure that, if the user sets nvdimm=off, we error out
58 * regardless of being 5.1 or newer.
59 */
60 if (!ms->nvdimms_state->is_enabled && nvdimm_opt) {
61 error_setg(errp, "nvdimm device found but 'nvdimm=off' was set");
62 return false;
63 }
64
65 if (object_property_get_int(OBJECT(nvdimm), NVDIMM_LABEL_SIZE_PROP,
66 &error_abort) == 0) {
67 error_setg(errp, "PAPR requires NVDIMM devices to have label-size set");
68 return false;
69 }
70
71 if (size % SPAPR_MINIMUM_SCM_BLOCK_SIZE) {
72 error_setg(errp, "PAPR requires NVDIMM memory size (excluding label)"
73 " to be a multiple of %" PRIu64 "MB",
74 SPAPR_MINIMUM_SCM_BLOCK_SIZE / MiB);
75 return false;
76 }
77
78 uuidstr = object_property_get_str(OBJECT(nvdimm), NVDIMM_UUID_PROP,
79 &error_abort);
80 ret = qemu_uuid_parse(uuidstr, &uuid);
81 g_assert(!ret);
82
83 if (qemu_uuid_is_null(&uuid)) {
84 error_setg(errp, "NVDIMM device requires the uuid to be set");
85 return false;
86 }
87
88 return true;
89 }
90
91
92 void spapr_add_nvdimm(DeviceState *dev, uint64_t slot)
93 {
94 SpaprDrc *drc;
95 bool hotplugged = spapr_drc_hotplugged(dev);
96
97 drc = spapr_drc_by_id(TYPE_SPAPR_DRC_PMEM, slot);
98 g_assert(drc);
99
100 /*
101 * pc_dimm_get_free_slot() provided a free slot at pre-plug. The
102 * corresponding DRC is thus assumed to be attachable.
103 */
104 spapr_drc_attach(drc, dev);
105
106 if (hotplugged) {
107 spapr_hotplug_req_add_by_index(drc);
108 }
109 }
110
111 static int spapr_dt_nvdimm(SpaprMachineState *spapr, void *fdt,
112 int parent_offset, NVDIMMDevice *nvdimm)
113 {
114 int child_offset;
115 char *buf;
116 SpaprDrc *drc;
117 uint32_t drc_idx;
118 uint32_t node = object_property_get_uint(OBJECT(nvdimm), PC_DIMM_NODE_PROP,
119 &error_abort);
120 uint64_t slot = object_property_get_uint(OBJECT(nvdimm), PC_DIMM_SLOT_PROP,
121 &error_abort);
122 uint64_t lsize = nvdimm->label_size;
123 uint64_t size = object_property_get_int(OBJECT(nvdimm), PC_DIMM_SIZE_PROP,
124 NULL);
125
126 drc = spapr_drc_by_id(TYPE_SPAPR_DRC_PMEM, slot);
127 g_assert(drc);
128
129 drc_idx = spapr_drc_index(drc);
130
131 buf = g_strdup_printf("ibm,pmemory@%x", drc_idx);
132 child_offset = fdt_add_subnode(fdt, parent_offset, buf);
133 g_free(buf);
134
135 _FDT(child_offset);
136
137 _FDT((fdt_setprop_cell(fdt, child_offset, "reg", drc_idx)));
138 _FDT((fdt_setprop_string(fdt, child_offset, "compatible", "ibm,pmemory")));
139 _FDT((fdt_setprop_string(fdt, child_offset, "device_type", "ibm,pmemory")));
140
141 spapr_numa_write_associativity_dt(spapr, fdt, child_offset, node);
142
143 buf = qemu_uuid_unparse_strdup(&nvdimm->uuid);
144 _FDT((fdt_setprop_string(fdt, child_offset, "ibm,unit-guid", buf)));
145 g_free(buf);
146
147 _FDT((fdt_setprop_cell(fdt, child_offset, "ibm,my-drc-index", drc_idx)));
148
149 _FDT((fdt_setprop_u64(fdt, child_offset, "ibm,block-size",
150 SPAPR_MINIMUM_SCM_BLOCK_SIZE)));
151 _FDT((fdt_setprop_u64(fdt, child_offset, "ibm,number-of-blocks",
152 size / SPAPR_MINIMUM_SCM_BLOCK_SIZE)));
153 _FDT((fdt_setprop_cell(fdt, child_offset, "ibm,metadata-size", lsize)));
154
155 _FDT((fdt_setprop_string(fdt, child_offset, "ibm,pmem-application",
156 "operating-system")));
157 _FDT(fdt_setprop(fdt, child_offset, "ibm,cache-flush-required", NULL, 0));
158
159 return child_offset;
160 }
161
162 int spapr_pmem_dt_populate(SpaprDrc *drc, SpaprMachineState *spapr,
163 void *fdt, int *fdt_start_offset, Error **errp)
164 {
165 NVDIMMDevice *nvdimm = NVDIMM(drc->dev);
166
167 *fdt_start_offset = spapr_dt_nvdimm(spapr, fdt, 0, nvdimm);
168
169 return 0;
170 }
171
172 void spapr_dt_persistent_memory(SpaprMachineState *spapr, void *fdt)
173 {
174 int offset = fdt_subnode_offset(fdt, 0, "persistent-memory");
175 GSList *iter, *nvdimms = nvdimm_get_device_list();
176
177 if (offset < 0) {
178 offset = fdt_add_subnode(fdt, 0, "persistent-memory");
179 _FDT(offset);
180 _FDT((fdt_setprop_cell(fdt, offset, "#address-cells", 0x1)));
181 _FDT((fdt_setprop_cell(fdt, offset, "#size-cells", 0x0)));
182 _FDT((fdt_setprop_string(fdt, offset, "device_type",
183 "ibm,persistent-memory")));
184 }
185
186 /* Create DT entries for cold plugged NVDIMM devices */
187 for (iter = nvdimms; iter; iter = iter->next) {
188 NVDIMMDevice *nvdimm = iter->data;
189
190 spapr_dt_nvdimm(spapr, fdt, offset, nvdimm);
191 }
192 g_slist_free(nvdimms);
193
194 return;
195 }
196
197 static target_ulong h_scm_read_metadata(PowerPCCPU *cpu,
198 SpaprMachineState *spapr,
199 target_ulong opcode,
200 target_ulong *args)
201 {
202 uint32_t drc_index = args[0];
203 uint64_t offset = args[1];
204 uint64_t len = args[2];
205 SpaprDrc *drc = spapr_drc_by_index(drc_index);
206 NVDIMMDevice *nvdimm;
207 NVDIMMClass *ddc;
208 uint64_t data = 0;
209 uint8_t buf[8] = { 0 };
210
211 if (!drc || !drc->dev ||
212 spapr_drc_type(drc) != SPAPR_DR_CONNECTOR_TYPE_PMEM) {
213 return H_PARAMETER;
214 }
215
216 if (len != 1 && len != 2 &&
217 len != 4 && len != 8) {
218 return H_P3;
219 }
220
221 nvdimm = NVDIMM(drc->dev);
222 if ((offset + len < offset) ||
223 (nvdimm->label_size < len + offset)) {
224 return H_P2;
225 }
226
227 ddc = NVDIMM_GET_CLASS(nvdimm);
228 ddc->read_label_data(nvdimm, buf, len, offset);
229
230 switch (len) {
231 case 1:
232 data = ldub_p(buf);
233 break;
234 case 2:
235 data = lduw_be_p(buf);
236 break;
237 case 4:
238 data = ldl_be_p(buf);
239 break;
240 case 8:
241 data = ldq_be_p(buf);
242 break;
243 default:
244 g_assert_not_reached();
245 }
246
247 args[0] = data;
248
249 return H_SUCCESS;
250 }
251
252 static target_ulong h_scm_write_metadata(PowerPCCPU *cpu,
253 SpaprMachineState *spapr,
254 target_ulong opcode,
255 target_ulong *args)
256 {
257 uint32_t drc_index = args[0];
258 uint64_t offset = args[1];
259 uint64_t data = args[2];
260 uint64_t len = args[3];
261 SpaprDrc *drc = spapr_drc_by_index(drc_index);
262 NVDIMMDevice *nvdimm;
263 NVDIMMClass *ddc;
264 uint8_t buf[8] = { 0 };
265
266 if (!drc || !drc->dev ||
267 spapr_drc_type(drc) != SPAPR_DR_CONNECTOR_TYPE_PMEM) {
268 return H_PARAMETER;
269 }
270
271 if (len != 1 && len != 2 &&
272 len != 4 && len != 8) {
273 return H_P4;
274 }
275
276 nvdimm = NVDIMM(drc->dev);
277 if ((offset + len < offset) ||
278 (nvdimm->label_size < len + offset)) {
279 return H_P2;
280 }
281
282 switch (len) {
283 case 1:
284 if (data & 0xffffffffffffff00) {
285 return H_P2;
286 }
287 stb_p(buf, data);
288 break;
289 case 2:
290 if (data & 0xffffffffffff0000) {
291 return H_P2;
292 }
293 stw_be_p(buf, data);
294 break;
295 case 4:
296 if (data & 0xffffffff00000000) {
297 return H_P2;
298 }
299 stl_be_p(buf, data);
300 break;
301 case 8:
302 stq_be_p(buf, data);
303 break;
304 default:
305 g_assert_not_reached();
306 }
307
308 ddc = NVDIMM_GET_CLASS(nvdimm);
309 ddc->write_label_data(nvdimm, buf, len, offset);
310
311 return H_SUCCESS;
312 }
313
314 static target_ulong h_scm_bind_mem(PowerPCCPU *cpu, SpaprMachineState *spapr,
315 target_ulong opcode, target_ulong *args)
316 {
317 uint32_t drc_index = args[0];
318 uint64_t starting_idx = args[1];
319 uint64_t no_of_scm_blocks_to_bind = args[2];
320 uint64_t target_logical_mem_addr = args[3];
321 uint64_t continue_token = args[4];
322 uint64_t size;
323 uint64_t total_no_of_scm_blocks;
324 SpaprDrc *drc = spapr_drc_by_index(drc_index);
325 hwaddr addr;
326 NVDIMMDevice *nvdimm;
327
328 if (!drc || !drc->dev ||
329 spapr_drc_type(drc) != SPAPR_DR_CONNECTOR_TYPE_PMEM) {
330 return H_PARAMETER;
331 }
332
333 /*
334 * Currently continue token should be zero qemu has already bound
335 * everything and this hcall doesnt return H_BUSY.
336 */
337 if (continue_token > 0) {
338 return H_P5;
339 }
340
341 /* Currently qemu assigns the address. */
342 if (target_logical_mem_addr != 0xffffffffffffffff) {
343 return H_OVERLAP;
344 }
345
346 nvdimm = NVDIMM(drc->dev);
347
348 size = object_property_get_uint(OBJECT(nvdimm),
349 PC_DIMM_SIZE_PROP, &error_abort);
350
351 total_no_of_scm_blocks = size / SPAPR_MINIMUM_SCM_BLOCK_SIZE;
352
353 if (starting_idx > total_no_of_scm_blocks) {
354 return H_P2;
355 }
356
357 if (((starting_idx + no_of_scm_blocks_to_bind) < starting_idx) ||
358 ((starting_idx + no_of_scm_blocks_to_bind) > total_no_of_scm_blocks)) {
359 return H_P3;
360 }
361
362 addr = object_property_get_uint(OBJECT(nvdimm),
363 PC_DIMM_ADDR_PROP, &error_abort);
364
365 addr += starting_idx * SPAPR_MINIMUM_SCM_BLOCK_SIZE;
366
367 /* Already bound, Return target logical address in R5 */
368 args[1] = addr;
369 args[2] = no_of_scm_blocks_to_bind;
370
371 return H_SUCCESS;
372 }
373
374 static target_ulong h_scm_unbind_mem(PowerPCCPU *cpu, SpaprMachineState *spapr,
375 target_ulong opcode, target_ulong *args)
376 {
377 uint32_t drc_index = args[0];
378 uint64_t starting_scm_logical_addr = args[1];
379 uint64_t no_of_scm_blocks_to_unbind = args[2];
380 uint64_t continue_token = args[3];
381 uint64_t size_to_unbind;
382 Range blockrange = range_empty;
383 Range nvdimmrange = range_empty;
384 SpaprDrc *drc = spapr_drc_by_index(drc_index);
385 NVDIMMDevice *nvdimm;
386 uint64_t size, addr;
387
388 if (!drc || !drc->dev ||
389 spapr_drc_type(drc) != SPAPR_DR_CONNECTOR_TYPE_PMEM) {
390 return H_PARAMETER;
391 }
392
393 /* continue_token should be zero as this hcall doesn't return H_BUSY. */
394 if (continue_token > 0) {
395 return H_P4;
396 }
397
398 /* Check if starting_scm_logical_addr is block aligned */
399 if (!QEMU_IS_ALIGNED(starting_scm_logical_addr,
400 SPAPR_MINIMUM_SCM_BLOCK_SIZE)) {
401 return H_P2;
402 }
403
404 size_to_unbind = no_of_scm_blocks_to_unbind * SPAPR_MINIMUM_SCM_BLOCK_SIZE;
405 if (no_of_scm_blocks_to_unbind == 0 || no_of_scm_blocks_to_unbind !=
406 size_to_unbind / SPAPR_MINIMUM_SCM_BLOCK_SIZE) {
407 return H_P3;
408 }
409
410 nvdimm = NVDIMM(drc->dev);
411 size = object_property_get_int(OBJECT(nvdimm), PC_DIMM_SIZE_PROP,
412 &error_abort);
413 addr = object_property_get_int(OBJECT(nvdimm), PC_DIMM_ADDR_PROP,
414 &error_abort);
415
416 range_init_nofail(&nvdimmrange, addr, size);
417 range_init_nofail(&blockrange, starting_scm_logical_addr, size_to_unbind);
418
419 if (!range_contains_range(&nvdimmrange, &blockrange)) {
420 return H_P3;
421 }
422
423 args[1] = no_of_scm_blocks_to_unbind;
424
425 /* let unplug take care of actual unbind */
426 return H_SUCCESS;
427 }
428
429 #define H_UNBIND_SCOPE_ALL 0x1
430 #define H_UNBIND_SCOPE_DRC 0x2
431
432 static target_ulong h_scm_unbind_all(PowerPCCPU *cpu, SpaprMachineState *spapr,
433 target_ulong opcode, target_ulong *args)
434 {
435 uint64_t target_scope = args[0];
436 uint32_t drc_index = args[1];
437 uint64_t continue_token = args[2];
438 NVDIMMDevice *nvdimm;
439 uint64_t size;
440 uint64_t no_of_scm_blocks_unbound = 0;
441
442 /* continue_token should be zero as this hcall doesn't return H_BUSY. */
443 if (continue_token > 0) {
444 return H_P4;
445 }
446
447 if (target_scope == H_UNBIND_SCOPE_DRC) {
448 SpaprDrc *drc = spapr_drc_by_index(drc_index);
449
450 if (!drc || !drc->dev ||
451 spapr_drc_type(drc) != SPAPR_DR_CONNECTOR_TYPE_PMEM) {
452 return H_P2;
453 }
454
455 nvdimm = NVDIMM(drc->dev);
456 size = object_property_get_int(OBJECT(nvdimm), PC_DIMM_SIZE_PROP,
457 &error_abort);
458
459 no_of_scm_blocks_unbound = size / SPAPR_MINIMUM_SCM_BLOCK_SIZE;
460 } else if (target_scope == H_UNBIND_SCOPE_ALL) {
461 GSList *list, *nvdimms;
462
463 nvdimms = nvdimm_get_device_list();
464 for (list = nvdimms; list; list = list->next) {
465 nvdimm = list->data;
466 size = object_property_get_int(OBJECT(nvdimm), PC_DIMM_SIZE_PROP,
467 &error_abort);
468
469 no_of_scm_blocks_unbound += size / SPAPR_MINIMUM_SCM_BLOCK_SIZE;
470 }
471 g_slist_free(nvdimms);
472 } else {
473 return H_PARAMETER;
474 }
475
476 args[1] = no_of_scm_blocks_unbound;
477
478 /* let unplug take care of actual unbind */
479 return H_SUCCESS;
480 }
481
482 static void spapr_scm_register_types(void)
483 {
484 /* qemu/scm specific hcalls */
485 spapr_register_hypercall(H_SCM_READ_METADATA, h_scm_read_metadata);
486 spapr_register_hypercall(H_SCM_WRITE_METADATA, h_scm_write_metadata);
487 spapr_register_hypercall(H_SCM_BIND_MEM, h_scm_bind_mem);
488 spapr_register_hypercall(H_SCM_UNBIND_MEM, h_scm_unbind_mem);
489 spapr_register_hypercall(H_SCM_UNBIND_ALL, h_scm_unbind_all);
490 }
491
492 type_init(spapr_scm_register_types)