xref: /qemu/hw/mem/cxl_type3.c (revision c7b64948)
1 #include "qemu/osdep.h"
2 #include "qemu/units.h"
3 #include "qemu/error-report.h"
4 #include "qapi/qapi-commands-cxl.h"
5 #include "hw/mem/memory-device.h"
6 #include "hw/mem/pc-dimm.h"
7 #include "hw/pci/pci.h"
8 #include "hw/qdev-properties.h"
9 #include "qapi/error.h"
10 #include "qemu/log.h"
11 #include "qemu/module.h"
12 #include "qemu/pmem.h"
13 #include "qemu/range.h"
14 #include "qemu/rcu.h"
15 #include "sysemu/hostmem.h"
16 #include "sysemu/numa.h"
17 #include "hw/cxl/cxl.h"
18 #include "hw/pci/msix.h"
19 
20 #define DWORD_BYTE 4
21 
22 /* Default CDAT entries for a memory region */
23 enum {
24     CT3_CDAT_DSMAS,
25     CT3_CDAT_DSLBIS0,
26     CT3_CDAT_DSLBIS1,
27     CT3_CDAT_DSLBIS2,
28     CT3_CDAT_DSLBIS3,
29     CT3_CDAT_DSEMTS,
30     CT3_CDAT_NUM_ENTRIES
31 };
32 
33 static int ct3_build_cdat_entries_for_mr(CDATSubHeader **cdat_table,
34                                          int dsmad_handle, MemoryRegion *mr,
35                                          bool is_pmem, uint64_t dpa_base)
36 {
37     g_autofree CDATDsmas *dsmas = NULL;
38     g_autofree CDATDslbis *dslbis0 = NULL;
39     g_autofree CDATDslbis *dslbis1 = NULL;
40     g_autofree CDATDslbis *dslbis2 = NULL;
41     g_autofree CDATDslbis *dslbis3 = NULL;
42     g_autofree CDATDsemts *dsemts = NULL;
43 
44     dsmas = g_malloc(sizeof(*dsmas));
45     if (!dsmas) {
46         return -ENOMEM;
47     }
48     *dsmas = (CDATDsmas) {
49         .header = {
50             .type = CDAT_TYPE_DSMAS,
51             .length = sizeof(*dsmas),
52         },
53         .DSMADhandle = dsmad_handle,
54         .flags = is_pmem ? CDAT_DSMAS_FLAG_NV : 0,
55         .DPA_base = dpa_base,
56         .DPA_length = memory_region_size(mr),
57     };
58 
59     /* For now, no memory side cache, plausiblish numbers */
60     dslbis0 = g_malloc(sizeof(*dslbis0));
61     if (!dslbis0) {
62         return -ENOMEM;
63     }
64     *dslbis0 = (CDATDslbis) {
65         .header = {
66             .type = CDAT_TYPE_DSLBIS,
67             .length = sizeof(*dslbis0),
68         },
69         .handle = dsmad_handle,
70         .flags = HMAT_LB_MEM_MEMORY,
71         .data_type = HMAT_LB_DATA_READ_LATENCY,
72         .entry_base_unit = 10000, /* 10ns base */
73         .entry[0] = 15, /* 150ns */
74     };
75 
76     dslbis1 = g_malloc(sizeof(*dslbis1));
77     if (!dslbis1) {
78         return -ENOMEM;
79     }
80     *dslbis1 = (CDATDslbis) {
81         .header = {
82             .type = CDAT_TYPE_DSLBIS,
83             .length = sizeof(*dslbis1),
84         },
85         .handle = dsmad_handle,
86         .flags = HMAT_LB_MEM_MEMORY,
87         .data_type = HMAT_LB_DATA_WRITE_LATENCY,
88         .entry_base_unit = 10000,
89         .entry[0] = 25, /* 250ns */
90     };
91 
92     dslbis2 = g_malloc(sizeof(*dslbis2));
93     if (!dslbis2) {
94         return -ENOMEM;
95     }
96     *dslbis2 = (CDATDslbis) {
97         .header = {
98             .type = CDAT_TYPE_DSLBIS,
99             .length = sizeof(*dslbis2),
100         },
101         .handle = dsmad_handle,
102         .flags = HMAT_LB_MEM_MEMORY,
103         .data_type = HMAT_LB_DATA_READ_BANDWIDTH,
104         .entry_base_unit = 1000, /* GB/s */
105         .entry[0] = 16,
106     };
107 
108     dslbis3 = g_malloc(sizeof(*dslbis3));
109     if (!dslbis3) {
110         return -ENOMEM;
111     }
112     *dslbis3 = (CDATDslbis) {
113         .header = {
114             .type = CDAT_TYPE_DSLBIS,
115             .length = sizeof(*dslbis3),
116         },
117         .handle = dsmad_handle,
118         .flags = HMAT_LB_MEM_MEMORY,
119         .data_type = HMAT_LB_DATA_WRITE_BANDWIDTH,
120         .entry_base_unit = 1000, /* GB/s */
121         .entry[0] = 16,
122     };
123 
124     dsemts = g_malloc(sizeof(*dsemts));
125     if (!dsemts) {
126         return -ENOMEM;
127     }
128     *dsemts = (CDATDsemts) {
129         .header = {
130             .type = CDAT_TYPE_DSEMTS,
131             .length = sizeof(*dsemts),
132         },
133         .DSMAS_handle = dsmad_handle,
134         /*
135          * NV: Reserved - the non volatile from DSMAS matters
136          * V: EFI_MEMORY_SP
137          */
138         .EFI_memory_type_attr = is_pmem ? 2 : 1,
139         .DPA_offset = 0,
140         .DPA_length = memory_region_size(mr),
141     };
142 
143     /* Header always at start of structure */
144     cdat_table[CT3_CDAT_DSMAS] = g_steal_pointer(&dsmas);
145     cdat_table[CT3_CDAT_DSLBIS0] = g_steal_pointer(&dslbis0);
146     cdat_table[CT3_CDAT_DSLBIS1] = g_steal_pointer(&dslbis1);
147     cdat_table[CT3_CDAT_DSLBIS2] = g_steal_pointer(&dslbis2);
148     cdat_table[CT3_CDAT_DSLBIS3] = g_steal_pointer(&dslbis3);
149     cdat_table[CT3_CDAT_DSEMTS] = g_steal_pointer(&dsemts);
150 
151     return 0;
152 }
153 
154 static int ct3_build_cdat_table(CDATSubHeader ***cdat_table, void *priv)
155 {
156     g_autofree CDATSubHeader **table = NULL;
157     CXLType3Dev *ct3d = priv;
158     MemoryRegion *volatile_mr = NULL, *nonvolatile_mr = NULL;
159     int dsmad_handle = 0;
160     int cur_ent = 0;
161     int len = 0;
162     int rc, i;
163 
164     if (!ct3d->hostpmem && !ct3d->hostvmem) {
165         return 0;
166     }
167 
168     if (ct3d->hostvmem) {
169         volatile_mr = host_memory_backend_get_memory(ct3d->hostvmem);
170         if (!volatile_mr) {
171             return -EINVAL;
172         }
173         len += CT3_CDAT_NUM_ENTRIES;
174     }
175 
176     if (ct3d->hostpmem) {
177         nonvolatile_mr = host_memory_backend_get_memory(ct3d->hostpmem);
178         if (!nonvolatile_mr) {
179             return -EINVAL;
180         }
181         len += CT3_CDAT_NUM_ENTRIES;
182     }
183 
184     table = g_malloc0(len * sizeof(*table));
185     if (!table) {
186         return -ENOMEM;
187     }
188 
189     /* Now fill them in */
190     if (volatile_mr) {
191         rc = ct3_build_cdat_entries_for_mr(table, dsmad_handle++, volatile_mr,
192                                            false, 0);
193         if (rc < 0) {
194             return rc;
195         }
196         cur_ent = CT3_CDAT_NUM_ENTRIES;
197     }
198 
199     if (nonvolatile_mr) {
200         rc = ct3_build_cdat_entries_for_mr(&(table[cur_ent]), dsmad_handle++,
201                                            nonvolatile_mr, true,
202                                            (volatile_mr ?
203                                             memory_region_size(volatile_mr) : 0));
204         if (rc < 0) {
205             goto error_cleanup;
206         }
207         cur_ent += CT3_CDAT_NUM_ENTRIES;
208     }
209     assert(len == cur_ent);
210 
211     *cdat_table = g_steal_pointer(&table);
212 
213     return len;
214 error_cleanup:
215     for (i = 0; i < cur_ent; i++) {
216         g_free(table[i]);
217     }
218     return rc;
219 }
220 
221 static void ct3_free_cdat_table(CDATSubHeader **cdat_table, int num, void *priv)
222 {
223     int i;
224 
225     for (i = 0; i < num; i++) {
226         g_free(cdat_table[i]);
227     }
228     g_free(cdat_table);
229 }
230 
231 static bool cxl_doe_cdat_rsp(DOECap *doe_cap)
232 {
233     CDATObject *cdat = &CXL_TYPE3(doe_cap->pdev)->cxl_cstate.cdat;
234     uint16_t ent;
235     void *base;
236     uint32_t len;
237     CDATReq *req = pcie_doe_get_write_mbox_ptr(doe_cap);
238     CDATRsp rsp;
239 
240     assert(cdat->entry_len);
241 
242     /* Discard if request length mismatched */
243     if (pcie_doe_get_obj_len(req) <
244         DIV_ROUND_UP(sizeof(CDATReq), DWORD_BYTE)) {
245         return false;
246     }
247 
248     ent = req->entry_handle;
249     base = cdat->entry[ent].base;
250     len = cdat->entry[ent].length;
251 
252     rsp = (CDATRsp) {
253         .header = {
254             .vendor_id = CXL_VENDOR_ID,
255             .data_obj_type = CXL_DOE_TABLE_ACCESS,
256             .reserved = 0x0,
257             .length = DIV_ROUND_UP((sizeof(rsp) + len), DWORD_BYTE),
258         },
259         .rsp_code = CXL_DOE_TAB_RSP,
260         .table_type = CXL_DOE_TAB_TYPE_CDAT,
261         .entry_handle = (ent < cdat->entry_len - 1) ?
262                         ent + 1 : CXL_DOE_TAB_ENT_MAX,
263     };
264 
265     memcpy(doe_cap->read_mbox, &rsp, sizeof(rsp));
266     memcpy(doe_cap->read_mbox + DIV_ROUND_UP(sizeof(rsp), DWORD_BYTE),
267            base, len);
268 
269     doe_cap->read_mbox_len += rsp.header.length;
270 
271     return true;
272 }
273 
274 static uint32_t ct3d_config_read(PCIDevice *pci_dev, uint32_t addr, int size)
275 {
276     CXLType3Dev *ct3d = CXL_TYPE3(pci_dev);
277     uint32_t val;
278 
279     if (pcie_doe_read_config(&ct3d->doe_cdat, addr, size, &val)) {
280         return val;
281     }
282 
283     return pci_default_read_config(pci_dev, addr, size);
284 }
285 
286 static void ct3d_config_write(PCIDevice *pci_dev, uint32_t addr, uint32_t val,
287                               int size)
288 {
289     CXLType3Dev *ct3d = CXL_TYPE3(pci_dev);
290 
291     pcie_doe_write_config(&ct3d->doe_cdat, addr, val, size);
292     pci_default_write_config(pci_dev, addr, val, size);
293     pcie_aer_write_config(pci_dev, addr, val, size);
294 }
295 
296 /*
297  * Null value of all Fs suggested by IEEE RA guidelines for use of
298  * EU, OUI and CID
299  */
300 #define UI64_NULL ~(0ULL)
301 
302 static void build_dvsecs(CXLType3Dev *ct3d)
303 {
304     CXLComponentState *cxl_cstate = &ct3d->cxl_cstate;
305     uint8_t *dvsec;
306     uint32_t range1_size_hi, range1_size_lo,
307              range1_base_hi = 0, range1_base_lo = 0,
308              range2_size_hi = 0, range2_size_lo = 0,
309              range2_base_hi = 0, range2_base_lo = 0;
310 
311     /*
312      * Volatile memory is mapped as (0x0)
313      * Persistent memory is mapped at (volatile->size)
314      */
315     if (ct3d->hostvmem) {
316         range1_size_hi = ct3d->hostvmem->size >> 32;
317         range1_size_lo = (2 << 5) | (2 << 2) | 0x3 |
318                          (ct3d->hostvmem->size & 0xF0000000);
319         if (ct3d->hostpmem) {
320             range2_size_hi = ct3d->hostpmem->size >> 32;
321             range2_size_lo = (2 << 5) | (2 << 2) | 0x3 |
322                              (ct3d->hostpmem->size & 0xF0000000);
323         }
324     } else {
325         range1_size_hi = ct3d->hostpmem->size >> 32;
326         range1_size_lo = (2 << 5) | (2 << 2) | 0x3 |
327                          (ct3d->hostpmem->size & 0xF0000000);
328     }
329 
330     dvsec = (uint8_t *)&(CXLDVSECDevice){
331         .cap = 0x1e,
332         .ctrl = 0x2,
333         .status2 = 0x2,
334         .range1_size_hi = range1_size_hi,
335         .range1_size_lo = range1_size_lo,
336         .range1_base_hi = range1_base_hi,
337         .range1_base_lo = range1_base_lo,
338         .range2_size_hi = range2_size_hi,
339         .range2_size_lo = range2_size_lo,
340         .range2_base_hi = range2_base_hi,
341         .range2_base_lo = range2_base_lo,
342     };
343     cxl_component_create_dvsec(cxl_cstate, CXL2_TYPE3_DEVICE,
344                                PCIE_CXL_DEVICE_DVSEC_LENGTH,
345                                PCIE_CXL_DEVICE_DVSEC,
346                                PCIE_CXL2_DEVICE_DVSEC_REVID, dvsec);
347 
348     dvsec = (uint8_t *)&(CXLDVSECRegisterLocator){
349         .rsvd         = 0,
350         .reg0_base_lo = RBI_COMPONENT_REG | CXL_COMPONENT_REG_BAR_IDX,
351         .reg0_base_hi = 0,
352         .reg1_base_lo = RBI_CXL_DEVICE_REG | CXL_DEVICE_REG_BAR_IDX,
353         .reg1_base_hi = 0,
354     };
355     cxl_component_create_dvsec(cxl_cstate, CXL2_TYPE3_DEVICE,
356                                REG_LOC_DVSEC_LENGTH, REG_LOC_DVSEC,
357                                REG_LOC_DVSEC_REVID, dvsec);
358     dvsec = (uint8_t *)&(CXLDVSECDeviceGPF){
359         .phase2_duration = 0x603, /* 3 seconds */
360         .phase2_power = 0x33, /* 0x33 miliwatts */
361     };
362     cxl_component_create_dvsec(cxl_cstate, CXL2_TYPE3_DEVICE,
363                                GPF_DEVICE_DVSEC_LENGTH, GPF_DEVICE_DVSEC,
364                                GPF_DEVICE_DVSEC_REVID, dvsec);
365 
366     dvsec = (uint8_t *)&(CXLDVSECPortFlexBus){
367         .cap                     = 0x26, /* 68B, IO, Mem, non-MLD */
368         .ctrl                    = 0x02, /* IO always enabled */
369         .status                  = 0x26, /* same as capabilities */
370         .rcvd_mod_ts_data_phase1 = 0xef, /* WTF? */
371     };
372     cxl_component_create_dvsec(cxl_cstate, CXL2_TYPE3_DEVICE,
373                                PCIE_FLEXBUS_PORT_DVSEC_LENGTH_2_0,
374                                PCIE_FLEXBUS_PORT_DVSEC,
375                                PCIE_FLEXBUS_PORT_DVSEC_REVID_2_0, dvsec);
376 }
377 
378 static void hdm_decoder_commit(CXLType3Dev *ct3d, int which)
379 {
380     ComponentRegisters *cregs = &ct3d->cxl_cstate.crb;
381     uint32_t *cache_mem = cregs->cache_mem_registers;
382     uint32_t ctrl;
383 
384     assert(which == 0);
385 
386     ctrl = ldl_le_p(cache_mem + R_CXL_HDM_DECODER0_CTRL);
387     /* TODO: Sanity checks that the decoder is possible */
388     ctrl = FIELD_DP32(ctrl, CXL_HDM_DECODER0_CTRL, ERR, 0);
389     ctrl = FIELD_DP32(ctrl, CXL_HDM_DECODER0_CTRL, COMMITTED, 1);
390 
391     stl_le_p(cache_mem + R_CXL_HDM_DECODER0_CTRL, ctrl);
392 }
393 
394 static void hdm_decoder_uncommit(CXLType3Dev *ct3d, int which)
395 {
396     ComponentRegisters *cregs = &ct3d->cxl_cstate.crb;
397     uint32_t *cache_mem = cregs->cache_mem_registers;
398     uint32_t ctrl;
399 
400     assert(which == 0);
401 
402     ctrl = ldl_le_p(cache_mem + R_CXL_HDM_DECODER0_CTRL);
403 
404     ctrl = FIELD_DP32(ctrl, CXL_HDM_DECODER0_CTRL, ERR, 0);
405     ctrl = FIELD_DP32(ctrl, CXL_HDM_DECODER0_CTRL, COMMITTED, 0);
406 
407     stl_le_p(cache_mem + R_CXL_HDM_DECODER0_CTRL, ctrl);
408 }
409 
410 static int ct3d_qmp_uncor_err_to_cxl(CxlUncorErrorType qmp_err)
411 {
412     switch (qmp_err) {
413     case CXL_UNCOR_ERROR_TYPE_CACHE_DATA_PARITY:
414         return CXL_RAS_UNC_ERR_CACHE_DATA_PARITY;
415     case CXL_UNCOR_ERROR_TYPE_CACHE_ADDRESS_PARITY:
416         return CXL_RAS_UNC_ERR_CACHE_ADDRESS_PARITY;
417     case CXL_UNCOR_ERROR_TYPE_CACHE_BE_PARITY:
418         return CXL_RAS_UNC_ERR_CACHE_BE_PARITY;
419     case CXL_UNCOR_ERROR_TYPE_CACHE_DATA_ECC:
420         return CXL_RAS_UNC_ERR_CACHE_DATA_ECC;
421     case CXL_UNCOR_ERROR_TYPE_MEM_DATA_PARITY:
422         return CXL_RAS_UNC_ERR_MEM_DATA_PARITY;
423     case CXL_UNCOR_ERROR_TYPE_MEM_ADDRESS_PARITY:
424         return CXL_RAS_UNC_ERR_MEM_ADDRESS_PARITY;
425     case CXL_UNCOR_ERROR_TYPE_MEM_BE_PARITY:
426         return CXL_RAS_UNC_ERR_MEM_BE_PARITY;
427     case CXL_UNCOR_ERROR_TYPE_MEM_DATA_ECC:
428         return CXL_RAS_UNC_ERR_MEM_DATA_ECC;
429     case CXL_UNCOR_ERROR_TYPE_REINIT_THRESHOLD:
430         return CXL_RAS_UNC_ERR_REINIT_THRESHOLD;
431     case CXL_UNCOR_ERROR_TYPE_RSVD_ENCODING:
432         return CXL_RAS_UNC_ERR_RSVD_ENCODING;
433     case CXL_UNCOR_ERROR_TYPE_POISON_RECEIVED:
434         return CXL_RAS_UNC_ERR_POISON_RECEIVED;
435     case CXL_UNCOR_ERROR_TYPE_RECEIVER_OVERFLOW:
436         return CXL_RAS_UNC_ERR_RECEIVER_OVERFLOW;
437     case CXL_UNCOR_ERROR_TYPE_INTERNAL:
438         return CXL_RAS_UNC_ERR_INTERNAL;
439     case CXL_UNCOR_ERROR_TYPE_CXL_IDE_TX:
440         return CXL_RAS_UNC_ERR_CXL_IDE_TX;
441     case CXL_UNCOR_ERROR_TYPE_CXL_IDE_RX:
442         return CXL_RAS_UNC_ERR_CXL_IDE_RX;
443     default:
444         return -EINVAL;
445     }
446 }
447 
448 static int ct3d_qmp_cor_err_to_cxl(CxlCorErrorType qmp_err)
449 {
450     switch (qmp_err) {
451     case CXL_COR_ERROR_TYPE_CACHE_DATA_ECC:
452         return CXL_RAS_COR_ERR_CACHE_DATA_ECC;
453     case CXL_COR_ERROR_TYPE_MEM_DATA_ECC:
454         return CXL_RAS_COR_ERR_MEM_DATA_ECC;
455     case CXL_COR_ERROR_TYPE_CRC_THRESHOLD:
456         return CXL_RAS_COR_ERR_CRC_THRESHOLD;
457     case CXL_COR_ERROR_TYPE_RETRY_THRESHOLD:
458         return CXL_RAS_COR_ERR_RETRY_THRESHOLD;
459     case CXL_COR_ERROR_TYPE_CACHE_POISON_RECEIVED:
460         return CXL_RAS_COR_ERR_CACHE_POISON_RECEIVED;
461     case CXL_COR_ERROR_TYPE_MEM_POISON_RECEIVED:
462         return CXL_RAS_COR_ERR_MEM_POISON_RECEIVED;
463     case CXL_COR_ERROR_TYPE_PHYSICAL:
464         return CXL_RAS_COR_ERR_PHYSICAL;
465     default:
466         return -EINVAL;
467     }
468 }
469 
470 static void ct3d_reg_write(void *opaque, hwaddr offset, uint64_t value,
471                            unsigned size)
472 {
473     CXLComponentState *cxl_cstate = opaque;
474     ComponentRegisters *cregs = &cxl_cstate->crb;
475     CXLType3Dev *ct3d = container_of(cxl_cstate, CXLType3Dev, cxl_cstate);
476     uint32_t *cache_mem = cregs->cache_mem_registers;
477     bool should_commit = false;
478     bool should_uncommit = false;
479     int which_hdm = -1;
480 
481     assert(size == 4);
482     g_assert(offset < CXL2_COMPONENT_CM_REGION_SIZE);
483 
484     switch (offset) {
485     case A_CXL_HDM_DECODER0_CTRL:
486         should_commit = FIELD_EX32(value, CXL_HDM_DECODER0_CTRL, COMMIT);
487         should_uncommit = !should_commit;
488         which_hdm = 0;
489         break;
490     case A_CXL_RAS_UNC_ERR_STATUS:
491     {
492         uint32_t capctrl = ldl_le_p(cache_mem + R_CXL_RAS_ERR_CAP_CTRL);
493         uint32_t fe = FIELD_EX32(capctrl, CXL_RAS_ERR_CAP_CTRL, FIRST_ERROR_POINTER);
494         CXLError *cxl_err;
495         uint32_t unc_err;
496 
497         /*
498          * If single bit written that corresponds to the first error
499          * pointer being cleared, update the status and header log.
500          */
501         if (!QTAILQ_EMPTY(&ct3d->error_list)) {
502             if ((1 << fe) ^ value) {
503                 CXLError *cxl_next;
504                 /*
505                  * Software is using wrong flow for multiple header recording
506                  * Following behavior in PCIe r6.0 and assuming multiple
507                  * header support. Implementation defined choice to clear all
508                  * matching records if more than one bit set - which corresponds
509                  * closest to behavior of hardware not capable of multiple
510                  * header recording.
511                  */
512                 QTAILQ_FOREACH_SAFE(cxl_err, &ct3d->error_list, node, cxl_next) {
513                     if ((1 << cxl_err->type) & value) {
514                         QTAILQ_REMOVE(&ct3d->error_list, cxl_err, node);
515                         g_free(cxl_err);
516                     }
517                 }
518             } else {
519                 /* Done with previous FE, so drop from list */
520                 cxl_err = QTAILQ_FIRST(&ct3d->error_list);
521                 QTAILQ_REMOVE(&ct3d->error_list, cxl_err, node);
522                 g_free(cxl_err);
523             }
524 
525             /*
526              * If there is another FE, then put that in place and update
527              * the header log
528              */
529             if (!QTAILQ_EMPTY(&ct3d->error_list)) {
530                 uint32_t *header_log = &cache_mem[R_CXL_RAS_ERR_HEADER0];
531                 int i;
532 
533                 cxl_err = QTAILQ_FIRST(&ct3d->error_list);
534                 for (i = 0; i < CXL_RAS_ERR_HEADER_NUM; i++) {
535                     stl_le_p(header_log + i, cxl_err->header[i]);
536                 }
537                 capctrl = FIELD_DP32(capctrl, CXL_RAS_ERR_CAP_CTRL,
538                                      FIRST_ERROR_POINTER, cxl_err->type);
539             } else {
540                 /*
541                  * If no more errors, then follow recomendation of PCI spec
542                  * r6.0 6.2.4.2 to set the first error pointer to a status
543                  * bit that will never be used.
544                  */
545                 capctrl = FIELD_DP32(capctrl, CXL_RAS_ERR_CAP_CTRL,
546                                      FIRST_ERROR_POINTER,
547                                      CXL_RAS_UNC_ERR_CXL_UNUSED);
548             }
549             stl_le_p((uint8_t *)cache_mem + A_CXL_RAS_ERR_CAP_CTRL, capctrl);
550         }
551         unc_err = 0;
552         QTAILQ_FOREACH(cxl_err, &ct3d->error_list, node) {
553             unc_err |= 1 << cxl_err->type;
554         }
555         stl_le_p((uint8_t *)cache_mem + offset, unc_err);
556 
557         return;
558     }
559     case A_CXL_RAS_COR_ERR_STATUS:
560     {
561         uint32_t rw1c = value;
562         uint32_t temp = ldl_le_p((uint8_t *)cache_mem + offset);
563         temp &= ~rw1c;
564         stl_le_p((uint8_t *)cache_mem + offset, temp);
565         return;
566     }
567     default:
568         break;
569     }
570 
571     stl_le_p((uint8_t *)cache_mem + offset, value);
572     if (should_commit) {
573         hdm_decoder_commit(ct3d, which_hdm);
574     } else if (should_uncommit) {
575         hdm_decoder_uncommit(ct3d, which_hdm);
576     }
577 }
578 
579 static bool cxl_setup_memory(CXLType3Dev *ct3d, Error **errp)
580 {
581     DeviceState *ds = DEVICE(ct3d);
582 
583     if (!ct3d->hostmem && !ct3d->hostvmem && !ct3d->hostpmem) {
584         error_setg(errp, "at least one memdev property must be set");
585         return false;
586     } else if (ct3d->hostmem && ct3d->hostpmem) {
587         error_setg(errp, "[memdev] cannot be used with new "
588                          "[persistent-memdev] property");
589         return false;
590     } else if (ct3d->hostmem) {
591         /* Use of hostmem property implies pmem */
592         ct3d->hostpmem = ct3d->hostmem;
593         ct3d->hostmem = NULL;
594     }
595 
596     if (ct3d->hostpmem && !ct3d->lsa) {
597         error_setg(errp, "lsa property must be set for persistent devices");
598         return false;
599     }
600 
601     if (ct3d->hostvmem) {
602         MemoryRegion *vmr;
603         char *v_name;
604 
605         vmr = host_memory_backend_get_memory(ct3d->hostvmem);
606         if (!vmr) {
607             error_setg(errp, "volatile memdev must have backing device");
608             return false;
609         }
610         memory_region_set_nonvolatile(vmr, false);
611         memory_region_set_enabled(vmr, true);
612         host_memory_backend_set_mapped(ct3d->hostvmem, true);
613         if (ds->id) {
614             v_name = g_strdup_printf("cxl-type3-dpa-vmem-space:%s", ds->id);
615         } else {
616             v_name = g_strdup("cxl-type3-dpa-vmem-space");
617         }
618         address_space_init(&ct3d->hostvmem_as, vmr, v_name);
619         ct3d->cxl_dstate.vmem_size = memory_region_size(vmr);
620         ct3d->cxl_dstate.mem_size += memory_region_size(vmr);
621         g_free(v_name);
622     }
623 
624     if (ct3d->hostpmem) {
625         MemoryRegion *pmr;
626         char *p_name;
627 
628         pmr = host_memory_backend_get_memory(ct3d->hostpmem);
629         if (!pmr) {
630             error_setg(errp, "persistent memdev must have backing device");
631             return false;
632         }
633         memory_region_set_nonvolatile(pmr, true);
634         memory_region_set_enabled(pmr, true);
635         host_memory_backend_set_mapped(ct3d->hostpmem, true);
636         if (ds->id) {
637             p_name = g_strdup_printf("cxl-type3-dpa-pmem-space:%s", ds->id);
638         } else {
639             p_name = g_strdup("cxl-type3-dpa-pmem-space");
640         }
641         address_space_init(&ct3d->hostpmem_as, pmr, p_name);
642         ct3d->cxl_dstate.pmem_size = memory_region_size(pmr);
643         ct3d->cxl_dstate.mem_size += memory_region_size(pmr);
644         g_free(p_name);
645     }
646 
647     return true;
648 }
649 
650 static DOEProtocol doe_cdat_prot[] = {
651     { CXL_VENDOR_ID, CXL_DOE_TABLE_ACCESS, cxl_doe_cdat_rsp },
652     { }
653 };
654 
655 static void ct3_realize(PCIDevice *pci_dev, Error **errp)
656 {
657     CXLType3Dev *ct3d = CXL_TYPE3(pci_dev);
658     CXLComponentState *cxl_cstate = &ct3d->cxl_cstate;
659     ComponentRegisters *regs = &cxl_cstate->crb;
660     MemoryRegion *mr = &regs->component_registers;
661     uint8_t *pci_conf = pci_dev->config;
662     unsigned short msix_num = 1;
663     int i, rc;
664 
665     QTAILQ_INIT(&ct3d->error_list);
666 
667     if (!cxl_setup_memory(ct3d, errp)) {
668         return;
669     }
670 
671     pci_config_set_prog_interface(pci_conf, 0x10);
672 
673     pcie_endpoint_cap_init(pci_dev, 0x80);
674     if (ct3d->sn != UI64_NULL) {
675         pcie_dev_ser_num_init(pci_dev, 0x100, ct3d->sn);
676         cxl_cstate->dvsec_offset = 0x100 + 0x0c;
677     } else {
678         cxl_cstate->dvsec_offset = 0x100;
679     }
680 
681     ct3d->cxl_cstate.pdev = pci_dev;
682     build_dvsecs(ct3d);
683 
684     regs->special_ops = g_new0(MemoryRegionOps, 1);
685     regs->special_ops->write = ct3d_reg_write;
686 
687     cxl_component_register_block_init(OBJECT(pci_dev), cxl_cstate,
688                                       TYPE_CXL_TYPE3);
689 
690     pci_register_bar(
691         pci_dev, CXL_COMPONENT_REG_BAR_IDX,
692         PCI_BASE_ADDRESS_SPACE_MEMORY | PCI_BASE_ADDRESS_MEM_TYPE_64, mr);
693 
694     cxl_device_register_block_init(OBJECT(pci_dev), &ct3d->cxl_dstate);
695     pci_register_bar(pci_dev, CXL_DEVICE_REG_BAR_IDX,
696                      PCI_BASE_ADDRESS_SPACE_MEMORY |
697                          PCI_BASE_ADDRESS_MEM_TYPE_64,
698                      &ct3d->cxl_dstate.device_registers);
699 
700     /* MSI(-X) Initailization */
701     rc = msix_init_exclusive_bar(pci_dev, msix_num, 4, NULL);
702     if (rc) {
703         goto err_address_space_free;
704     }
705     for (i = 0; i < msix_num; i++) {
706         msix_vector_use(pci_dev, i);
707     }
708 
709     /* DOE Initailization */
710     pcie_doe_init(pci_dev, &ct3d->doe_cdat, 0x190, doe_cdat_prot, true, 0);
711 
712     cxl_cstate->cdat.build_cdat_table = ct3_build_cdat_table;
713     cxl_cstate->cdat.free_cdat_table = ct3_free_cdat_table;
714     cxl_cstate->cdat.private = ct3d;
715     cxl_doe_cdat_init(cxl_cstate, errp);
716     if (*errp) {
717         goto err_free_special_ops;
718     }
719 
720     pcie_cap_deverr_init(pci_dev);
721     /* Leave a bit of room for expansion */
722     rc = pcie_aer_init(pci_dev, PCI_ERR_VER, 0x200, PCI_ERR_SIZEOF, NULL);
723     if (rc) {
724         goto err_release_cdat;
725     }
726 
727     return;
728 
729 err_release_cdat:
730     cxl_doe_cdat_release(cxl_cstate);
731 err_free_special_ops:
732     g_free(regs->special_ops);
733 err_address_space_free:
734     if (ct3d->hostpmem) {
735         address_space_destroy(&ct3d->hostpmem_as);
736     }
737     if (ct3d->hostvmem) {
738         address_space_destroy(&ct3d->hostvmem_as);
739     }
740     return;
741 }
742 
743 static void ct3_exit(PCIDevice *pci_dev)
744 {
745     CXLType3Dev *ct3d = CXL_TYPE3(pci_dev);
746     CXLComponentState *cxl_cstate = &ct3d->cxl_cstate;
747     ComponentRegisters *regs = &cxl_cstate->crb;
748 
749     pcie_aer_exit(pci_dev);
750     cxl_doe_cdat_release(cxl_cstate);
751     g_free(regs->special_ops);
752     if (ct3d->hostpmem) {
753         address_space_destroy(&ct3d->hostpmem_as);
754     }
755     if (ct3d->hostvmem) {
756         address_space_destroy(&ct3d->hostvmem_as);
757     }
758 }
759 
760 /* TODO: Support multiple HDM decoders and DPA skip */
761 static bool cxl_type3_dpa(CXLType3Dev *ct3d, hwaddr host_addr, uint64_t *dpa)
762 {
763     uint32_t *cache_mem = ct3d->cxl_cstate.crb.cache_mem_registers;
764     uint64_t decoder_base, decoder_size, hpa_offset;
765     uint32_t hdm0_ctrl;
766     int ig, iw;
767 
768     decoder_base = (((uint64_t)cache_mem[R_CXL_HDM_DECODER0_BASE_HI] << 32) |
769                     cache_mem[R_CXL_HDM_DECODER0_BASE_LO]);
770     if ((uint64_t)host_addr < decoder_base) {
771         return false;
772     }
773 
774     hpa_offset = (uint64_t)host_addr - decoder_base;
775 
776     decoder_size = ((uint64_t)cache_mem[R_CXL_HDM_DECODER0_SIZE_HI] << 32) |
777         cache_mem[R_CXL_HDM_DECODER0_SIZE_LO];
778     if (hpa_offset >= decoder_size) {
779         return false;
780     }
781 
782     hdm0_ctrl = cache_mem[R_CXL_HDM_DECODER0_CTRL];
783     iw = FIELD_EX32(hdm0_ctrl, CXL_HDM_DECODER0_CTRL, IW);
784     ig = FIELD_EX32(hdm0_ctrl, CXL_HDM_DECODER0_CTRL, IG);
785 
786     *dpa = (MAKE_64BIT_MASK(0, 8 + ig) & hpa_offset) |
787         ((MAKE_64BIT_MASK(8 + ig + iw, 64 - 8 - ig - iw) & hpa_offset) >> iw);
788 
789     return true;
790 }
791 
792 static int cxl_type3_hpa_to_as_and_dpa(CXLType3Dev *ct3d,
793                                        hwaddr host_addr,
794                                        unsigned int size,
795                                        AddressSpace **as,
796                                        uint64_t *dpa_offset)
797 {
798     MemoryRegion *vmr = NULL, *pmr = NULL;
799 
800     if (ct3d->hostvmem) {
801         vmr = host_memory_backend_get_memory(ct3d->hostvmem);
802     }
803     if (ct3d->hostpmem) {
804         pmr = host_memory_backend_get_memory(ct3d->hostpmem);
805     }
806 
807     if (!vmr && !pmr) {
808         return -ENODEV;
809     }
810 
811     if (!cxl_type3_dpa(ct3d, host_addr, dpa_offset)) {
812         return -EINVAL;
813     }
814 
815     if (*dpa_offset > ct3d->cxl_dstate.mem_size) {
816         return -EINVAL;
817     }
818 
819     if (vmr) {
820         if (*dpa_offset < memory_region_size(vmr)) {
821             *as = &ct3d->hostvmem_as;
822         } else {
823             *as = &ct3d->hostpmem_as;
824             *dpa_offset -= memory_region_size(vmr);
825         }
826     } else {
827         *as = &ct3d->hostpmem_as;
828     }
829 
830     return 0;
831 }
832 
833 MemTxResult cxl_type3_read(PCIDevice *d, hwaddr host_addr, uint64_t *data,
834                            unsigned size, MemTxAttrs attrs)
835 {
836     uint64_t dpa_offset = 0;
837     AddressSpace *as = NULL;
838     int res;
839 
840     res = cxl_type3_hpa_to_as_and_dpa(CXL_TYPE3(d), host_addr, size,
841                                       &as, &dpa_offset);
842     if (res) {
843         return MEMTX_ERROR;
844     }
845 
846     return address_space_read(as, dpa_offset, attrs, data, size);
847 }
848 
849 MemTxResult cxl_type3_write(PCIDevice *d, hwaddr host_addr, uint64_t data,
850                             unsigned size, MemTxAttrs attrs)
851 {
852     uint64_t dpa_offset = 0;
853     AddressSpace *as = NULL;
854     int res;
855 
856     res = cxl_type3_hpa_to_as_and_dpa(CXL_TYPE3(d), host_addr, size,
857                                       &as, &dpa_offset);
858     if (res) {
859         return MEMTX_ERROR;
860     }
861 
862     return address_space_write(as, dpa_offset, attrs, &data, size);
863 }
864 
865 static void ct3d_reset(DeviceState *dev)
866 {
867     CXLType3Dev *ct3d = CXL_TYPE3(dev);
868     uint32_t *reg_state = ct3d->cxl_cstate.crb.cache_mem_registers;
869     uint32_t *write_msk = ct3d->cxl_cstate.crb.cache_mem_regs_write_mask;
870 
871     cxl_component_register_init_common(reg_state, write_msk, CXL2_TYPE3_DEVICE);
872     cxl_device_register_init_common(&ct3d->cxl_dstate);
873 }
874 
875 static Property ct3_props[] = {
876     DEFINE_PROP_LINK("memdev", CXLType3Dev, hostmem, TYPE_MEMORY_BACKEND,
877                      HostMemoryBackend *), /* for backward compatibility */
878     DEFINE_PROP_LINK("persistent-memdev", CXLType3Dev, hostpmem,
879                      TYPE_MEMORY_BACKEND, HostMemoryBackend *),
880     DEFINE_PROP_LINK("volatile-memdev", CXLType3Dev, hostvmem,
881                      TYPE_MEMORY_BACKEND, HostMemoryBackend *),
882     DEFINE_PROP_LINK("lsa", CXLType3Dev, lsa, TYPE_MEMORY_BACKEND,
883                      HostMemoryBackend *),
884     DEFINE_PROP_UINT64("sn", CXLType3Dev, sn, UI64_NULL),
885     DEFINE_PROP_STRING("cdat", CXLType3Dev, cxl_cstate.cdat.filename),
886     DEFINE_PROP_END_OF_LIST(),
887 };
888 
889 static uint64_t get_lsa_size(CXLType3Dev *ct3d)
890 {
891     MemoryRegion *mr;
892 
893     if (!ct3d->lsa) {
894         return 0;
895     }
896 
897     mr = host_memory_backend_get_memory(ct3d->lsa);
898     return memory_region_size(mr);
899 }
900 
901 static void validate_lsa_access(MemoryRegion *mr, uint64_t size,
902                                 uint64_t offset)
903 {
904     assert(offset + size <= memory_region_size(mr));
905     assert(offset + size > offset);
906 }
907 
908 static uint64_t get_lsa(CXLType3Dev *ct3d, void *buf, uint64_t size,
909                     uint64_t offset)
910 {
911     MemoryRegion *mr;
912     void *lsa;
913 
914     if (!ct3d->lsa) {
915         return 0;
916     }
917 
918     mr = host_memory_backend_get_memory(ct3d->lsa);
919     validate_lsa_access(mr, size, offset);
920 
921     lsa = memory_region_get_ram_ptr(mr) + offset;
922     memcpy(buf, lsa, size);
923 
924     return size;
925 }
926 
927 static void set_lsa(CXLType3Dev *ct3d, const void *buf, uint64_t size,
928                     uint64_t offset)
929 {
930     MemoryRegion *mr;
931     void *lsa;
932 
933     if (!ct3d->lsa) {
934         return;
935     }
936 
937     mr = host_memory_backend_get_memory(ct3d->lsa);
938     validate_lsa_access(mr, size, offset);
939 
940     lsa = memory_region_get_ram_ptr(mr) + offset;
941     memcpy(lsa, buf, size);
942     memory_region_set_dirty(mr, offset, size);
943 
944     /*
945      * Just like the PMEM, if the guest is not allowed to exit gracefully, label
946      * updates will get lost.
947      */
948 }
949 
950 /* For uncorrectable errors include support for multiple header recording */
951 void qmp_cxl_inject_uncorrectable_errors(const char *path,
952                                          CXLUncorErrorRecordList *errors,
953                                          Error **errp)
954 {
955     Object *obj = object_resolve_path(path, NULL);
956     static PCIEAERErr err = {};
957     CXLType3Dev *ct3d;
958     CXLError *cxl_err;
959     uint32_t *reg_state;
960     uint32_t unc_err;
961     bool first;
962 
963     if (!obj) {
964         error_setg(errp, "Unable to resolve path");
965         return;
966     }
967 
968     if (!object_dynamic_cast(obj, TYPE_CXL_TYPE3)) {
969         error_setg(errp, "Path does not point to a CXL type 3 device");
970         return;
971     }
972 
973     err.status = PCI_ERR_UNC_INTN;
974     err.source_id = pci_requester_id(PCI_DEVICE(obj));
975     err.flags = 0;
976 
977     ct3d = CXL_TYPE3(obj);
978 
979     first = QTAILQ_EMPTY(&ct3d->error_list);
980     reg_state = ct3d->cxl_cstate.crb.cache_mem_registers;
981     while (errors) {
982         uint32List *header = errors->value->header;
983         uint8_t header_count = 0;
984         int cxl_err_code;
985 
986         cxl_err_code = ct3d_qmp_uncor_err_to_cxl(errors->value->type);
987         if (cxl_err_code < 0) {
988             error_setg(errp, "Unknown error code");
989             return;
990         }
991 
992         /* If the error is masked, nothing to do here */
993         if (!((1 << cxl_err_code) &
994               ~ldl_le_p(reg_state + R_CXL_RAS_UNC_ERR_MASK))) {
995             errors = errors->next;
996             continue;
997         }
998 
999         cxl_err = g_malloc0(sizeof(*cxl_err));
1000         if (!cxl_err) {
1001             return;
1002         }
1003 
1004         cxl_err->type = cxl_err_code;
1005         while (header && header_count < 32) {
1006             cxl_err->header[header_count++] = header->value;
1007             header = header->next;
1008         }
1009         if (header_count > 32) {
1010             error_setg(errp, "Header must be 32 DWORD or less");
1011             return;
1012         }
1013         QTAILQ_INSERT_TAIL(&ct3d->error_list, cxl_err, node);
1014 
1015         errors = errors->next;
1016     }
1017 
1018     if (first && !QTAILQ_EMPTY(&ct3d->error_list)) {
1019         uint32_t *cache_mem = ct3d->cxl_cstate.crb.cache_mem_registers;
1020         uint32_t capctrl = ldl_le_p(cache_mem + R_CXL_RAS_ERR_CAP_CTRL);
1021         uint32_t *header_log = &cache_mem[R_CXL_RAS_ERR_HEADER0];
1022         int i;
1023 
1024         cxl_err = QTAILQ_FIRST(&ct3d->error_list);
1025         for (i = 0; i < CXL_RAS_ERR_HEADER_NUM; i++) {
1026             stl_le_p(header_log + i, cxl_err->header[i]);
1027         }
1028 
1029         capctrl = FIELD_DP32(capctrl, CXL_RAS_ERR_CAP_CTRL,
1030                              FIRST_ERROR_POINTER, cxl_err->type);
1031         stl_le_p(cache_mem + R_CXL_RAS_ERR_CAP_CTRL, capctrl);
1032     }
1033 
1034     unc_err = 0;
1035     QTAILQ_FOREACH(cxl_err, &ct3d->error_list, node) {
1036         unc_err |= (1 << cxl_err->type);
1037     }
1038     if (!unc_err) {
1039         return;
1040     }
1041 
1042     stl_le_p(reg_state + R_CXL_RAS_UNC_ERR_STATUS, unc_err);
1043     pcie_aer_inject_error(PCI_DEVICE(obj), &err);
1044 
1045     return;
1046 }
1047 
1048 void qmp_cxl_inject_correctable_error(const char *path, CxlCorErrorType type,
1049                                       Error **errp)
1050 {
1051     static PCIEAERErr err = {};
1052     Object *obj = object_resolve_path(path, NULL);
1053     CXLType3Dev *ct3d;
1054     uint32_t *reg_state;
1055     uint32_t cor_err;
1056     int cxl_err_type;
1057 
1058     if (!obj) {
1059         error_setg(errp, "Unable to resolve path");
1060         return;
1061     }
1062     if (!object_dynamic_cast(obj, TYPE_CXL_TYPE3)) {
1063         error_setg(errp, "Path does not point to a CXL type 3 device");
1064         return;
1065     }
1066 
1067     err.status = PCI_ERR_COR_INTERNAL;
1068     err.source_id = pci_requester_id(PCI_DEVICE(obj));
1069     err.flags = PCIE_AER_ERR_IS_CORRECTABLE;
1070 
1071     ct3d = CXL_TYPE3(obj);
1072     reg_state = ct3d->cxl_cstate.crb.cache_mem_registers;
1073     cor_err = ldl_le_p(reg_state + R_CXL_RAS_COR_ERR_STATUS);
1074 
1075     cxl_err_type = ct3d_qmp_cor_err_to_cxl(type);
1076     if (cxl_err_type < 0) {
1077         error_setg(errp, "Invalid COR error");
1078         return;
1079     }
1080     /* If the error is masked, nothting to do here */
1081     if (!((1 << cxl_err_type) & ~ldl_le_p(reg_state + R_CXL_RAS_COR_ERR_MASK))) {
1082         return;
1083     }
1084 
1085     cor_err |= (1 << cxl_err_type);
1086     stl_le_p(reg_state + R_CXL_RAS_COR_ERR_STATUS, cor_err);
1087 
1088     pcie_aer_inject_error(PCI_DEVICE(obj), &err);
1089 }
1090 
1091 static void ct3_class_init(ObjectClass *oc, void *data)
1092 {
1093     DeviceClass *dc = DEVICE_CLASS(oc);
1094     PCIDeviceClass *pc = PCI_DEVICE_CLASS(oc);
1095     CXLType3Class *cvc = CXL_TYPE3_CLASS(oc);
1096 
1097     pc->realize = ct3_realize;
1098     pc->exit = ct3_exit;
1099     pc->class_id = PCI_CLASS_MEMORY_CXL;
1100     pc->vendor_id = PCI_VENDOR_ID_INTEL;
1101     pc->device_id = 0xd93; /* LVF for now */
1102     pc->revision = 1;
1103 
1104     pc->config_write = ct3d_config_write;
1105     pc->config_read = ct3d_config_read;
1106 
1107     set_bit(DEVICE_CATEGORY_STORAGE, dc->categories);
1108     dc->desc = "CXL Memory Device (Type 3)";
1109     dc->reset = ct3d_reset;
1110     device_class_set_props(dc, ct3_props);
1111 
1112     cvc->get_lsa_size = get_lsa_size;
1113     cvc->get_lsa = get_lsa;
1114     cvc->set_lsa = set_lsa;
1115 }
1116 
1117 static const TypeInfo ct3d_info = {
1118     .name = TYPE_CXL_TYPE3,
1119     .parent = TYPE_PCI_DEVICE,
1120     .class_size = sizeof(struct CXLType3Class),
1121     .class_init = ct3_class_init,
1122     .instance_size = sizeof(CXLType3Dev),
1123     .interfaces = (InterfaceInfo[]) {
1124         { INTERFACE_CXL_DEVICE },
1125         { INTERFACE_PCIE_DEVICE },
1126         {}
1127     },
1128 };
1129 
1130 static void ct3d_registers(void)
1131 {
1132     type_register_static(&ct3d_info);
1133 }
1134 
1135 type_init(ct3d_registers);
1136