xref: /qemu/hw/pci/msi.c (revision bf8d4924)
1 /*
2  * msi.c
3  *
4  * Copyright (c) 2010 Isaku Yamahata <yamahata at valinux co jp>
5  *                    VA Linux Systems Japan K.K.
6  *
7  * This program is free software; you can redistribute it and/or modify
8  * it under the terms of the GNU General Public License as published by
9  * the Free Software Foundation; either version 2 of the License, or
10  * (at your option) any later version.
11 
12  * This program is distributed in the hope that it will be useful,
13  * but WITHOUT ANY WARRANTY; without even the implied warranty of
14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
15  * GNU General Public License for more details.
16 
17  * You should have received a copy of the GNU General Public License along
18  * with this program; if not, see <http://www.gnu.org/licenses/>.
19  */
20 
21 #include "qemu/osdep.h"
22 #include "hw/pci/msi.h"
23 #include "hw/xen/xen.h"
24 #include "qemu/range.h"
25 
26 /* PCI_MSI_ADDRESS_LO */
27 #define PCI_MSI_ADDRESS_LO_MASK         (~0x3)
28 
29 /* If we get rid of cap allocator, we won't need those. */
30 #define PCI_MSI_32_SIZEOF       0x0a
31 #define PCI_MSI_64_SIZEOF       0x0e
32 #define PCI_MSI_32M_SIZEOF      0x14
33 #define PCI_MSI_64M_SIZEOF      0x18
34 
35 #define PCI_MSI_VECTORS_MAX     32
36 
37 /*
38  * Flag for interrupt controllers to declare broken MSI/MSI-X support.
39  * values: false - broken; true - non-broken.
40  *
41  * Setting this flag to false will remove MSI/MSI-X capability from all devices.
42  *
43  * It is preferable for controllers to set this to true (non-broken) even if
44  * they do not actually support MSI/MSI-X: guests normally probe the controller
45  * type and do not attempt to enable MSI/MSI-X with interrupt controllers not
46  * supporting such, so removing the capability is not required, and
47  * it seems cleaner to have a given device look the same for all boards.
48  *
49  * TODO: some existing controllers violate the above rule. Identify and fix them.
50  */
51 bool msi_nonbroken;
52 
53 /* If we get rid of cap allocator, we won't need this. */
54 static inline uint8_t msi_cap_sizeof(uint16_t flags)
55 {
56     switch (flags & (PCI_MSI_FLAGS_MASKBIT | PCI_MSI_FLAGS_64BIT)) {
57     case PCI_MSI_FLAGS_MASKBIT | PCI_MSI_FLAGS_64BIT:
58         return PCI_MSI_64M_SIZEOF;
59     case PCI_MSI_FLAGS_64BIT:
60         return PCI_MSI_64_SIZEOF;
61     case PCI_MSI_FLAGS_MASKBIT:
62         return PCI_MSI_32M_SIZEOF;
63     case 0:
64         return PCI_MSI_32_SIZEOF;
65     default:
66         abort();
67         break;
68     }
69     return 0;
70 }
71 
72 //#define MSI_DEBUG
73 
74 #ifdef MSI_DEBUG
75 # define MSI_DPRINTF(fmt, ...)                                          \
76     fprintf(stderr, "%s:%d " fmt, __func__, __LINE__, ## __VA_ARGS__)
77 #else
78 # define MSI_DPRINTF(fmt, ...)  do { } while (0)
79 #endif
80 #define MSI_DEV_PRINTF(dev, fmt, ...)                                   \
81     MSI_DPRINTF("%s:%x " fmt, (dev)->name, (dev)->devfn, ## __VA_ARGS__)
82 
83 static inline unsigned int msi_nr_vectors(uint16_t flags)
84 {
85     return 1U <<
86         ((flags & PCI_MSI_FLAGS_QSIZE) >> ctz32(PCI_MSI_FLAGS_QSIZE));
87 }
88 
89 static inline uint8_t msi_flags_off(const PCIDevice* dev)
90 {
91     return dev->msi_cap + PCI_MSI_FLAGS;
92 }
93 
94 static inline uint8_t msi_address_lo_off(const PCIDevice* dev)
95 {
96     return dev->msi_cap + PCI_MSI_ADDRESS_LO;
97 }
98 
99 static inline uint8_t msi_address_hi_off(const PCIDevice* dev)
100 {
101     return dev->msi_cap + PCI_MSI_ADDRESS_HI;
102 }
103 
104 static inline uint8_t msi_data_off(const PCIDevice* dev, bool msi64bit)
105 {
106     return dev->msi_cap + (msi64bit ? PCI_MSI_DATA_64 : PCI_MSI_DATA_32);
107 }
108 
109 static inline uint8_t msi_mask_off(const PCIDevice* dev, bool msi64bit)
110 {
111     return dev->msi_cap + (msi64bit ? PCI_MSI_MASK_64 : PCI_MSI_MASK_32);
112 }
113 
114 static inline uint8_t msi_pending_off(const PCIDevice* dev, bool msi64bit)
115 {
116     return dev->msi_cap + (msi64bit ? PCI_MSI_PENDING_64 : PCI_MSI_PENDING_32);
117 }
118 
119 /*
120  * Special API for POWER to configure the vectors through
121  * a side channel. Should never be used by devices.
122  */
123 void msi_set_message(PCIDevice *dev, MSIMessage msg)
124 {
125     uint16_t flags = pci_get_word(dev->config + msi_flags_off(dev));
126     bool msi64bit = flags & PCI_MSI_FLAGS_64BIT;
127 
128     if (msi64bit) {
129         pci_set_quad(dev->config + msi_address_lo_off(dev), msg.address);
130     } else {
131         pci_set_long(dev->config + msi_address_lo_off(dev), msg.address);
132     }
133     pci_set_word(dev->config + msi_data_off(dev, msi64bit), msg.data);
134 }
135 
136 MSIMessage msi_get_message(PCIDevice *dev, unsigned int vector)
137 {
138     uint16_t flags = pci_get_word(dev->config + msi_flags_off(dev));
139     bool msi64bit = flags & PCI_MSI_FLAGS_64BIT;
140     unsigned int nr_vectors = msi_nr_vectors(flags);
141     MSIMessage msg;
142 
143     assert(vector < nr_vectors);
144 
145     if (msi64bit) {
146         msg.address = pci_get_quad(dev->config + msi_address_lo_off(dev));
147     } else {
148         msg.address = pci_get_long(dev->config + msi_address_lo_off(dev));
149     }
150 
151     /* upper bit 31:16 is zero */
152     msg.data = pci_get_word(dev->config + msi_data_off(dev, msi64bit));
153     if (nr_vectors > 1) {
154         msg.data &= ~(nr_vectors - 1);
155         msg.data |= vector;
156     }
157 
158     return msg;
159 }
160 
161 bool msi_enabled(const PCIDevice *dev)
162 {
163     return msi_present(dev) &&
164         (pci_get_word(dev->config + msi_flags_off(dev)) &
165          PCI_MSI_FLAGS_ENABLE);
166 }
167 
168 /*
169  * Make PCI device @dev MSI-capable.
170  * Non-zero @offset puts capability MSI at that offset in PCI config
171  * space.
172  * @nr_vectors is the number of MSI vectors (1, 2, 4, 8, 16 or 32).
173  * If @msi64bit, make the device capable of sending a 64-bit message
174  * address.
175  * If @msi_per_vector_mask, make the device support per-vector masking.
176  * Return 0 on success, return -errno on error.
177  *
178  * -ENOTSUP means lacking msi support for a msi-capable platform.
179  * -EINVAL means capability overlap, happens when @offset is non-zero,
180  *  also means a programming error, except device assignment, which can check
181  *  if a real HW is broken.
182  */
183 int msi_init(struct PCIDevice *dev, uint8_t offset,
184              unsigned int nr_vectors, bool msi64bit, bool msi_per_vector_mask)
185 {
186     unsigned int vectors_order;
187     uint16_t flags;
188     uint8_t cap_size;
189     int config_offset;
190 
191     if (!msi_nonbroken) {
192         return -ENOTSUP;
193     }
194 
195     MSI_DEV_PRINTF(dev,
196                    "init offset: 0x%"PRIx8" vector: %"PRId8
197                    " 64bit %d mask %d\n",
198                    offset, nr_vectors, msi64bit, msi_per_vector_mask);
199 
200     assert(!(nr_vectors & (nr_vectors - 1)));   /* power of 2 */
201     assert(nr_vectors > 0);
202     assert(nr_vectors <= PCI_MSI_VECTORS_MAX);
203     /* the nr of MSI vectors is up to 32 */
204     vectors_order = ctz32(nr_vectors);
205 
206     flags = vectors_order << ctz32(PCI_MSI_FLAGS_QMASK);
207     if (msi64bit) {
208         flags |= PCI_MSI_FLAGS_64BIT;
209     }
210     if (msi_per_vector_mask) {
211         flags |= PCI_MSI_FLAGS_MASKBIT;
212     }
213 
214     cap_size = msi_cap_sizeof(flags);
215     config_offset = pci_add_capability(dev, PCI_CAP_ID_MSI, offset, cap_size);
216     if (config_offset < 0) {
217         return config_offset;
218     }
219 
220     dev->msi_cap = config_offset;
221     dev->cap_present |= QEMU_PCI_CAP_MSI;
222 
223     pci_set_word(dev->config + msi_flags_off(dev), flags);
224     pci_set_word(dev->wmask + msi_flags_off(dev),
225                  PCI_MSI_FLAGS_QSIZE | PCI_MSI_FLAGS_ENABLE);
226     pci_set_long(dev->wmask + msi_address_lo_off(dev),
227                  PCI_MSI_ADDRESS_LO_MASK);
228     if (msi64bit) {
229         pci_set_long(dev->wmask + msi_address_hi_off(dev), 0xffffffff);
230     }
231     pci_set_word(dev->wmask + msi_data_off(dev, msi64bit), 0xffff);
232 
233     if (msi_per_vector_mask) {
234         /* Make mask bits 0 to nr_vectors - 1 writable. */
235         pci_set_long(dev->wmask + msi_mask_off(dev, msi64bit),
236                      0xffffffff >> (PCI_MSI_VECTORS_MAX - nr_vectors));
237     }
238 
239     return 0;
240 }
241 
242 void msi_uninit(struct PCIDevice *dev)
243 {
244     uint16_t flags;
245     uint8_t cap_size;
246 
247     if (!msi_present(dev)) {
248         return;
249     }
250     flags = pci_get_word(dev->config + msi_flags_off(dev));
251     cap_size = msi_cap_sizeof(flags);
252     pci_del_capability(dev, PCI_CAP_ID_MSI, cap_size);
253     dev->cap_present &= ~QEMU_PCI_CAP_MSI;
254 
255     MSI_DEV_PRINTF(dev, "uninit\n");
256 }
257 
258 void msi_reset(PCIDevice *dev)
259 {
260     uint16_t flags;
261     bool msi64bit;
262 
263     if (!msi_present(dev)) {
264         return;
265     }
266 
267     flags = pci_get_word(dev->config + msi_flags_off(dev));
268     flags &= ~(PCI_MSI_FLAGS_QSIZE | PCI_MSI_FLAGS_ENABLE);
269     msi64bit = flags & PCI_MSI_FLAGS_64BIT;
270 
271     pci_set_word(dev->config + msi_flags_off(dev), flags);
272     pci_set_long(dev->config + msi_address_lo_off(dev), 0);
273     if (msi64bit) {
274         pci_set_long(dev->config + msi_address_hi_off(dev), 0);
275     }
276     pci_set_word(dev->config + msi_data_off(dev, msi64bit), 0);
277     if (flags & PCI_MSI_FLAGS_MASKBIT) {
278         pci_set_long(dev->config + msi_mask_off(dev, msi64bit), 0);
279         pci_set_long(dev->config + msi_pending_off(dev, msi64bit), 0);
280     }
281     MSI_DEV_PRINTF(dev, "reset\n");
282 }
283 
284 static bool msi_is_masked(const PCIDevice *dev, unsigned int vector)
285 {
286     uint16_t flags = pci_get_word(dev->config + msi_flags_off(dev));
287     uint32_t mask, data;
288     bool msi64bit = flags & PCI_MSI_FLAGS_64BIT;
289     assert(vector < PCI_MSI_VECTORS_MAX);
290 
291     if (!(flags & PCI_MSI_FLAGS_MASKBIT)) {
292         return false;
293     }
294 
295     data = pci_get_word(dev->config + msi_data_off(dev, msi64bit));
296     if (xen_is_pirq_msi(data)) {
297         return false;
298     }
299 
300     mask = pci_get_long(dev->config +
301                         msi_mask_off(dev, flags & PCI_MSI_FLAGS_64BIT));
302     return mask & (1U << vector);
303 }
304 
305 void msi_notify(PCIDevice *dev, unsigned int vector)
306 {
307     uint16_t flags = pci_get_word(dev->config + msi_flags_off(dev));
308     bool msi64bit = flags & PCI_MSI_FLAGS_64BIT;
309     unsigned int nr_vectors = msi_nr_vectors(flags);
310     MSIMessage msg;
311 
312     assert(vector < nr_vectors);
313     if (msi_is_masked(dev, vector)) {
314         assert(flags & PCI_MSI_FLAGS_MASKBIT);
315         pci_long_test_and_set_mask(
316             dev->config + msi_pending_off(dev, msi64bit), 1U << vector);
317         MSI_DEV_PRINTF(dev, "pending vector 0x%x\n", vector);
318         return;
319     }
320 
321     msg = msi_get_message(dev, vector);
322 
323     MSI_DEV_PRINTF(dev,
324                    "notify vector 0x%x"
325                    " address: 0x%"PRIx64" data: 0x%"PRIx32"\n",
326                    vector, msg.address, msg.data);
327     msi_send_message(dev, msg);
328 }
329 
330 void msi_send_message(PCIDevice *dev, MSIMessage msg)
331 {
332     MemTxAttrs attrs = {};
333 
334     attrs.requester_id = pci_requester_id(dev);
335     address_space_stl_le(&dev->bus_master_as, msg.address, msg.data,
336                          attrs, NULL);
337 }
338 
339 /* Normally called by pci_default_write_config(). */
340 void msi_write_config(PCIDevice *dev, uint32_t addr, uint32_t val, int len)
341 {
342     uint16_t flags = pci_get_word(dev->config + msi_flags_off(dev));
343     bool msi64bit = flags & PCI_MSI_FLAGS_64BIT;
344     bool msi_per_vector_mask = flags & PCI_MSI_FLAGS_MASKBIT;
345     unsigned int nr_vectors;
346     uint8_t log_num_vecs;
347     uint8_t log_max_vecs;
348     unsigned int vector;
349     uint32_t pending;
350 
351     if (!msi_present(dev) ||
352         !ranges_overlap(addr, len, dev->msi_cap, msi_cap_sizeof(flags))) {
353         return;
354     }
355 
356 #ifdef MSI_DEBUG
357     MSI_DEV_PRINTF(dev, "addr 0x%"PRIx32" val 0x%"PRIx32" len %d\n",
358                    addr, val, len);
359     MSI_DEV_PRINTF(dev, "ctrl: 0x%"PRIx16" address: 0x%"PRIx32,
360                    flags,
361                    pci_get_long(dev->config + msi_address_lo_off(dev)));
362     if (msi64bit) {
363         fprintf(stderr, " address-hi: 0x%"PRIx32,
364                 pci_get_long(dev->config + msi_address_hi_off(dev)));
365     }
366     fprintf(stderr, " data: 0x%"PRIx16,
367             pci_get_word(dev->config + msi_data_off(dev, msi64bit)));
368     if (flags & PCI_MSI_FLAGS_MASKBIT) {
369         fprintf(stderr, " mask 0x%"PRIx32" pending 0x%"PRIx32,
370                 pci_get_long(dev->config + msi_mask_off(dev, msi64bit)),
371                 pci_get_long(dev->config + msi_pending_off(dev, msi64bit)));
372     }
373     fprintf(stderr, "\n");
374 #endif
375 
376     if (!(flags & PCI_MSI_FLAGS_ENABLE)) {
377         return;
378     }
379 
380     /*
381      * Now MSI is enabled, clear INTx# interrupts.
382      * the driver is prohibited from writing enable bit to mask
383      * a service request. But the guest OS could do this.
384      * So we just discard the interrupts as moderate fallback.
385      *
386      * 6.8.3.3. Enabling Operation
387      *   While enabled for MSI or MSI-X operation, a function is prohibited
388      *   from using its INTx# pin (if implemented) to request
389      *   service (MSI, MSI-X, and INTx# are mutually exclusive).
390      */
391     pci_device_deassert_intx(dev);
392 
393     /*
394      * nr_vectors might be set bigger than capable. So clamp it.
395      * This is not legal by spec, so we can do anything we like,
396      * just don't crash the host
397      */
398     log_num_vecs =
399         (flags & PCI_MSI_FLAGS_QSIZE) >> ctz32(PCI_MSI_FLAGS_QSIZE);
400     log_max_vecs =
401         (flags & PCI_MSI_FLAGS_QMASK) >> ctz32(PCI_MSI_FLAGS_QMASK);
402     if (log_num_vecs > log_max_vecs) {
403         flags &= ~PCI_MSI_FLAGS_QSIZE;
404         flags |= log_max_vecs << ctz32(PCI_MSI_FLAGS_QSIZE);
405         pci_set_word(dev->config + msi_flags_off(dev), flags);
406     }
407 
408     if (!msi_per_vector_mask) {
409         /* if per vector masking isn't supported,
410            there is no pending interrupt. */
411         return;
412     }
413 
414     nr_vectors = msi_nr_vectors(flags);
415 
416     /* This will discard pending interrupts, if any. */
417     pending = pci_get_long(dev->config + msi_pending_off(dev, msi64bit));
418     pending &= 0xffffffff >> (PCI_MSI_VECTORS_MAX - nr_vectors);
419     pci_set_long(dev->config + msi_pending_off(dev, msi64bit), pending);
420 
421     /* deliver pending interrupts which are unmasked */
422     for (vector = 0; vector < nr_vectors; ++vector) {
423         if (msi_is_masked(dev, vector) || !(pending & (1U << vector))) {
424             continue;
425         }
426 
427         pci_long_test_and_clear_mask(
428             dev->config + msi_pending_off(dev, msi64bit), 1U << vector);
429         msi_notify(dev, vector);
430     }
431 }
432 
433 unsigned int msi_nr_vectors_allocated(const PCIDevice *dev)
434 {
435     uint16_t flags = pci_get_word(dev->config + msi_flags_off(dev));
436     return msi_nr_vectors(flags);
437 }
438