2 * QEMU rocker switch emulation - PCI device
4 * Copyright (c) 2014 Scott Feldman <sfeldma@gmail.com>
5 * Copyright (c) 2014 Jiri Pirko <jiri@resnulli.us>
7 * This program is free software; you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License as published by
9 * the Free Software Foundation; either version 2 of the License, or
10 * (at your option) any later version.
12 * This program is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 * GNU General Public License for more details.
18 #include "qemu/osdep.h"
20 #include "hw/pci/pci.h"
21 #include "hw/pci/msix.h"
25 #include "qemu/bitops.h"
26 #include "qmp-commands.h"
29 #include "rocker_hw.h"
30 #include "rocker_fp.h"
31 #include "rocker_desc.h"
32 #include "rocker_tlv.h"
33 #include "rocker_world.h"
34 #include "rocker_of_dpa.h"
42 MemoryRegion msix_bar;
44 /* switch configuration */
45 char *name; /* switch name */
46 char *world_name; /* world name */
47 uint32_t fp_ports; /* front-panel port count */
48 NICPeers *fp_ports_peers;
49 MACAddr fp_start_macaddr; /* front-panel port 0 mac addr */
50 uint64_t switch_id; /* switch id */
52 /* front-panel ports */
53 FpPort *fp_port[ROCKER_FP_PORTS_MAX];
55 /* register backings */
58 dma_addr_t test_dma_addr;
59 uint32_t test_dma_size;
60 uint64_t lower32; /* lower 32-bit val in 2-part 64-bit access */
66 World *worlds[ROCKER_WORLD_TYPE_MAX];
69 QLIST_ENTRY(rocker) next;
72 #define ROCKER "rocker"
74 #define to_rocker(obj) \
75 OBJECT_CHECK(Rocker, (obj), ROCKER)
77 static QLIST_HEAD(, rocker) rockers;
79 Rocker *rocker_find(const char *name)
83 QLIST_FOREACH(r, &rockers, next)
84 if (strcmp(r->name, name) == 0) {
91 World *rocker_get_world(Rocker *r, enum rocker_world_type type)
93 if (type < ROCKER_WORLD_TYPE_MAX) {
94 return r->worlds[type];
99 RockerSwitch *qmp_query_rocker(const char *name, Error **errp)
101 RockerSwitch *rocker;
104 r = rocker_find(name);
106 error_setg(errp, "rocker %s not found", name);
110 rocker = g_new0(RockerSwitch, 1);
111 rocker->name = g_strdup(r->name);
112 rocker->id = r->switch_id;
113 rocker->ports = r->fp_ports;
118 RockerPortList *qmp_query_rocker_ports(const char *name, Error **errp)
120 RockerPortList *list = NULL;
124 r = rocker_find(name);
126 error_setg(errp, "rocker %s not found", name);
130 for (i = r->fp_ports - 1; i >= 0; i--) {
131 RockerPortList *info = g_malloc0(sizeof(*info));
132 info->value = g_malloc0(sizeof(*info->value));
133 struct fp_port *port = r->fp_port[i];
135 fp_port_get_info(port, info);
143 uint32_t rocker_fp_ports(Rocker *r)
148 static uint32_t rocker_get_pport_by_tx_ring(Rocker *r,
151 return (desc_ring_index(ring) - 2) / 2 + 1;
154 static int tx_consume(Rocker *r, DescInfo *info)
156 PCIDevice *dev = PCI_DEVICE(r);
157 char *buf = desc_get_buf(info, true);
159 RockerTlv *tlvs[ROCKER_TLV_TX_MAX + 1];
160 struct iovec iov[ROCKER_TX_FRAGS_MAX] = { { 0, }, };
163 uint16_t tx_offload = ROCKER_TX_OFFLOAD_NONE;
164 uint16_t tx_l3_csum_off = 0;
165 uint16_t tx_tso_mss = 0;
166 uint16_t tx_tso_hdr_len = 0;
173 return -ROCKER_ENXIO;
176 rocker_tlv_parse(tlvs, ROCKER_TLV_TX_MAX, buf, desc_tlv_size(info));
178 if (!tlvs[ROCKER_TLV_TX_FRAGS]) {
179 return -ROCKER_EINVAL;
182 pport = rocker_get_pport_by_tx_ring(r, desc_get_ring(info));
183 if (!fp_port_from_pport(pport, &port)) {
184 return -ROCKER_EINVAL;
187 if (tlvs[ROCKER_TLV_TX_OFFLOAD]) {
188 tx_offload = rocker_tlv_get_u8(tlvs[ROCKER_TLV_TX_OFFLOAD]);
191 switch (tx_offload) {
192 case ROCKER_TX_OFFLOAD_L3_CSUM:
193 if (!tlvs[ROCKER_TLV_TX_L3_CSUM_OFF]) {
194 return -ROCKER_EINVAL;
197 case ROCKER_TX_OFFLOAD_TSO:
198 if (!tlvs[ROCKER_TLV_TX_TSO_MSS] ||
199 !tlvs[ROCKER_TLV_TX_TSO_HDR_LEN]) {
200 return -ROCKER_EINVAL;
205 if (tlvs[ROCKER_TLV_TX_L3_CSUM_OFF]) {
206 tx_l3_csum_off = rocker_tlv_get_le16(tlvs[ROCKER_TLV_TX_L3_CSUM_OFF]);
209 if (tlvs[ROCKER_TLV_TX_TSO_MSS]) {
210 tx_tso_mss = rocker_tlv_get_le16(tlvs[ROCKER_TLV_TX_TSO_MSS]);
213 if (tlvs[ROCKER_TLV_TX_TSO_HDR_LEN]) {
214 tx_tso_hdr_len = rocker_tlv_get_le16(tlvs[ROCKER_TLV_TX_TSO_HDR_LEN]);
217 rocker_tlv_for_each_nested(tlv_frag, tlvs[ROCKER_TLV_TX_FRAGS], rem) {
221 if (rocker_tlv_type(tlv_frag) != ROCKER_TLV_TX_FRAG) {
222 err = -ROCKER_EINVAL;
226 rocker_tlv_parse_nested(tlvs, ROCKER_TLV_TX_FRAG_ATTR_MAX, tlv_frag);
228 if (!tlvs[ROCKER_TLV_TX_FRAG_ATTR_ADDR] ||
229 !tlvs[ROCKER_TLV_TX_FRAG_ATTR_LEN]) {
230 err = -ROCKER_EINVAL;
234 frag_addr = rocker_tlv_get_le64(tlvs[ROCKER_TLV_TX_FRAG_ATTR_ADDR]);
235 frag_len = rocker_tlv_get_le16(tlvs[ROCKER_TLV_TX_FRAG_ATTR_LEN]);
237 if (iovcnt >= ROCKER_TX_FRAGS_MAX) {
238 goto err_too_many_frags;
240 iov[iovcnt].iov_len = frag_len;
241 iov[iovcnt].iov_base = g_malloc(frag_len);
242 if (!iov[iovcnt].iov_base) {
243 err = -ROCKER_ENOMEM;
247 if (pci_dma_read(dev, frag_addr, iov[iovcnt].iov_base,
248 iov[iovcnt].iov_len)) {
256 /* XXX perform Tx offloads */
257 /* XXX silence compiler for now */
258 tx_l3_csum_off += tx_tso_mss = tx_tso_hdr_len = 0;
261 err = fp_port_eg(r->fp_port[port], iov, iovcnt);
267 for (i = 0; i < ROCKER_TX_FRAGS_MAX; i++) {
268 g_free(iov[i].iov_base);
274 static int cmd_get_port_settings(Rocker *r,
275 DescInfo *info, char *buf,
276 RockerTlv *cmd_info_tlv)
278 RockerTlv *tlvs[ROCKER_TLV_CMD_PORT_SETTINGS_MAX + 1];
289 enum rocker_world_type mode;
294 rocker_tlv_parse_nested(tlvs, ROCKER_TLV_CMD_PORT_SETTINGS_MAX,
297 if (!tlvs[ROCKER_TLV_CMD_PORT_SETTINGS_PPORT]) {
298 return -ROCKER_EINVAL;
301 pport = rocker_tlv_get_le32(tlvs[ROCKER_TLV_CMD_PORT_SETTINGS_PPORT]);
302 if (!fp_port_from_pport(pport, &port)) {
303 return -ROCKER_EINVAL;
305 fp_port = r->fp_port[port];
307 err = fp_port_get_settings(fp_port, &speed, &duplex, &autoneg);
312 fp_port_get_macaddr(fp_port, &macaddr);
313 mode = world_type(fp_port_get_world(fp_port));
314 learning = fp_port_get_learning(fp_port);
315 phys_name = fp_port_get_name(fp_port);
317 tlv_size = rocker_tlv_total_size(0) + /* nest */
318 rocker_tlv_total_size(sizeof(uint32_t)) + /* pport */
319 rocker_tlv_total_size(sizeof(uint32_t)) + /* speed */
320 rocker_tlv_total_size(sizeof(uint8_t)) + /* duplex */
321 rocker_tlv_total_size(sizeof(uint8_t)) + /* autoneg */
322 rocker_tlv_total_size(sizeof(macaddr.a)) + /* macaddr */
323 rocker_tlv_total_size(sizeof(uint8_t)) + /* mode */
324 rocker_tlv_total_size(sizeof(uint8_t)) + /* learning */
325 rocker_tlv_total_size(strlen(phys_name));
327 if (tlv_size > desc_buf_size(info)) {
328 return -ROCKER_EMSGSIZE;
332 nest = rocker_tlv_nest_start(buf, &pos, ROCKER_TLV_CMD_INFO);
333 rocker_tlv_put_le32(buf, &pos, ROCKER_TLV_CMD_PORT_SETTINGS_PPORT, pport);
334 rocker_tlv_put_le32(buf, &pos, ROCKER_TLV_CMD_PORT_SETTINGS_SPEED, speed);
335 rocker_tlv_put_u8(buf, &pos, ROCKER_TLV_CMD_PORT_SETTINGS_DUPLEX, duplex);
336 rocker_tlv_put_u8(buf, &pos, ROCKER_TLV_CMD_PORT_SETTINGS_AUTONEG, autoneg);
337 rocker_tlv_put(buf, &pos, ROCKER_TLV_CMD_PORT_SETTINGS_MACADDR,
338 sizeof(macaddr.a), macaddr.a);
339 rocker_tlv_put_u8(buf, &pos, ROCKER_TLV_CMD_PORT_SETTINGS_MODE, mode);
340 rocker_tlv_put_u8(buf, &pos, ROCKER_TLV_CMD_PORT_SETTINGS_LEARNING,
342 rocker_tlv_put(buf, &pos, ROCKER_TLV_CMD_PORT_SETTINGS_PHYS_NAME,
343 strlen(phys_name), phys_name);
344 rocker_tlv_nest_end(buf, &pos, nest);
346 return desc_set_buf(info, tlv_size);
349 static int cmd_set_port_settings(Rocker *r,
350 RockerTlv *cmd_info_tlv)
352 RockerTlv *tlvs[ROCKER_TLV_CMD_PORT_SETTINGS_MAX + 1];
361 enum rocker_world_type mode;
364 rocker_tlv_parse_nested(tlvs, ROCKER_TLV_CMD_PORT_SETTINGS_MAX,
367 if (!tlvs[ROCKER_TLV_CMD_PORT_SETTINGS_PPORT]) {
368 return -ROCKER_EINVAL;
371 pport = rocker_tlv_get_le32(tlvs[ROCKER_TLV_CMD_PORT_SETTINGS_PPORT]);
372 if (!fp_port_from_pport(pport, &port)) {
373 return -ROCKER_EINVAL;
375 fp_port = r->fp_port[port];
377 if (tlvs[ROCKER_TLV_CMD_PORT_SETTINGS_SPEED] &&
378 tlvs[ROCKER_TLV_CMD_PORT_SETTINGS_DUPLEX] &&
379 tlvs[ROCKER_TLV_CMD_PORT_SETTINGS_AUTONEG]) {
381 speed = rocker_tlv_get_le32(tlvs[ROCKER_TLV_CMD_PORT_SETTINGS_SPEED]);
382 duplex = rocker_tlv_get_u8(tlvs[ROCKER_TLV_CMD_PORT_SETTINGS_DUPLEX]);
383 autoneg = rocker_tlv_get_u8(tlvs[ROCKER_TLV_CMD_PORT_SETTINGS_AUTONEG]);
385 err = fp_port_set_settings(fp_port, speed, duplex, autoneg);
391 if (tlvs[ROCKER_TLV_CMD_PORT_SETTINGS_MACADDR]) {
392 if (rocker_tlv_len(tlvs[ROCKER_TLV_CMD_PORT_SETTINGS_MACADDR]) !=
394 return -ROCKER_EINVAL;
397 rocker_tlv_data(tlvs[ROCKER_TLV_CMD_PORT_SETTINGS_MACADDR]),
399 fp_port_set_macaddr(fp_port, &macaddr);
402 if (tlvs[ROCKER_TLV_CMD_PORT_SETTINGS_MODE]) {
403 mode = rocker_tlv_get_u8(tlvs[ROCKER_TLV_CMD_PORT_SETTINGS_MODE]);
404 if (mode >= ROCKER_WORLD_TYPE_MAX) {
405 return -ROCKER_EINVAL;
407 /* We don't support world change. */
408 if (!fp_port_check_world(fp_port, r->worlds[mode])) {
409 return -ROCKER_EINVAL;
413 if (tlvs[ROCKER_TLV_CMD_PORT_SETTINGS_LEARNING]) {
415 rocker_tlv_get_u8(tlvs[ROCKER_TLV_CMD_PORT_SETTINGS_LEARNING]);
416 fp_port_set_learning(fp_port, learning);
422 static int cmd_consume(Rocker *r, DescInfo *info)
424 char *buf = desc_get_buf(info, false);
425 RockerTlv *tlvs[ROCKER_TLV_CMD_MAX + 1];
432 return -ROCKER_ENXIO;
435 rocker_tlv_parse(tlvs, ROCKER_TLV_CMD_MAX, buf, desc_tlv_size(info));
437 if (!tlvs[ROCKER_TLV_CMD_TYPE] || !tlvs[ROCKER_TLV_CMD_INFO]) {
438 return -ROCKER_EINVAL;
441 cmd = rocker_tlv_get_le16(tlvs[ROCKER_TLV_CMD_TYPE]);
442 info_tlv = tlvs[ROCKER_TLV_CMD_INFO];
444 /* This might be reworked to something like this:
445 * Every world will have an array of command handlers from
446 * ROCKER_TLV_CMD_TYPE_UNSPEC to ROCKER_TLV_CMD_TYPE_MAX. There is
447 * up to each world to implement whatever command it want.
448 * It can reference "generic" commands as cmd_set_port_settings or
449 * cmd_get_port_settings
453 case ROCKER_TLV_CMD_TYPE_OF_DPA_FLOW_ADD:
454 case ROCKER_TLV_CMD_TYPE_OF_DPA_FLOW_MOD:
455 case ROCKER_TLV_CMD_TYPE_OF_DPA_FLOW_DEL:
456 case ROCKER_TLV_CMD_TYPE_OF_DPA_FLOW_GET_STATS:
457 case ROCKER_TLV_CMD_TYPE_OF_DPA_GROUP_ADD:
458 case ROCKER_TLV_CMD_TYPE_OF_DPA_GROUP_MOD:
459 case ROCKER_TLV_CMD_TYPE_OF_DPA_GROUP_DEL:
460 case ROCKER_TLV_CMD_TYPE_OF_DPA_GROUP_GET_STATS:
461 world = r->worlds[ROCKER_WORLD_TYPE_OF_DPA];
462 err = world_do_cmd(world, info, buf, cmd, info_tlv);
464 case ROCKER_TLV_CMD_TYPE_GET_PORT_SETTINGS:
465 err = cmd_get_port_settings(r, info, buf, info_tlv);
467 case ROCKER_TLV_CMD_TYPE_SET_PORT_SETTINGS:
468 err = cmd_set_port_settings(r, info_tlv);
471 err = -ROCKER_EINVAL;
478 static void rocker_msix_irq(Rocker *r, unsigned vector)
480 PCIDevice *dev = PCI_DEVICE(r);
482 DPRINTF("MSI-X notify request for vector %d\n", vector);
483 if (vector >= ROCKER_MSIX_VEC_COUNT(r->fp_ports)) {
484 DPRINTF("incorrect vector %d\n", vector);
487 msix_notify(dev, vector);
490 int rocker_event_link_changed(Rocker *r, uint32_t pport, bool link_up)
492 DescRing *ring = r->rings[ROCKER_RING_EVENT];
493 DescInfo *info = desc_ring_fetch_desc(ring);
501 return -ROCKER_ENOBUFS;
504 tlv_size = rocker_tlv_total_size(sizeof(uint16_t)) + /* event type */
505 rocker_tlv_total_size(0) + /* nest */
506 rocker_tlv_total_size(sizeof(uint32_t)) + /* pport */
507 rocker_tlv_total_size(sizeof(uint8_t)); /* link up */
509 if (tlv_size > desc_buf_size(info)) {
510 err = -ROCKER_EMSGSIZE;
514 buf = desc_get_buf(info, false);
516 err = -ROCKER_ENOMEM;
521 rocker_tlv_put_le32(buf, &pos, ROCKER_TLV_EVENT_TYPE,
522 ROCKER_TLV_EVENT_TYPE_LINK_CHANGED);
523 nest = rocker_tlv_nest_start(buf, &pos, ROCKER_TLV_EVENT_INFO);
524 rocker_tlv_put_le32(buf, &pos, ROCKER_TLV_EVENT_LINK_CHANGED_PPORT, pport);
525 rocker_tlv_put_u8(buf, &pos, ROCKER_TLV_EVENT_LINK_CHANGED_LINKUP,
527 rocker_tlv_nest_end(buf, &pos, nest);
529 err = desc_set_buf(info, tlv_size);
533 if (desc_ring_post_desc(ring, err)) {
534 rocker_msix_irq(r, ROCKER_MSIX_VEC_EVENT);
540 int rocker_event_mac_vlan_seen(Rocker *r, uint32_t pport, uint8_t *addr,
543 DescRing *ring = r->rings[ROCKER_RING_EVENT];
553 if (!fp_port_from_pport(pport, &port)) {
554 return -ROCKER_EINVAL;
556 fp_port = r->fp_port[port];
557 if (!fp_port_get_learning(fp_port)) {
561 info = desc_ring_fetch_desc(ring);
563 return -ROCKER_ENOBUFS;
566 tlv_size = rocker_tlv_total_size(sizeof(uint16_t)) + /* event type */
567 rocker_tlv_total_size(0) + /* nest */
568 rocker_tlv_total_size(sizeof(uint32_t)) + /* pport */
569 rocker_tlv_total_size(ETH_ALEN) + /* mac addr */
570 rocker_tlv_total_size(sizeof(uint16_t)); /* vlan_id */
572 if (tlv_size > desc_buf_size(info)) {
573 err = -ROCKER_EMSGSIZE;
577 buf = desc_get_buf(info, false);
579 err = -ROCKER_ENOMEM;
584 rocker_tlv_put_le32(buf, &pos, ROCKER_TLV_EVENT_TYPE,
585 ROCKER_TLV_EVENT_TYPE_MAC_VLAN_SEEN);
586 nest = rocker_tlv_nest_start(buf, &pos, ROCKER_TLV_EVENT_INFO);
587 rocker_tlv_put_le32(buf, &pos, ROCKER_TLV_EVENT_MAC_VLAN_PPORT, pport);
588 rocker_tlv_put(buf, &pos, ROCKER_TLV_EVENT_MAC_VLAN_MAC, ETH_ALEN, addr);
589 rocker_tlv_put_u16(buf, &pos, ROCKER_TLV_EVENT_MAC_VLAN_VLAN_ID, vlan_id);
590 rocker_tlv_nest_end(buf, &pos, nest);
592 err = desc_set_buf(info, tlv_size);
596 if (desc_ring_post_desc(ring, err)) {
597 rocker_msix_irq(r, ROCKER_MSIX_VEC_EVENT);
603 static DescRing *rocker_get_rx_ring_by_pport(Rocker *r,
606 return r->rings[(pport - 1) * 2 + 3];
609 int rx_produce(World *world, uint32_t pport,
610 const struct iovec *iov, int iovcnt, uint8_t copy_to_cpu)
612 Rocker *r = world_rocker(world);
613 PCIDevice *dev = (PCIDevice *)r;
614 DescRing *ring = rocker_get_rx_ring_by_pport(r, pport);
615 DescInfo *info = desc_ring_fetch_desc(ring);
617 size_t data_size = iov_size(iov, iovcnt);
619 uint16_t rx_flags = 0;
620 uint16_t rx_csum = 0;
622 RockerTlv *tlvs[ROCKER_TLV_RX_MAX + 1];
624 uint16_t frag_max_len;
629 return -ROCKER_ENOBUFS;
632 buf = desc_get_buf(info, false);
637 rocker_tlv_parse(tlvs, ROCKER_TLV_RX_MAX, buf, desc_tlv_size(info));
639 if (!tlvs[ROCKER_TLV_RX_FRAG_ADDR] ||
640 !tlvs[ROCKER_TLV_RX_FRAG_MAX_LEN]) {
641 err = -ROCKER_EINVAL;
645 frag_addr = rocker_tlv_get_le64(tlvs[ROCKER_TLV_RX_FRAG_ADDR]);
646 frag_max_len = rocker_tlv_get_le16(tlvs[ROCKER_TLV_RX_FRAG_MAX_LEN]);
648 if (data_size > frag_max_len) {
649 err = -ROCKER_EMSGSIZE;
654 rx_flags |= ROCKER_RX_FLAGS_FWD_OFFLOAD;
657 /* XXX calc rx flags/csum */
659 tlv_size = rocker_tlv_total_size(sizeof(uint16_t)) + /* flags */
660 rocker_tlv_total_size(sizeof(uint16_t)) + /* scum */
661 rocker_tlv_total_size(sizeof(uint64_t)) + /* frag addr */
662 rocker_tlv_total_size(sizeof(uint16_t)) + /* frag max len */
663 rocker_tlv_total_size(sizeof(uint16_t)); /* frag len */
665 if (tlv_size > desc_buf_size(info)) {
666 err = -ROCKER_EMSGSIZE;
671 * iov dma write can be optimized in similar way e1000 does it in
672 * e1000_receive_iov. But maybe if would make sense to introduce
673 * generic helper iov_dma_write.
676 data = g_malloc(data_size);
678 err = -ROCKER_ENOMEM;
681 iov_to_buf(iov, iovcnt, 0, data, data_size);
682 pci_dma_write(dev, frag_addr, data, data_size);
686 rocker_tlv_put_le16(buf, &pos, ROCKER_TLV_RX_FLAGS, rx_flags);
687 rocker_tlv_put_le16(buf, &pos, ROCKER_TLV_RX_CSUM, rx_csum);
688 rocker_tlv_put_le64(buf, &pos, ROCKER_TLV_RX_FRAG_ADDR, frag_addr);
689 rocker_tlv_put_le16(buf, &pos, ROCKER_TLV_RX_FRAG_MAX_LEN, frag_max_len);
690 rocker_tlv_put_le16(buf, &pos, ROCKER_TLV_RX_FRAG_LEN, data_size);
692 err = desc_set_buf(info, tlv_size);
695 if (desc_ring_post_desc(ring, err)) {
696 rocker_msix_irq(r, ROCKER_MSIX_VEC_RX(pport - 1));
702 int rocker_port_eg(Rocker *r, uint32_t pport,
703 const struct iovec *iov, int iovcnt)
708 if (!fp_port_from_pport(pport, &port)) {
709 return -ROCKER_EINVAL;
712 fp_port = r->fp_port[port];
714 return fp_port_eg(fp_port, iov, iovcnt);
717 static void rocker_test_dma_ctrl(Rocker *r, uint32_t val)
719 PCIDevice *dev = PCI_DEVICE(r);
723 buf = g_malloc(r->test_dma_size);
726 DPRINTF("test dma buffer alloc failed");
731 case ROCKER_TEST_DMA_CTRL_CLEAR:
732 memset(buf, 0, r->test_dma_size);
734 case ROCKER_TEST_DMA_CTRL_FILL:
735 memset(buf, 0x96, r->test_dma_size);
737 case ROCKER_TEST_DMA_CTRL_INVERT:
738 pci_dma_read(dev, r->test_dma_addr, buf, r->test_dma_size);
739 for (i = 0; i < r->test_dma_size; i++) {
744 DPRINTF("not test dma control val=0x%08x\n", val);
747 pci_dma_write(dev, r->test_dma_addr, buf, r->test_dma_size);
749 rocker_msix_irq(r, ROCKER_MSIX_VEC_TEST);
755 static void rocker_reset(DeviceState *dev);
757 static void rocker_control(Rocker *r, uint32_t val)
759 if (val & ROCKER_CONTROL_RESET) {
760 rocker_reset(DEVICE(r));
764 static int rocker_pci_ring_count(Rocker *r)
769 * - tx and rx ring per each port
771 return 2 + (2 * r->fp_ports);
774 static bool rocker_addr_is_desc_reg(Rocker *r, hwaddr addr)
776 hwaddr start = ROCKER_DMA_DESC_BASE;
777 hwaddr end = start + (ROCKER_DMA_DESC_SIZE * rocker_pci_ring_count(r));
779 return addr >= start && addr < end;
782 static void rocker_port_phys_enable_write(Rocker *r, uint64_t new)
789 for (i = 0; i < r->fp_ports; i++) {
790 fp_port = r->fp_port[i];
791 old_enabled = fp_port_enabled(fp_port);
792 new_enabled = (new >> (i + 1)) & 0x1;
793 if (new_enabled == old_enabled) {
797 fp_port_enable(r->fp_port[i]);
799 fp_port_disable(r->fp_port[i]);
804 static void rocker_io_writel(void *opaque, hwaddr addr, uint32_t val)
808 if (rocker_addr_is_desc_reg(r, addr)) {
809 unsigned index = ROCKER_RING_INDEX(addr);
810 unsigned offset = addr & ROCKER_DMA_DESC_MASK;
813 case ROCKER_DMA_DESC_ADDR_OFFSET:
814 r->lower32 = (uint64_t)val;
816 case ROCKER_DMA_DESC_ADDR_OFFSET + 4:
817 desc_ring_set_base_addr(r->rings[index],
818 ((uint64_t)val) << 32 | r->lower32);
821 case ROCKER_DMA_DESC_SIZE_OFFSET:
822 desc_ring_set_size(r->rings[index], val);
824 case ROCKER_DMA_DESC_HEAD_OFFSET:
825 if (desc_ring_set_head(r->rings[index], val)) {
826 rocker_msix_irq(r, desc_ring_get_msix_vector(r->rings[index]));
829 case ROCKER_DMA_DESC_CTRL_OFFSET:
830 desc_ring_set_ctrl(r->rings[index], val);
832 case ROCKER_DMA_DESC_CREDITS_OFFSET:
833 if (desc_ring_ret_credits(r->rings[index], val)) {
834 rocker_msix_irq(r, desc_ring_get_msix_vector(r->rings[index]));
838 DPRINTF("not implemented dma reg write(l) addr=0x" TARGET_FMT_plx
839 " val=0x%08x (ring %d, addr=0x%02x)\n",
840 addr, val, index, offset);
847 case ROCKER_TEST_REG:
850 case ROCKER_TEST_REG64:
851 case ROCKER_TEST_DMA_ADDR:
852 case ROCKER_PORT_PHYS_ENABLE:
853 r->lower32 = (uint64_t)val;
855 case ROCKER_TEST_REG64 + 4:
856 r->test_reg64 = ((uint64_t)val) << 32 | r->lower32;
859 case ROCKER_TEST_IRQ:
860 rocker_msix_irq(r, val);
862 case ROCKER_TEST_DMA_SIZE:
863 r->test_dma_size = val;
865 case ROCKER_TEST_DMA_ADDR + 4:
866 r->test_dma_addr = ((uint64_t)val) << 32 | r->lower32;
869 case ROCKER_TEST_DMA_CTRL:
870 rocker_test_dma_ctrl(r, val);
873 rocker_control(r, val);
875 case ROCKER_PORT_PHYS_ENABLE + 4:
876 rocker_port_phys_enable_write(r, ((uint64_t)val) << 32 | r->lower32);
880 DPRINTF("not implemented write(l) addr=0x" TARGET_FMT_plx
881 " val=0x%08x\n", addr, val);
886 static void rocker_io_writeq(void *opaque, hwaddr addr, uint64_t val)
890 if (rocker_addr_is_desc_reg(r, addr)) {
891 unsigned index = ROCKER_RING_INDEX(addr);
892 unsigned offset = addr & ROCKER_DMA_DESC_MASK;
895 case ROCKER_DMA_DESC_ADDR_OFFSET:
896 desc_ring_set_base_addr(r->rings[index], val);
899 DPRINTF("not implemented dma reg write(q) addr=0x" TARGET_FMT_plx
900 " val=0x" TARGET_FMT_plx " (ring %d, offset=0x%02x)\n",
901 addr, val, index, offset);
908 case ROCKER_TEST_REG64:
911 case ROCKER_TEST_DMA_ADDR:
912 r->test_dma_addr = val;
914 case ROCKER_PORT_PHYS_ENABLE:
915 rocker_port_phys_enable_write(r, val);
918 DPRINTF("not implemented write(q) addr=0x" TARGET_FMT_plx
919 " val=0x" TARGET_FMT_plx "\n", addr, val);
925 #define regname(reg) case (reg): return #reg
926 static const char *rocker_reg_name(void *opaque, hwaddr addr)
930 if (rocker_addr_is_desc_reg(r, addr)) {
931 unsigned index = ROCKER_RING_INDEX(addr);
932 unsigned offset = addr & ROCKER_DMA_DESC_MASK;
933 static char buf[100];
938 sprintf(ring_name, "cmd");
941 sprintf(ring_name, "event");
944 sprintf(ring_name, "%s-%d", index % 2 ? "rx" : "tx",
949 case ROCKER_DMA_DESC_ADDR_OFFSET:
950 sprintf(buf, "Ring[%s] ADDR", ring_name);
952 case ROCKER_DMA_DESC_ADDR_OFFSET+4:
953 sprintf(buf, "Ring[%s] ADDR+4", ring_name);
955 case ROCKER_DMA_DESC_SIZE_OFFSET:
956 sprintf(buf, "Ring[%s] SIZE", ring_name);
958 case ROCKER_DMA_DESC_HEAD_OFFSET:
959 sprintf(buf, "Ring[%s] HEAD", ring_name);
961 case ROCKER_DMA_DESC_TAIL_OFFSET:
962 sprintf(buf, "Ring[%s] TAIL", ring_name);
964 case ROCKER_DMA_DESC_CTRL_OFFSET:
965 sprintf(buf, "Ring[%s] CTRL", ring_name);
967 case ROCKER_DMA_DESC_CREDITS_OFFSET:
968 sprintf(buf, "Ring[%s] CREDITS", ring_name);
971 sprintf(buf, "Ring[%s] ???", ring_name);
976 regname(ROCKER_BOGUS_REG0);
977 regname(ROCKER_BOGUS_REG1);
978 regname(ROCKER_BOGUS_REG2);
979 regname(ROCKER_BOGUS_REG3);
980 regname(ROCKER_TEST_REG);
981 regname(ROCKER_TEST_REG64);
982 regname(ROCKER_TEST_REG64+4);
983 regname(ROCKER_TEST_IRQ);
984 regname(ROCKER_TEST_DMA_ADDR);
985 regname(ROCKER_TEST_DMA_ADDR+4);
986 regname(ROCKER_TEST_DMA_SIZE);
987 regname(ROCKER_TEST_DMA_CTRL);
988 regname(ROCKER_CONTROL);
989 regname(ROCKER_PORT_PHYS_COUNT);
990 regname(ROCKER_PORT_PHYS_LINK_STATUS);
991 regname(ROCKER_PORT_PHYS_LINK_STATUS+4);
992 regname(ROCKER_PORT_PHYS_ENABLE);
993 regname(ROCKER_PORT_PHYS_ENABLE+4);
994 regname(ROCKER_SWITCH_ID);
995 regname(ROCKER_SWITCH_ID+4);
1001 static const char *rocker_reg_name(void *opaque, hwaddr addr)
1007 static void rocker_mmio_write(void *opaque, hwaddr addr, uint64_t val,
1010 DPRINTF("Write %s addr " TARGET_FMT_plx
1011 ", size %u, val " TARGET_FMT_plx "\n",
1012 rocker_reg_name(opaque, addr), addr, size, val);
1016 rocker_io_writel(opaque, addr, val);
1019 rocker_io_writeq(opaque, addr, val);
1024 static uint64_t rocker_port_phys_link_status(Rocker *r)
1027 uint64_t status = 0;
1029 for (i = 0; i < r->fp_ports; i++) {
1030 FpPort *port = r->fp_port[i];
1032 if (fp_port_get_link_up(port)) {
1033 status |= 1 << (i + 1);
1039 static uint64_t rocker_port_phys_enable_read(Rocker *r)
1044 for (i = 0; i < r->fp_ports; i++) {
1045 FpPort *port = r->fp_port[i];
1047 if (fp_port_enabled(port)) {
1048 ret |= 1 << (i + 1);
1054 static uint32_t rocker_io_readl(void *opaque, hwaddr addr)
1059 if (rocker_addr_is_desc_reg(r, addr)) {
1060 unsigned index = ROCKER_RING_INDEX(addr);
1061 unsigned offset = addr & ROCKER_DMA_DESC_MASK;
1064 case ROCKER_DMA_DESC_ADDR_OFFSET:
1065 ret = (uint32_t)desc_ring_get_base_addr(r->rings[index]);
1067 case ROCKER_DMA_DESC_ADDR_OFFSET + 4:
1068 ret = (uint32_t)(desc_ring_get_base_addr(r->rings[index]) >> 32);
1070 case ROCKER_DMA_DESC_SIZE_OFFSET:
1071 ret = desc_ring_get_size(r->rings[index]);
1073 case ROCKER_DMA_DESC_HEAD_OFFSET:
1074 ret = desc_ring_get_head(r->rings[index]);
1076 case ROCKER_DMA_DESC_TAIL_OFFSET:
1077 ret = desc_ring_get_tail(r->rings[index]);
1079 case ROCKER_DMA_DESC_CREDITS_OFFSET:
1080 ret = desc_ring_get_credits(r->rings[index]);
1083 DPRINTF("not implemented dma reg read(l) addr=0x" TARGET_FMT_plx
1084 " (ring %d, addr=0x%02x)\n", addr, index, offset);
1092 case ROCKER_BOGUS_REG0:
1093 case ROCKER_BOGUS_REG1:
1094 case ROCKER_BOGUS_REG2:
1095 case ROCKER_BOGUS_REG3:
1098 case ROCKER_TEST_REG:
1099 ret = r->test_reg * 2;
1101 case ROCKER_TEST_REG64:
1102 ret = (uint32_t)(r->test_reg64 * 2);
1104 case ROCKER_TEST_REG64 + 4:
1105 ret = (uint32_t)((r->test_reg64 * 2) >> 32);
1107 case ROCKER_TEST_DMA_SIZE:
1108 ret = r->test_dma_size;
1110 case ROCKER_TEST_DMA_ADDR:
1111 ret = (uint32_t)r->test_dma_addr;
1113 case ROCKER_TEST_DMA_ADDR + 4:
1114 ret = (uint32_t)(r->test_dma_addr >> 32);
1116 case ROCKER_PORT_PHYS_COUNT:
1119 case ROCKER_PORT_PHYS_LINK_STATUS:
1120 ret = (uint32_t)rocker_port_phys_link_status(r);
1122 case ROCKER_PORT_PHYS_LINK_STATUS + 4:
1123 ret = (uint32_t)(rocker_port_phys_link_status(r) >> 32);
1125 case ROCKER_PORT_PHYS_ENABLE:
1126 ret = (uint32_t)rocker_port_phys_enable_read(r);
1128 case ROCKER_PORT_PHYS_ENABLE + 4:
1129 ret = (uint32_t)(rocker_port_phys_enable_read(r) >> 32);
1131 case ROCKER_SWITCH_ID:
1132 ret = (uint32_t)r->switch_id;
1134 case ROCKER_SWITCH_ID + 4:
1135 ret = (uint32_t)(r->switch_id >> 32);
1138 DPRINTF("not implemented read(l) addr=0x" TARGET_FMT_plx "\n", addr);
1145 static uint64_t rocker_io_readq(void *opaque, hwaddr addr)
1150 if (rocker_addr_is_desc_reg(r, addr)) {
1151 unsigned index = ROCKER_RING_INDEX(addr);
1152 unsigned offset = addr & ROCKER_DMA_DESC_MASK;
1154 switch (addr & ROCKER_DMA_DESC_MASK) {
1155 case ROCKER_DMA_DESC_ADDR_OFFSET:
1156 ret = desc_ring_get_base_addr(r->rings[index]);
1159 DPRINTF("not implemented dma reg read(q) addr=0x" TARGET_FMT_plx
1160 " (ring %d, addr=0x%02x)\n", addr, index, offset);
1168 case ROCKER_BOGUS_REG0:
1169 case ROCKER_BOGUS_REG2:
1170 ret = 0xDEADBABEDEADBABEULL;
1172 case ROCKER_TEST_REG64:
1173 ret = r->test_reg64 * 2;
1175 case ROCKER_TEST_DMA_ADDR:
1176 ret = r->test_dma_addr;
1178 case ROCKER_PORT_PHYS_LINK_STATUS:
1179 ret = rocker_port_phys_link_status(r);
1181 case ROCKER_PORT_PHYS_ENABLE:
1182 ret = rocker_port_phys_enable_read(r);
1184 case ROCKER_SWITCH_ID:
1188 DPRINTF("not implemented read(q) addr=0x" TARGET_FMT_plx "\n", addr);
1195 static uint64_t rocker_mmio_read(void *opaque, hwaddr addr, unsigned size)
1197 DPRINTF("Read %s addr " TARGET_FMT_plx ", size %u\n",
1198 rocker_reg_name(opaque, addr), addr, size);
1202 return rocker_io_readl(opaque, addr);
1204 return rocker_io_readq(opaque, addr);
1210 static const MemoryRegionOps rocker_mmio_ops = {
1211 .read = rocker_mmio_read,
1212 .write = rocker_mmio_write,
1213 .endianness = DEVICE_LITTLE_ENDIAN,
1215 .min_access_size = 4,
1216 .max_access_size = 8,
1219 .min_access_size = 4,
1220 .max_access_size = 8,
1224 static void rocker_msix_vectors_unuse(Rocker *r,
1225 unsigned int num_vectors)
1227 PCIDevice *dev = PCI_DEVICE(r);
1230 for (i = 0; i < num_vectors; i++) {
1231 msix_vector_unuse(dev, i);
1235 static int rocker_msix_vectors_use(Rocker *r,
1236 unsigned int num_vectors)
1238 PCIDevice *dev = PCI_DEVICE(r);
1242 for (i = 0; i < num_vectors; i++) {
1243 err = msix_vector_use(dev, i);
1251 rocker_msix_vectors_unuse(r, i);
1255 static int rocker_msix_init(Rocker *r)
1257 PCIDevice *dev = PCI_DEVICE(r);
1260 err = msix_init(dev, ROCKER_MSIX_VEC_COUNT(r->fp_ports),
1262 ROCKER_PCI_MSIX_BAR_IDX, ROCKER_PCI_MSIX_TABLE_OFFSET,
1264 ROCKER_PCI_MSIX_BAR_IDX, ROCKER_PCI_MSIX_PBA_OFFSET,
1270 err = rocker_msix_vectors_use(r, ROCKER_MSIX_VEC_COUNT(r->fp_ports));
1272 goto err_msix_vectors_use;
1277 err_msix_vectors_use:
1278 msix_uninit(dev, &r->msix_bar, &r->msix_bar);
1282 static void rocker_msix_uninit(Rocker *r)
1284 PCIDevice *dev = PCI_DEVICE(r);
1286 msix_uninit(dev, &r->msix_bar, &r->msix_bar);
1287 rocker_msix_vectors_unuse(r, ROCKER_MSIX_VEC_COUNT(r->fp_ports));
1290 static World *rocker_world_type_by_name(Rocker *r, const char *name)
1294 for (i = 0; i < ROCKER_WORLD_TYPE_MAX; i++) {
1295 if (strcmp(name, world_name(r->worlds[i])) == 0) {
1296 return r->worlds[i];
1302 static int pci_rocker_init(PCIDevice *dev)
1304 Rocker *r = to_rocker(dev);
1305 const MACAddr zero = { .a = { 0, 0, 0, 0, 0, 0 } };
1306 const MACAddr dflt = { .a = { 0x52, 0x54, 0x00, 0x12, 0x35, 0x01 } };
1307 static int sw_index;
1310 /* allocate worlds */
1312 r->worlds[ROCKER_WORLD_TYPE_OF_DPA] = of_dpa_world_alloc(r);
1314 for (i = 0; i < ROCKER_WORLD_TYPE_MAX; i++) {
1315 if (!r->worlds[i]) {
1317 goto err_world_alloc;
1321 if (!r->world_name) {
1322 r->world_name = g_strdup(world_name(r->worlds[ROCKER_WORLD_TYPE_OF_DPA]));
1325 r->world_dflt = rocker_world_type_by_name(r, r->world_name);
1326 if (!r->world_dflt) {
1328 "rocker: requested world \"%s\" does not exist\n",
1331 goto err_world_type_by_name;
1334 /* set up memory-mapped region at BAR0 */
1336 memory_region_init_io(&r->mmio, OBJECT(r), &rocker_mmio_ops, r,
1337 "rocker-mmio", ROCKER_PCI_BAR0_SIZE);
1338 pci_register_bar(dev, ROCKER_PCI_BAR0_IDX,
1339 PCI_BASE_ADDRESS_SPACE_MEMORY, &r->mmio);
1341 /* set up memory-mapped region for MSI-X */
1343 memory_region_init(&r->msix_bar, OBJECT(r), "rocker-msix-bar",
1344 ROCKER_PCI_MSIX_BAR_SIZE);
1345 pci_register_bar(dev, ROCKER_PCI_MSIX_BAR_IDX,
1346 PCI_BASE_ADDRESS_SPACE_MEMORY, &r->msix_bar);
1350 err = rocker_msix_init(r);
1355 /* validate switch properties */
1358 r->name = g_strdup(ROCKER);
1361 if (rocker_find(r->name)) {
1366 /* Rocker name is passed in port name requests to OS with the intention
1367 * that the name is used in interface names. Limit the length of the
1368 * rocker name to avoid naming problems in the OS. Also, adding the
1369 * port number as p# and unganged breakout b#, where # is at most 2
1370 * digits, so leave room for it too (-1 for string terminator, -3 for
1373 #define ROCKER_IFNAMSIZ 16
1374 #define MAX_ROCKER_NAME_LEN (ROCKER_IFNAMSIZ - 1 - 3 - 3)
1375 if (strlen(r->name) > MAX_ROCKER_NAME_LEN) {
1377 "rocker: name too long; please shorten to at most %d chars\n",
1378 MAX_ROCKER_NAME_LEN);
1382 if (memcmp(&r->fp_start_macaddr, &zero, sizeof(zero)) == 0) {
1383 memcpy(&r->fp_start_macaddr, &dflt, sizeof(dflt));
1384 r->fp_start_macaddr.a[4] += (sw_index++);
1387 if (!r->switch_id) {
1388 memcpy(&r->switch_id, &r->fp_start_macaddr,
1389 sizeof(r->fp_start_macaddr));
1392 if (r->fp_ports > ROCKER_FP_PORTS_MAX) {
1393 r->fp_ports = ROCKER_FP_PORTS_MAX;
1396 r->rings = g_new(DescRing *, rocker_pci_ring_count(r));
1398 goto err_rings_alloc;
1401 /* Rings are ordered like this:
1412 for (i = 0; i < rocker_pci_ring_count(r); i++) {
1413 DescRing *ring = desc_ring_alloc(r, i);
1416 goto err_ring_alloc;
1419 if (i == ROCKER_RING_CMD) {
1420 desc_ring_set_consume(ring, cmd_consume, ROCKER_MSIX_VEC_CMD);
1421 } else if (i == ROCKER_RING_EVENT) {
1422 desc_ring_set_consume(ring, NULL, ROCKER_MSIX_VEC_EVENT);
1423 } else if (i % 2 == 0) {
1424 desc_ring_set_consume(ring, tx_consume,
1425 ROCKER_MSIX_VEC_TX((i - 2) / 2));
1426 } else if (i % 2 == 1) {
1427 desc_ring_set_consume(ring, NULL, ROCKER_MSIX_VEC_RX((i - 3) / 2));
1433 for (i = 0; i < r->fp_ports; i++) {
1435 fp_port_alloc(r, r->name, &r->fp_start_macaddr,
1436 i, &r->fp_ports_peers[i]);
1439 goto err_port_alloc;
1442 r->fp_port[i] = port;
1443 fp_port_set_world(port, r->world_dflt);
1446 QLIST_INSERT_HEAD(&rockers, r, next);
1451 for (--i; i >= 0; i--) {
1452 FpPort *port = r->fp_port[i];
1455 i = rocker_pci_ring_count(r);
1457 for (--i; i >= 0; i--) {
1458 desc_ring_free(r->rings[i]);
1463 rocker_msix_uninit(r);
1465 object_unparent(OBJECT(&r->msix_bar));
1466 object_unparent(OBJECT(&r->mmio));
1467 err_world_type_by_name:
1469 for (i = 0; i < ROCKER_WORLD_TYPE_MAX; i++) {
1471 world_free(r->worlds[i]);
1477 static void pci_rocker_uninit(PCIDevice *dev)
1479 Rocker *r = to_rocker(dev);
1482 QLIST_REMOVE(r, next);
1484 for (i = 0; i < r->fp_ports; i++) {
1485 FpPort *port = r->fp_port[i];
1488 r->fp_port[i] = NULL;
1491 for (i = 0; i < rocker_pci_ring_count(r); i++) {
1493 desc_ring_free(r->rings[i]);
1498 rocker_msix_uninit(r);
1499 object_unparent(OBJECT(&r->msix_bar));
1500 object_unparent(OBJECT(&r->mmio));
1502 for (i = 0; i < ROCKER_WORLD_TYPE_MAX; i++) {
1504 world_free(r->worlds[i]);
1507 g_free(r->fp_ports_peers);
1510 static void rocker_reset(DeviceState *dev)
1512 Rocker *r = to_rocker(dev);
1515 for (i = 0; i < ROCKER_WORLD_TYPE_MAX; i++) {
1517 world_reset(r->worlds[i]);
1520 for (i = 0; i < r->fp_ports; i++) {
1521 fp_port_reset(r->fp_port[i]);
1522 fp_port_set_world(r->fp_port[i], r->world_dflt);
1527 r->test_dma_addr = 0;
1528 r->test_dma_size = 0;
1530 for (i = 0; i < rocker_pci_ring_count(r); i++) {
1531 desc_ring_reset(r->rings[i]);
1534 DPRINTF("Reset done\n");
1537 static Property rocker_properties[] = {
1538 DEFINE_PROP_STRING("name", Rocker, name),
1539 DEFINE_PROP_STRING("world", Rocker, world_name),
1540 DEFINE_PROP_MACADDR("fp_start_macaddr", Rocker,
1542 DEFINE_PROP_UINT64("switch_id", Rocker,
1544 DEFINE_PROP_ARRAY("ports", Rocker, fp_ports,
1545 fp_ports_peers, qdev_prop_netdev, NICPeers),
1546 DEFINE_PROP_END_OF_LIST(),
1549 static const VMStateDescription rocker_vmsd = {
1554 static void rocker_class_init(ObjectClass *klass, void *data)
1556 DeviceClass *dc = DEVICE_CLASS(klass);
1557 PCIDeviceClass *k = PCI_DEVICE_CLASS(klass);
1559 k->init = pci_rocker_init;
1560 k->exit = pci_rocker_uninit;
1561 k->vendor_id = PCI_VENDOR_ID_REDHAT;
1562 k->device_id = PCI_DEVICE_ID_REDHAT_ROCKER;
1563 k->revision = ROCKER_PCI_REVISION;
1564 k->class_id = PCI_CLASS_NETWORK_OTHER;
1565 set_bit(DEVICE_CATEGORY_NETWORK, dc->categories);
1566 dc->desc = "Rocker Switch";
1567 dc->reset = rocker_reset;
1568 dc->props = rocker_properties;
1569 dc->vmsd = &rocker_vmsd;
1572 static const TypeInfo rocker_info = {
1574 .parent = TYPE_PCI_DEVICE,
1575 .instance_size = sizeof(Rocker),
1576 .class_init = rocker_class_init,
1579 static void rocker_register_types(void)
1581 type_register_static(&rocker_info);
1584 type_init(rocker_register_types)