struct config_data cdata;
 
 static __rte_always_inline void
-work(struct rte_mbuf *m)
+exchange_mac(struct rte_mbuf *m)
 {
        struct ether_hdr *eth;
        struct ether_addr addr;
 
        /* change mac addresses on packet (to use mbuf data) */
-       /*
-        * FIXME Swap mac address properly and also handle the
-        * case for both odd and even number of stages that the
-        * addresses end up the same at the end of the pipeline
-        */
        eth = rte_pktmbuf_mtod(m, struct ether_hdr *);
        ether_addr_copy(ð->d_addr, &addr);
        ether_addr_copy(&addr, ð->d_addr);
+}
 
+static __rte_always_inline void
+work(void)
+{
        /* do a number of cycles of work per packet */
        volatile uint64_t start_tsc = rte_rdtsc();
        while (rte_rdtsc() < start_tsc + cdata.worker_cycles)
 
                ev.op = RTE_EVENT_OP_FORWARD;
                ev.sched_type = cdata.queue_type;
 
-               work(ev.mbuf);
+               work();
 
                while (rte_event_enqueue_burst(dev_id, port_id, &ev, 1) != 1)
                        rte_pause();
                        events[i].op = RTE_EVENT_OP_FORWARD;
                        events[i].sched_type = cdata.queue_type;
 
-                       work(events[i].mbuf);
+                       work();
                }
                uint16_t nb_tx = rte_event_enqueue_burst(dev_id, port_id,
                                events, nb_rx);
                received++;
                uint8_t outport = packet.mbuf->port;
 
+               exchange_mac(packet.mbuf);
                rte_eth_tx_buffer(outport, 0, fdata->tx_buf[outport],
                                packet.mbuf);
 
                received += n;
                for (i = 0; i < n; i++) {
                        uint8_t outport = packets[i].mbuf->port;
+
+                       exchange_mac(packets[i].mbuf);
                        rte_eth_tx_buffer(outport, 0, fdata->tx_buf[outport],
                                        packets[i].mbuf);