summaryrefslogtreecommitdiffstats
path: root/test/test_vxlan.py
blob: c74efe7d062c690bfc4abb080937bd0f477c0bff (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
#!/usr/bin/env python

import socket
from util import ip4n_range, ip4_range, reassemble4
import unittest
from framework import VppTestCase, VppTestRunner
from template_bd import BridgeDomain

from scapy.layers.l2 import Ether, Raw
from scapy.layers.inet import IP, UDP
from scapy.layers.vxlan import VXLAN
from scapy.utils import atol
from vpp_ip_route import VppIpRoute, VppRoutePath
from vpp_ip import INVALID_INDEX


class TestVxlan(BridgeDomain, VppTestCase):
    """ VXLAN Test Case """

    def __init__(self, *args):
        BridgeDomain.__init__(self)
        VppTestCase.__init__(self, *args)

    def encapsulate(self, pkt, vni):
        """
        Encapsulate the original payload frame by adding VXLAN header with its
        UDP, IP and Ethernet fields
        """
        return (Ether(src=self.pg0.remote_mac, dst=self.pg0.local_mac) /
                IP(src=self.pg0.remote_ip4, dst=self.pg0.local_ip4) /
                UDP(sport=self.dport, dport=self.dport, chksum=0) /
                VXLAN(vni=vni, flags=self.flags) /
                pkt)

    def ip_range(self, start, end):
        """ range of remote ip's """
        return ip4_range(self.pg0.remote_ip4, start, end)

    def encap_mcast(self, pkt, src_ip, src_mac, vni):
        """
        Encapsulate the original payload frame by adding VXLAN header with its
        UDP, IP and Ethernet fields
        """
        return (Ether(src=src_mac, dst=self.mcast_mac) /
                IP(src=src_ip, dst=self.mcast_ip4) /
                UDP(sport=self.dport, dport=self.dport, chksum=0) /
                VXLAN(vni=vni, flags=self.flags) /
                pkt)

    def decapsulate(self, pkt):
        """
        Decapsulate the original payload frame by removing VXLAN header
        """
        # check if is set I flag
        self.assertEqual(pkt[VXLAN].flags, int('0x8', 16))
        return pkt[VXLAN].payload

    # Method for checking VXLAN encapsulation.
    #
    def check_encapsulation(self, pkt, vni, local_only=False, mcast_pkt=False):
        # TODO: add error messages
        # Verify source MAC is VPP_MAC and destination MAC is MY_MAC resolved
        #  by VPP using ARP.
        self.assertEqual(pkt[Ether].src, self.pg0.local_mac)
        if not local_only:
            if not mcast_pkt:
                self.assertEqual(pkt[Ether].dst, self.pg0.remote_mac)
            else:
                self.assertEqual(pkt[Ether].dst, type(self).mcast_mac)
        # Verify VXLAN tunnel source IP is VPP_IP and destination IP is MY_IP.
        self.assertEqual(pkt[IP].src, self.pg0.local_ip4)
        if not local_only:
            if not mcast_pkt:
                self.assertEqual(pkt[IP].dst, self.pg0.remote_ip4)
            else:
                self.assertEqual(pkt[IP].dst, type(self).mcast_ip4)
        # Verify UDP destination port is VXLAN 4789, source UDP port could be
        #  arbitrary.
        self.assertEqual(pkt[UDP].dport, type(self).dport)
        # TODO: checksum check
        # Verify VNI
        self.assertEqual(pkt[VXLAN].vni, vni)

    @classmethod
    def create_vxlan_flood_test_bd(cls, vni, n_ucast_tunnels):
        # Create 10 ucast vxlan tunnels under bd
        ip_range_start = 10
        ip_range_end = ip_range_start + n_ucast_tunnels
        next_hop_address = cls.pg0.remote_ip4
        for dest_ip4 in ip4_range(next_hop_address, ip_range_start,
                                  ip_range_end):
            # add host route so dest_ip4n will not be resolved
            rip = VppIpRoute(cls, dest_ip4, 32,
                             [VppRoutePath(next_hop_address,
                                           INVALID_INDEX)],
                             register=False)
            rip.add_vpp_config()
            dest_ip4n = socket.inet_pton(socket.AF_INET, dest_ip4)

            r = cls.vapi.vxlan_add_del_tunnel(src_address=cls.pg0.local_ip4n,
                                              dst_address=dest_ip4n, vni=vni)
            cls.vapi.sw_interface_set_l2_bridge(r.sw_if_index, bd_id=vni)

    @classmethod
    def add_del_shared_mcast_dst_load(cls, is_add):
        """
        add or del tunnels sharing the same mcast dst
        to test vxlan ref_count mechanism
        """
        n_shared_dst_tunnels = 20
        vni_start = 10000
        vni_end = vni_start + n_shared_dst_tunnels
        for vni in range(vni_start, vni_end):
            r = cls.vapi.vxlan_add_del_tunnel(src_address=cls.pg0.local_ip4n,
                                              dst_address=cls.mcast_ip4n,
                                              mcast_sw_if_index=1,
                                              is_add=is_add, vni=vni)
            if r.sw_if_index == 0xffffffff:
                raise ValueError("bad sw_if_index: ~0")

    @classmethod
    def add_shared_mcast_dst_load(cls):
        cls.add_del_shared_mcast_dst_load(is_add=1)

    @classmethod
    def del_shared_mcast_dst_load(cls):
        cls.add_del_shared_mcast_dst_load(is_add=0)

    @classmethod
    def add_del_mcast_tunnels_load(cls, is_add):
        """
        add or del tunnels to test vxlan stability
        """
        n_distinct_dst_tunnels = 200
        ip_range_start = 10
        ip_range_end = ip_range_start + n_distinct_dst_tunnels
        for dest_ip4n in ip4n_range(cls.mcast_ip4n, ip_range_start,
                                    ip_range_end):
            vni = bytearray(dest_ip4n)[3]
            cls.vapi.vxlan_add_del_tunnel(src_address=cls.pg0.local_ip4n,
                                          dst_address=dest_ip4n,
                                          mcast_sw_if_index=1, is_add=is_add,
                                          vni=vni)

    @classmethod
    def add_mcast_tunnels_load(cls):
        cls.add_del_mcast_tunnels_load(is_add=1)

    @classmethod
    def del_mcast_tunnels_load(cls):
        cls.add_del_mcast_tunnels_load(is_add=0)

    # Class method to start the VXLAN test case.
    #  Overrides setUpClass method in VppTestCase class.
    #  Python try..except statement is used to ensure that the tear down of
    #  the class will be executed even if exception is raised.
    #  @param cls The class pointer.
    @classmethod
    def setUpClass(cls):
        super(TestVxlan, cls).setUpClass()

        try:
            cls.dport = 4789
            cls.flags = 0x8

            # Create 2 pg interfaces.
            cls.create_pg_interfaces(range(4))
            for pg in cls.pg_interfaces:
                pg.admin_up()

            # Configure IPv4 addresses on VPP pg0.
            cls.pg0.config_ip4()

            # Resolve MAC address for VPP's IP address on pg0.
            cls.pg0.resolve_arp()

            # Our Multicast address
            cls.mcast_ip4 = '239.1.1.1'
            cls.mcast_ip4n = socket.inet_pton(socket.AF_INET, cls.mcast_ip4)
            iplong = atol(cls.mcast_ip4)
            cls.mcast_mac = "01:00:5e:%02x:%02x:%02x" % (
                (iplong >> 16) & 0x7F, (iplong >> 8) & 0xFF, iplong & 0xFF)

            # Create VXLAN VTEP on VPP pg0, and put vxlan_tunnel0 and pg1
            #  into BD.
            cls.single_tunnel_bd = 1
            r = cls.vapi.vxlan_add_del_tunnel(src_address=cls.pg0.local_ip4n,
                                              dst_address=cls.pg0.remote_ip4n,
                                              vni=cls.single_tunnel_bd)
            cls.vapi.sw_interface_set_l2_bridge(rx_sw_if_index=r.sw_if_index,
                                                bd_id=cls.single_tunnel_bd)
            cls.vapi.sw_interface_set_l2_bridge(
                rx_sw_if_index=cls.pg1.sw_if_index, bd_id=cls.single_tunnel_bd)

            # Setup vni 2 to test multicast flooding
            cls.n_ucast_tunnels = 10
            cls.mcast_flood_bd = 2
            cls.create_vxlan_flood_test_bd(cls.mcast_flood_bd,
                                           cls.n_ucast_tunnels)
            r = cls.vapi.vxlan_add_del_tunnel(src_address=cls.pg0.local_ip4n,
                                              dst_address=cls.mcast_ip4n,
                                              mcast_sw_if_index=1,
                                              vni=cls.mcast_flood_bd)
            cls.vapi.sw_interface_set_l2_bridge(rx_sw_if_index=r.sw_if_index,
                                                bd_id=cls.mcast_flood_bd)
            cls.vapi.sw_interface_set_l2_bridge(
                rx_sw_if_index=cls.pg2.sw_if_index, bd_id=cls.mcast_flood_bd)

            # Add and delete mcast tunnels to check stability
            cls.add_shared_mcast_dst_load()
            cls.add_mcast_tunnels_load()
            cls.del_shared_mcast_dst_load()
            cls.del_mcast_tunnels_load()

            # Setup vni 3 to test unicast flooding
            cls.ucast_flood_bd = 3
            cls.create_vxlan_flood_test_bd(cls.ucast_flood_bd,
                                           cls.n_ucast_tunnels)
            cls.vapi.sw_interface_set_l2_bridge(
                rx_sw_if_index=cls.pg3.sw_if_index, bd_id=cls.ucast_flood_bd)
        except Exception:
            super(TestVxlan, cls).tearDownClass()
            raise

    @classmethod
    def tearDownClass(cls):
        super(TestVxlan, cls).tearDownClass()

    def test_encap_big_packet(self):
        """ Encapsulation test send big frame from pg1
        Verify receipt of encapsulated frames on pg0
        """

        self.vapi.sw_interface_set_mtu(self.pg0.sw_if_index, [1500, 0, 0, 0])

        frame = (Ether(src='00:00:00:00:00:02', dst='00:00:00:00:00:01') /
                 IP(src='4.3.2.1', dst='1.2.3.4') /
                 UDP(sport=20000, dport=10000) /
                 Raw('\xa5' * 1450))

        self.pg1.add_stream([frame])

        self.pg0.enable_capture()

        self.pg_start()

        # Pick first received frame and check if it's correctly encapsulated.
        out = self.pg0.get_capture(2)
        ether = out[0]
        pkt = reassemble4(out)
        pkt = ether / pkt
        self.check_encapsulation(pkt, self.single_tunnel_bd)

        payload = self.decapsulate(pkt)
        # TODO: Scapy bug?
        # self.assert_eq_pkts(payload, frame)

    # Method to define VPP actions before tear down of the test case.
    #  Overrides tearDown method in VppTestCase class.
    #  @param self The object pointer.
    def tearDown(self):
        super(TestVxlan, self).tearDown()

    def show_commands_at_teardown(self):
        self.logger.info(self.vapi.cli("show bridge-domain 1 detail"))
        self.logger.info(self.vapi.cli("show bridge-domain 2 detail"))
        self.logger.info(self.vapi.cli("show bridge-domain 3 detail"))
        self.logger.info(self.vapi.cli("show vxlan tunnel"))


if __name__ == '__main__':
    unittest.main(testRunner=VppTestRunner)
class="o">= ptd->next; while (n_left >= 8) { CLIB_PREFETCH (mb + 8, CLIB_CACHE_LINE_BYTES, LOAD); dpdk_prefetch_buffer_x4 (mb + 4); b[0] = vlib_buffer_from_rte_mbuf (mb[0]); b[1] = vlib_buffer_from_rte_mbuf (mb[1]); b[2] = vlib_buffer_from_rte_mbuf (mb[2]); b[3] = vlib_buffer_from_rte_mbuf (mb[3]); clib_memcpy64_x4 (b[0], b[1], b[2], b[3], &ptd->buffer_template); dpdk_prefetch_mbuf_x4 (mb + 4); or_flags |= dpdk_ol_flags_extract (mb, flags, 4); flags += 4; /* we temporary store relative offset of ethertype into next[x] so we can prefetch and get it faster later */ off = mb[0]->data_off; next[0] = off + STRUCT_OFFSET_OF (ethernet_header_t, type); off -= RTE_PKTMBUF_HEADROOM; vnet_buffer (b[0])->l2_hdr_offset = off; b[0]->current_data = off; off = mb[1]->data_off; next[1] = off + STRUCT_OFFSET_OF (ethernet_header_t, type); off -= RTE_PKTMBUF_HEADROOM; vnet_buffer (b[1])->l2_hdr_offset = off; b[1]->current_data = off; off = mb[2]->data_off; next[2] = off + STRUCT_OFFSET_OF (ethernet_header_t, type); off -= RTE_PKTMBUF_HEADROOM; vnet_buffer (b[2])->l2_hdr_offset = off; b[2]->current_data = off; off = mb[3]->data_off; next[3] = off + STRUCT_OFFSET_OF (ethernet_header_t, type); off -= RTE_PKTMBUF_HEADROOM; vnet_buffer (b[3])->l2_hdr_offset = off; b[3]->current_data = off; b[0]->current_length = mb[0]->data_len; b[1]->current_length = mb[1]->data_len; b[2]->current_length = mb[2]->data_len; b[3]->current_length = mb[3]->data_len; n_bytes += mb[0]->data_len; n_bytes += mb[1]->data_len; n_bytes += mb[2]->data_len; n_bytes += mb[3]->data_len; if (maybe_multiseg) { n_bytes += dpdk_process_subseq_segs (vm, b[0], mb[0], fl); n_bytes += dpdk_process_subseq_segs (vm, b[1], mb[1], fl); n_bytes += dpdk_process_subseq_segs (vm, b[2], mb[2], fl); n_bytes += dpdk_process_subseq_segs (vm, b[3], mb[3], fl); } VLIB_BUFFER_TRACE_TRAJECTORY_INIT (b[0]); VLIB_BUFFER_TRACE_TRAJECTORY_INIT (b[1]); VLIB_BUFFER_TRACE_TRAJECTORY_INIT (b[2]); VLIB_BUFFER_TRACE_TRAJECTORY_INIT (b[3]); /* next */ mb += 4; n_left -= 4; next += 4; } while (n_left) { b[0] = vlib_buffer_from_rte_mbuf (mb[0]); clib_memcpy (b[0], &ptd->buffer_template, 64); or_flags |= dpdk_ol_flags_extract (mb, flags, 1); flags += 1; off = mb[0]->data_off; next[0] = off + STRUCT_OFFSET_OF (ethernet_header_t, type); off -= RTE_PKTMBUF_HEADROOM; vnet_buffer (b[0])->l2_hdr_offset = off; b[0]->current_data = off; b[0]->current_length = mb[0]->data_len; n_bytes += mb[0]->data_len; if (maybe_multiseg) n_bytes += dpdk_process_subseq_segs (vm, b[0], mb[0], fl); VLIB_BUFFER_TRACE_TRAJECTORY_INIT (b[0]); /* next */ mb += 1; n_left -= 1; next += 1; } *or_flagsp = or_flags; return n_bytes; } static_always_inline void dpdk_set_next_from_etype (vlib_main_t * vm, vlib_node_runtime_t * node, dpdk_per_thread_data_t * ptd, uword n_rx_packets) { vlib_buffer_t *b[4]; i16 adv[4]; u16 etype[4]; struct rte_mbuf **mb = ptd->mbufs; u8 *flags = ptd->flags; u16 *next = ptd->next; u32 n_left = n_rx_packets; while (n_left >= 12) { dpdk_prefetch_buffer_data_x4 (mb + 8); dpdk_prefetch_buffer_x4 (mb + 8); b[0] = vlib_buffer_from_rte_mbuf (mb[0]); b[1] = vlib_buffer_from_rte_mbuf (mb[1]); b[2] = vlib_buffer_from_rte_mbuf (mb[2]); b[3] = vlib_buffer_from_rte_mbuf (mb[3]); etype[0] = *(u16 *) ((u8 *) mb[0] + next[0] + sizeof (vlib_buffer_t)); etype[1] = *(u16 *) ((u8 *) mb[1] + next[1] + sizeof (vlib_buffer_t)); etype[2] = *(u16 *) ((u8 *) mb[2] + next[2] + sizeof (vlib_buffer_t)); etype[3] = *(u16 *) ((u8 *) mb[3] + next[3] + sizeof (vlib_buffer_t)); next[0] = dpdk_rx_next (node, etype[0], flags[0]); next[1] = dpdk_rx_next (node, etype[1], flags[1]); next[2] = dpdk_rx_next (node, etype[2], flags[2]); next[3] = dpdk_rx_next (node, etype[3], flags[3]); adv[0] = device_input_next_node_advance[next[0]]; adv[1] = device_input_next_node_advance[next[1]]; adv[2] = device_input_next_node_advance[next[2]]; adv[3] = device_input_next_node_advance[next[3]]; b[0]->current_data += adv[0]; b[1]->current_data += adv[1]; b[2]->current_data += adv[2]; b[3]->current_data += adv[3]; b[0]->current_length -= adv[0]; b[1]->current_length -= adv[1]; b[2]->current_length -= adv[2]; b[3]->current_length -= adv[3]; /* next */ next += 4; mb += 4; n_left -= 4; flags += 4; } while (n_left) { b[0] = vlib_buffer_from_rte_mbuf (mb[0]); next[0] = *(u16 *) ((u8 *) mb[0] + next[0] + sizeof (vlib_buffer_t)); next[0] = dpdk_rx_next (node, next[0], flags[0]); adv[0] = device_input_next_node_advance[next[0]]; b[0]->current_data += adv[0]; b[0]->current_length -= adv[0]; /* next */ next += 1; mb += 1; n_left -= 1; flags += 1; } } static_always_inline void dpdk_process_flow_offload (dpdk_device_t * xd, dpdk_per_thread_data_t * ptd, uword n_rx_packets) { uword n; dpdk_flow_lookup_entry_t *fle; vlib_buffer_t *b0; /* TODO prefetch and quad-loop */ for (n = 0; n < n_rx_packets; n++) { if ((ptd->flags[n] & (1 << DPDK_RX_F_FDIR)) == 0) continue; fle = vec_elt_at_index (xd->flow_lookup_entries, ptd->mbufs[n]->hash.fdir.hi); if (fle->next_index != (u16) ~ 0) ptd->next[n] = fle->next_index; if (fle->flow_id != ~0) { b0 = vlib_buffer_from_rte_mbuf (ptd->mbufs[n]); b0->flow_id = fle->flow_id; } if (fle->buffer_advance != ~0) { b0 = vlib_buffer_from_rte_mbuf (ptd->mbufs[n]); vlib_buffer_advance (b0, fle->buffer_advance); } } } static_always_inline u32 dpdk_device_input (vlib_main_t * vm, dpdk_main_t * dm, dpdk_device_t * xd, vlib_node_runtime_t * node, u32 thread_index, u16 queue_id) { uword n_rx_packets = 0, n_rx_bytes; u32 n_left, n_trace; u32 *buffers; u32 next_index = VNET_DEVICE_INPUT_NEXT_ETHERNET_INPUT; struct rte_mbuf **mb; vlib_buffer_t *b0; int known_next = 0; u16 *next; u8 or_flags; u32 n; dpdk_per_thread_data_t *ptd = vec_elt_at_index (dm->per_thread_data, thread_index); vlib_buffer_t *bt = &ptd->buffer_template; if ((xd->flags & DPDK_DEVICE_FLAG_ADMIN_UP) == 0) return 0; /* get up to DPDK_RX_BURST_SZ buffers from PMD */ while (n_rx_packets < DPDK_RX_BURST_SZ) { n = rte_eth_rx_burst (xd->device_index, queue_id, ptd->mbufs + n_rx_packets, DPDK_RX_BURST_SZ - n_rx_packets); n_rx_packets += n; if (n < 32) break; } if (n_rx_packets == 0) return 0; /* Update buffer template */ vnet_buffer (bt)->sw_if_index[VLIB_RX] = xd->sw_if_index; bt->error = node->errors[DPDK_ERROR_NONE]; /* as DPDK is allocating empty buffers from mempool provided before interface start for each queue, it is safe to store this in the template */ bt->buffer_pool_index = xd->buffer_pool_for_queue[queue_id]; /* receive burst of packets from DPDK PMD */ if (PREDICT_FALSE (xd->per_interface_next_index != ~0)) { known_next = 1; next_index = xd->per_interface_next_index; } /* as all packets belong to thr same interface feature arc lookup can be don once and result stored in the buffer template */ if (PREDICT_FALSE (vnet_device_input_have_features (xd->sw_if_index))) { vnet_feature_start_device_input_x1 (xd->sw_if_index, &next_index, bt); known_next = 1; } if (xd->flags & DPDK_DEVICE_FLAG_MAYBE_MULTISEG) n_rx_bytes = dpdk_process_rx_burst (vm, ptd, n_rx_packets, 1, &or_flags); else n_rx_bytes = dpdk_process_rx_burst (vm, ptd, n_rx_packets, 0, &or_flags); if (PREDICT_FALSE (known_next)) { for (n = 0; n < n_rx_packets; n++) ptd->next[n] = next_index; vnet_buffer (bt)->feature_arc_index = 0; bt->current_config_index = 0; } else dpdk_set_next_from_etype (vm, node, ptd, n_rx_packets); /* flow offload - process if rx flow offlaod enabled and at least one packet is marked */ if (PREDICT_FALSE ((xd->flags & DPDK_DEVICE_FLAG_RX_FLOW_OFFLOAD) && (or_flags & (1 << DPDK_RX_F_FDIR)))) dpdk_process_flow_offload (xd, ptd, n_rx_packets); /* is at least one packet marked as ip4 checksum bad? */ if (PREDICT_FALSE (or_flags & (1 << DPDK_RX_F_CKSUM_BAD))) for (n = 0; n < n_rx_packets; n++) { if ((ptd->flags[n] & (1 << DPDK_RX_F_CKSUM_BAD)) == 0) continue; if (ptd->next[n] != VNET_DEVICE_INPUT_NEXT_IP4_INPUT) continue; b0 = vlib_buffer_from_rte_mbuf (ptd->mbufs[n]); b0->error = node->errors[DPDK_ERROR_IP_CHECKSUM_ERROR]; ptd->next[n] = VNET_DEVICE_INPUT_NEXT_DROP; } /* enqueue buffers to the next node */ vlib_get_buffer_indices_with_offset (vm, (void **) ptd->mbufs, ptd->buffers, n_rx_packets, sizeof (struct rte_mbuf)); n_left = n_rx_packets; next = ptd->next; buffers = ptd->buffers; mb = ptd->mbufs; while (n_left) { u32 n_left_to_next; u32 *to_next; vlib_get_next_frame (vm, node, next_index, to_next, n_left_to_next); #ifdef CLIB_HAVE_VEC256 while (n_left >= 16 && n_left_to_next >= 16) { u16x16 next16 = u16x16_load_unaligned (next); if (u16x16_is_all_equal (next16, next_index)) { clib_memcpy (to_next, buffers, 16 * sizeof (u32)); to_next += 16; n_left_to_next -= 16; buffers += 16; n_left -= 16; next += 16; mb += 16; } else { clib_memcpy (to_next, buffers, 4 * sizeof (u32)); to_next += 4; n_left_to_next -= 4; vlib_validate_buffer_enqueue_x4 (vm, node, next_index, to_next, n_left_to_next, buffers[0], buffers[1], buffers[2], buffers[3], next[0], next[1], next[2], next[3]); /* next */ buffers += 4; n_left -= 4; next += 4; mb += 4; } } #endif while (n_left >= 4 && n_left_to_next >= 4) { clib_memcpy (to_next, buffers, 4 * sizeof (u32)); to_next += 4; n_left_to_next -= 4; vlib_validate_buffer_enqueue_x4 (vm, node, next_index, to_next, n_left_to_next, buffers[0], buffers[1], buffers[2], buffers[3], next[0], next[1], next[2], next[3]); /* next */ buffers += 4; n_left -= 4; next += 4; mb += 4; } while (n_left && n_left_to_next) { clib_memcpy (to_next, buffers, 1 * sizeof (u32)); to_next += 1; n_left_to_next -= 1; vlib_validate_buffer_enqueue_x1 (vm, node, next_index, to_next, n_left_to_next, buffers[0], next[0]); /* next */ buffers += 1; n_left -= 1; next += 1; mb += 1; } vlib_put_next_frame (vm, node, next_index, n_left_to_next); } /* packet trace if enabled */ if ((n_trace = vlib_get_trace_count (vm, node))) { n_left = n_rx_packets; buffers = ptd->buffers; mb = ptd->mbufs; next = ptd->next; while (n_trace && n_left) { b0 = vlib_get_buffer (vm, buffers[0]); vlib_trace_buffer (vm, node, next[0], b0, /* follow_chain */ 0); dpdk_rx_trace_t *t0 = vlib_add_trace (vm, node, b0, sizeof t0[0]); t0->queue_index = queue_id; t0->device_index = xd->device_index; t0->buffer_index = vlib_get_buffer_index (vm, b0); clib_memcpy (&t0->mb, mb[0], sizeof t0->mb); clib_memcpy (&t0->buffer, b0, sizeof b0[0] - sizeof b0->pre_data); clib_memcpy (t0->buffer.pre_data, b0->data, sizeof t0->buffer.pre_data); clib_memcpy (&t0->data, mb[0]->buf_addr + mb[0]->data_off, sizeof t0->data); n_trace--; n_left--; buffers++; mb++; next++; } vlib_set_trace_count (vm, node, n_trace); } vlib_increment_combined_counter (vnet_get_main ()->interface_main.combined_sw_if_counters + VNET_INTERFACE_COUNTER_RX, thread_index, xd->sw_if_index, n_rx_packets, n_rx_bytes); vnet_device_increment_rx_packets (thread_index, n_rx_packets); return n_rx_packets; } uword CLIB_CPU_OPTIMIZED CLIB_MULTIARCH_FN (dpdk_input) (vlib_main_t * vm, vlib_node_runtime_t * node, vlib_frame_t * f) { dpdk_main_t *dm = &dpdk_main; dpdk_device_t *xd; uword n_rx_packets = 0; vnet_device_input_runtime_t *rt = (void *) node->runtime_data; vnet_device_and_queue_t *dq; u32 thread_index = node->thread_index; /* * Poll all devices on this cpu for input/interrupts. */ /* *INDENT-OFF* */ foreach_device_and_queue (dq, rt->devices_and_queues) { xd = vec_elt_at_index(dm->devices, dq->dev_instance); if (PREDICT_FALSE (xd->flags & DPDK_DEVICE_FLAG_BOND_SLAVE)) continue; /* Do not poll slave to a bonded interface */ n_rx_packets += dpdk_device_input (vm, dm, xd, node, thread_index, dq->queue_id); } /* *INDENT-ON* */ poll_rate_limit (dm); return n_rx_packets; } #ifndef CLIB_MULTIARCH_VARIANT /* *INDENT-OFF* */ VLIB_REGISTER_NODE (dpdk_input_node) = { .function = dpdk_input, .type = VLIB_NODE_TYPE_INPUT, .name = "dpdk-input", .sibling_of = "device-input", /* Will be enabled if/when hardware is detected. */ .state = VLIB_NODE_STATE_DISABLED, .format_buffer = format_ethernet_header_with_length, .format_trace = format_dpdk_rx_trace, .n_errors = DPDK_N_ERROR, .error_strings = dpdk_error_strings, }; /* *INDENT-ON* */ vlib_node_function_t __clib_weak dpdk_input_avx512; vlib_node_function_t __clib_weak dpdk_input_avx2; #if __x86_64__ static void __clib_constructor dpdk_input_multiarch_select (void) { if (dpdk_input_avx512 && clib_cpu_supports_avx512f ()) dpdk_input_node.function = dpdk_input_avx512; else if (dpdk_input_avx2 && clib_cpu_supports_avx2 ()) dpdk_input_node.function = dpdk_input_avx2; } #endif #endif /* * fd.io coding-style-patch-verification: ON * * Local Variables: * eval: (c-set-style "gnu") * End: */