summaryrefslogtreecommitdiffstats
path: root/src/svm/svm_common.h
blob: ce07c37b24ed895066de11893a9bab83ab5105d0 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
/*
 *------------------------------------------------------------------
 * Copyright (c) 2009 Cisco and/or its affiliates.
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at:
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 *------------------------------------------------------------------
 */

#ifndef __included_svm_common_h__
#define __included_svm_common_h__

#include <stdarg.h>
#include <pthread.h>
#include <vppinfra/types.h>

#define SVM_VERSION ((1<<16) | 1)	/* set to declare region ready. */

#define SVM_FLAGS_MHEAP (1<<0)	/* region contains an mheap */
#define SVM_FLAGS_FILE  (1<<1)	/* region backed by one or more files */
#define SVM_FLAGS_NODATA (1<<2)	/* region will be further subdivided */
#define SVM_FLAGS_NEED_DATA_INIT (1<<3)

#define SVM_PVT_MHEAP_SIZE (128<<10)	/* region's private mheap (128k) */

typedef struct svm_region_
{
  volatile uword version;
  pthread_mutex_t mutex;
  pthread_cond_t condvar;
  int mutex_owner_pid;		/* in case of trouble */
  int mutex_owner_tag;
  uword flags;
  uword virtual_base;		/* base of the region object */
  uword virtual_size;
  void *region_heap;
  void *data_base;		/* data portion base address */
  void *data_heap;		/* data heap, if any */
  volatile void *user_ctx;	/* user context pointer */
  /* stuff allocated in the region's heap */
  uword bitmap_size;		/* nbits in virtual alloc bitmap */
  uword *bitmap;		/* the bitmap */
  char *region_name;
  char *backing_file;
  char **filenames;
  uword *client_pids;
  /* pad */

  /* next page:
   * (64K) clib heap for the region itself
   *
   * data_base -> whatever is in this region
   */

} svm_region_t;

typedef struct svm_map_region_args_
{
  const char *root_path;	/* NULL means use the truly global arena */
  const char *name;
  uword baseva;
  u64 size;
  u64 pvt_heap_size;
  uword flags;
  char *backing_file;
  uword backing_mmap_size;
  /* uid, gid to own the svm region(s) */
  int uid;
  int gid;
} svm_map_region_args_t;

/*
 * Memory mapped to high addresses for session/vppcom/vcl/etc...
 */
#if __WORDSIZE == 64
#define HIGH_SEGMENT_BASEVA (8ULL   << 30)	/* 8GB */
#elif __WORDSIZE == 32
#define HIGH_SEGMENT_BASEVA (3584UL << 20)	/* 3.5GB */
#else
#error "unknown __WORDSIZE"
#endif

/*
 * Memory shared across all router instances. Packet buffers, etc
 * Base should be "out of the way," and size should be big enough to
 * cover everything we plan to put here.
 */
#define SVM_GLOBAL_REGION_SIZE    (64<<20)
#define SVM_GLOBAL_REGION_NAME "/global_vm"
u64 svm_get_global_region_base_va ();

/*
 * Memory shared across individual router instances.
 */
#define SVM_OVERLAY_REGION_BASEVA \
               (SVM_GLOBAL_REGION_BASEVA + SVM_GLOBAL_REGION_SIZE)
#define SVM_OVERLAY_REGION_SIZE   (1<<20)
#define SVM_OVERLAY_REGION_BASENAME "/overlay_vm"

typedef struct
{
  u8 *subregion_name;
} svm_subregion_t;

typedef struct
{
  svm_subregion_t *subregions;	/* subregion pool */
  uword *name_hash;
  u8 *root_path;
  int uid;
  int gid;
} svm_main_region_t;


void *svm_region_find_or_create (svm_map_region_args_t * a);
void svm_region_init (void);
void svm_region_init_mapped_region (svm_map_region_args_t * a,
				    svm_region_t * rp);
int svm_region_init_chroot (const char *root_path);
void svm_region_init_chroot_uid_gid (const char *root_path, int uid, int gid);
void svm_region_init_args (svm_map_region_args_t * a);
void svm_region_exit (void);
void svm_region_exit_client (void);
void svm_region_unmap (void *rp_arg);
void svm_region_unmap_client (void *rp_arg);
void svm_client_scan (const char *root_path);
void svm_client_scan_this_region_nolock (svm_region_t * rp);
u8 *shm_name_from_svm_map_region_args (svm_map_region_args_t * a);
u8 *format_svm_region (u8 * s, va_list * args);

svm_region_t *svm_get_root_rp (void);

#endif /* __included_svm_common_h__ */

/*
 * fd.io coding-style-patch-verification: ON
 *
 * Local Variables:
 * eval: (c-set-style "gnu")
 * End:
 */
s = format (s, "PPPoE decap error - session for session_id %d does not exist", t->session_id); } return s; } VLIB_NODE_FN (pppoe_input_node) (vlib_main_t * vm, vlib_node_runtime_t * node, vlib_frame_t * from_frame) { u32 n_left_from, next_index, * from, * to_next; pppoe_main_t * pem = &pppoe_main; vnet_main_t * vnm = pem->vnet_main; vnet_interface_main_t * im = &vnm->interface_main; u32 pkts_decapsulated = 0; u32 thread_index = vlib_get_thread_index(); u32 stats_sw_if_index, stats_n_packets, stats_n_bytes; pppoe_entry_key_t cached_key; pppoe_entry_result_t cached_result; from = vlib_frame_vector_args (from_frame); n_left_from = from_frame->n_vectors; /* Clear the one-entry cache in case session table was updated */ cached_key.raw = ~0; cached_result.raw = ~0; /* warning be gone */ next_index = node->cached_next_index; stats_sw_if_index = node->runtime_data[0]; stats_n_packets = stats_n_bytes = 0; while (n_left_from > 0) { u32 n_left_to_next; vlib_get_next_frame (vm, node, next_index, to_next, n_left_to_next); while (n_left_from >= 4 && n_left_to_next >= 2) { u32 bi0, bi1; vlib_buffer_t * b0, * b1; u32 next0, next1; ethernet_header_t *h0, *h1; pppoe_header_t * pppoe0, * pppoe1; u16 ppp_proto0 = 0, ppp_proto1 = 0; pppoe_session_t * t0, * t1; u32 error0, error1; u32 sw_if_index0, sw_if_index1, len0, len1; pppoe_entry_key_t key0, key1; pppoe_entry_result_t result0, result1; u32 bucket0, bucket1; /* Prefetch next iteration. */ { vlib_buffer_t * p2, * p3; p2 = vlib_get_buffer (vm, from[2]); p3 = vlib_get_buffer (vm, from[3]); vlib_prefetch_buffer_header (p2, LOAD); vlib_prefetch_buffer_header (p3, LOAD); CLIB_PREFETCH (p2->data, 2*CLIB_CACHE_LINE_BYTES, LOAD); CLIB_PREFETCH (p3->data, 2*CLIB_CACHE_LINE_BYTES, LOAD); } bi0 = from[0]; bi1 = from[1]; to_next[0] = bi0; to_next[1] = bi1; from += 2; to_next += 2; n_left_to_next -= 2; n_left_from -= 2; b0 = vlib_get_buffer (vm, bi0); b1 = vlib_get_buffer (vm, bi1); error0 = 0; error1 = 0; /* leaves current_data pointing at the pppoe header */ pppoe0 = vlib_buffer_get_current (b0); pppoe1 = vlib_buffer_get_current (b1); ppp_proto0 = clib_net_to_host_u16(pppoe0->ppp_proto); ppp_proto1 = clib_net_to_host_u16(pppoe1->ppp_proto); /* Manipulate packet 0 */ if ((ppp_proto0 != PPP_PROTOCOL_ip4) && (ppp_proto0 != PPP_PROTOCOL_ip6)) { error0 = PPPOE_ERROR_CONTROL_PLANE; next0 = PPPOE_INPUT_NEXT_CP_INPUT; goto trace0; } /* get client mac */ vlib_buffer_reset(b0); h0 = vlib_buffer_get_current (b0); pppoe_lookup_1 (&pem->session_table, &cached_key, &cached_result, h0->src_address, pppoe0->session_id, &key0, &bucket0, &result0); if (PREDICT_FALSE (result0.fields.session_index == ~0)) { error0 = PPPOE_ERROR_NO_SUCH_SESSION; next0 = PPPOE_INPUT_NEXT_DROP; goto trace0; } t0 = pool_elt_at_index (pem->sessions, result0.fields.session_index); /* Pop Eth and PPPoE header */ vlib_buffer_advance(b0, sizeof(*h0)+sizeof(*pppoe0)); next0 = (ppp_proto0==PPP_PROTOCOL_ip4)? PPPOE_INPUT_NEXT_IP4_INPUT : PPPOE_INPUT_NEXT_IP6_INPUT; sw_if_index0 = t0->sw_if_index; len0 = vlib_buffer_length_in_chain (vm, b0); pkts_decapsulated ++; stats_n_packets += 1; stats_n_bytes += len0; /* Batch stats increment on the same pppoe session so counter is not incremented per packet */ if (PREDICT_FALSE (sw_if_index0 != stats_sw_if_index)) { stats_n_packets -= 1; stats_n_bytes -= len0; if (stats_n_packets) vlib_increment_combined_counter (im->combined_sw_if_counters + VNET_INTERFACE_COUNTER_RX, thread_index, stats_sw_if_index, stats_n_packets, stats_n_bytes); stats_n_packets = 1; stats_n_bytes = len0; stats_sw_if_index = sw_if_index0; } trace0: b0->error = error0 ? node->errors[error0] : 0; if (PREDICT_FALSE(b0->flags & VLIB_BUFFER_IS_TRACED)) { pppoe_rx_trace_t *tr = vlib_add_trace (vm, node, b0, sizeof (*tr)); tr->next_index = next0; tr->error = error0; tr->session_index = result0.fields.session_index; tr->session_id = clib_net_to_host_u32(pppoe0->session_id); } /* Manipulate packet 1 */ if ((ppp_proto1 != PPP_PROTOCOL_ip4) && (ppp_proto1 != PPP_PROTOCOL_ip6)) { error1 = PPPOE_ERROR_CONTROL_PLANE; next1 = PPPOE_INPUT_NEXT_CP_INPUT; goto trace1; } /* get client mac */ vlib_buffer_reset(b1); h1 = vlib_buffer_get_current (b1); pppoe_lookup_1 (&pem->session_table, &cached_key, &cached_result, h1->src_address, pppoe1->session_id, &key1, &bucket1, &result1); if (PREDICT_FALSE (result1.fields.session_index == ~0)) { error1 = PPPOE_ERROR_NO_SUCH_SESSION; next1 = PPPOE_INPUT_NEXT_DROP; goto trace1; } t1 = pool_elt_at_index (pem->sessions, result1.fields.session_index); /* Pop Eth and PPPoE header */ vlib_buffer_advance(b1, sizeof(*h1)+sizeof(*pppoe1)); next1 = (ppp_proto1==PPP_PROTOCOL_ip4)? PPPOE_INPUT_NEXT_IP4_INPUT : PPPOE_INPUT_NEXT_IP6_INPUT; sw_if_index1 = t1->sw_if_index; len1 = vlib_buffer_length_in_chain (vm, b1); pkts_decapsulated ++; stats_n_packets += 1; stats_n_bytes += len1; /* Batch stats increment on the same pppoe session so counter is not incremented per packet */ if (PREDICT_FALSE (sw_if_index1 != stats_sw_if_index)) { stats_n_packets -= 1; stats_n_bytes -= len1; if (stats_n_packets) vlib_increment_combined_counter (im->combined_sw_if_counters + VNET_INTERFACE_COUNTER_RX, thread_index, stats_sw_if_index, stats_n_packets, stats_n_bytes); stats_n_packets = 1; stats_n_bytes = len1; stats_sw_if_index = sw_if_index1; } trace1: b1->error = error1 ? node->errors[error1] : 0; if (PREDICT_FALSE(b1->flags & VLIB_BUFFER_IS_TRACED)) { pppoe_rx_trace_t *tr = vlib_add_trace (vm, node, b1, sizeof (*tr)); tr->next_index = next1; tr->error = error1; tr->session_index = result1.fields.session_index; tr->session_id = clib_net_to_host_u32(pppoe1->session_id); } vlib_validate_buffer_enqueue_x2 (vm, node, next_index, to_next, n_left_to_next, bi0, bi1, next0, next1); } while (n_left_from > 0 && n_left_to_next > 0) { u32 bi0; vlib_buffer_t * b0; u32 next0; ethernet_header_t *h0; pppoe_header_t * pppoe0; u16 ppp_proto0 = 0; pppoe_session_t * t0; u32 error0; u32 sw_if_index0, len0; pppoe_entry_key_t key0; pppoe_entry_result_t result0; u32 bucket0; bi0 = from[0]; to_next[0] = bi0; from += 1; to_next += 1; n_left_from -= 1; n_left_to_next -= 1; b0 = vlib_get_buffer (vm, bi0); error0 = 0; /* leaves current_data pointing at the pppoe header */ pppoe0 = vlib_buffer_get_current (b0); ppp_proto0 = clib_net_to_host_u16(pppoe0->ppp_proto); if ((ppp_proto0 != PPP_PROTOCOL_ip4) && (ppp_proto0 != PPP_PROTOCOL_ip6)) { error0 = PPPOE_ERROR_CONTROL_PLANE; next0 = PPPOE_INPUT_NEXT_CP_INPUT; goto trace00; } /* get client mac */ vlib_buffer_reset(b0); h0 = vlib_buffer_get_current (b0); pppoe_lookup_1 (&pem->session_table, &cached_key, &cached_result, h0->src_address, pppoe0->session_id, &key0, &bucket0, &result0); if (PREDICT_FALSE (result0.fields.session_index == ~0)) { error0 = PPPOE_ERROR_NO_SUCH_SESSION; next0 = PPPOE_INPUT_NEXT_DROP; goto trace00; } t0 = pool_elt_at_index (pem->sessions, result0.fields.session_index); /* Pop Eth and PPPoE header */ vlib_buffer_advance(b0, sizeof(*h0)+sizeof(*pppoe0)); next0 = (ppp_proto0==PPP_PROTOCOL_ip4)? PPPOE_INPUT_NEXT_IP4_INPUT : PPPOE_INPUT_NEXT_IP6_INPUT; sw_if_index0 = t0->sw_if_index; len0 = vlib_buffer_length_in_chain (vm, b0); pkts_decapsulated ++; stats_n_packets += 1; stats_n_bytes += len0; /* Batch stats increment on the same pppoe session so counter is not incremented per packet */ if (PREDICT_FALSE (sw_if_index0 != stats_sw_if_index)) { stats_n_packets -= 1; stats_n_bytes -= len0; if (stats_n_packets) vlib_increment_combined_counter (im->combined_sw_if_counters + VNET_INTERFACE_COUNTER_RX, thread_index, stats_sw_if_index, stats_n_packets, stats_n_bytes); stats_n_packets = 1; stats_n_bytes = len0; stats_sw_if_index = sw_if_index0; } trace00: b0->error = error0 ? node->errors[error0] : 0; if (PREDICT_FALSE(b0->flags & VLIB_BUFFER_IS_TRACED)) { pppoe_rx_trace_t *tr = vlib_add_trace (vm, node, b0, sizeof (*tr)); tr->next_index = next0; tr->error = error0; tr->session_index = result0.fields.session_index; tr->session_id = clib_net_to_host_u16(pppoe0->session_id); } vlib_validate_buffer_enqueue_x1 (vm, node, next_index, to_next, n_left_to_next, bi0, next0); } vlib_put_next_frame (vm, node, next_index, n_left_to_next); } /* Do we still need this now that session tx stats is kept? */ vlib_node_increment_counter (vm, pppoe_input_node.index, PPPOE_ERROR_DECAPSULATED, pkts_decapsulated); /* Increment any remaining batch stats */ if (stats_n_packets) { vlib_increment_combined_counter (im->combined_sw_if_counters + VNET_INTERFACE_COUNTER_RX, thread_index, stats_sw_if_index, stats_n_packets, stats_n_bytes); node->runtime_data[0] = stats_sw_if_index; } return from_frame->n_vectors; } static char * pppoe_error_strings[] = { #define pppoe_error(n,s) s, #include <pppoe/pppoe_error.def> #undef pppoe_error #undef _ }; VLIB_REGISTER_NODE (pppoe_input_node) = { .name = "pppoe-input", /* Takes a vector of packets. */ .vector_size = sizeof (u32), .n_errors = PPPOE_N_ERROR, .error_strings = pppoe_error_strings, .n_next_nodes = PPPOE_INPUT_N_NEXT, .next_nodes = { #define _(s,n) [PPPOE_INPUT_NEXT_##s] = n, foreach_pppoe_input_next #undef _ }, .format_trace = format_pppoe_rx_trace, };