X-Git-Url: https://gerrit.opnfv.org/gerrit/gitweb?a=blobdiff_plain;f=VNFs%2FDPPD-PROX%2Fhandle_lat.c;h=c7a45b60d5227f95912c2e7d5b44e9926638fe66;hb=2a7b2ff862fb75e8e3b34b58eb09dd4de8a6a28d;hp=3962b21d6cb33956e3bd1bffc6bbad44936582e8;hpb=167e6d113d61a4a75812d0df71843b0ab8b88784;p=samplevnf.git

diff --git a/VNFs/DPPD-PROX/handle_lat.c b/VNFs/DPPD-PROX/handle_lat.c
index 3962b21d..c7a45b60 100644
--- a/VNFs/DPPD-PROX/handle_lat.c
+++ b/VNFs/DPPD-PROX/handle_lat.c
@@ -106,19 +106,26 @@ struct task_lat {
 	struct lat_test lt[2];
 	struct lat_test *lat_test;
 	uint32_t generator_count;
+	uint16_t min_pkt_len;
 	struct early_loss_detect *eld;
 	struct rx_pkt_meta_data *rx_pkt_meta;
-	uint64_t link_speed;
 	// Following fields are only used when starting or stopping, not in general runtime
 	uint64_t *prev_tx_packet_index;
 	FILE *fp_rx;
 	FILE *fp_tx;
 	struct prox_port_cfg *port;
+	uint64_t *bytes_to_tsc;
 };
-
-static uint32_t diff_or_zero(uint32_t a, uint32_t b)
+/* This function calculate the difference between rx and tx_time
+ * Both values are uint32_t (see handle_lat_bulk)
+ * rx time should be higher than tx_time...except every UINT32_MAX
+ * cycles, when rx_time overflows.
+ * As the return value is also uint32_t, returning (rx_time - tx_time)
+ * is also fine when it overflows.
+ */
+static uint32_t diff_time(uint32_t rx_time, uint32_t tx_time)
 {
-       return a < b? 0 : a - b;
+	return rx_time - tx_time;
 }
 
 struct lat_test *task_lat_get_latency_meassurement(struct task_lat *task)
@@ -257,7 +264,7 @@ static uint64_t lat_latency_buffer_get_min_tsc(struct task_lat *task)
 
 static uint64_t lat_info_get_lat_tsc(struct lat_info *lat_info)
 {
-	uint64_t lat = diff_or_zero(lat_info->rx_time, lat_info->tx_time);
+	uint64_t lat = diff_time(lat_info->rx_time, lat_info->tx_time);
 
 	return lat << LATENCY_ACCURACY;
 }
@@ -422,25 +429,19 @@ static void task_lat_store_lat_buf(struct task_lat *task, uint64_t rx_packet_ind
 	lat_info->tx_err = tx_err;
 }
 
-static uint32_t task_lat_early_loss_detect(struct task_lat *task, struct unique_id *unique_id)
+static uint32_t task_lat_early_loss_detect(struct task_lat *task, uint32_t packet_id, uint8_t generator_id)
 {
-	struct early_loss_detect *eld;
-	uint8_t generator_id;
-	uint32_t packet_index;
-
-	unique_id_get(unique_id, &generator_id, &packet_index);
-
-	if (generator_id >= task->generator_count)
-		return 0;
-
-	eld = &task->eld[generator_id];
-
-	return early_loss_detect_add(eld, packet_index);
+	struct early_loss_detect *eld = &task->eld[generator_id];
+	return early_loss_detect_add(eld, packet_id);
 }
 
-static uint64_t tsc_extrapolate_backward(uint64_t link_speed, uint64_t tsc_from, uint64_t bytes, uint64_t tsc_minimum)
+static uint64_t tsc_extrapolate_backward(struct task_lat *task, uint64_t tsc_from, uint64_t bytes, uint64_t tsc_minimum)
 {
-	uint64_t tsc = tsc_from - (rte_get_tsc_hz()*bytes)/link_speed;
+#ifdef NO_EXTRAPOLATION
+	uint64_t tsc = tsc_from;
+#else
+	uint64_t tsc = tsc_from - task->bytes_to_tsc[bytes];
+#endif
 	if (likely(tsc > tsc_minimum))
 		return tsc;
 	else
@@ -496,9 +497,7 @@ static int task_lat_can_store_latency(struct task_lat *task)
 
 static void task_lat_store_lat(struct task_lat *task, uint64_t rx_packet_index, uint64_t rx_time, uint64_t tx_time, uint64_t rx_error, uint64_t tx_error, uint32_t packet_id, uint8_t generator_id)
 {
-	if (tx_time == 0)
-		return;
-	uint32_t lat_tsc = diff_or_zero(rx_time, tx_time) << LATENCY_ACCURACY;
+	uint32_t lat_tsc = diff_time(rx_time, tx_time) << LATENCY_ACCURACY;
 
 	lat_test_add_latency(task->lat_test, lat_tsc, rx_error + tx_error);
 
@@ -510,9 +509,7 @@ static void task_lat_store_lat(struct task_lat *task, uint64_t rx_packet_index,
 static int handle_lat_bulk(struct task_base *tbase, struct rte_mbuf **mbufs, uint16_t n_pkts)
 {
 	struct task_lat *task = (struct task_lat *)tbase;
-	uint64_t rx_time_err;
-
-	uint32_t pkt_rx_time, pkt_tx_time;
+	int rc;
 
 	if (n_pkts == 0) {
 		task->begin = tbase->aux->tsc_rx.before;
@@ -521,8 +518,12 @@ static int handle_lat_bulk(struct task_base *tbase, struct rte_mbuf **mbufs, uin
 
 	task_lat_update_lat_test(task);
 
-	const uint64_t rx_tsc = tbase->aux->tsc_rx.after;
-	uint32_t tx_time_err = 0;
+	// Remember those packets with bad length or bad signature
+	uint32_t non_dp_count = 0;
+	uint64_t pkt_bad_len_sig = 0;
+#define BIT64_SET(a64, bit)	a64 |=  (((uint64_t)1) << (bit & 63))
+#define BIT64_CLR(a64, bit)	a64 &= ~(((uint64_t)1) << (bit & 63))
+#define BIT64_TEST(a64, bit)	a64  &  (((uint64_t)1) << (bit & 63))
 
 	/* Go once through all received packets and read them.  If
 	   packet has just been modified by another core, the cost of
@@ -530,17 +531,31 @@ static int handle_lat_bulk(struct task_base *tbase, struct rte_mbuf **mbufs, uin
 	for (uint16_t j = 0; j < n_pkts; ++j) {
 		struct rte_mbuf *mbuf = mbufs[j];
 		task->rx_pkt_meta[j].hdr = rte_pktmbuf_mtod(mbuf, uint8_t *);
+
+		// Remember those packets which are too short to hold the values that we expect
+		if (unlikely(rte_pktmbuf_pkt_len(mbuf) < task->min_pkt_len)) {
+			BIT64_SET(pkt_bad_len_sig, j);
+			non_dp_count++;
+		} else
+			BIT64_CLR(pkt_bad_len_sig, j);
 	}
 
-	if (task->sig) {
+	if (task->sig_pos) {
 		for (uint16_t j = 0; j < n_pkts; ++j) {
-			if (*(uint32_t *)(task->rx_pkt_meta[j].hdr + task->sig_pos) == task->sig)
+			if (unlikely(BIT64_TEST(pkt_bad_len_sig, j)))
+				continue;
+			// Remember those packets with bad signature
+			if (likely(*(uint32_t *)(task->rx_pkt_meta[j].hdr + task->sig_pos) == task->sig))
 				task->rx_pkt_meta[j].pkt_tx_time = *(uint32_t *)(task->rx_pkt_meta[j].hdr + task->lat_pos);
-			else
-				task->rx_pkt_meta[j].pkt_tx_time = 0;
+			else {
+				BIT64_SET(pkt_bad_len_sig, j);
+				non_dp_count++;
+			}
 		}
 	} else {
 		for (uint16_t j = 0; j < n_pkts; ++j) {
+			if (unlikely(BIT64_TEST(pkt_bad_len_sig, j)))
+				continue;
 			task->rx_pkt_meta[j].pkt_tx_time = *(uint32_t *)(task->rx_pkt_meta[j].hdr + task->lat_pos);
 		}
 	}
@@ -554,37 +569,51 @@ static int handle_lat_bulk(struct task_base *tbase, struct rte_mbuf **mbufs, uin
 		bytes_total_in_bulk += mbuf_wire_size(mbufs[flipped]);
 	}
 
-	pkt_rx_time = tsc_extrapolate_backward(task->link_speed, rx_tsc, task->rx_pkt_meta[0].bytes_after_in_bulk, task->last_pkts_tsc) >> LATENCY_ACCURACY;
-	if ((uint32_t)((task->begin >> LATENCY_ACCURACY)) > pkt_rx_time) {
+	const uint64_t rx_tsc = tbase->aux->tsc_rx.after;
+
+	uint64_t rx_time_err;
+	uint64_t pkt_rx_time64 = tsc_extrapolate_backward(task, rx_tsc, task->rx_pkt_meta[0].bytes_after_in_bulk, task->last_pkts_tsc) >> LATENCY_ACCURACY;
+	if (unlikely((task->begin >> LATENCY_ACCURACY) > pkt_rx_time64)) {
 		// Extrapolation went up to BEFORE begin => packets were stuck in the NIC but we were not seeing them
-		rx_time_err = pkt_rx_time - (uint32_t)(task->last_pkts_tsc >> LATENCY_ACCURACY);
+		rx_time_err = pkt_rx_time64 - (task->last_pkts_tsc >> LATENCY_ACCURACY);
 	} else {
-		rx_time_err = pkt_rx_time - (uint32_t)(task->begin >> LATENCY_ACCURACY);
+		rx_time_err = pkt_rx_time64 - (task->begin >> LATENCY_ACCURACY);
 	}
 
-	struct unique_id *unique_id = NULL;
-	struct delayed_latency_entry *delayed_latency_entry;
-	uint32_t packet_id, generator_id;
-
+	TASK_STATS_ADD_RX_NON_DP(&tbase->aux->stats, non_dp_count);
 	for (uint16_t j = 0; j < n_pkts; ++j) {
+		// Used to display % of packets within accuracy limit vs. total number of packets (used_col)
+		task->lat_test->tot_all_pkts++;
+
+		// Skip those packets with bad length or bad signature
+		if (unlikely(BIT64_TEST(pkt_bad_len_sig, j)))
+			continue;
+
 		struct rx_pkt_meta_data *rx_pkt_meta = &task->rx_pkt_meta[j];
 		uint8_t *hdr = rx_pkt_meta->hdr;
 
-		pkt_rx_time = tsc_extrapolate_backward(task->link_speed, rx_tsc, rx_pkt_meta->bytes_after_in_bulk, task->last_pkts_tsc) >> LATENCY_ACCURACY;
-		pkt_tx_time = rx_pkt_meta->pkt_tx_time;
+		uint32_t pkt_rx_time = tsc_extrapolate_backward(task, rx_tsc, rx_pkt_meta->bytes_after_in_bulk, task->last_pkts_tsc) >> LATENCY_ACCURACY;
+		uint32_t pkt_tx_time = rx_pkt_meta->pkt_tx_time;
 
+		uint8_t generator_id;
+		uint32_t packet_id;
 		if (task->unique_id_pos) {
-			unique_id = (struct unique_id *)(hdr + task->unique_id_pos);
+			struct unique_id *unique_id = (struct unique_id *)(hdr + task->unique_id_pos);
+			unique_id_get(unique_id, &generator_id, &packet_id);
+
+			if (unlikely(generator_id >= task->generator_count)) {
+				/* No need to remember unexpected packet at this stage
+				BIT64_SET(pkt_bad_len_sig, j);
+				*/
+				// Skip unexpected packet
+				continue;
+			}
 
-			uint32_t n_loss = task_lat_early_loss_detect(task, unique_id);
-			packet_id = unique_id->packet_id;
-			generator_id = unique_id->generator_id;
-			lat_test_add_lost(task->lat_test, n_loss);
+			lat_test_add_lost(task->lat_test, task_lat_early_loss_detect(task, packet_id, generator_id));
 		} else {
-			packet_id = task->rx_packet_index;
 			generator_id = 0;
+			packet_id = task->rx_packet_index;
 		}
-		task->lat_test->tot_all_pkts++;
 
 		/* If accuracy is enabled, latency is reported with a
 		   delay of ACCURACY_BUFFER_SIZE packets since the generator puts the
@@ -592,9 +621,9 @@ static int handle_lat_bulk(struct task_base *tbase, struct rte_mbuf **mbufs, uin
 		   ensures that all reported latencies have both rx
 		   and tx error. */
 		if (task->accur_pos) {
-			tx_time_err = *(uint32_t *)(hdr + task->accur_pos);
+			uint32_t tx_time_err = *(uint32_t *)(hdr + task->accur_pos);
 
-			delayed_latency_entry = delayed_latency_get(task->delayed_latency_entries, generator_id, packet_id - ACCURACY_BUFFER_SIZE);
+			struct delayed_latency_entry *delayed_latency_entry = delayed_latency_get(task->delayed_latency_entries, generator_id, packet_id - ACCURACY_BUFFER_SIZE);
 
 			if (delayed_latency_entry) {
 				task_lat_store_lat(task,
@@ -617,13 +646,20 @@ static int handle_lat_bulk(struct task_base *tbase, struct rte_mbuf **mbufs, uin
 		} else {
 			task_lat_store_lat(task, task->rx_packet_index, pkt_rx_time, pkt_tx_time, 0, 0, packet_id, generator_id);
 		}
+
+		// Bad/unexpected packets do not need to be indexed
 		task->rx_packet_index++;
 	}
-	int ret;
-	ret = task->base.tx_pkt(&task->base, mbufs, n_pkts, NULL);
-	task->begin = tbase->aux->tsc_rx.before;
+
+	if (n_pkts < MAX_PKT_BURST)
+		task->begin = tbase->aux->tsc_rx.before;
 	task->last_pkts_tsc = tbase->aux->tsc_rx.after;
-	return ret;
+
+	rc = task->base.tx_pkt(&task->base, mbufs, n_pkts, NULL);
+	// non_dp_count should not be drop-handled, as there are all by definition considered as not handled
+	// RX = DISCARDED + HANDLED + NON_DP + (TX - TX_NON_DP) + TX_FAIL
+	TASK_STATS_ADD_DROP_HANDLED(&tbase->aux->stats, -non_dp_count);
+	return rc;
 }
 
 static void init_task_lat_latency_buffer(struct task_lat *task, uint32_t core_id)
@@ -682,12 +718,6 @@ static void lat_start(struct task_base *tbase)
 {
 	struct task_lat *task = (struct task_lat *)tbase;
 
-	if (task->port) {
-		// task->port->link->speed reports the link speed in Mbps e.g. 40k for a 40 Gbps NIC
-		// task->link_speed reported link speed in Bytes per sec.
-		task->link_speed = task->port->link_speed * 125000L;
-		plog_info("\tReceiving at %lu Mbps\n", 8 * task->link_speed / 1000000);
-	}
 }
 
 static void init_task_lat(struct task_base *tbase, struct task_args *targ)
@@ -703,6 +733,19 @@ static void init_task_lat(struct task_base *tbase, struct task_args *targ)
 	task->unique_id_pos = targ->packet_id_pos;
 	task->latency_buffer_size = targ->latency_buffer_size;
 
+	PROX_PANIC(task->lat_pos == 0, "Missing 'lat pos' parameter in config file\n");
+	uint16_t min_pkt_len = task->lat_pos + sizeof(uint32_t);
+	if (task->unique_id_pos && (
+		min_pkt_len < task->unique_id_pos + sizeof(struct unique_id)))
+		min_pkt_len = task->unique_id_pos + sizeof(struct unique_id);
+	if (task->accur_pos && (
+		min_pkt_len < task->accur_pos + sizeof(uint32_t)))
+		min_pkt_len = task->accur_pos + sizeof(uint32_t);
+	if (task->sig_pos && (
+		min_pkt_len < task->sig_pos + sizeof(uint32_t)))
+		min_pkt_len = task->sig_pos + sizeof(uint32_t);
+	task->min_pkt_len = min_pkt_len;
+
 	task_init_generator_count(task);
 
 	if (task->latency_buffer_size) {
@@ -740,15 +783,32 @@ static void init_task_lat(struct task_base *tbase, struct task_args *targ)
 	task->lat_test = &task->lt[task->using_lt];
 
 	task_lat_set_accuracy_limit(task, targ->accuracy_limit_nsec);
-	task->rx_pkt_meta = prox_zmalloc(MAX_RX_PKT_ALL * sizeof(*task->rx_pkt_meta), socket_id);
+	task->rx_pkt_meta = prox_zmalloc(MAX_PKT_BURST * sizeof(*task->rx_pkt_meta), socket_id);
 	PROX_PANIC(task->rx_pkt_meta == NULL, "unable to allocate memory to store RX packet meta data");
 
-	task->link_speed = UINT64_MAX;
+	uint32_t max_frame_size = MAX_PKT_SIZE;
+	uint64_t bytes_per_hz = UINT64_MAX;
 	if (targ->nb_rxports) {
-		// task->port structure is only used while starting handle_lat to get the link_speed.
-		// link_speed can not be quiried at init as the port has not been initialized yet.
 		struct prox_port_cfg *port = &prox_port_cfg[targ->rx_port_queue[0].port];
-		task->port = port;
+		max_frame_size = port->mtu + ETHER_HDR_LEN + ETHER_CRC_LEN + 2 * PROX_VLAN_TAG_SIZE;
+
+		// port->max_link_speed reports the maximum, non negotiated ink speed in Mbps e.g. 40k for a 40 Gbps NIC.
+		// It can be UINT32_MAX (virtual devices or not supported by DPDK < 16.04)
+		if (port->max_link_speed != UINT32_MAX) {
+			bytes_per_hz = port->max_link_speed * 125000L;
+			plog_info("\tPort %u: max link speed is %ld Mbps\n",
+				(uint8_t)(port - prox_port_cfg), 8 * bytes_per_hz / 1000000);
+		}
+	}
+	task->bytes_to_tsc = prox_zmalloc(max_frame_size * sizeof(task->bytes_to_tsc[0]) * MAX_PKT_BURST, rte_lcore_to_socket_id(targ->lconf->id));
+	PROX_PANIC(task->bytes_to_tsc == NULL,
+		"Failed to allocate %u bytes (in huge pages) for bytes_to_tsc\n", max_frame_size);
+
+	for (unsigned int i = 0; i < max_frame_size * MAX_PKT_BURST ; i++) {
+		if (bytes_per_hz == UINT64_MAX)
+			task->bytes_to_tsc[i] = 0;
+		else
+			task->bytes_to_tsc[i] = (rte_get_tsc_hz() * i) / bytes_per_hz;
 	}
 }
 
@@ -758,7 +818,7 @@ static struct task_init task_init_lat = {
 	.handle = handle_lat_bulk,
 	.start = lat_start,
 	.stop = lat_stop,
-	.flag_features = TASK_FEATURE_TSC_RX | TASK_FEATURE_RX_ALL | TASK_FEATURE_ZERO_RX | TASK_FEATURE_NEVER_DISCARDS,
+	.flag_features = TASK_FEATURE_TSC_RX | TASK_FEATURE_ZERO_RX | TASK_FEATURE_NEVER_DISCARDS,
 	.size = sizeof(struct task_lat)
 };