f-stack/dpdk/lib/sched/rte_sched.h

588 lines
18 KiB
C
Raw Normal View History

2019-06-25 11:12:58 +00:00
/* SPDX-License-Identifier: BSD-3-Clause
* Copyright(c) 2010-2014 Intel Corporation
2017-04-21 10:43:26 +00:00
*/
#ifndef __INCLUDE_RTE_SCHED_H__
#define __INCLUDE_RTE_SCHED_H__
#ifdef __cplusplus
extern "C" {
#endif
/**
* @file
* RTE Hierarchical Scheduler
*
* The hierarchical scheduler prioritizes the transmission of packets
* from different users and traffic classes according to the Service
* Level Agreements (SLAs) defined for the current network node.
*
* The scheduler supports thousands of packet queues grouped under a
* 5-level hierarchy:
* 1. Port:
* - Typical usage: output Ethernet port;
* - Multiple ports are scheduled in round robin order with
* equal priority;
* 2. Subport:
* - Typical usage: group of users;
* - Traffic shaping using the token bucket algorithm
* (one bucket per subport);
* - Upper limit enforced per traffic class at subport level;
* - Lower priority traffic classes able to reuse subport
* bandwidth currently unused by higher priority traffic
* classes of the same subport;
* - When any subport traffic class is oversubscribed
* (configuration time event), the usage of subport member
2019-06-26 10:17:41 +00:00
* pipes with high demand for that traffic class pipes is
2017-04-21 10:43:26 +00:00
* truncated to a dynamically adjusted value with no
* impact to low demand pipes;
* 3. Pipe:
* - Typical usage: individual user/subscriber;
* - Traffic shaping using the token bucket algorithm
* (one bucket per pipe);
* 4. Traffic class:
* - Traffic classes of the same pipe handled in strict
* priority order;
* - Upper limit enforced per traffic class at the pipe level;
* - Lower priority traffic classes able to reuse pipe
* bandwidth currently unused by higher priority traffic
* classes of the same pipe;
* 5. Queue:
* - Typical usage: queue hosting packets from one or
* multiple connections of same traffic class belonging to
* the same user;
* - Weighted Round Robin (WRR) is used to service the
2020-06-18 16:55:50 +00:00
* queues within same pipe lowest priority traffic class (best-effort).
2017-04-21 10:43:26 +00:00
*
*/
#include <sys/types.h>
2019-06-25 11:12:58 +00:00
#include <rte_compat.h>
2017-04-21 10:43:26 +00:00
#include <rte_mbuf.h>
#include <rte_meter.h>
2022-09-06 04:00:10 +00:00
/** Congestion Management */
2017-04-21 10:43:26 +00:00
#include "rte_red.h"
2022-09-06 04:00:10 +00:00
#include "rte_pie.h"
2017-04-21 10:43:26 +00:00
2020-06-18 16:55:50 +00:00
/** Maximum number of queues per pipe.
* Note that the multiple queues (power of 2) can only be assigned to
* lowest priority (best-effort) traffic class. Other higher priority traffic
* classes can only have one queue.
* Can not change.
*
* @see struct rte_sched_port_params
2017-04-21 10:43:26 +00:00
*/
2020-06-18 16:55:50 +00:00
#define RTE_SCHED_QUEUES_PER_PIPE 16
2017-04-21 10:43:26 +00:00
2020-06-18 16:55:50 +00:00
/** Number of WRR queues for best-effort traffic class per pipe.
*
* @see struct rte_sched_pipe_params
*/
#define RTE_SCHED_BE_QUEUES_PER_PIPE 4
2017-04-21 10:43:26 +00:00
2020-06-18 16:55:50 +00:00
/** Number of traffic classes per pipe (as well as subport).
* @see struct rte_sched_subport_params
* @see struct rte_sched_pipe_params
*/
#define RTE_SCHED_TRAFFIC_CLASSES_PER_PIPE \
(RTE_SCHED_QUEUES_PER_PIPE - RTE_SCHED_BE_QUEUES_PER_PIPE + 1)
2017-04-21 10:43:26 +00:00
2020-06-18 16:55:50 +00:00
/** Best-effort traffic class ID
* Can not change.
2017-04-21 10:43:26 +00:00
*/
2020-06-18 16:55:50 +00:00
#define RTE_SCHED_TRAFFIC_CLASS_BE (RTE_SCHED_TRAFFIC_CLASSES_PER_PIPE - 1)
2017-04-21 10:43:26 +00:00
/*
* Ethernet framing overhead. Overhead fields per Ethernet frame:
* 1. Preamble: 7 bytes;
* 2. Start of Frame Delimiter (SFD): 1 byte;
* 3. Frame Check Sequence (FCS): 4 bytes;
* 4. Inter Frame Gap (IFG): 12 bytes.
*
* The FCS is considered overhead only if not included in the packet
* length (field pkt_len of struct rte_mbuf).
2020-06-18 16:55:50 +00:00
*
* @see struct rte_sched_port_params
2017-04-21 10:43:26 +00:00
*/
#ifndef RTE_SCHED_FRAME_OVERHEAD_DEFAULT
#define RTE_SCHED_FRAME_OVERHEAD_DEFAULT 24
#endif
2022-09-06 04:00:10 +00:00
/**
* Congestion Management (CMAN) mode
*
* This is used for controlling the admission of packets into a packet queue or
* group of packet queues on congestion.
*
* The *Random Early Detection (RED)* algorithm works by proactively dropping
* more and more input packets as the queue occupancy builds up. When the queue
* is full or almost full, RED effectively works as *tail drop*. The *Weighted
* RED* algorithm uses a separate set of RED thresholds for each packet color.
*
* Similar to RED, Proportional Integral Controller Enhanced (PIE) randomly
* drops a packet at the onset of the congestion and tries to control the
* latency around the target value. The congestion detection, however, is based
* on the queueing latency instead of the queue length like RED. For more
* information, refer RFC8033.
*/
enum rte_sched_cman_mode {
RTE_SCHED_CMAN_RED, /**< Random Early Detection (RED) */
RTE_SCHED_CMAN_PIE, /**< Proportional Integral Controller Enhanced (PIE) */
};
2017-04-21 10:43:26 +00:00
/*
2020-06-18 16:55:50 +00:00
* Pipe configuration parameters. The period and credits_per_period
2017-04-21 10:43:26 +00:00
* parameters are measured in bytes, with one byte meaning the time
* duration associated with the transmission of one byte on the
* physical medium of the output port, with pipe or pipe traffic class
* rate (measured as percentage of output port rate) determined as
* credits_per_period divided by period. One credit represents one
* byte.
*/
2020-06-18 16:55:50 +00:00
struct rte_sched_pipe_params {
/** Token bucket rate (measured in bytes per second) */
uint64_t tb_rate;
2017-04-21 10:43:26 +00:00
2020-06-18 16:55:50 +00:00
/** Token bucket size (measured in credits) */
uint64_t tb_size;
2017-04-21 10:43:26 +00:00
2020-06-18 16:55:50 +00:00
/** Traffic class rates (measured in bytes per second) */
uint64_t tc_rate[RTE_SCHED_TRAFFIC_CLASSES_PER_PIPE];
/** Enforcement period (measured in milliseconds) */
uint64_t tc_period;
/** Best-effort traffic class oversubscription weight */
uint8_t tc_ov_weight;
/** WRR weights of best-effort traffic class queues */
uint8_t wrr_weights[RTE_SCHED_BE_QUEUES_PER_PIPE];
2017-04-21 10:43:26 +00:00
};
2022-09-06 04:00:10 +00:00
/*
* Congestion Management configuration parameters.
*/
struct rte_sched_cman_params {
/** Congestion Management mode */
enum rte_sched_cman_mode cman_mode;
union {
/** RED parameters */
struct rte_red_params red_params[RTE_SCHED_TRAFFIC_CLASSES_PER_PIPE][RTE_COLORS];
/** PIE parameters */
struct rte_pie_params pie_params[RTE_SCHED_TRAFFIC_CLASSES_PER_PIPE];
};
};
2017-04-21 10:43:26 +00:00
/*
2020-06-18 16:55:50 +00:00
* Subport configuration parameters. The period and credits_per_period
2017-04-21 10:43:26 +00:00
* parameters are measured in bytes, with one byte meaning the time
* duration associated with the transmission of one byte on the
* physical medium of the output port, with pipe or pipe traffic class
* rate (measured as percentage of output port rate) determined as
* credits_per_period divided by period. One credit represents one
* byte.
*/
2020-06-18 16:55:50 +00:00
struct rte_sched_subport_params {
/** Number of subport pipes.
* The subport can enable/allocate fewer pipes than the maximum
* number set through struct port_params::n_max_pipes_per_subport,
* as needed, to avoid memory allocation for the queues of the
* pipes that are not really needed.
*/
uint32_t n_pipes_per_subport_enabled;
/** Packet queue size for each traffic class.
* All the pipes within the same subport share the similar
* configuration for the queues.
*/
uint16_t qsize[RTE_SCHED_TRAFFIC_CLASSES_PER_PIPE];
/** Pipe profile table.
* Every pipe is configured using one of the profiles from this table.
*/
struct rte_sched_pipe_params *pipe_profiles;
/** Profiles in the pipe profile table */
uint32_t n_pipe_profiles;
/** Max allowed profiles in the pipe profile table */
uint32_t n_max_pipe_profiles;
2022-09-06 04:00:10 +00:00
/** Congestion Management parameters
* If NULL the congestion management is disabled for the subport,
* otherwise proper parameters need to be provided.
*/
struct rte_sched_cman_params *cman_params;
2020-06-18 16:55:50 +00:00
};
2017-04-21 10:43:26 +00:00
2021-02-05 08:48:47 +00:00
struct rte_sched_subport_profile_params {
/** Token bucket rate (measured in bytes per second) */
uint64_t tb_rate;
/** Token bucket size (measured in credits) */
uint64_t tb_size;
/** Traffic class rates (measured in bytes per second) */
uint64_t tc_rate[RTE_SCHED_TRAFFIC_CLASSES_PER_PIPE];
/** Enforcement period for rates (measured in milliseconds) */
uint64_t tc_period;
};
2020-06-18 16:55:50 +00:00
/** Subport statistics */
struct rte_sched_subport_stats {
/** Number of packets successfully written */
uint64_t n_pkts_tc[RTE_SCHED_TRAFFIC_CLASSES_PER_PIPE];
/** Number of packets dropped */
uint64_t n_pkts_tc_dropped[RTE_SCHED_TRAFFIC_CLASSES_PER_PIPE];
/** Number of bytes successfully written for each traffic class */
uint64_t n_bytes_tc[RTE_SCHED_TRAFFIC_CLASSES_PER_PIPE];
/** Number of bytes dropped for each traffic class */
uint64_t n_bytes_tc_dropped[RTE_SCHED_TRAFFIC_CLASSES_PER_PIPE];
2022-09-06 04:00:10 +00:00
/** Number of packets dropped by congestion management scheme */
uint64_t n_pkts_cman_dropped[RTE_SCHED_TRAFFIC_CLASSES_PER_PIPE];
2017-04-21 10:43:26 +00:00
};
/** Queue statistics */
struct rte_sched_queue_stats {
2020-06-18 16:55:50 +00:00
/** Packets successfully written */
uint64_t n_pkts;
/** Packets dropped */
uint64_t n_pkts_dropped;
2022-09-06 04:00:10 +00:00
/** Packets dropped by congestion management scheme */
uint64_t n_pkts_cman_dropped;
2017-04-21 10:43:26 +00:00
2020-06-18 16:55:50 +00:00
/** Bytes successfully written */
uint64_t n_bytes;
/** Bytes dropped */
uint64_t n_bytes_dropped;
2017-04-21 10:43:26 +00:00
};
/** Port configuration parameters. */
struct rte_sched_port_params {
2020-06-18 16:55:50 +00:00
/** Name of the port to be associated */
const char *name;
/** CPU socket ID */
int socket;
/** Output port rate (measured in bytes per second) */
uint64_t rate;
/** Maximum Ethernet frame size (measured in bytes).
* Should not include the framing overhead.
*/
uint32_t mtu;
/** Framing overhead per packet (measured in bytes) */
uint32_t frame_overhead;
/** Number of subports */
uint32_t n_subports_per_port;
2021-02-05 08:48:47 +00:00
/** subport profile table.
* Every pipe is configured using one of the profiles from this table.
*/
struct rte_sched_subport_profile_params *subport_profiles;
/** Profiles in the pipe profile table */
uint32_t n_subport_profiles;
/** Max allowed profiles in the pipe profile table */
uint32_t n_max_subport_profiles;
2020-06-18 16:55:50 +00:00
/** Maximum number of subport pipes.
* This parameter is used to reserve a fixed number of bits
* in struct rte_mbuf::sched.queue_id for the pipe_id for all
* the subports of the same port.
*/
uint32_t n_pipes_per_subport;
2017-04-21 10:43:26 +00:00
};
/*
* Configuration
*
***/
/**
* Hierarchical scheduler port configuration
*
* @param params
* Port scheduler configuration parameter structure
* @return
* Handle to port scheduler instance upon success or NULL otherwise.
*/
struct rte_sched_port *
rte_sched_port_config(struct rte_sched_port_params *params);
/**
* Hierarchical scheduler port free
*
* @param port
* Handle to port scheduler instance
*/
void
rte_sched_port_free(struct rte_sched_port *port);
2019-06-25 11:12:58 +00:00
/**
* Hierarchical scheduler pipe profile add
*
* @param port
* Handle to port scheduler instance
2020-06-18 16:55:50 +00:00
* @param subport_id
* Subport ID
2019-06-25 11:12:58 +00:00
* @param params
* Pipe profile parameters
* @param pipe_profile_id
* Set to valid profile id when profile is added successfully.
* @return
* 0 upon success, error code otherwise
*/
2020-06-18 16:55:50 +00:00
int
rte_sched_subport_pipe_profile_add(struct rte_sched_port *port,
uint32_t subport_id,
2019-06-25 11:12:58 +00:00
struct rte_sched_pipe_params *params,
uint32_t *pipe_profile_id);
2017-04-21 10:43:26 +00:00
/**
2021-02-05 08:48:47 +00:00
* @warning
* @b EXPERIMENTAL: this API may change without prior notice.
2017-04-21 10:43:26 +00:00
*
2021-02-05 08:48:47 +00:00
* Hierarchical scheduler subport bandwidth profile add
* Note that this function is safe to use in runtime for adding new
2022-09-02 04:40:05 +00:00
* subport bandwidth profile as it doesn't have any impact on hierarchical
2021-02-05 08:48:47 +00:00
* structure of the scheduler.
* @param port
* Handle to port scheduler instance
* @param profile
* Subport bandwidth profile
* @param subport_profile_id
* Subport profile id
* @return
* 0 upon success, error code otherwise
*/
__rte_experimental
int
rte_sched_port_subport_profile_add(struct rte_sched_port *port,
struct rte_sched_subport_profile_params *profile,
uint32_t *subport_profile_id);
/**
* Hierarchical scheduler subport configuration
* Note that this function is safe to use at runtime
* to configure subport bandwidth profile.
2017-04-21 10:43:26 +00:00
* @param port
* Handle to port scheduler instance
* @param subport_id
* Subport ID
* @param params
2021-02-05 08:48:47 +00:00
* Subport configuration parameters. Must be non-NULL
* for first invocation (i.e initialization) for a given
* subport. Ignored (recommended value is NULL) for all
* subsequent invocation on the same subport.
* @param subport_profile_id
* ID of subport bandwidth profile
2017-04-21 10:43:26 +00:00
* @return
* 0 upon success, error code otherwise
*/
int
rte_sched_subport_config(struct rte_sched_port *port,
uint32_t subport_id,
2021-02-05 08:48:47 +00:00
struct rte_sched_subport_params *params,
uint32_t subport_profile_id);
2017-04-21 10:43:26 +00:00
/**
* Hierarchical scheduler pipe configuration
*
* @param port
* Handle to port scheduler instance
* @param subport_id
* Subport ID
* @param pipe_id
* Pipe ID within subport
* @param pipe_profile
2020-06-18 16:55:50 +00:00
* ID of subport-level pre-configured pipe profile
2017-04-21 10:43:26 +00:00
* @return
* 0 upon success, error code otherwise
*/
int
rte_sched_pipe_config(struct rte_sched_port *port,
uint32_t subport_id,
uint32_t pipe_id,
int32_t pipe_profile);
/**
* Hierarchical scheduler memory footprint size per port
*
2020-06-18 16:55:50 +00:00
* @param port_params
2017-04-21 10:43:26 +00:00
* Port scheduler configuration parameter structure
2020-06-18 16:55:50 +00:00
* @param subport_params
* Array of subport parameter structures
2017-04-21 10:43:26 +00:00
* @return
* Memory footprint size in bytes upon success, 0 otherwise
*/
uint32_t
2020-06-18 16:55:50 +00:00
rte_sched_port_get_memory_footprint(struct rte_sched_port_params *port_params,
struct rte_sched_subport_params **subport_params);
2017-04-21 10:43:26 +00:00
/*
* Statistics
*
***/
/**
* Hierarchical scheduler subport statistics read
*
* @param port
* Handle to port scheduler instance
* @param subport_id
* Subport ID
* @param stats
* Pointer to pre-allocated subport statistics structure where the statistics
* counters should be stored
* @param tc_ov
2020-06-18 16:55:50 +00:00
* Pointer to pre-allocated RTE_SCHED_TRAFFIC_CLASSES_PER_PIPE-entry array
* where the oversubscription status for each of the subport traffic classes
* should be stored.
2017-04-21 10:43:26 +00:00
* @return
* 0 upon success, error code otherwise
*/
int
rte_sched_subport_read_stats(struct rte_sched_port *port,
uint32_t subport_id,
struct rte_sched_subport_stats *stats,
uint32_t *tc_ov);
/**
* Hierarchical scheduler queue statistics read
*
* @param port
* Handle to port scheduler instance
* @param queue_id
* Queue ID within port scheduler
* @param stats
* Pointer to pre-allocated subport statistics structure where the statistics
* counters should be stored
* @param qlen
* Pointer to pre-allocated variable where the current queue length
* should be stored.
* @return
* 0 upon success, error code otherwise
*/
int
rte_sched_queue_read_stats(struct rte_sched_port *port,
uint32_t queue_id,
struct rte_sched_queue_stats *stats,
uint16_t *qlen);
/**
* Scheduler hierarchy path write to packet descriptor. Typically
* called by the packet classification stage.
*
2020-06-18 16:55:50 +00:00
* @param port
* Handle to port scheduler instance
2017-04-21 10:43:26 +00:00
* @param pkt
* Packet descriptor handle
* @param subport
* Subport ID
* @param pipe
* Pipe ID within subport
* @param traffic_class
2020-06-18 16:55:50 +00:00
* Traffic class ID within pipe (0 .. RTE_SCHED_TRAFFIC_CLASS_BE)
2017-04-21 10:43:26 +00:00
* @param queue
2020-06-18 16:55:50 +00:00
* Queue ID within pipe traffic class, 0 for high priority TCs, and
* 0 .. (RTE_SCHED_BE_QUEUES_PER_PIPE - 1) for best-effort TC
2017-04-21 10:43:26 +00:00
* @param color
* Packet color set
*/
void
2020-06-18 16:55:50 +00:00
rte_sched_port_pkt_write(struct rte_sched_port *port,
struct rte_mbuf *pkt,
2017-04-21 10:43:26 +00:00
uint32_t subport, uint32_t pipe, uint32_t traffic_class,
2020-06-18 16:55:50 +00:00
uint32_t queue, enum rte_color color);
2017-04-21 10:43:26 +00:00
/**
* Scheduler hierarchy path read from packet descriptor (struct
* rte_mbuf). Typically called as part of the hierarchical scheduler
* enqueue operation. The subport, pipe, traffic class and queue
* parameters need to be pre-allocated by the caller.
*
2020-06-18 16:55:50 +00:00
* @param port
* Handle to port scheduler instance
2017-04-21 10:43:26 +00:00
* @param pkt
* Packet descriptor handle
* @param subport
* Subport ID
* @param pipe
* Pipe ID within subport
* @param traffic_class
2020-06-18 16:55:50 +00:00
* Traffic class ID within pipe (0 .. RTE_SCHED_TRAFFIC_CLASS_BE)
2017-04-21 10:43:26 +00:00
* @param queue
2020-06-18 16:55:50 +00:00
* Queue ID within pipe traffic class, 0 for high priority TCs, and
* 0 .. (RTE_SCHED_BE_QUEUES_PER_PIPE - 1) for best-effort TC
2017-04-21 10:43:26 +00:00
*/
void
2020-06-18 16:55:50 +00:00
rte_sched_port_pkt_read_tree_path(struct rte_sched_port *port,
const struct rte_mbuf *pkt,
2017-04-21 10:43:26 +00:00
uint32_t *subport, uint32_t *pipe,
uint32_t *traffic_class, uint32_t *queue);
2020-06-18 16:55:50 +00:00
enum rte_color
2017-04-21 10:43:26 +00:00
rte_sched_port_pkt_read_color(const struct rte_mbuf *pkt);
/**
* Hierarchical scheduler port enqueue. Writes up to n_pkts to port
* scheduler and returns the number of packets actually written. For
* each packet, the port scheduler queue to write the packet to is
* identified by reading the hierarchy path from the packet
* descriptor; if the queue is full or congested and the packet is not
* written to the queue, then the packet is automatically dropped
* without any action required from the caller.
*
* @param port
* Handle to port scheduler instance
* @param pkts
* Array storing the packet descriptor handles
* @param n_pkts
* Number of packets to enqueue from the pkts array into the port scheduler
* @return
* Number of packets successfully enqueued
*/
int
rte_sched_port_enqueue(struct rte_sched_port *port, struct rte_mbuf **pkts, uint32_t n_pkts);
/**
* Hierarchical scheduler port dequeue. Reads up to n_pkts from the
* port scheduler and stores them in the pkts array and returns the
* number of packets actually read. The pkts array needs to be
* pre-allocated by the caller with at least n_pkts entries.
*
* @param port
* Handle to port scheduler instance
* @param pkts
* Pre-allocated packet descriptor array where the packets dequeued
* from the port
* scheduler should be stored
* @param n_pkts
* Number of packets to dequeue from the port scheduler
* @return
* Number of packets successfully dequeued and placed in the pkts array
*/
int
rte_sched_port_dequeue(struct rte_sched_port *port, struct rte_mbuf **pkts, uint32_t n_pkts);
#ifdef __cplusplus
}
#endif
#endif /* __INCLUDE_RTE_SCHED_H__ */