On 1/9/18 8:27 PM, Chris Mi wrote: > Currently in tc batch mode, only one command is read from the batch > file and sent to kernel to process. With this support, at most 128 > commands can be accumulated before sending to kernel. > > Now it only works for the following successive commands: > filter and actions add/delete/change/replace. > > Signed-off-by: Chris Mi <chr...@mellanox.com> > --- > tc/m_action.c | 60 +++++++++++++-------- > tc/tc.c | 165 > ++++++++++++++++++++++++++++++++++++++++++++++++++++----- > tc/tc_common.h | 5 +- > tc/tc_filter.c | 97 +++++++++++++++++++-------------- > 4 files changed, 249 insertions(+), 78 deletions(-) > > diff --git a/tc/m_action.c b/tc/m_action.c > index fc422364..e5c53a80 100644 > --- a/tc/m_action.c > +++ b/tc/m_action.c > @@ -546,40 +546,56 @@ bad_val: > return ret; > } > > +struct tc_action_req { > + struct nlmsghdr n; > + struct tcamsg t; > + char buf[MAX_MSG]; > +}; > + > static int tc_action_modify(int cmd, unsigned int flags, > - int *argc_p, char ***argv_p) > + int *argc_p, char ***argv_p, > + void *buf)
you really need a buflen; you should not make assumptions about the length of buffer passed to these functions. > { > - int argc = *argc_p; > + struct tc_action_req *req, action_req; > char **argv = *argv_p; > + struct rtattr *tail; > + int argc = *argc_p; > + struct iovec iov; > int ret = 0; > - struct { > - struct nlmsghdr n; > - struct tcamsg t; > - char buf[MAX_MSG]; > - } req = { > - .n.nlmsg_len = NLMSG_LENGTH(sizeof(struct tcamsg)), > - .n.nlmsg_flags = NLM_F_REQUEST | flags, > - .n.nlmsg_type = cmd, > - .t.tca_family = AF_UNSPEC, > - }; > - struct rtattr *tail = NLMSG_TAIL(&req.n); > + > + if (buf) > + req = buf; > + else > + req = &action_req; > + And a memset is needed for the !buf path since action_req is not initialized. > + req->n.nlmsg_len = NLMSG_LENGTH(sizeof(struct tcamsg)); > + req->n.nlmsg_flags = NLM_F_REQUEST | flags; > + req->n.nlmsg_type = cmd; > + req->t.tca_family = AF_UNSPEC; > + tail = NLMSG_TAIL(&req->n); > > argc -= 1; > argv += 1; > - if (parse_action(&argc, &argv, TCA_ACT_TAB, &req.n)) { > + if (parse_action(&argc, &argv, TCA_ACT_TAB, &req->n)) { > fprintf(stderr, "Illegal \"action\"\n"); > return -1; > } > - tail->rta_len = (void *) NLMSG_TAIL(&req.n) - (void *) tail; > + tail->rta_len = (void *) NLMSG_TAIL(&req->n) - (void *) tail; > + > + *argc_p = argc; > + *argv_p = argv; > > - if (rtnl_talk(&rth, &req.n, NULL) < 0) { > + iov.iov_base = &req->n; > + iov.iov_len = req->n.nlmsg_len; you can leave that as rtnl_talk; no need to change the !buf case to rtnl_talk_iov. > + > + if (buf) > + return 0; > + > + if (rtnl_talk_iov(&rth, &iov, 1, NULL) < 0) { > fprintf(stderr, "We have an error talking to the kernel\n"); > ret = -1; > } > > - *argc_p = argc; > - *argv_p = argv; > - > return ret; > } > > @@ -679,7 +695,7 @@ bad_val: > return ret; > } > > -int do_action(int argc, char **argv) > +int do_action(int argc, char **argv, void *buf) > { > > int ret = 0; > @@ -689,12 +705,12 @@ int do_action(int argc, char **argv) > if (matches(*argv, "add") == 0) { > ret = tc_action_modify(RTM_NEWACTION, > NLM_F_EXCL | NLM_F_CREATE, > - &argc, &argv); > + &argc, &argv, buf); > } else if (matches(*argv, "change") == 0 || > matches(*argv, "replace") == 0) { > ret = tc_action_modify(RTM_NEWACTION, > NLM_F_CREATE | NLM_F_REPLACE, > - &argc, &argv); > + &argc, &argv, buf); > } else if (matches(*argv, "delete") == 0) { > argc -= 1; > argv += 1; > diff --git a/tc/tc.c b/tc/tc.c > index ad9f07e9..44277405 100644 > --- a/tc/tc.c > +++ b/tc/tc.c > @@ -193,16 +193,16 @@ static void usage(void) > " -nm | -nam[es] | { -cf | -conf } > path } | -j[son]\n"); > } > > -static int do_cmd(int argc, char **argv) > +static int do_cmd(int argc, char **argv, void *buf) > { > if (matches(*argv, "qdisc") == 0) > return do_qdisc(argc-1, argv+1); > if (matches(*argv, "class") == 0) > return do_class(argc-1, argv+1); > if (matches(*argv, "filter") == 0) > - return do_filter(argc-1, argv+1); > + return do_filter(argc-1, argv+1, buf); > if (matches(*argv, "actions") == 0) > - return do_action(argc-1, argv+1); > + return do_action(argc-1, argv+1, buf); > if (matches(*argv, "monitor") == 0) > return do_tcmonitor(argc-1, argv+1); > if (matches(*argv, "exec") == 0) > @@ -217,11 +217,79 @@ static int do_cmd(int argc, char **argv) > return -1; > } > > +static bool batchsize_enabled(int argc, char *argv[]) > +{ > + if (argc < 2) > + return false; > + if ((matches(argv[0], "filter") && matches(argv[0], "actions")) > + || (matches(argv[1], "add") && matches(argv[1], "delete") > + && matches(argv[1], "change") && matches(argv[1], "replace"))) > + return false; That is really hard to follow. It would be better to default the response to false and test for the expected set: if argv[0] is filter or actions && argv[1] is add or delete or change or replace return true; return false; > + return true; > +} > + > +struct batch_buf { > + struct batch_buf *next; > + char buf[16420]; /* sizeof (struct nlmsghdr) + > + sizeof (struct tcmsg) + actions has a different ancillary header -- tcamsg. Use the buflen approach is more robust. > + MAX_MSG */ > +}; > + > +static struct batch_buf *get_batch_buf(struct batch_buf **pool) > +{ > + struct batch_buf *buf; > + > + if (*pool == NULL) > + buf = calloc(1, sizeof (struct batch_buf)); > + else { > + buf = *pool; > + *pool = (*pool)->next; > + memset(buf, 0, sizeof (struct batch_buf)); > + } > + return buf; > +} > + > +static void put_batch_bufs(struct batch_buf **pool, > + struct batch_buf **head, struct batch_buf **tail) > +{ > + if (*head == NULL || *tail == NULL) > + return; > + > + if (*pool == NULL) > + *pool = *head; > + else { > + (*tail)->next = *pool; > + *pool = *head; > + } > + *head = NULL; > + *tail = NULL; > +} > + > +static void free_batch_bufs(struct batch_buf **pool) > +{ > + struct batch_buf *buf; > + > + for (buf = *pool; buf != NULL; buf = *pool) { > + *pool = buf->next; > + free(buf); > + } > + *pool = NULL; > +} > + > static int batch(const char *name) > { > - char *line = NULL; > + struct batch_buf *head = NULL, *tail = NULL, *buf_pool = NULL; > + char *largv[100], *largv_next[100]; > + char *line, *line_next = NULL; > + bool bs_enabled_next = false; > + bool bs_enabled = false; > + bool lastline = false; > + int largc, largc_next; > + bool bs_enabled_saved; > + int batchsize = 0; > size_t len = 0; > int ret = 0; > + bool send; > > batch_mode = 1; > if (name && strcmp(name, "-") != 0) { > @@ -240,25 +308,94 @@ static int batch(const char *name) > } > > cmdlineno = 0; > - while (getcmdline(&line, &len, stdin) != -1) { > - char *largv[100]; > - int largc; > + if (getcmdline(&line, &len, stdin) == -1) > + goto Exit; > + largc = makeargs(line, largv, 100); > + bs_enabled = batchsize_enabled(largc, largv); > + bs_enabled_saved = bs_enabled; > + do { > + if (getcmdline(&line_next, &len, stdin) == -1) > + lastline = true; > + > + largc_next = makeargs(line_next, largv_next, 100); > + bs_enabled_next = batchsize_enabled(largc_next, largv_next); > + if (bs_enabled) { > + struct batch_buf *buf; space between variables and code. > + buf = get_batch_buf(&buf_pool); > + if (!buf) { > + fprintf(stderr, "failed to allocate > batch_buf\n"); > + return -1; > + } > + if (head == NULL) > + head = tail = buf; > + else { > + tail->next = buf; > + tail = buf; > + } > + ++batchsize; > + } > + > + /* > + * In batch mode, if we haven't accumulated enough commands > + * and this is not the last command and this command & next > + * command both support the batchsize feature, don't send the > + * message immediately. > + */ > + if (!lastline && bs_enabled && bs_enabled_next > + && batchsize != MSG_IOV_MAX) > + send = false; > + else > + send = true; > + > + line = line_next; > + line_next = NULL; > + len = 0; > + bs_enabled_saved = bs_enabled; > + bs_enabled = bs_enabled_next; > + bs_enabled_next = false; > > - largc = makeargs(line, largv, 100); > if (largc == 0) > continue; /* blank line */ > > - if (do_cmd(largc, largv)) { > - fprintf(stderr, "Command failed %s:%d\n", name, > cmdlineno); > + ret = do_cmd(largc, largv, tail == NULL ? NULL : tail->buf); > + if (ret != 0) { > + fprintf(stderr, "Command failed %s:%d\n", name, > + cmdlineno - 1); > ret = 1; > if (!force) > break; > } > - } > - if (line) > - free(line); > + largc = largc_next; > + memcpy(largv, largv_next, largc * sizeof(char *)); > + > + if (send && bs_enabled_saved) { > + struct iovec *iov, *iovs; > + struct batch_buf *buf; > + struct nlmsghdr *n; > + iov = iovs = malloc(batchsize * sizeof (struct iovec)); > + for (buf = head; buf != NULL; buf = buf->next, ++iov) { > + n = (struct nlmsghdr *)&buf->buf; > + iov->iov_base = n; > + iov->iov_len = n->nlmsg_len; > + } > + > + ret = rtnl_talk_iov(&rth, iovs, batchsize, NULL); > + if (ret < 0) { > + fprintf(stderr, "Command failed %s:%d\n", name, > + cmdlineno - (batchsize + ret) - 1); > + return 2; > + } > + put_batch_bufs(&buf_pool, &head, &tail); > + batchsize = 0; > + free(iovs); > + } > + } while (!lastline); > > + free_batch_bufs(&buf_pool); > +Exit: > + free(line); > rtnl_close(&rth); > + > return ret; > } > > @@ -341,7 +478,7 @@ int main(int argc, char **argv) > goto Exit; > } > > - ret = do_cmd(argc-1, argv+1); > + ret = do_cmd(argc-1, argv+1, NULL); > Exit: > rtnl_close(&rth); > > diff --git a/tc/tc_common.h b/tc/tc_common.h > index 264fbdac..59018da5 100644 > --- a/tc/tc_common.h > +++ b/tc/tc_common.h > @@ -1,13 +1,14 @@ > /* SPDX-License-Identifier: GPL-2.0 */ > > #define TCA_BUF_MAX (64*1024) > +#define MSG_IOV_MAX 128 > > extern struct rtnl_handle rth; > > extern int do_qdisc(int argc, char **argv); > extern int do_class(int argc, char **argv); > -extern int do_filter(int argc, char **argv); > -extern int do_action(int argc, char **argv); > +extern int do_filter(int argc, char **argv, void *buf); > +extern int do_action(int argc, char **argv, void *buf); > extern int do_tcmonitor(int argc, char **argv); > extern int do_exec(int argc, char **argv); > > diff --git a/tc/tc_filter.c b/tc/tc_filter.c > index 545cc3a1..7db4964b 100644 > --- a/tc/tc_filter.c > +++ b/tc/tc_filter.c > @@ -42,28 +42,38 @@ static void usage(void) > "OPTIONS := ... try tc filter add <desired FILTER_KIND> > help\n"); > } > > -static int tc_filter_modify(int cmd, unsigned int flags, int argc, char > **argv) > +struct tc_filter_req { > + struct nlmsghdr n; > + struct tcmsg t; > + char buf[MAX_MSG]; > +}; > + > +static int tc_filter_modify(int cmd, unsigned int flags, int argc, char > **argv, > + void *buf) > { > - struct { > - struct nlmsghdr n; > - struct tcmsg t; > - char buf[MAX_MSG]; > - } req = { > - .n.nlmsg_len = NLMSG_LENGTH(sizeof(struct tcmsg)), > - .n.nlmsg_flags = NLM_F_REQUEST | flags, > - .n.nlmsg_type = cmd, > - .t.tcm_family = AF_UNSPEC, > - }; > + struct tc_filter_req *req, filter_req; > struct filter_util *q = NULL; > - __u32 prio = 0; > - __u32 protocol = 0; > - int protocol_set = 0; > - __u32 chain_index; > + struct tc_estimator est = {}; > + char k[FILTER_NAMESZ] = {}; > int chain_index_set = 0; > + char d[IFNAMSIZ] = {}; > + int protocol_set = 0; > char *fhandle = NULL; > - char d[IFNAMSIZ] = {}; > - char k[FILTER_NAMESZ] = {}; > - struct tc_estimator est = {}; > + __u32 protocol = 0; > + __u32 chain_index; > + struct iovec iov; > + __u32 prio = 0; > + int ret; > + > + if (buf) > + req = buf; > + else > + req = &filter_req; same comment here about buflen and filter_req initialization. > + > + req->n.nlmsg_len = NLMSG_LENGTH(sizeof(struct tcmsg)); > + req->n.nlmsg_flags = NLM_F_REQUEST | flags; > + req->n.nlmsg_type = cmd; > + req->t.tcm_family = AF_UNSPEC; > > if (cmd == RTM_NEWTFILTER && flags & NLM_F_CREATE) > protocol = htons(ETH_P_ALL); > @@ -75,37 +85,37 @@ static int tc_filter_modify(int cmd, unsigned int flags, > int argc, char **argv) > duparg("dev", *argv); > strncpy(d, *argv, sizeof(d)-1); > } else if (strcmp(*argv, "root") == 0) { > - if (req.t.tcm_parent) { > + if (req->t.tcm_parent) { > fprintf(stderr, > "Error: \"root\" is duplicate parent > ID\n"); > return -1; > } > - req.t.tcm_parent = TC_H_ROOT; > + req->t.tcm_parent = TC_H_ROOT; > } else if (strcmp(*argv, "ingress") == 0) { > - if (req.t.tcm_parent) { > + if (req->t.tcm_parent) { > fprintf(stderr, > "Error: \"ingress\" is duplicate parent > ID\n"); > return -1; > } > - req.t.tcm_parent = TC_H_MAKE(TC_H_CLSACT, > + req->t.tcm_parent = TC_H_MAKE(TC_H_CLSACT, > TC_H_MIN_INGRESS); > } else if (strcmp(*argv, "egress") == 0) { > - if (req.t.tcm_parent) { > + if (req->t.tcm_parent) { > fprintf(stderr, > "Error: \"egress\" is duplicate parent > ID\n"); > return -1; > } > - req.t.tcm_parent = TC_H_MAKE(TC_H_CLSACT, > + req->t.tcm_parent = TC_H_MAKE(TC_H_CLSACT, > TC_H_MIN_EGRESS); > } else if (strcmp(*argv, "parent") == 0) { > __u32 handle; > > NEXT_ARG(); > - if (req.t.tcm_parent) > + if (req->t.tcm_parent) > duparg("parent", *argv); > if (get_tc_classid(&handle, *argv)) > invarg("Invalid parent ID", *argv); > - req.t.tcm_parent = handle; > + req->t.tcm_parent = handle; > } else if (strcmp(*argv, "handle") == 0) { > NEXT_ARG(); > if (fhandle) > @@ -152,26 +162,26 @@ static int tc_filter_modify(int cmd, unsigned int > flags, int argc, char **argv) > argc--; argv++; > } > > - req.t.tcm_info = TC_H_MAKE(prio<<16, protocol); > + req->t.tcm_info = TC_H_MAKE(prio<<16, protocol); > > if (chain_index_set) > - addattr32(&req.n, sizeof(req), TCA_CHAIN, chain_index); > + addattr32(&req->n, sizeof(*req), TCA_CHAIN, chain_index); > > if (k[0]) > - addattr_l(&req.n, sizeof(req), TCA_KIND, k, strlen(k)+1); > + addattr_l(&req->n, sizeof(*req), TCA_KIND, k, strlen(k)+1); > > if (d[0]) { > ll_init_map(&rth); > > - req.t.tcm_ifindex = ll_name_to_index(d); > - if (req.t.tcm_ifindex == 0) { > + req->t.tcm_ifindex = ll_name_to_index(d); > + if (req->t.tcm_ifindex == 0) { > fprintf(stderr, "Cannot find device \"%s\"\n", d); > return 1; > } > } > > if (q) { > - if (q->parse_fopt(q, fhandle, argc, argv, &req.n)) > + if (q->parse_fopt(q, fhandle, argc, argv, &req->n)) > return 1; > } else { > if (fhandle) { > @@ -190,10 +200,17 @@ static int tc_filter_modify(int cmd, unsigned int > flags, int argc, char **argv) > } > > if (est.ewma_log) > - addattr_l(&req.n, sizeof(req), TCA_RATE, &est, sizeof(est)); > + addattr_l(&req->n, sizeof(*req), TCA_RATE, &est, sizeof(est)); > > - if (rtnl_talk(&rth, &req.n, NULL) < 0) { > - fprintf(stderr, "We have an error talking to the kernel\n"); And here, no need to change to iov for the !buf case. > + iov.iov_base = &req->n; > + iov.iov_len = req->n.nlmsg_len; > + > + if (buf) > + return 0; > + > + ret = rtnl_talk_iov(&rth, &iov, 1, NULL); > + if (ret < 0) { > + fprintf(stderr, "We have an error talking to the kernel, %d\n", > ret); > return 2; > } > > @@ -636,20 +653,20 @@ static int tc_filter_list(int argc, char **argv) > return 0; > } > > -int do_filter(int argc, char **argv) > +int do_filter(int argc, char **argv, void *buf) > { > if (argc < 1) > return tc_filter_list(0, NULL); > if (matches(*argv, "add") == 0) > return tc_filter_modify(RTM_NEWTFILTER, NLM_F_EXCL|NLM_F_CREATE, > - argc-1, argv+1); > + argc-1, argv+1, buf); > if (matches(*argv, "change") == 0) > - return tc_filter_modify(RTM_NEWTFILTER, 0, argc-1, argv+1); > + return tc_filter_modify(RTM_NEWTFILTER, 0, argc-1, argv+1, buf); > if (matches(*argv, "replace") == 0) > return tc_filter_modify(RTM_NEWTFILTER, NLM_F_CREATE, argc-1, > - argv+1); > + argv+1, buf); > if (matches(*argv, "delete") == 0) > - return tc_filter_modify(RTM_DELTFILTER, 0, argc-1, argv+1); > + return tc_filter_modify(RTM_DELTFILTER, 0, argc-1, argv+1, buf); > if (matches(*argv, "get") == 0) > return tc_filter_get(RTM_GETTFILTER, 0, argc-1, argv+1); > if (matches(*argv, "list") == 0 || matches(*argv, "show") == 0 >