您的位置:首页 > 其它

TC执行过程解析

2011-05-30 18:45 357 查看
查看iproute2源码文件中的tc文件夹:
先看makefile
TCOBJ= tc.o tc_qdisc.o tc_class.o tc_filter.o tc_util.o /
       m_police.o m_estimator.o m_action.o m_ematch.o /
       emp_ematch.yacc.o emp_ematch.lex.o
 
include ../Config
 
TCMODULES :=
TCMODULES += q_fifo.o
TCMODULES += q_sfq.o
TCMODULES += q_red.o
TCMODULES += q_prio.o
TCMODULES += q_tbf.o
TCMODULES += q_cbq.o
TCMODULES += f_rsvp.o
TCMODULES += f_u32.o
TCMODULES += f_route.o
TCMODULES += f_fw.o
TCMODULES += f_basic.o
TCMODULES += q_dsmark.o
TCMODULES += q_gred.o
TCMODULES += f_tcindex.o
TCMODULES += q_ingress.o
TCMODULES += q_hfsc.o
TCMODULES += q_htb.o
TCMODULES += m_gact.o
TCMODULES += m_mirred.o
TCMODULES += m_ipt.o
TCMODULES += m_pedit.o
TCMODULES += p_ip.o
TCMODULES += p_icmp.o
TCMODULES += p_tcp.o
TCMODULES += p_udp.o
TCMODULES += em_nbyte.o
TCMODULES += em_cmp.o
TCMODULES += em_u32.o
TCMODULES += em_meta.o
 
TCOBJ += $(TCMODULES)
 
TCLIB := tc_core.o
TCLIB += tc_red.o
TCLIB += tc_cbq.o
TCLIB += tc_estimator.o
 
CFLAGS += -DCONFIG_GACT -DCONFIG_GACT_PROB
 
TCSO :=
TCSO += q_netem.so
ifeq ($(TC_CONFIG_ATM),y)
  TCSO += q_atm.so
endif
 
LDLIBS += -L. -ltc -lm -ldl
 
LDFLAGS += -Wl,-export-dynamic
 
YACC := bison
LEX := flex
 
%.so: %.c
       $(CC) $(CFLAGS) -shared -fpic $< -o $@
 
 
all: libtc.a tc $(TCSO)
 
tc: $(TCOBJ) $(LIBNETLINK) $(LIBUTIL) $(TCLIB)
 
libtc.a: $(TCLIB)
       $(AR) rcs $@ $(TCLIB)
 
install: all
       mkdir -p $(DESTDIR)/usr/lib/tc
       install -m 0755 -s tc $(DESTDIR)$(SBINDIR)
       for i in $(TCSO); /
       do install -m 755 -s $$i $(DESTDIR)/usr/lib/tc; /
       done
 
clean:
       rm -f $(TCOBJ) $(TCLIB) libtc.a tc *.so emp_ematch.yacc.h; /
       rm -f emp_ematch.yacc.output
 
q_atm.so: q_atm.c
       $(CC) $(CFLAGS) -shared -fpic -o q_atm.so q_atm.c -latm
 
%.yacc.c: %.y
       $(YACC) $(YACCFLAGS) -o $@ $<
 
%.lex.c: %.l
       $(LEX) $(LEXFLAGS) -o$@ $<
 
淡蓝色标记的为我们关注.
为了跟踪程序是如何执行的,以执行下面命令为例:
Code
tc qdisc add dev eth0 root handle 1: htb default 12[cmd1]
 
下面看tc.c中的main函数
int main(int argc, char **argv)
{
/**
*cmd1:argc=11(maybe 12)
*argv:{ `tc` ` qdisc` ` add` ` dev ` `eth0` ` root ` `handle`  1:` `htb`` default` *`12`}
*/
       int ret;
       int do_batching = 0;
       char *batchfile = NULL;
 
       while (argc > 1) {
              if (argv[1][0] != '-')
                     break;
              if (matches(argv[1], "-stats") == 0 ||
                      matches(argv[1], "-statistics") == 0) {
                     ++show_stats;
              } else if (matches(argv[1], "-details") == 0) {
                     ++show_details;
              } else if (matches(argv[1], "-raw") == 0) {
                     ++show_raw;
              } else if (matches(argv[1], "-Version") == 0) {
                     printf("tc utility, iproute2-ss%s/n", SNAPSHOT);
                     return 0;
              } else if (matches(argv[1], "-iec") == 0) {
                     ++use_iec;
              } else if (matches(argv[1], "-help") == 0) {
                     usage();
                     return 0;
              } else if (matches(argv[1], "-force") == 0) {
                     ++force;
              } else   if (matches(argv[1], "-batch") == 0) {
                     do_batching = 1;
                     if (argc > 2)
                            batchfile = argv[2];
                     argc--;  argv++;
              } else {
                     fprintf(stderr, "Option /"%s/" is unknown, try /"tc -help/"./n", argv[1]);
                     return -1;
              }
              argc--;  argv++;
       }
 
       if (do_batching)
              return batch(batchfile);
 
       if (argc <= 1) {
              usage();
              return 0;
       }
 
       tc_core_init();//从系统中读出一些设置参数
       if (rtnl_open(&rth, 0) < 0) {
/**
*用户层和系统内核通信采用的是rtnetlink机制,
*所以需要rtnetlink的支持
*/
              fprintf(stderr, "Cannot open rtnetlink/n");
              exit(1);
       }
/**
*tc的命令形式:tc ……
*所以传递给do_cmd的参数中,去掉了tc这个关键字
*这就是为什么argc-1和argv+1
*argv:{ ` qdisc` ` add` ` dev ` `eth0` ` root ` `handle`  1:` default` *`12`}
*/
       ret = do_cmd(argc-1, argv+1);
       rtnl_close(&rth);
       return ret;
}
do_cmd会根据不同的类型,调用不同的函数来处理,例如,如果是qdisc,那么函数do_qdisc会被调用,当然传递给do_qdisc函数的参数,关键字qdisc也是会被去处的。那么[cmd1]在do_qdisc为:
argv:{ ` add` ` dev ` `eth0` ` root ` `handle`  1:` `htb` ` default` *`12`}
Code::do_cmd
static int do_cmd(int argc, char **argv)
{
/**
*cssalp&csalp:
*do argc-1 and argv+1 is to escape the key word, i.e.
*do_qdisc must escape 'qdisc'
*/
       if (matches(*argv, "qdisc") == 0)
              return do_qdisc(argc-1, argv+1);//这是要跟踪的函数
 
       if (matches(*argv, "class") == 0)
              return do_class(argc-1, argv+1);
 
       if (matches(*argv, "filter") == 0)
              return do_filter(argc-1, argv+1);
 
       if (matches(*argv, "actions") == 0)
              return do_action(argc-1, argv+1);
 
       if (matches(*argv, "help") == 0) {
              usage();
              return 0;
       }
      
       fprintf(stderr, "Object /"%s/" is unknown, try /"tc help/"./n",
              *argv);
       return -1;
}
 
下面看看do_qdisc的
int do_qdisc(int argc, char **argv)
{
         if (argc < 1)
                   return tc_qdisc_list(0, NULL);//列出系统默认的qdisc和filter等信息
         if (matches(*argv, "add") == 0)
                   return tc_qdisc_modify(RTM_NEWQDISC, NLM_F_EXCL|NLM_F_CREATE, argc-1, argv+1);
         if (matches(*argv, "change") == 0)
                   return tc_qdisc_modify(RTM_NEWQDISC, 0, argc-1, argv+1);
         if (matches(*argv, "replace") == 0)
                   return tc_qdisc_modify(RTM_NEWQDISC, NLM_F_CREATE|NLM_F_REPLACE, argc-1, argv+1);
         if (matches(*argv, "link") == 0)
                   return tc_qdisc_modify(RTM_NEWQDISC, NLM_F_REPLACE, argc-1, argv+1);
         if (matches(*argv, "delete") == 0)
                   return tc_qdisc_modify(RTM_DELQDISC, 0,  argc-1, argv+1);
#if 0
         if (matches(*argv, "get") == 0)
                   return tc_qdisc_get(RTM_GETQDISC, 0,  argc-1, argv+1);
#endif
         if (matches(*argv, "list") == 0 || matches(*argv, "show") == 0
             || matches(*argv, "lst") == 0)
                   return tc_qdisc_list(argc-1, argv+1);
         if (matches(*argv, "help") == 0)
                   usage();
         fprintf(stderr, "Command /"%s/" is unknown, try /"tc qdisc help/"./n", *argv);
         return -1;
}
 
tc_qdisc_modify函数
 
传递给tc_qdisc_modify函数的argv为:
argv:{ ` dev ` `eth0` ` root ` `handle`  1:` `htb`` default` *`12`}
tc_qdisc_modify(RTM_NEWQDISC, NLM_F_EXCL|NLM_F_CREATE, argc-1, argv+1);
对tc_qdisc_modify函数参数的说明:
1、定义rtnetlink(netlink)消息类型:RTM_NEWQDISC,即新建一个qdisc
2、设置标志flag,flag的有如下几种:
Ø  NLM_F_REPLACE(ox100)覆盖以存在的
Ø  NLM_F_EXCL(ox200)如果存在就不创建
Ø  NLM_F_CREATE(ox400)不存在就创建
Ø  NLM_F_APPEND(ox800)添加到末尾
Code::flag
#define NLM_F_REPLACE       0x100   /* Override existing             */
#define NLM_F_EXCL 0x200  /* Do not touch, if it exists */
#define NLM_F_CREATE  0x400  /* Create, if it does not exist     */
#define NLM_F_APPEND  0x800  /* Add to end of list             */
/*在linux系统里面有相同的定义*/
3、设置命令参数的个数和命令参数
Code::tc_qdisc_modify
int tc_qdisc_modify(int cmd, unsigned flags, int argc, char **argv)
{
/**
* argv:{ ` dev ` `eth0` ` root ` `handle`  1:` `htb`` default` *`12`}
*/
       struct qdisc_util *q = NULL;
       struct tc_estimator est;
       char  d[16];
       char  k[16];
       struct {
/**
* nlmsghdr为和系统内核通信的消息结构的头
*tcmsg为tc消息结构
*/
              struct nlmsghdr     n;
              struct tcmsg            t;
              char                        buf[TCA_BUF_MAX];
       } req;
 
       memset(&req, 0, sizeof(req));
       memset(&est, 0, sizeof(est));
       memset(&d, 0, sizeof(d));
       memset(&k, 0, sizeof(k));
 
       req.n.nlmsg_len = NLMSG_LENGTH(sizeof(struct tcmsg));
       req.n.nlmsg_flags = NLM_F_REQUEST|flags;
       req.n.nlmsg_type = cmd;//对应[cmd1],type=rtm_newqdisc
       req.t.tcm_family = AF_UNSPEC;//family
 
       while (argc > 0) {
              if (strcmp(*argv, "dev") == 0) {
                     NEXT_ARG();//point to nextà ethi(i is number)
                     if (d[0])
                            duparg("dev", *argv);
                     strncpy(d, *argv, sizeof(d)-1);//eth0
              } else if (strcmp(*argv, "handle") == 0) {
                     __u32 handle;
                     if (req.t.tcm_handle)
                            duparg("handle", *argv);
                     NEXT_ARG();
                     if (get_qdisc_handle(&handle, *argv))//handle=1
                            invarg(*argv, "invalid qdisc ID");
                     req.t.tcm_handle = handle;
              } else if (strcmp(*argv, "root") == 0) {
                     if (req.t.tcm_parent) {
/**
*如果存在parent, 那么就不能为root
*/
                            fprintf(stderr, "Error: /"root/" is duplicate parent ID/n");
                            return -1;
                     }
                     req.t.tcm_parent = TC_H_ROOT;
#ifdef TC_H_INGRESS
              } else if (strcmp(*argv, "ingress") == 0) {
                     if (req.t.tcm_parent) {
                            fprintf(stderr, "Error: /"ingress/" is a duplicate parent ID/n");
                            return -1;
                     }
                     req.t.tcm_parent = TC_H_INGRESS;
                     strncpy(k, "ingress", sizeof(k)-1);
                     q = get_qdisc_kind(k);
                     req.t.tcm_handle = 0xffff0000;
 
                     argc--; argv++;
                     break;
#endif
              } else if (strcmp(*argv, "parent") == 0) {
                     __u32 handle;
                     NEXT_ARG();
                     if (req.t.tcm_parent)
                            duparg("parent", *argv);
                     if (get_tc_classid(&handle, *argv))
                            invarg(*argv, "invalid parent ID");
                     req.t.tcm_parent = handle;
              } else if (matches(*argv, "estimator") == 0) {
                     if (parse_estimator(&argc, &argv, &est))
                            return -1;
              } else if (matches(*argv, "help") == 0) {
                     usage();
              } else {
                     strncpy(k, *argv, sizeof(k)-1);//k=`htb`
/**
*get_qdisc_kind
*1、首先查看,与要添加的qdisc相关的qdisc_util是否已经存在了
* 如果存在,那么返回
*2、如果qdisc_util 还存在,那么查找系统的动态链接库,看是否存在
*通过函数dlopen打开动态链接库,然后通过函数q = dlsym(dlh, buf)
*得到相应的qdisc_util
*3、如果系统的动态链接也不存在,[cmd1]就是这种能够情况
*那么,就创建一个新的(q = malloc(sizeof(*q));),如果成功
*然后设置一下参数{
*            q->id = strcpy(malloc(strlen(str)+1), str);
*            q->parse_qopt = parse_noqopt;
*            q->print_qopt = print_noqopt; }
*4、最后将找到的qdisc_util,挂载到qdisc_list的上(链表),并返回q
*5、如果不成功,那么返回null(无能为力了)
*/
                     q = get_qdisc_kind(k);
                     argc--; argv++;
                     break;
              }
              argc--; argv++;
       }
/**
*addattr函数设置nlmsghdr中的一些参数,为和内核通信传递参数做准备
*/
       if (k[0])
              addattr_l(&req.n, sizeof(req), TCA_KIND, k, strlen(k)+1);
       if (est.ewma_log)
              addattr_l(&req.n, sizeof(req), TCA_RATE, &est, sizeof(est));
 
       if (q) {
              if (!q->parse_qopt) {
                     fprintf(stderr, "qdisc '%s' does not support option parsing/n", k);
                     return -1;
              }
/**
*在这个例子中,parse_qopt=parse_noqopt, do nothing and return 0
*/
              if (q->parse_qopt(q, argc, argv, &req.n))
                     return 1;
       } else {
              if (argc) {
                     if (matches(*argv, "help") == 0)
                            usage();
 
                     fprintf(stderr, "Garbage instead of arguments /"%s .../". Try /"tc qdisc help/"./n", *argv);
                     return -1;
              }
       }
/**
*根据设备名,找到设备,并设置消息,传递设备信息到内核
*/
       if (d[0])  {
              int idx;
 
             ll_init_map(&rth);
 
              if ((idx = ll_name_to_index(d)) == 0) {
                     fprintf(stderr, "Cannot find device /"%s/"/n", d);
                     return 1;
              }
              req.t.tcm_ifindex = idx;
       }
/**
*rtnl_talk函数,实现和内核通信
*在rtnl_talk函数中,会调用sendmsg函数,将信息传递到内核,
*在内核中,最终会调用tc_modify_qidsc函数来创建qdisc
*在pktsched_init函数中(linux 内核)
*rtnl_register(PF_UNSPEC, RTM_NEWQDISC, tc_modify_qdisc, NULL);
*而消息设定信息:
*  req.n.nlmsg_type = cmd;//对应[cmd1],type=RTM_NEWQDISC
*     req.t.tcm_family = AF_UNSPEC;
*当然rtnl_talk会监听内核返回的消息,并做相应的处理
*/
      if (rtnl_talk(&rth, &req.n, 0, 0, NULL, NULL, NULL) < 0)
              return 2;
 
       return 0;
}
 
内容来自用户分享和网络整理,不保证内容的准确性,如有侵权内容,可联系管理员处理 点击这里给我发消息
标签:  cmd struct null filter list yacc