net/sched/sch_sfb.c

   1 /*
   2  * net/sched/sch_sfb.c    Stochastic Fair Blue
   3  *
   4  * Copyright (c) 2008-2011 Juliusz Chroboczek <jch@pps.jussieu.fr>
   5  * Copyright (c) 2011 Eric Dumazet <eric.dumazet@gmail.com>
   6  *
   7  * This program is free software; you can redistribute it and/or
   8  * modify it under the terms of the GNU General Public License
   9  * version 2 as published by the Free Software Foundation.
  10  *
  11  * W. Feng, D. Kandlur, D. Saha, K. Shin. Blue:
  12  * A New Class of Active Queue Management Algorithms.
  13  * U. Michigan CSE-TR-387-99, April 1999.
  14  *
  15  * http://www.thefengs.com/wuchang/blue/CSE-TR-387-99.pdf
  16  *
  17  */
  18
  19 #include <linux/module.h>
  20 #include <linux/types.h>
  21 #include <linux/kernel.h>
  22 #include <linux/errno.h>
  23 #include <linux/skbuff.h>
  24 #include <linux/random.h>
  25 #include <linux/siphash.h>
  26 #include <net/ip.h>
  27 #include <net/pkt_sched.h>
  28 #include <net/pkt_cls.h>
  29 #include <net/inet_ecn.h>
  30
  31 /*
  32  * SFB uses two B[l][n] : L x N arrays of bins (L levels, N bins per level)
  33  * This implementation uses L = 8 and N = 16
  34  * This permits us to split one 32bit hash (provided per packet by rxhash or
  35  * external classifier) into 8 subhashes of 4 bits.
  36  */
  37 #define SFB_BUCKET_SHIFT 4
  38 #define SFB_NUMBUCKETS  (1 << SFB_BUCKET_SHIFT) /* N bins per Level */
  39 #define SFB_BUCKET_MASK (SFB_NUMBUCKETS - 1)
  40 #define SFB_LEVELS      (32 / SFB_BUCKET_SHIFT) /* L */
  41
  42 /* SFB algo uses a virtual queue, named "bin" */
  43 struct sfb_bucket {
  44         u16             qlen; /* length of virtual queue */
  45         u16             p_mark; /* marking probability */
  46 };
  47
  48 /* We use a double buffering right before hash change
  49  * (Section 4.4 of SFB reference : moving hash functions)
  50  */
  51 struct sfb_bins {
  52         siphash_key_t     perturbation; /* siphash key */
  53         struct sfb_bucket bins[SFB_LEVELS][SFB_NUMBUCKETS];
  54 };
  55
  56 struct sfb_sched_data {
  57         struct Qdisc    *qdisc;
  58         struct tcf_proto __rcu *filter_list;
  59         struct tcf_block *block;
  60         unsigned long   rehash_interval;
  61         unsigned long   warmup_time;    /* double buffering warmup time in jiffies */
  62         u32             max;
  63         u32             bin_size;       /* maximum queue length per bin */
  64         u32             increment;      /* d1 */
  65         u32             decrement;      /* d2 */
  66         u32             limit;          /* HARD maximal queue length */
  67         u32             penalty_rate;
  68         u32             penalty_burst;
  69         u32             tokens_avail;
  70         unsigned long   rehash_time;
  71         unsigned long   token_time;
  72
  73         u8              slot;           /* current active bins (0 or 1) */
  74         bool            double_buffering;
  75         struct sfb_bins bins[2];
  76
  77         struct {
  78                 u32     earlydrop;
  79                 u32     penaltydrop;
  80                 u32     bucketdrop;
  81                 u32     queuedrop;
  82                 u32     childdrop;      /* drops in child qdisc */
  83                 u32     marked;         /* ECN mark */
  84         } stats;
  85 };
  86
  87 /*
  88  * Each queued skb might be hashed on one or two bins
  89  * We store in skb_cb the two hash values.
  90  * (A zero value means double buffering was not used)
  91  */
  92 struct sfb_skb_cb {
  93         u32 hashes[2];
  94 };
  95
  96 static inline struct sfb_skb_cb *sfb_skb_cb(const struct sk_buff *skb)
  97 {
  98         qdisc_cb_private_validate(skb, sizeof(struct sfb_skb_cb));
  99         return (struct sfb_skb_cb *)qdisc_skb_cb(skb)->data;
 100 }
 101
 102 /*
 103  * If using 'internal' SFB flow classifier, hash comes from skb rxhash
 104  * If using external classifier, hash comes from the classid.
 105  */
 106 static u32 sfb_hash(const struct sk_buff *skb, u32 slot)
 107 {
 108         return sfb_skb_cb(skb)->hashes[slot];
 109 }
 110
 111 /* Probabilities are coded as Q0.16 fixed-point values,
 112  * with 0xFFFF representing 65535/65536 (almost 1.0)
 113  * Addition and subtraction are saturating in [0, 65535]
 114  */
 115 static u32 prob_plus(u32 p1, u32 p2)
 116 {
 117         u32 res = p1 + p2;
 118
 119         return min_t(u32, res, SFB_MAX_PROB);
 120 }
 121
 122 static u32 prob_minus(u32 p1, u32 p2)
 123 {
 124         return p1 > p2 ? p1 - p2 : 0;
 125 }
 126
 127 static void increment_one_qlen(u32 sfbhash, u32 slot, struct sfb_sched_data *q)
 128 {
 129         int i;
 130         struct sfb_bucket *b = &q->bins[slot].bins[0][0];
 131
 132         for (i = 0; i < SFB_LEVELS; i++) {
 133                 u32 hash = sfbhash & SFB_BUCKET_MASK;
 134
 135                 sfbhash >>= SFB_BUCKET_SHIFT;
 136                 if (b[hash].qlen < 0xFFFF)
 137                         b[hash].qlen++;
 138                 b += SFB_NUMBUCKETS; /* next level */
 139         }
 140 }
 141
 142 static void increment_qlen(const struct sfb_skb_cb *cb, struct sfb_sched_data *q)
 143 {
 144         u32 sfbhash;
 145
 146         sfbhash = cb->hashes[0];
 147         if (sfbhash)
 148                 increment_one_qlen(sfbhash, 0, q);
 149
 150         sfbhash = cb->hashes[1];
 151         if (sfbhash)
 152                 increment_one_qlen(sfbhash, 1, q);
 153 }
 154
 155 static void decrement_one_qlen(u32 sfbhash, u32 slot,
 156                                struct sfb_sched_data *q)
 157 {
 158         int i;
 159         struct sfb_bucket *b = &q->bins[slot].bins[0][0];
 160
 161         for (i = 0; i < SFB_LEVELS; i++) {
 162                 u32 hash = sfbhash & SFB_BUCKET_MASK;
 163
 164                 sfbhash >>= SFB_BUCKET_SHIFT;
 165                 if (b[hash].qlen > 0)
 166                         b[hash].qlen--;
 167                 b += SFB_NUMBUCKETS; /* next level */
 168         }
 169 }
 170
 171 static void decrement_qlen(const struct sk_buff *skb, struct sfb_sched_data *q)
 172 {
 173         u32 sfbhash;
 174
 175         sfbhash = sfb_hash(skb, 0);
 176         if (sfbhash)
 177                 decrement_one_qlen(sfbhash, 0, q);
 178
 179         sfbhash = sfb_hash(skb, 1);
 180         if (sfbhash)
 181                 decrement_one_qlen(sfbhash, 1, q);
 182 }
 183
 184 static void decrement_prob(struct sfb_bucket *b, struct sfb_sched_data *q)
 185 {
 186         b->p_mark = prob_minus(b->p_mark, q->decrement);
 187 }
 188
 189 static void increment_prob(struct sfb_bucket *b, struct sfb_sched_data *q)
 190 {
 191         b->p_mark = prob_plus(b->p_mark, q->increment);
 192 }
 193
 194 static void sfb_zero_all_buckets(struct sfb_sched_data *q)
 195 {
 196         memset(&q->bins, 0, sizeof(q->bins));
 197 }
 198
 199 /*
 200  * compute max qlen, max p_mark, and avg p_mark
 201  */
 202 static u32 sfb_compute_qlen(u32 *prob_r, u32 *avgpm_r, const struct sfb_sched_data *q)
 203 {
 204         int i;
 205         u32 qlen = 0, prob = 0, totalpm = 0;
 206         const struct sfb_bucket *b = &q->bins[q->slot].bins[0][0];
 207
 208         for (i = 0; i < SFB_LEVELS * SFB_NUMBUCKETS; i++) {
 209                 if (qlen < b->qlen)
 210                         qlen = b->qlen;
 211                 totalpm += b->p_mark;
 212                 if (prob < b->p_mark)
 213                         prob = b->p_mark;
 214                 b++;
 215         }
 216         *prob_r = prob;
 217         *avgpm_r = totalpm / (SFB_LEVELS * SFB_NUMBUCKETS);
 218         return qlen;
 219 }
 220
 221
 222 static void sfb_init_perturbation(u32 slot, struct sfb_sched_data *q)
 223 {
 224         get_random_bytes(&q->bins[slot].perturbation,
 225                          sizeof(q->bins[slot].perturbation));
 226 }
 227
 228 static void sfb_swap_slot(struct sfb_sched_data *q)
 229 {
 230         sfb_init_perturbation(q->slot, q);
 231         q->slot ^= 1;
 232         q->double_buffering = false;
 233 }
 234
 235 /* Non elastic flows are allowed to use part of the bandwidth, expressed
 236  * in "penalty_rate" packets per second, with "penalty_burst" burst
 237  */
 238 static bool sfb_rate_limit(struct sk_buff *skb, struct sfb_sched_data *q)
 239 {
 240         if (q->penalty_rate == 0 || q->penalty_burst == 0)
 241                 return true;
 242
 243         if (q->tokens_avail < 1) {
 244                 unsigned long age = min(10UL * HZ, jiffies - q->token_time);
 245
 246                 q->tokens_avail = (age * q->penalty_rate) / HZ;
 247                 if (q->tokens_avail > q->penalty_burst)
 248                         q->tokens_avail = q->penalty_burst;
 249                 q->token_time = jiffies;
 250                 if (q->tokens_avail < 1)
 251                         return true;
 252         }
 253
 254         q->tokens_avail--;
 255         return false;
 256 }
 257
 258 static bool sfb_classify(struct sk_buff *skb, struct tcf_proto *fl,
 259                          int *qerr, u32 *salt)
 260 {
 261         struct tcf_result res;
 262         int result;
 263
 264         result = tcf_classify(skb, fl, &res, false);
 265         if (result >= 0) {
 266 #ifdef CONFIG_NET_CLS_ACT
 267                 switch (result) {
 268                 case TC_ACT_STOLEN:
 269                 case TC_ACT_QUEUED:
 270                 case TC_ACT_TRAP:
 271                         *qerr = NET_XMIT_SUCCESS | __NET_XMIT_STOLEN;
 272                         /* fall through */
 273                 case TC_ACT_SHOT:
 274                         return false;
 275                 }
 276 #endif
 277                 *salt = TC_H_MIN(res.classid);
 278                 return true;
 279         }
 280         return false;
 281 }
 282
 283 static int sfb_enqueue(struct sk_buff *skb, struct Qdisc *sch,
 284                        struct sk_buff **to_free)
 285 {
 286
 287         struct sfb_sched_data *q = qdisc_priv(sch);
 288         unsigned int len = qdisc_pkt_len(skb);
 289         struct Qdisc *child = q->qdisc;
 290         struct tcf_proto *fl;
 291         struct sfb_skb_cb cb;
 292         int i;
 293         u32 p_min = ~0;
 294         u32 minqlen = ~0;
 295         u32 r, sfbhash;
 296         u32 slot = q->slot;
 297         int ret = NET_XMIT_SUCCESS | __NET_XMIT_BYPASS;
 298
 299         if (unlikely(sch->q.qlen >= q->limit)) {
 300                 qdisc_qstats_overlimit(sch);
 301                 q->stats.queuedrop++;
 302                 goto drop;
 303         }
 304
 305         if (q->rehash_interval > 0) {
 306                 unsigned long limit = q->rehash_time + q->rehash_interval;
 307
 308                 if (unlikely(time_after(jiffies, limit))) {
 309                         sfb_swap_slot(q);
 310                         q->rehash_time = jiffies;
 311                 } else if (unlikely(!q->double_buffering && q->warmup_time > 0 &&
 312                                     time_after(jiffies, limit - q->warmup_time))) {
 313                         q->double_buffering = true;
 314                 }
 315         }
 316
 317         fl = rcu_dereference_bh(q->filter_list);
 318         if (fl) {
 319                 u32 salt;
 320
 321                 /* If using external classifiers, get result and record it. */
 322                 if (!sfb_classify(skb, fl, &ret, &salt))
 323                         goto other_drop;
 324                 sfbhash = siphash_1u32(salt, &q->bins[slot].perturbation);
 325         } else {
 326                 sfbhash = skb_get_hash_perturb(skb, &q->bins[slot].perturbation);
 327         }
 328
 329
 330         if (!sfbhash)
 331                 sfbhash = 1;
 332         sfb_skb_cb(skb)->hashes[slot] = sfbhash;
 333
 334         for (i = 0; i < SFB_LEVELS; i++) {
 335                 u32 hash = sfbhash & SFB_BUCKET_MASK;
 336                 struct sfb_bucket *b = &q->bins[slot].bins[i][hash];
 337
 338                 sfbhash >>= SFB_BUCKET_SHIFT;
 339                 if (b->qlen == 0)
 340                         decrement_prob(b, q);
 341                 else if (b->qlen >= q->bin_size)
 342                         increment_prob(b, q);
 343                 if (minqlen > b->qlen)
 344                         minqlen = b->qlen;
 345                 if (p_min > b->p_mark)
 346                         p_min = b->p_mark;
 347         }
 348
 349         slot ^= 1;
 350         sfb_skb_cb(skb)->hashes[slot] = 0;
 351
 352         if (unlikely(minqlen >= q->max)) {
 353                 qdisc_qstats_overlimit(sch);
 354                 q->stats.bucketdrop++;
 355                 goto drop;
 356         }
 357
 358         if (unlikely(p_min >= SFB_MAX_PROB)) {
 359                 /* Inelastic flow */
 360                 if (q->double_buffering) {
 361                         sfbhash = skb_get_hash_perturb(skb,
 362                             &q->bins[slot].perturbation);
 363                         if (!sfbhash)
 364                                 sfbhash = 1;
 365                         sfb_skb_cb(skb)->hashes[slot] = sfbhash;
 366
 367                         for (i = 0; i < SFB_LEVELS; i++) {
 368                                 u32 hash = sfbhash & SFB_BUCKET_MASK;
 369                                 struct sfb_bucket *b = &q->bins[slot].bins[i][hash];
 370
 371                                 sfbhash >>= SFB_BUCKET_SHIFT;
 372                                 if (b->qlen == 0)
 373                                         decrement_prob(b, q);
 374                                 else if (b->qlen >= q->bin_size)
 375                                         increment_prob(b, q);
 376                         }
 377                 }
 378                 if (sfb_rate_limit(skb, q)) {
 379                         qdisc_qstats_overlimit(sch);
 380                         q->stats.penaltydrop++;
 381                         goto drop;
 382                 }
 383                 goto enqueue;
 384         }
 385
 386         r = prandom_u32() & SFB_MAX_PROB;
 387
 388         if (unlikely(r < p_min)) {
 389                 if (unlikely(p_min > SFB_MAX_PROB / 2)) {
 390                         /* If we're marking that many packets, then either
 391                          * this flow is unresponsive, or we're badly congested.
 392                          * In either case, we want to start dropping packets.
 393                          */
 394                         if (r < (p_min - SFB_MAX_PROB / 2) * 2) {
 395                                 q->stats.earlydrop++;
 396                                 goto drop;
 397                         }
 398                 }
 399                 if (INET_ECN_set_ce(skb)) {
 400                         q->stats.marked++;
 401                 } else {
 402                         q->stats.earlydrop++;
 403                         goto drop;
 404                 }
 405         }
 406
 407 enqueue:
 408         memcpy(&cb, sfb_skb_cb(skb), sizeof(cb));
 409         ret = qdisc_enqueue(skb, child, to_free);
 410         if (likely(ret == NET_XMIT_SUCCESS)) {
 411                 sch->qstats.backlog += len;
 412                 sch->q.qlen++;
 413                 increment_qlen(&cb, q);
 414         } else if (net_xmit_drop_count(ret)) {
 415                 q->stats.childdrop++;
 416                 qdisc_qstats_drop(sch);
 417         }
 418         return ret;
 419
 420 drop:
 421         qdisc_drop(skb, sch, to_free);
 422         return NET_XMIT_CN;
 423 other_drop:
 424         if (ret & __NET_XMIT_BYPASS)
 425                 qdisc_qstats_drop(sch);
 426         kfree_skb(skb);
 427         return ret;
 428 }
 429
 430 static struct sk_buff *sfb_dequeue(struct Qdisc *sch)
 431 {
 432         struct sfb_sched_data *q = qdisc_priv(sch);
 433         struct Qdisc *child = q->qdisc;
 434         struct sk_buff *skb;
 435
 436         skb = child->dequeue(q->qdisc);
 437
 438         if (skb) {
 439                 qdisc_bstats_update(sch, skb);
 440                 qdisc_qstats_backlog_dec(sch, skb);
 441                 sch->q.qlen--;
 442                 decrement_qlen(skb, q);
 443         }
 444
 445         return skb;
 446 }
 447
 448 static struct sk_buff *sfb_peek(struct Qdisc *sch)
 449 {
 450         struct sfb_sched_data *q = qdisc_priv(sch);
 451         struct Qdisc *child = q->qdisc;
 452
 453         return child->ops->peek(child);
 454 }
 455
 456 /* No sfb_drop -- impossible since the child doesn't return the dropped skb. */
 457
 458 static void sfb_reset(struct Qdisc *sch)
 459 {
 460         struct sfb_sched_data *q = qdisc_priv(sch);
 461
 462         qdisc_reset(q->qdisc);
 463         sch->qstats.backlog = 0;
 464         sch->q.qlen = 0;
 465         q->slot = 0;
 466         q->double_buffering = false;
 467         sfb_zero_all_buckets(q);
 468         sfb_init_perturbation(0, q);
 469 }
 470
 471 static void sfb_destroy(struct Qdisc *sch)
 472 {
 473         struct sfb_sched_data *q = qdisc_priv(sch);
 474
 475         tcf_block_put(q->block);
 476         qdisc_put(q->qdisc);
 477 }
 478
 479 static const struct nla_policy sfb_policy[TCA_SFB_MAX + 1] = {
 480         [TCA_SFB_PARMS] = { .len = sizeof(struct tc_sfb_qopt) },
 481 };
 482
 483 static const struct tc_sfb_qopt sfb_default_ops = {
 484         .rehash_interval = 600 * MSEC_PER_SEC,
 485         .warmup_time = 60 * MSEC_PER_SEC,
 486         .limit = 0,
 487         .max = 25,
 488         .bin_size = 20,
 489         .increment = (SFB_MAX_PROB + 500) / 1000, /* 0.1 % */
 490         .decrement = (SFB_MAX_PROB + 3000) / 6000,
 491         .penalty_rate = 10,
 492         .penalty_burst = 20,
 493 };
 494
 495 static int sfb_change(struct Qdisc *sch, struct nlattr *opt,
 496                       struct netlink_ext_ack *extack)
 497 {
 498         struct sfb_sched_data *q = qdisc_priv(sch);
 499         struct Qdisc *child;
 500         struct nlattr *tb[TCA_SFB_MAX + 1];
 501         const struct tc_sfb_qopt *ctl = &sfb_default_ops;
 502         u32 limit;
 503         int err;
 504
 505         if (opt) {
 506                 err = nla_parse_nested(tb, TCA_SFB_MAX, opt, sfb_policy, NULL);
 507                 if (err < 0)
 508                         return -EINVAL;
 509
 510                 if (tb[TCA_SFB_PARMS] == NULL)
 511                         return -EINVAL;
 512
 513                 ctl = nla_data(tb[TCA_SFB_PARMS]);
 514         }
 515
 516         limit = ctl->limit;
 517         if (limit == 0)
 518                 limit = qdisc_dev(sch)->tx_queue_len;
 519
 520         child = fifo_create_dflt(sch, &pfifo_qdisc_ops, limit, extack);
 521         if (IS_ERR(child))
 522                 return PTR_ERR(child);
 523
 524         if (child != &noop_qdisc)
 525                 qdisc_hash_add(child, true);
 526         sch_tree_lock(sch);
 527
 528         qdisc_tree_reduce_backlog(q->qdisc, q->qdisc->q.qlen,
 529                                   q->qdisc->qstats.backlog);
 530         qdisc_put(q->qdisc);
 531         q->qdisc = child;
 532
 533         q->rehash_interval = msecs_to_jiffies(ctl->rehash_interval);
 534         q->warmup_time = msecs_to_jiffies(ctl->warmup_time);
 535         q->rehash_time = jiffies;
 536         q->limit = limit;
 537         q->increment = ctl->increment;
 538         q->decrement = ctl->decrement;
 539         q->max = ctl->max;
 540         q->bin_size = ctl->bin_size;
 541         q->penalty_rate = ctl->penalty_rate;
 542         q->penalty_burst = ctl->penalty_burst;
 543         q->tokens_avail = ctl->penalty_burst;
 544         q->token_time = jiffies;
 545
 546         q->slot = 0;
 547         q->double_buffering = false;
 548         sfb_zero_all_buckets(q);
 549         sfb_init_perturbation(0, q);
 550         sfb_init_perturbation(1, q);
 551
 552         sch_tree_unlock(sch);
 553
 554         return 0;
 555 }
 556
 557 static int sfb_init(struct Qdisc *sch, struct nlattr *opt,
 558                     struct netlink_ext_ack *extack)
 559 {
 560         struct sfb_sched_data *q = qdisc_priv(sch);
 561         int err;
 562
 563         err = tcf_block_get(&q->block, &q->filter_list, sch, extack);
 564         if (err)
 565                 return err;
 566
 567         q->qdisc = &noop_qdisc;
 568         return sfb_change(sch, opt, extack);
 569 }
 570
 571 static int sfb_dump(struct Qdisc *sch, struct sk_buff *skb)
 572 {
 573         struct sfb_sched_data *q = qdisc_priv(sch);
 574         struct nlattr *opts;
 575         struct tc_sfb_qopt opt = {
 576                 .rehash_interval = jiffies_to_msecs(q->rehash_interval),
 577                 .warmup_time = jiffies_to_msecs(q->warmup_time),
 578                 .limit = q->limit,
 579                 .max = q->max,
 580                 .bin_size = q->bin_size,
 581                 .increment = q->increment,
 582                 .decrement = q->decrement,
 583                 .penalty_rate = q->penalty_rate,
 584                 .penalty_burst = q->penalty_burst,
 585         };
 586
 587         sch->qstats.backlog = q->qdisc->qstats.backlog;
 588         opts = nla_nest_start(skb, TCA_OPTIONS);
 589         if (opts == NULL)
 590                 goto nla_put_failure;
 591         if (nla_put(skb, TCA_SFB_PARMS, sizeof(opt), &opt))
 592                 goto nla_put_failure;
 593         return nla_nest_end(skb, opts);
 594
 595 nla_put_failure:
 596         nla_nest_cancel(skb, opts);
 597         return -EMSGSIZE;
 598 }
 599
 600 static int sfb_dump_stats(struct Qdisc *sch, struct gnet_dump *d)
 601 {
 602         struct sfb_sched_data *q = qdisc_priv(sch);
 603         struct tc_sfb_xstats st = {
 604                 .earlydrop = q->stats.earlydrop,
 605                 .penaltydrop = q->stats.penaltydrop,
 606                 .bucketdrop = q->stats.bucketdrop,
 607                 .queuedrop = q->stats.queuedrop,
 608                 .childdrop = q->stats.childdrop,
 609                 .marked = q->stats.marked,
 610         };
 611
 612         st.maxqlen = sfb_compute_qlen(&st.maxprob, &st.avgprob, q);
 613
 614         return gnet_stats_copy_app(d, &st, sizeof(st));
 615 }
 616
 617 static int sfb_dump_class(struct Qdisc *sch, unsigned long cl,
 618                           struct sk_buff *skb, struct tcmsg *tcm)
 619 {
 620         return -ENOSYS;
 621 }
 622
 623 static int sfb_graft(struct Qdisc *sch, unsigned long arg, struct Qdisc *new,
 624                      struct Qdisc **old, struct netlink_ext_ack *extack)
 625 {
 626         struct sfb_sched_data *q = qdisc_priv(sch);
 627
 628         if (new == NULL)
 629                 new = &noop_qdisc;
 630
 631         *old = qdisc_replace(sch, new, &q->qdisc);
 632         return 0;
 633 }
 634
 635 static struct Qdisc *sfb_leaf(struct Qdisc *sch, unsigned long arg)
 636 {
 637         struct sfb_sched_data *q = qdisc_priv(sch);
 638
 639         return q->qdisc;
 640 }
 641
 642 static unsigned long sfb_find(struct Qdisc *sch, u32 classid)
 643 {
 644         return 1;
 645 }
 646
 647 static void sfb_unbind(struct Qdisc *sch, unsigned long arg)
 648 {
 649 }
 650
 651 static int sfb_change_class(struct Qdisc *sch, u32 classid, u32 parentid,
 652                             struct nlattr **tca, unsigned long *arg,
 653                             struct netlink_ext_ack *extack)
 654 {
 655         return -ENOSYS;
 656 }
 657
 658 static int sfb_delete(struct Qdisc *sch, unsigned long cl)
 659 {
 660         return -ENOSYS;
 661 }
 662
 663 static void sfb_walk(struct Qdisc *sch, struct qdisc_walker *walker)
 664 {
 665         if (!walker->stop) {
 666                 if (walker->count >= walker->skip)
 667                         if (walker->fn(sch, 1, walker) < 0) {
 668                                 walker->stop = 1;
 669                                 return;
 670                         }
 671                 walker->count++;
 672         }
 673 }
 674
 675 static struct tcf_block *sfb_tcf_block(struct Qdisc *sch, unsigned long cl,
 676                                        struct netlink_ext_ack *extack)
 677 {
 678         struct sfb_sched_data *q = qdisc_priv(sch);
 679
 680         if (cl)
 681                 return NULL;
 682         return q->block;
 683 }
 684
 685 static unsigned long sfb_bind(struct Qdisc *sch, unsigned long parent,
 686                               u32 classid)
 687 {
 688         return 0;
 689 }
 690
 691
 692 static const struct Qdisc_class_ops sfb_class_ops = {
 693         .graft          =       sfb_graft,
 694         .leaf           =       sfb_leaf,
 695         .find           =       sfb_find,
 696         .change         =       sfb_change_class,
 697         .delete         =       sfb_delete,
 698         .walk           =       sfb_walk,
 699         .tcf_block      =       sfb_tcf_block,
 700         .bind_tcf       =       sfb_bind,
 701         .unbind_tcf     =       sfb_unbind,
 702         .dump           =       sfb_dump_class,
 703 };
 704
 705 static struct Qdisc_ops sfb_qdisc_ops __read_mostly = {
 706         .id             =       "sfb",
 707         .priv_size      =       sizeof(struct sfb_sched_data),
 708         .cl_ops         =       &sfb_class_ops,
 709         .enqueue        =       sfb_enqueue,
 710         .dequeue        =       sfb_dequeue,
 711         .peek           =       sfb_peek,
 712         .init           =       sfb_init,
 713         .reset          =       sfb_reset,
 714         .destroy        =       sfb_destroy,
 715         .change         =       sfb_change,
 716         .dump           =       sfb_dump,
 717         .dump_stats     =       sfb_dump_stats,
 718         .owner          =       THIS_MODULE,
 719 };
 720
 721 static int __init sfb_module_init(void)
 722 {
 723         return register_qdisc(&sfb_qdisc_ops);
 724 }
 725
 726 static void __exit sfb_module_exit(void)
 727 {
 728         unregister_qdisc(&sfb_qdisc_ops);
 729 }
 730
 731 module_init(sfb_module_init)
 732 module_exit(sfb_module_exit)
 733
 734 MODULE_DESCRIPTION("Stochastic Fair Blue queue discipline");
 735 MODULE_AUTHOR("Juliusz Chroboczek");
 736 MODULE_AUTHOR("Eric Dumazet");
 737 MODULE_LICENSE("GPL");