X-Git-Url: http://git.pld-linux.org/?a=blobdiff_plain;f=kernel-imq.patch;h=87ee89ac682277f7f3ceef3ab2c724fcfc049e2f;hb=e9788481c9ff174d00e2fa102dac9e857d3a1840;hp=5847a95fa0bdc2e6dced711bf5c045294cd61606;hpb=7af23471e02083ea9400d58f0b268857b7e806a6;p=packages%2Fkernel.git diff --git a/kernel-imq.patch b/kernel-imq.patch index 5847a95f..87ee89ac 100644 --- a/kernel-imq.patch +++ b/kernel-imq.patch @@ -1,7 +1,7 @@ -diff -uNr linux-2.6.39/drivers/net/imq.c linux-2.6.39-imqmq/drivers/net/imq.c ---- linux-2.6.39/drivers/net/imq.c 1970-01-01 02:00:00.000000000 +0200 -+++ linux-2.6.39-imqmq/drivers/net/imq.c 2011-05-19 11:08:03.838522212 +0300 -@@ -0,0 +1,777 @@ +diff -Naupr linux-4.10_orig/drivers/net/imq.c linux-4.10/drivers/net/imq.c +--- linux-4.10_orig/drivers/net/imq.c 1970-01-01 07:00:00.000000000 +0700 ++++ linux-4.10/drivers/net/imq.c 2017-02-28 19:03:58.883221583 +0700 +@@ -0,0 +1,945 @@ +/* + * Pseudo-driver for the intermediate queue device. + * @@ -14,101 +14,7 @@ diff -uNr linux-2.6.39/drivers/net/imq.c linux-2.6.39-imqmq/drivers/net/imq.c + * + * The first version was written by Martin Devera, + * -+ * Credits: Jan Rafaj -+ * - Update patch to 2.4.21 -+ * Sebastian Strollo -+ * - Fix "Dead-loop on netdevice imq"-issue -+ * Marcel Sebek -+ * - Update to 2.6.2-rc1 -+ * -+ * After some time of inactivity there is a group taking care -+ * of IMQ again: http://www.linuximq.net -+ * -+ * -+ * 2004/06/30 - New version of IMQ patch to kernels <=2.6.7 -+ * including the following changes: -+ * -+ * - Correction of ipv6 support "+"s issue (Hasso Tepper) -+ * - Correction of imq_init_devs() issue that resulted in -+ * kernel OOPS unloading IMQ as module (Norbert Buchmuller) -+ * - Addition of functionality to choose number of IMQ devices -+ * during kernel config (Andre Correa) -+ * - Addition of functionality to choose how IMQ hooks on -+ * PRE and POSTROUTING (after or before NAT) (Andre Correa) -+ * - Cosmetic corrections (Norbert Buchmuller) (Andre Correa) -+ * -+ * -+ * 2005/12/16 - IMQ versions between 2.6.7 and 2.6.13 were -+ * released with almost no problems. 2.6.14-x was released -+ * with some important changes: nfcache was removed; After -+ * some weeks of trouble we figured out that some IMQ fields -+ * in skb were missing in skbuff.c - skb_clone and copy_skb_header. -+ * These functions are correctly patched by this new patch version. -+ * -+ * Thanks for all who helped to figure out all the problems with -+ * 2.6.14.x: Patrick McHardy, Rune Kock, VeNoMouS, Max CtRiX, -+ * Kevin Shanahan, Richard Lucassen, Valery Dachev (hopefully -+ * I didn't forget anybody). I apologize again for my lack of time. -+ * -+ * -+ * 2008/06/17 - 2.6.25 - Changed imq.c to use qdisc_run() instead -+ * of qdisc_restart() and moved qdisc_run() to tasklet to avoid -+ * recursive locking. New initialization routines to fix 'rmmod' not -+ * working anymore. Used code from ifb.c. (Jussi Kivilinna) -+ * -+ * 2008/08/06 - 2.6.26 - (JK) -+ * - Replaced tasklet with 'netif_schedule()'. -+ * - Cleaned up and added comments for imq_nf_queue(). -+ * -+ * 2009/04/12 -+ * - Add skb_save_cb/skb_restore_cb helper functions for backuping -+ * control buffer. This is needed because qdisc-layer on kernels -+ * 2.6.27 and newer overwrite control buffer. (Jussi Kivilinna) -+ * - Add better locking for IMQ device. Hopefully this will solve -+ * SMP issues. (Jussi Kivilinna) -+ * - Port to 2.6.27 -+ * - Port to 2.6.28 -+ * - Port to 2.6.29 + fix rmmod not working -+ * -+ * 2009/04/20 - (Jussi Kivilinna) -+ * - Use netdevice feature flags to avoid extra packet handling -+ * by core networking layer and possibly increase performance. -+ * -+ * 2009/09/26 - (Jussi Kivilinna) -+ * - Add imq_nf_reinject_lockless to fix deadlock with -+ * imq_nf_queue/imq_nf_reinject. -+ * -+ * 2009/12/08 - (Jussi Kivilinna) -+ * - Port to 2.6.32 -+ * - Add check for skb->nf_queue_entry==NULL in imq_dev_xmit() -+ * - Also add better error checking for skb->nf_queue_entry usage -+ * -+ * 2010/02/25 - (Jussi Kivilinna) -+ * - Port to 2.6.33 -+ * -+ * 2010/08/15 - (Jussi Kivilinna) -+ * - Port to 2.6.35 -+ * - Simplify hook registration by using nf_register_hooks. -+ * - nf_reinject doesn't need spinlock around it, therefore remove -+ * imq_nf_reinject function. Other nf_reinject users protect -+ * their own data with spinlock. With IMQ however all data is -+ * needed is stored per skbuff, so no locking is needed. -+ * - Changed IMQ to use 'separate' NF_IMQ_QUEUE instead of -+ * NF_QUEUE, this allows working coexistance of IMQ and other -+ * NF_QUEUE users. -+ * - Make IMQ multi-queue. Number of IMQ device queues can be -+ * increased with 'numqueues' module parameters. Default number -+ * of queues is 1, in other words by default IMQ works as -+ * single-queue device. Multi-queue selection is based on -+ * IFB multi-queue patch by Changli Gao . -+ * -+ * 2011/03/18 - (Jussi Kivilinna) -+ * - Port to 2.6.38 -+ * -+ * Also, many thanks to pablo Sebastian Greco for making the initial -+ * patch and to those who helped the testing. -+ * -+ * More info at: http://www.linuximq.net/ (Andre Correa) ++ * See Credits.txt + */ + +#include @@ -144,7 +50,6 @@ diff -uNr linux-2.6.39/drivers/net/imq.c linux-2.6.39-imqmq/drivers/net/imq.c + { + /* imq_ingress_ipv4 */ + .hook = imq_nf_hook, -+ .owner = THIS_MODULE, + .pf = PF_INET, + .hooknum = NF_INET_PRE_ROUTING, +#if defined(CONFIG_IMQ_BEHAVIOR_BA) || defined(CONFIG_IMQ_BEHAVIOR_BB) @@ -156,7 +61,6 @@ diff -uNr linux-2.6.39/drivers/net/imq.c linux-2.6.39-imqmq/drivers/net/imq.c + { + /* imq_egress_ipv4 */ + .hook = imq_nf_hook, -+ .owner = THIS_MODULE, + .pf = PF_INET, + .hooknum = NF_INET_POST_ROUTING, +#if defined(CONFIG_IMQ_BEHAVIOR_AA) || defined(CONFIG_IMQ_BEHAVIOR_BA) @@ -169,7 +73,6 @@ diff -uNr linux-2.6.39/drivers/net/imq.c linux-2.6.39-imqmq/drivers/net/imq.c + { + /* imq_ingress_ipv6 */ + .hook = imq_nf_hook, -+ .owner = THIS_MODULE, + .pf = PF_INET6, + .hooknum = NF_INET_PRE_ROUTING, +#if defined(CONFIG_IMQ_BEHAVIOR_BA) || defined(CONFIG_IMQ_BEHAVIOR_BB) @@ -181,7 +84,6 @@ diff -uNr linux-2.6.39/drivers/net/imq.c linux-2.6.39-imqmq/drivers/net/imq.c + { + /* imq_egress_ipv6 */ + .hook = imq_nf_hook, -+ .owner = THIS_MODULE, + .pf = PF_INET6, + .hooknum = NF_INET_POST_ROUTING, +#if defined(CONFIG_IMQ_BEHAVIOR_AA) || defined(CONFIG_IMQ_BEHAVIOR_BA) @@ -199,79 +101,12 @@ diff -uNr linux-2.6.39/drivers/net/imq.c linux-2.6.39-imqmq/drivers/net/imq.c +static int numdevs = IMQ_MAX_DEVS; +#endif + -+#define IMQ_MAX_QUEUES 32 -+static int numqueues = 1; -+ -+/*static DEFINE_SPINLOCK(imq_nf_queue_lock);*/ -+ +static struct net_device *imq_devs_cache[IMQ_MAX_DEVS]; + -+ -+static struct net_device_stats *imq_get_stats(struct net_device *dev) -+{ -+ return &dev->stats; -+} -+ -+/* called for packets kfree'd in qdiscs at places other than enqueue */ -+static void imq_skb_destructor(struct sk_buff *skb) -+{ -+ struct nf_queue_entry *entry = skb->nf_queue_entry; -+ -+ skb->nf_queue_entry = NULL; -+ -+ if (entry) { -+ nf_queue_entry_release_refs(entry); -+ kfree(entry); -+ } -+ -+ skb_restore_cb(skb); /* kfree backup */ -+} -+ -+static netdev_tx_t imq_dev_xmit(struct sk_buff *skb, struct net_device *dev) -+{ -+ struct nf_queue_entry *entry = skb->nf_queue_entry; -+ -+ skb->nf_queue_entry = NULL; -+ dev->trans_start = jiffies; -+ -+ dev->stats.tx_bytes += skb->len; -+ dev->stats.tx_packets++; -+ -+ if (entry == NULL) { -+ /* We don't know what is going on here.. packet is queued for -+ * imq device, but (probably) not by us. -+ * -+ * If this packet was not send here by imq_nf_queue(), then -+ * skb_save_cb() was not used and skb_free() should not show: -+ * WARNING: IMQ: kfree_skb: skb->cb_next:.. -+ * and/or -+ * WARNING: IMQ: kfree_skb: skb->nf_queue_entry... -+ * -+ * However if this message is shown, then IMQ is somehow broken -+ * and you should report this to linuximq.net. -+ */ -+ -+ /* imq_dev_xmit is black hole that eats all packets, report that -+ * we eat this packet happily and increase dropped counters. -+ */ -+ -+ dev->stats.tx_dropped++; -+ dev_kfree_skb(skb); -+ -+ return NETDEV_TX_OK; -+ } -+ -+ skb_restore_cb(skb); /* restore skb->cb */ -+ -+ skb->imq_flags = 0; -+ skb->destructor = NULL; -+ -+ nf_reinject(entry, NF_ACCEPT); -+ -+ return NETDEV_TX_OK; -+} -+ ++#define IMQ_MAX_QUEUES 32 ++static int numqueues = 1; +static u32 imq_hashrnd; ++static int imq_dev_accurate_stats = 1; + +static inline __be16 pppoe_proto(const struct sk_buff *skb) +{ @@ -335,13 +170,15 @@ diff -uNr linux-2.6.39/drivers/net/imq.c linux-2.6.39-imqmq/drivers/net/imq.c +#if defined(CONFIG_IPV6) || defined(CONFIG_IPV6_MODULE) + case htons(ETH_P_IPV6): { + const struct ipv6hdr *iph = ipv6_hdr(skb); ++ __be16 fo = 0; + + if (unlikely(!pskb_may_pull(skb, sizeof(struct ipv6hdr)))) + goto other; + + addr1 = iph->daddr.s6_addr32[3]; + addr2 = iph->saddr.s6_addr32[3]; -+ ihl = ipv6_skip_exthdr(skb, sizeof(struct ipv6hdr), &ip_proto); ++ ihl = ipv6_skip_exthdr(skb, sizeof(struct ipv6hdr), &ip_proto, ++ &fo); + if (unlikely(ihl < 0)) + goto other; + @@ -434,54 +271,299 @@ diff -uNr linux-2.6.39/drivers/net/imq.c linux-2.6.39-imqmq/drivers/net/imq.c + if (unlikely(queue_index >= dev->real_num_tx_queues)) + queue_index = (u16)((u32)queue_index % dev->real_num_tx_queues); + ++ skb_set_queue_mapping(skb, queue_index); + return netdev_get_tx_queue(dev, queue_index); +} + ++static struct net_device_stats *imq_get_stats(struct net_device *dev) ++{ ++ return &dev->stats; ++} ++ ++/* called for packets kfree'd in qdiscs at places other than enqueue */ ++static void imq_skb_destructor(struct sk_buff *skb) ++{ ++ struct nf_queue_entry *entry = skb->nf_queue_entry; ++ ++ skb->nf_queue_entry = NULL; ++ ++ if (entry) { ++ nf_queue_entry_release_refs(entry); ++ kfree(entry); ++ } ++ ++ skb_restore_cb(skb); /* kfree backup */ ++} ++ ++static void imq_done_check_queue_mapping(struct sk_buff *skb, ++ struct net_device *dev) ++{ ++ unsigned int queue_index; ++ ++ /* Don't let queue_mapping be left too large after exiting IMQ */ ++ if (likely(skb->dev != dev && skb->dev != NULL)) { ++ queue_index = skb_get_queue_mapping(skb); ++ if (unlikely(queue_index >= skb->dev->real_num_tx_queues)) { ++ queue_index = (u16)((u32)queue_index % ++ skb->dev->real_num_tx_queues); ++ skb_set_queue_mapping(skb, queue_index); ++ } ++ } else { ++ /* skb->dev was IMQ device itself or NULL, be on safe side and ++ * just clear queue mapping. ++ */ ++ skb_set_queue_mapping(skb, 0); ++ } ++} ++ ++static netdev_tx_t imq_dev_xmit(struct sk_buff *skb, struct net_device *dev) ++{ ++ struct nf_queue_entry *entry = skb->nf_queue_entry; ++ ++ rcu_read_lock(); ++ ++ skb->nf_queue_entry = NULL; ++ netif_trans_update(dev); ++ ++ dev->stats.tx_bytes += skb->len; ++ dev->stats.tx_packets++; ++ ++ if (unlikely(entry == NULL)) { ++ /* We don't know what is going on here.. packet is queued for ++ * imq device, but (probably) not by us. ++ * ++ * If this packet was not send here by imq_nf_queue(), then ++ * skb_save_cb() was not used and skb_free() should not show: ++ * WARNING: IMQ: kfree_skb: skb->cb_next:.. ++ * and/or ++ * WARNING: IMQ: kfree_skb: skb->nf_queue_entry... ++ * ++ * However if this message is shown, then IMQ is somehow broken ++ * and you should report this to linuximq.net. ++ */ ++ ++ /* imq_dev_xmit is black hole that eats all packets, report that ++ * we eat this packet happily and increase dropped counters. ++ */ ++ ++ dev->stats.tx_dropped++; ++ dev_kfree_skb(skb); ++ ++ rcu_read_unlock(); ++ return NETDEV_TX_OK; ++ } ++ ++ skb_restore_cb(skb); /* restore skb->cb */ ++ ++ skb->imq_flags = 0; ++ skb->destructor = NULL; ++ ++ imq_done_check_queue_mapping(skb, dev); ++ ++ nf_reinject(entry, NF_ACCEPT); ++ ++ rcu_read_unlock(); ++ return NETDEV_TX_OK; ++} ++ ++static struct net_device *get_imq_device_by_index(int index) ++{ ++ struct net_device *dev = NULL; ++ struct net *net; ++ char buf[8]; ++ ++ /* get device by name and cache result */ ++ snprintf(buf, sizeof(buf), "imq%d", index); ++ ++ /* Search device from all namespaces. */ ++ for_each_net(net) { ++ dev = dev_get_by_name(net, buf); ++ if (dev) ++ break; ++ } ++ ++ if (WARN_ON_ONCE(dev == NULL)) { ++ /* IMQ device not found. Exotic config? */ ++ return ERR_PTR(-ENODEV); ++ } ++ ++ imq_devs_cache[index] = dev; ++ dev_put(dev); ++ ++ return dev; ++} ++ ++static struct nf_queue_entry *nf_queue_entry_dup(struct nf_queue_entry *e) ++{ ++ struct nf_queue_entry *entry = kmemdup(e, e->size, GFP_ATOMIC); ++ if (entry) { ++ nf_queue_entry_get_refs(entry); ++ return entry; ++ } ++ return NULL; ++} ++ ++#ifdef CONFIG_BRIDGE_NETFILTER ++/* When called from bridge netfilter, skb->data must point to MAC header ++ * before calling skb_gso_segment(). Else, original MAC header is lost ++ * and segmented skbs will be sent to wrong destination. ++ */ ++static void nf_bridge_adjust_skb_data(struct sk_buff *skb) ++{ ++ if (skb->nf_bridge) ++ __skb_push(skb, skb->network_header - skb->mac_header); ++} ++ ++static void nf_bridge_adjust_segmented_data(struct sk_buff *skb) ++{ ++ if (skb->nf_bridge) ++ __skb_pull(skb, skb->network_header - skb->mac_header); ++} ++#else ++#define nf_bridge_adjust_skb_data(s) do {} while (0) ++#define nf_bridge_adjust_segmented_data(s) do {} while (0) ++#endif ++ ++static void free_entry(struct nf_queue_entry *entry) ++{ ++ nf_queue_entry_release_refs(entry); ++ kfree(entry); ++} ++ ++static int __imq_nf_queue(struct nf_queue_entry *entry, struct net_device *dev); ++ ++static int __imq_nf_queue_gso(struct nf_queue_entry *entry, ++ struct net_device *dev, struct sk_buff *skb) ++{ ++ int ret = -ENOMEM; ++ struct nf_queue_entry *entry_seg; ++ ++ nf_bridge_adjust_segmented_data(skb); ++ ++ if (skb->next == NULL) { /* last packet, no need to copy entry */ ++ struct sk_buff *gso_skb = entry->skb; ++ entry->skb = skb; ++ ret = __imq_nf_queue(entry, dev); ++ if (ret) ++ entry->skb = gso_skb; ++ return ret; ++ } ++ ++ skb->next = NULL; ++ ++ entry_seg = nf_queue_entry_dup(entry); ++ if (entry_seg) { ++ entry_seg->skb = skb; ++ ret = __imq_nf_queue(entry_seg, dev); ++ if (ret) ++ free_entry(entry_seg); ++ } ++ return ret; ++} ++ +static int imq_nf_queue(struct nf_queue_entry *entry, unsigned queue_num) +{ ++ struct sk_buff *skb, *segs; + struct net_device *dev; -+ struct sk_buff *skb_orig, *skb, *skb_shared; -+ struct Qdisc *q; -+ struct netdev_queue *txq; -+ spinlock_t *root_lock; -+ int users, index; -+ int retval = -EINVAL; ++ unsigned int queued; ++ int index, retval, err; + + index = entry->skb->imq_flags & IMQ_F_IFMASK; + if (unlikely(index > numdevs - 1)) { + if (net_ratelimit()) -+ printk(KERN_WARNING -+ "IMQ: invalid device specified, highest is %u\n", -+ numdevs - 1); ++ pr_warn("IMQ: invalid device specified, highest is %u\n", ++ numdevs - 1); + retval = -EINVAL; -+ goto out; ++ goto out_no_dev; + } + + /* check for imq device by index from cache */ + dev = imq_devs_cache[index]; + if (unlikely(!dev)) { -+ char buf[8]; -+ -+ /* get device by name and cache result */ -+ snprintf(buf, sizeof(buf), "imq%d", index); -+ dev = dev_get_by_name(&init_net, buf); -+ if (unlikely(!dev)) { -+ /* not found ?!*/ -+ BUG(); -+ retval = -ENODEV; -+ goto out; ++ dev = get_imq_device_by_index(index); ++ if (IS_ERR(dev)) { ++ retval = PTR_ERR(dev); ++ goto out_no_dev; + } -+ -+ imq_devs_cache[index] = dev; -+ dev_put(dev); + } + + if (unlikely(!(dev->flags & IFF_UP))) { + entry->skb->imq_flags = 0; -+ nf_reinject(entry, NF_ACCEPT); -+ retval = 0; -+ goto out; ++ retval = -ECANCELED; ++ goto out_no_dev; + } ++ ++ /* Since 3.10.x, GSO handling moved here as result of upstream commit ++ * a5fedd43d5f6c94c71053a66e4c3d2e35f1731a2 (netfilter: move ++ * skb_gso_segment into nfnetlink_queue module). ++ * ++ * Following code replicates the gso handling from ++ * 'net/netfilter/nfnetlink_queue_core.c':nfqnl_enqueue_packet(). ++ */ ++ ++ skb = entry->skb; ++ ++ switch (entry->state.pf) { ++ case NFPROTO_IPV4: ++ skb->protocol = htons(ETH_P_IP); ++ break; ++ case NFPROTO_IPV6: ++ skb->protocol = htons(ETH_P_IPV6); ++ break; ++ } ++ ++ if (!skb_is_gso(entry->skb)) ++ return __imq_nf_queue(entry, dev); ++ ++ nf_bridge_adjust_skb_data(skb); ++ segs = skb_gso_segment(skb, 0); ++ /* Does not use PTR_ERR to limit the number of error codes that can be ++ * returned by nf_queue. For instance, callers rely on -ECANCELED to ++ * mean 'ignore this hook'. ++ */ ++ err = -ENOBUFS; ++ if (IS_ERR(segs)) ++ goto out_err; ++ queued = 0; ++ err = 0; ++ do { ++ struct sk_buff *nskb = segs->next; ++ if (nskb && nskb->next) ++ nskb->cb_next = NULL; ++ if (err == 0) ++ err = __imq_nf_queue_gso(entry, dev, segs); ++ if (err == 0) ++ queued++; ++ else ++ kfree_skb(segs); ++ segs = nskb; ++ } while (segs); ++ ++ if (queued) { ++ if (err) /* some segments are already queued */ ++ free_entry(entry); ++ kfree_skb(skb); ++ return 0; ++ } ++ ++out_err: ++ nf_bridge_adjust_segmented_data(skb); ++ retval = err; ++out_no_dev: ++ return retval; ++} ++ ++static int __imq_nf_queue(struct nf_queue_entry *entry, struct net_device *dev) ++{ ++ struct sk_buff *skb_orig, *skb, *skb_shared, *skb_popd; ++ struct Qdisc *q; ++ struct sk_buff *to_free = NULL; ++ struct netdev_queue *txq; ++ spinlock_t *root_lock; ++ int users; ++ int retval = -EINVAL; ++ unsigned int orig_queue_index; ++ + dev->last_rx = jiffies; + + skb = entry->skb; @@ -495,62 +577,113 @@ diff -uNr linux-2.6.39/drivers/net/imq.c linux-2.6.39-imqmq/drivers/net/imq.c + retval = -ENOMEM; + goto out; + } ++ skb->cb_next = NULL; + entry->skb = skb; + } + -+ skb->nf_queue_entry = entry; -+ + dev->stats.rx_bytes += skb->len; + dev->stats.rx_packets++; + ++ if (!skb->dev) { ++ /* skb->dev == NULL causes problems, try the find cause. */ ++ if (net_ratelimit()) { ++ dev_warn(&dev->dev, ++ "received packet with skb->dev == NULL\n"); ++ dump_stack(); ++ } ++ ++ skb->dev = dev; ++ } ++ + /* Disables softirqs for lock below */ + rcu_read_lock_bh(); + + /* Multi-queue selection */ ++ orig_queue_index = skb_get_queue_mapping(skb); + txq = imq_select_queue(dev, skb); + + q = rcu_dereference(txq->qdisc); + if (unlikely(!q->enqueue)) + goto packet_not_eaten_by_imq_dev; + ++ skb->nf_queue_entry = entry; + root_lock = qdisc_lock(q); + spin_lock(root_lock); + + users = atomic_read(&skb->users); + + skb_shared = skb_get(skb); /* increase reference count by one */ -+ skb_save_cb(skb_shared); /* backup skb->cb, as qdisc layer will -+ overwrite it */ -+ qdisc_enqueue_root(skb_shared, q); /* might kfree_skb */ + ++ /* backup skb->cb, as qdisc layer will overwrite it */ ++ skb_save_cb(skb_shared); ++ qdisc_enqueue_root(skb_shared, q, &to_free); /* might kfree_skb */ + if (likely(atomic_read(&skb_shared->users) == users + 1)) { ++ bool validate; ++ + kfree_skb(skb_shared); /* decrease reference count by one */ + + skb->destructor = &imq_skb_destructor; + ++ skb_popd = qdisc_dequeue_skb(q, &validate); ++ + /* cloned? */ + if (unlikely(skb_orig)) + kfree_skb(skb_orig); /* free original */ + + spin_unlock(root_lock); -+ rcu_read_unlock_bh(); + ++#if 0 + /* schedule qdisc dequeue */ + __netif_schedule(q); -+ ++#else ++ if (likely(skb_popd)) { ++ /* Note that we validate skb (GSO, checksum, ...) outside of locks */ ++ if (validate) ++ skb_popd = validate_xmit_skb_list(skb_popd, dev); ++ ++ if (skb_popd) { ++ int dummy_ret; ++ int cpu = smp_processor_id(); /* ok because BHs are off */ ++ ++ txq = skb_get_tx_queue(dev, skb_popd); ++ /* ++ IMQ device will not be frozen or stoped, and it always be successful. ++ So we need not check its status and return value to accelerate. ++ */ ++ if (imq_dev_accurate_stats && txq->xmit_lock_owner != cpu) { ++ HARD_TX_LOCK(dev, txq, cpu); ++ if (!netif_xmit_frozen_or_stopped(txq)) { ++ dev_hard_start_xmit(skb_popd, dev, txq, &dummy_ret); ++ } ++ HARD_TX_UNLOCK(dev, txq); ++ } else { ++ if (!netif_xmit_frozen_or_stopped(txq)) { ++ dev_hard_start_xmit(skb_popd, dev, txq, &dummy_ret); ++ } ++ } ++ } ++ } else { ++ /* No ready skb, then schedule it */ ++ __netif_schedule(q); ++ } ++#endif ++ rcu_read_unlock_bh(); + retval = 0; + goto out; + } else { + skb_restore_cb(skb_shared); /* restore skb->cb */ + skb->nf_queue_entry = NULL; -+ /* qdisc dropped packet and decreased skb reference count of ++ /* ++ * qdisc dropped packet and decreased skb reference count of + * skb, so we don't really want to and try refree as that would -+ * actually destroy the skb. */ ++ * actually destroy the skb. ++ */ + spin_unlock(root_lock); + goto packet_not_eaten_by_imq_dev; + } + +packet_not_eaten_by_imq_dev: ++ skb_set_queue_mapping(skb, orig_queue_index); + rcu_read_unlock_bh(); + + /* cloned? restore original */ @@ -560,15 +693,16 @@ diff -uNr linux-2.6.39/drivers/net/imq.c linux-2.6.39-imqmq/drivers/net/imq.c + } + retval = -1; +out: ++ if (unlikely(to_free)) { ++ kfree_skb_list(to_free); ++ } + return retval; +} -+ -+static unsigned int imq_nf_hook(unsigned int hook, struct sk_buff *pskb, -+ const struct net_device *indev, -+ const struct net_device *outdev, -+ int (*okfn)(struct sk_buff *)) ++static unsigned int imq_nf_hook(void *priv, ++ struct sk_buff *skb, ++ const struct nf_hook_state *state) +{ -+ return (pskb->imq_flags & IMQ_F_ENQUEUE) ? NF_IMQ_QUEUE : NF_ACCEPT; ++ return (skb->imq_flags & IMQ_F_ENQUEUE) ? NF_IMQ_QUEUE : NF_ACCEPT; +} + +static int imq_close(struct net_device *dev) @@ -583,6 +717,10 @@ diff -uNr linux-2.6.39/drivers/net/imq.c linux-2.6.39-imqmq/drivers/net/imq.c + return 0; +} + ++static struct device_type imq_device_type = { ++ .name = "imq", ++}; ++ +static const struct net_device_ops imq_netdev_ops = { + .ndo_open = imq_open, + .ndo_stop = imq_close, @@ -593,14 +731,15 @@ diff -uNr linux-2.6.39/drivers/net/imq.c linux-2.6.39-imqmq/drivers/net/imq.c +static void imq_setup(struct net_device *dev) +{ + dev->netdev_ops = &imq_netdev_ops; -+ dev->type = ARPHRD_VOID; -+ dev->mtu = 16000; -+ dev->tx_queue_len = 11000; -+ dev->flags = IFF_NOARP; -+ dev->features = NETIF_F_SG | NETIF_F_FRAGLIST | ++ dev->type = ARPHRD_VOID; ++ dev->mtu = 16000; /* too small? */ ++ dev->tx_queue_len = 11000; /* too big? */ ++ dev->flags = IFF_NOARP; ++ dev->features = NETIF_F_SG | NETIF_F_FRAGLIST | + NETIF_F_GSO | NETIF_F_HW_CSUM | + NETIF_F_HIGHDMA; -+ dev->priv_flags &= ~IFF_XMIT_DST_RELEASE; ++ dev->priv_flags &= ~(IFF_XMIT_DST_RELEASE | ++ IFF_TX_SKB_SHARING); +} + +static int imq_validate(struct nlattr *tb[], struct nlattr *data[]) @@ -619,7 +758,7 @@ diff -uNr linux-2.6.39/drivers/net/imq.c linux-2.6.39-imqmq/drivers/net/imq.c + } + return 0; +end: -+ printk(KERN_WARNING "IMQ: imq_validate failed (%d)\n", ret); ++ pr_warn("IMQ: imq_validate failed (%d)\n", ret); + return ret; +} + @@ -631,7 +770,6 @@ diff -uNr linux-2.6.39/drivers/net/imq.c linux-2.6.39-imqmq/drivers/net/imq.c +}; + +static const struct nf_queue_handler imq_nfqh = { -+ .name = "imq", + .outfn = imq_nf_queue, +}; + @@ -648,12 +786,39 @@ diff -uNr linux-2.6.39/drivers/net/imq.c linux-2.6.39-imqmq/drivers/net/imq.c + return ret; +} + ++#ifdef CONFIG_LOCKDEP ++ static struct lock_class_key imq_netdev_addr_lock_key; ++ ++ static void __init imq_dev_set_lockdep_one(struct net_device *dev, ++ struct netdev_queue *txq, void *arg) ++ { ++ /* ++ * the IMQ transmit locks can be taken recursively, ++ * for example with one IMQ rule for input- and one for ++ * output network devices in iptables! ++ * until we find a better solution ignore them. ++ */ ++ lockdep_set_novalidate_class(&txq->_xmit_lock); ++ } ++ ++ static void imq_dev_set_lockdep_class(struct net_device *dev) ++ { ++ lockdep_set_class_and_name(&dev->addr_list_lock, ++ &imq_netdev_addr_lock_key, "_xmit_addr_IMQ"); ++ netdev_for_each_tx_queue(dev, imq_dev_set_lockdep_one, NULL); ++} ++#else ++ static inline void imq_dev_set_lockdep_class(struct net_device *dev) ++ { ++ } ++#endif ++ +static int __init imq_init_one(int index) +{ + struct net_device *dev; + int ret; + -+ dev = alloc_netdev_mq(0, "imq%d", imq_setup, numqueues); ++ dev = alloc_netdev_mq(0, "imq%d", NET_NAME_UNKNOWN, imq_setup, numqueues); + if (!dev) + return -ENOMEM; + @@ -662,10 +827,13 @@ diff -uNr linux-2.6.39/drivers/net/imq.c linux-2.6.39-imqmq/drivers/net/imq.c + goto fail; + + dev->rtnl_link_ops = &imq_link_ops; ++ SET_NETDEV_DEVTYPE(dev, &imq_device_type); + ret = register_netdevice(dev); + if (ret < 0) + goto fail; + ++ imq_dev_set_lockdep_class(dev); ++ + return 0; +fail: + free_netdev(dev); @@ -677,13 +845,13 @@ diff -uNr linux-2.6.39/drivers/net/imq.c linux-2.6.39-imqmq/drivers/net/imq.c + int err, i; + + if (numdevs < 1 || numdevs > IMQ_MAX_DEVS) { -+ printk(KERN_ERR "IMQ: numdevs has to be betweed 1 and %u\n", ++ pr_err("IMQ: numdevs has to be betweed 1 and %u\n", + IMQ_MAX_DEVS); + return -EINVAL; + } + + if (numqueues < 1 || numqueues > IMQ_MAX_QUEUES) { -+ printk(KERN_ERR "IMQ: numqueues has to be betweed 1 and %u\n", ++ pr_err("IMQ: numqueues has to be betweed 1 and %u\n", + IMQ_MAX_QUEUES); + return -EINVAL; + } @@ -717,30 +885,30 @@ diff -uNr linux-2.6.39/drivers/net/imq.c linux-2.6.39-imqmq/drivers/net/imq.c + + err = imq_init_devs(); + if (err) { -+ printk(KERN_ERR "IMQ: Error trying imq_init_devs(net)\n"); ++ pr_err("IMQ: Error trying imq_init_devs(net)\n"); + return err; + } + + err = imq_init_hooks(); + if (err) { -+ printk(KERN_ERR "IMQ: Error trying imq_init_hooks()\n"); ++ pr_err(KERN_ERR "IMQ: Error trying imq_init_hooks()\n"); + rtnl_link_unregister(&imq_link_ops); + memset(imq_devs_cache, 0, sizeof(imq_devs_cache)); + return err; + } + -+ printk(KERN_INFO "IMQ driver loaded successfully. " -+ "(numdevs = %d, numqueues = %d)\n", numdevs, numqueues); ++ pr_info("IMQ driver loaded successfully. (numdevs = %d, numqueues = %d, imq_dev_accurate_stats = %d)\n", ++ numdevs, numqueues, imq_dev_accurate_stats); + +#if defined(CONFIG_IMQ_BEHAVIOR_BA) || defined(CONFIG_IMQ_BEHAVIOR_BB) -+ printk(KERN_INFO "\tHooking IMQ before NAT on PREROUTING.\n"); ++ pr_info("\tHooking IMQ before NAT on PREROUTING.\n"); +#else -+ printk(KERN_INFO "\tHooking IMQ after NAT on PREROUTING.\n"); ++ pr_info("\tHooking IMQ after NAT on PREROUTING.\n"); +#endif +#if defined(CONFIG_IMQ_BEHAVIOR_AB) || defined(CONFIG_IMQ_BEHAVIOR_BB) -+ printk(KERN_INFO "\tHooking IMQ before NAT on POSTROUTING.\n"); ++ pr_info("\tHooking IMQ before NAT on POSTROUTING.\n"); +#else -+ printk(KERN_INFO "\tHooking IMQ after NAT on POSTROUTING.\n"); ++ pr_info("\tHooking IMQ after NAT on POSTROUTING.\n"); +#endif + + return 0; @@ -762,7 +930,7 @@ diff -uNr linux-2.6.39/drivers/net/imq.c linux-2.6.39-imqmq/drivers/net/imq.c +{ + imq_unhook(); + imq_cleanup_devs(); -+ printk(KERN_INFO "IMQ driver unloaded successfully.\n"); ++ pr_info("IMQ driver unloaded successfully.\n"); +} + +module_init(imq_init_module); @@ -770,21 +938,21 @@ diff -uNr linux-2.6.39/drivers/net/imq.c linux-2.6.39-imqmq/drivers/net/imq.c + +module_param(numdevs, int, 0); +module_param(numqueues, int, 0); -+MODULE_PARM_DESC(numdevs, "number of IMQ devices (how many imq* devices will " -+ "be created)"); ++module_param(imq_dev_accurate_stats, int, 0); ++MODULE_PARM_DESC(numdevs, "number of IMQ devices (how many imq* devices will be created)"); +MODULE_PARM_DESC(numqueues, "number of queues per IMQ device"); -+MODULE_AUTHOR("http://www.linuximq.net"); -+MODULE_DESCRIPTION("Pseudo-driver for the intermediate queue device. See " -+ "http://www.linuximq.net/ for more information."); ++MODULE_PARM_DESC(imq_dev_accurate_stats, "Notify if need the accurate imq device stats"); ++ ++MODULE_AUTHOR("https://github.com/imq/linuximq"); ++MODULE_DESCRIPTION("Pseudo-driver for the intermediate queue device. See https://github.com/imq/linuximq/wiki for more information."); +MODULE_LICENSE("GPL"); +MODULE_ALIAS_RTNL_LINK("imq"); -+ -diff -uNr linux-2.6.39/drivers/net/Kconfig linux-2.6.39-imqmq/drivers/net/Kconfig ---- linux-2.6.39/drivers/net/Kconfig 2011-05-19 07:06:34.000000000 +0300 -+++ linux-2.6.39-imqmq/drivers/net/Kconfig 2011-05-19 11:08:04.281864473 +0300 -@@ -124,6 +124,129 @@ - To compile this driver as a module, choose M here: the module - will be called eql. If unsure, say N. +diff -Naupr linux-4.10_orig/drivers/net/Kconfig linux-4.10/drivers/net/Kconfig +--- linux-4.10_orig/drivers/net/Kconfig 2017-02-20 05:34:00.000000000 +0700 ++++ linux-4.10/drivers/net/Kconfig 2017-02-28 18:44:55.978280593 +0700 +@@ -260,6 +260,125 @@ config RIONET_RX_SIZE + depends on RIONET + default "128" +config IMQ + tristate "IMQ (intermediate queueing device) support" @@ -797,7 +965,7 @@ diff -uNr linux-2.6.39/drivers/net/Kconfig linux-2.6.39-imqmq/drivers/net/Kconfi + and distribute bandwidth among them. Iptables is used to specify + through which IMQ device, if any, packets travel. + -+ More information at: http://www.linuximq.net/ ++ More information at: https://github.com/imq/linuximq + + To compile this driver as a module, choose M here: the module + will be called imq. If unsure, say N. @@ -807,125 +975,121 @@ diff -uNr linux-2.6.39/drivers/net/Kconfig linux-2.6.39-imqmq/drivers/net/Kconfi + depends on IMQ + default IMQ_BEHAVIOR_AB + help ++ This setting defines how IMQ behaves in respect to its ++ hooking in PREROUTING and POSTROUTING. + -+ This settings defines how IMQ behaves in respect to its -+ hooking in PREROUTING and POSTROUTING. -+ -+ IMQ can work in any of the following ways: ++ IMQ can work in any of the following ways: + -+ PREROUTING | POSTROUTING -+ -----------------|------------------- -+ #1 After NAT | After NAT -+ #2 After NAT | Before NAT -+ #3 Before NAT | After NAT -+ #4 Before NAT | Before NAT ++ PREROUTING | POSTROUTING ++ -----------------|------------------- ++ #1 After NAT | After NAT ++ #2 After NAT | Before NAT ++ #3 Before NAT | After NAT ++ #4 Before NAT | Before NAT + -+ The default behavior is to hook before NAT on PREROUTING -+ and after NAT on POSTROUTING (#3). ++ The default behavior is to hook before NAT on PREROUTING ++ and after NAT on POSTROUTING (#3). + -+ This settings are specially usefull when trying to use IMQ -+ to shape NATed clients. ++ This settings are specially usefull when trying to use IMQ ++ to shape NATed clients. + -+ More information can be found at: www.linuximq.net ++ More information can be found at: https://github.com/imq/linuximq + -+ If not sure leave the default settings alone. ++ If not sure leave the default settings alone. + +config IMQ_BEHAVIOR_AA + bool "IMQ AA" + help -+ This settings defines how IMQ behaves in respect to its -+ hooking in PREROUTING and POSTROUTING. ++ This setting defines how IMQ behaves in respect to its ++ hooking in PREROUTING and POSTROUTING. + -+ Choosing this option will make IMQ hook like this: ++ Choosing this option will make IMQ hook like this: + -+ PREROUTING: After NAT -+ POSTROUTING: After NAT ++ PREROUTING: After NAT ++ POSTROUTING: After NAT + -+ More information can be found at: www.linuximq.net ++ More information can be found at: https://github.com/imq/linuximq + -+ If not sure leave the default settings alone. ++ If not sure leave the default settings alone. + +config IMQ_BEHAVIOR_AB + bool "IMQ AB" + help -+ This settings defines how IMQ behaves in respect to its -+ hooking in PREROUTING and POSTROUTING. ++ This setting defines how IMQ behaves in respect to its ++ hooking in PREROUTING and POSTROUTING. + -+ Choosing this option will make IMQ hook like this: ++ Choosing this option will make IMQ hook like this: + -+ PREROUTING: After NAT -+ POSTROUTING: Before NAT ++ PREROUTING: After NAT ++ POSTROUTING: Before NAT + -+ More information can be found at: www.linuximq.net ++ More information can be found at: https://github.com/imq/linuximq + -+ If not sure leave the default settings alone. ++ If not sure leave the default settings alone. + +config IMQ_BEHAVIOR_BA + bool "IMQ BA" + help -+ This settings defines how IMQ behaves in respect to its -+ hooking in PREROUTING and POSTROUTING. ++ This setting defines how IMQ behaves in respect to its ++ hooking in PREROUTING and POSTROUTING. + -+ Choosing this option will make IMQ hook like this: ++ Choosing this option will make IMQ hook like this: + -+ PREROUTING: Before NAT -+ POSTROUTING: After NAT ++ PREROUTING: Before NAT ++ POSTROUTING: After NAT + -+ More information can be found at: www.linuximq.net ++ More information can be found at: https://github.com/imq/linuximq + -+ If not sure leave the default settings alone. ++ If not sure leave the default settings alone. + +config IMQ_BEHAVIOR_BB + bool "IMQ BB" + help -+ This settings defines how IMQ behaves in respect to its -+ hooking in PREROUTING and POSTROUTING. ++ This setting defines how IMQ behaves in respect to its ++ hooking in PREROUTING and POSTROUTING. + -+ Choosing this option will make IMQ hook like this: ++ Choosing this option will make IMQ hook like this: + -+ PREROUTING: Before NAT -+ POSTROUTING: Before NAT ++ PREROUTING: Before NAT ++ POSTROUTING: Before NAT + -+ More information can be found at: www.linuximq.net ++ More information can be found at: https://github.com/imq/linuximq + -+ If not sure leave the default settings alone. ++ If not sure leave the default settings alone. + +endchoice + +config IMQ_NUM_DEVS -+ + int "Number of IMQ devices" + range 2 16 + depends on IMQ + default "16" + help ++ This setting defines how many IMQ devices will be created. + -+ This settings defines how many IMQ devices will be -+ created. -+ -+ The default value is 16. ++ The default value is 16. + -+ More information can be found at: www.linuximq.net ++ More information can be found at: https://github.com/imq/linuximq + -+ If not sure leave the default settings alone. ++ If not sure leave the default settings alone. + config TUN tristate "Universal TUN/TAP device driver support" - select CRC32 -diff -uNr linux-2.6.39/drivers/net/Makefile linux-2.6.39-imqmq/drivers/net/Makefile ---- linux-2.6.39/drivers/net/Makefile 2011-05-19 07:06:34.000000000 +0300 -+++ linux-2.6.39-imqmq/drivers/net/Makefile 2011-05-19 11:08:04.281864473 +0300 -@@ -175,6 +175,7 @@ - obj-$(CONFIG_XEN_NETDEV_BACKEND) += xen-netback/ - - obj-$(CONFIG_DUMMY) += dummy.o -+obj-$(CONFIG_IMQ) += imq.o + depends on INET +diff -Naupr linux-4.10_orig/drivers/net/Makefile linux-4.10/drivers/net/Makefile +--- linux-4.10_orig/drivers/net/Makefile 2017-02-20 05:34:00.000000000 +0700 ++++ linux-4.10/drivers/net/Makefile 2017-02-28 18:44:55.978280593 +0700 +@@ -11,6 +11,7 @@ obj-$(CONFIG_DUMMY) += dummy.o + obj-$(CONFIG_EQUALIZER) += eql.o obj-$(CONFIG_IFB) += ifb.o + obj-$(CONFIG_MACSEC) += macsec.o ++obj-$(CONFIG_IMQ) += imq.o obj-$(CONFIG_MACVLAN) += macvlan.o obj-$(CONFIG_MACVTAP) += macvtap.o -diff -uNr linux-2.6.39/include/linux/imq.h linux-2.6.39-imqmq/include/linux/imq.h ---- linux-2.6.39/include/linux/imq.h 1970-01-01 02:00:00.000000000 +0200 -+++ linux-2.6.39-imqmq/include/linux/imq.h 2011-05-19 11:08:04.281864473 +0300 + obj-$(CONFIG_MII) += mii.o +diff -Naupr linux-4.10_orig/include/linux/imq.h linux-4.10/include/linux/imq.h +--- linux-4.10_orig/include/linux/imq.h 1970-01-01 07:00:00.000000000 +0700 ++++ linux-4.10/include/linux/imq.h 2017-02-28 18:44:55.978280593 +0700 @@ -0,0 +1,13 @@ +#ifndef _IMQ_H +#define _IMQ_H @@ -940,9 +1104,32 @@ diff -uNr linux-2.6.39/include/linux/imq.h linux-2.6.39-imqmq/include/linux/imq. + +#endif /* _IMQ_H */ + -diff -uNr linux-2.6.39/include/linux/netfilter/xt_IMQ.h linux-2.6.39-imqmq/include/linux/netfilter/xt_IMQ.h ---- linux-2.6.39/include/linux/netfilter/xt_IMQ.h 1970-01-01 02:00:00.000000000 +0200 -+++ linux-2.6.39-imqmq/include/linux/netfilter/xt_IMQ.h 2011-05-19 11:08:04.281864473 +0300 +diff -Naupr linux-4.10_orig/include/linux/netdevice.h linux-4.10/include/linux/netdevice.h +--- linux-4.10_orig/include/linux/netdevice.h 2017-02-20 05:34:00.000000000 +0700 ++++ linux-4.10/include/linux/netdevice.h 2017-02-28 18:44:55.978280593 +0700 +@@ -3604,6 +3604,19 @@ static inline void netif_tx_unlock_bh(st + } \ + } + ++#define HARD_TX_LOCK_BH(dev, txq) { \ ++ if ((dev->features & NETIF_F_LLTX) == 0) { \ ++ __netif_tx_lock_bh(txq); \ ++ } \ ++} ++ ++#define HARD_TX_UNLOCK_BH(dev, txq) { \ ++ if ((dev->features & NETIF_F_LLTX) == 0) { \ ++ __netif_tx_unlock_bh(txq); \ ++ } \ ++} ++ ++ + static inline void netif_tx_disable(struct net_device *dev) + { + unsigned int i; +diff -Naupr linux-4.10_orig/include/linux/netfilter/xt_IMQ.h linux-4.10/include/linux/netfilter/xt_IMQ.h +--- linux-4.10_orig/include/linux/netfilter/xt_IMQ.h 1970-01-01 07:00:00.000000000 +0700 ++++ linux-4.10/include/linux/netfilter/xt_IMQ.h 2017-02-28 18:44:55.981613941 +0700 @@ -0,0 +1,9 @@ +#ifndef _XT_IMQ_H +#define _XT_IMQ_H @@ -953,22 +1140,9 @@ diff -uNr linux-2.6.39/include/linux/netfilter/xt_IMQ.h linux-2.6.39-imqmq/inclu + +#endif /* _XT_IMQ_H */ + -diff -uNr linux-2.6.39/include/linux/netfilter.h linux-2.6.39-imqmq/include/linux/netfilter.h ---- linux-2.6.39/include/linux/netfilter.h 2011-05-19 07:06:34.000000000 +0300 -+++ linux-2.6.39-imqmq/include/linux/netfilter.h 2011-05-19 11:08:04.285197874 +0300 -@@ -21,7 +21,8 @@ - #define NF_QUEUE 3 - #define NF_REPEAT 4 - #define NF_STOP 5 --#define NF_MAX_VERDICT NF_STOP -+#define NF_IMQ_QUEUE 6 -+#define NF_MAX_VERDICT NF_IMQ_QUEUE - - /* we overload the higher bits for encoding auxiliary data such as the queue - * number or errno values. Not nice, but better than additional function -diff -uNr linux-2.6.39/include/linux/netfilter_ipv4/ipt_IMQ.h linux-2.6.39-imqmq/include/linux/netfilter_ipv4/ipt_IMQ.h ---- linux-2.6.39/include/linux/netfilter_ipv4/ipt_IMQ.h 1970-01-01 02:00:00.000000000 +0200 -+++ linux-2.6.39-imqmq/include/linux/netfilter_ipv4/ipt_IMQ.h 2011-05-19 11:08:04.285197874 +0300 +diff -Naupr linux-4.10_orig/include/linux/netfilter_ipv4/ipt_IMQ.h linux-4.10/include/linux/netfilter_ipv4/ipt_IMQ.h +--- linux-4.10_orig/include/linux/netfilter_ipv4/ipt_IMQ.h 1970-01-01 07:00:00.000000000 +0700 ++++ linux-4.10/include/linux/netfilter_ipv4/ipt_IMQ.h 2017-02-28 18:44:55.981613941 +0700 @@ -0,0 +1,10 @@ +#ifndef _IPT_IMQ_H +#define _IPT_IMQ_H @@ -980,9 +1154,9 @@ diff -uNr linux-2.6.39/include/linux/netfilter_ipv4/ipt_IMQ.h linux-2.6.39-imqmq + +#endif /* _IPT_IMQ_H */ + -diff -uNr linux-2.6.39/include/linux/netfilter_ipv6/ip6t_IMQ.h linux-2.6.39-imqmq/include/linux/netfilter_ipv6/ip6t_IMQ.h ---- linux-2.6.39/include/linux/netfilter_ipv6/ip6t_IMQ.h 1970-01-01 02:00:00.000000000 +0200 -+++ linux-2.6.39-imqmq/include/linux/netfilter_ipv6/ip6t_IMQ.h 2011-05-19 11:08:04.285197874 +0300 +diff -Naupr linux-4.10_orig/include/linux/netfilter_ipv6/ip6t_IMQ.h linux-4.10/include/linux/netfilter_ipv6/ip6t_IMQ.h +--- linux-4.10_orig/include/linux/netfilter_ipv6/ip6t_IMQ.h 1970-01-01 07:00:00.000000000 +0700 ++++ linux-4.10/include/linux/netfilter_ipv6/ip6t_IMQ.h 2017-02-28 18:44:55.981613941 +0700 @@ -0,0 +1,10 @@ +#ifndef _IP6T_IMQ_H +#define _IP6T_IMQ_H @@ -994,20 +1168,21 @@ diff -uNr linux-2.6.39/include/linux/netfilter_ipv6/ip6t_IMQ.h linux-2.6.39-imqm + +#endif /* _IP6T_IMQ_H */ + -diff -uNr linux-2.6.39/include/linux/skbuff.h linux-2.6.39-imqmq/include/linux/skbuff.h ---- linux-2.6.39/include/linux/skbuff.h 2011-05-19 07:06:34.000000000 +0300 -+++ linux-2.6.39-imqmq/include/linux/skbuff.h 2011-05-19 11:08:04.288531274 +0300 -@@ -29,6 +29,9 @@ - #include - #include - #include +diff -Naupr linux-4.10_orig/include/linux/skbuff.h linux-4.10/include/linux/skbuff.h +--- linux-4.10_orig/include/linux/skbuff.h 2017-02-20 05:34:00.000000000 +0700 ++++ linux-4.10/include/linux/skbuff.h 2017-02-28 18:44:55.981613941 +0700 +@@ -39,6 +39,10 @@ + #include + #include + #include +#if defined(CONFIG_IMQ) || defined(CONFIG_IMQ_MODULE) +#include +#endif ++ - /* Don't change this without changing skb_csum_unnecessary! */ - #define CHECKSUM_NONE 0 -@@ -339,6 +342,9 @@ + /* The interface for checksum offload between the stack and networking drivers + * is as follows... +@@ -661,6 +665,9 @@ struct sk_buff { * first. This is owned by whoever has the skb queued ATM. */ char cb[48] __aligned(8); @@ -1016,129 +1191,155 @@ diff -uNr linux-2.6.39/include/linux/skbuff.h linux-2.6.39-imqmq/include/linux/s +#endif unsigned long _skb_refdst; - #ifdef CONFIG_XFRM -@@ -377,6 +383,9 @@ - #ifdef NET_SKBUFF_NF_DEFRAG_NEEDED - struct sk_buff *nfct_reasm; + void (*destructor)(struct sk_buff *skb); +@@ -670,6 +677,9 @@ struct sk_buff { + #if defined(CONFIG_NF_CONNTRACK) || defined(CONFIG_NF_CONNTRACK_MODULE) + struct nf_conntrack *nfct; #endif +#if defined(CONFIG_IMQ) || defined(CONFIG_IMQ_MODULE) -+ struct nf_queue_entry *nf_queue_entry; ++ struct nf_queue_entry *nf_queue_entry; +#endif - #ifdef CONFIG_BRIDGE_NETFILTER + #if IS_ENABLED(CONFIG_BRIDGE_NETFILTER) struct nf_bridge_info *nf_bridge; #endif -@@ -401,6 +410,10 @@ - - /* 0/13 bit hole */ - +@@ -750,6 +760,9 @@ struct sk_buff { + __u8 offload_fwd_mark:1; + #endif + /* 2, 4 or 5 bit hole */ +#if defined(CONFIG_IMQ) || defined(CONFIG_IMQ_MODULE) + __u8 imq_flags:IMQ_F_BITS; +#endif -+ - #ifdef CONFIG_NET_DMA - dma_cookie_t dma_cookie; - #endif -@@ -487,6 +500,12 @@ - return (struct rtable *)skb_dst(skb); - } + #ifdef CONFIG_NET_SCHED + __u16 tc_index; /* traffic control index */ +@@ -910,6 +923,12 @@ void kfree_skb_list(struct sk_buff *segs + void skb_tx_error(struct sk_buff *skb); + void consume_skb(struct sk_buff *skb); + void __kfree_skb(struct sk_buff *skb); + +#if defined(CONFIG_IMQ) || defined(CONFIG_IMQ_MODULE) -+extern int skb_save_cb(struct sk_buff *skb); -+extern int skb_restore_cb(struct sk_buff *skb); ++int skb_save_cb(struct sk_buff *skb); ++int skb_restore_cb(struct sk_buff *skb); +#endif + - extern void kfree_skb(struct sk_buff *skb); - extern void consume_skb(struct sk_buff *skb); - extern void __kfree_skb(struct sk_buff *skb); -@@ -2129,6 +2148,10 @@ - dst->nfct_reasm = src->nfct_reasm; - nf_conntrack_get_reasm(src->nfct_reasm); + extern struct kmem_cache *skbuff_head_cache; + + void kfree_skb_partial(struct sk_buff *skb, bool head_stolen); +@@ -3607,6 +3626,10 @@ static inline void __nf_copy(struct sk_b + if (copy) + dst->nfctinfo = src->nfctinfo; #endif +#if defined(CONFIG_IMQ) || defined(CONFIG_IMQ_MODULE) -+ dst->imq_flags = src->imq_flags; -+ dst->nf_queue_entry = src->nf_queue_entry; ++ dst->imq_flags = src->imq_flags; ++ dst->nf_queue_entry = src->nf_queue_entry; +#endif - #ifdef CONFIG_BRIDGE_NETFILTER + #if IS_ENABLED(CONFIG_BRIDGE_NETFILTER) dst->nf_bridge = src->nf_bridge; nf_bridge_get(src->nf_bridge); -diff -uNr linux-2.6.39/include/net/netfilter/nf_queue.h linux-2.6.39-imqmq/include/net/netfilter/nf_queue.h ---- linux-2.6.39/include/net/netfilter/nf_queue.h 2011-05-19 07:06:34.000000000 +0300 -+++ linux-2.6.39-imqmq/include/net/netfilter/nf_queue.h 2011-05-19 11:08:04.288531274 +0300 -@@ -30,5 +30,11 @@ - const struct nf_queue_handler *qh); - extern void nf_unregister_queue_handlers(const struct nf_queue_handler *qh); - extern void nf_reinject(struct nf_queue_entry *entry, unsigned int verdict); -+extern void nf_queue_entry_release_refs(struct nf_queue_entry *entry); +diff -Naupr linux-4.10_orig/include/net/netfilter/nf_queue.h linux-4.10/include/net/netfilter/nf_queue.h +--- linux-4.10_orig/include/net/netfilter/nf_queue.h 2017-02-20 05:34:00.000000000 +0700 ++++ linux-4.10/include/net/netfilter/nf_queue.h 2017-02-28 18:44:55.981613941 +0700 +@@ -31,6 +31,12 @@ struct nf_queue_handler { + void nf_register_queue_handler(struct net *net, const struct nf_queue_handler *qh); + void nf_unregister_queue_handler(struct net *net); + void nf_reinject(struct nf_queue_entry *entry, unsigned int verdict); ++void nf_queue_entry_release_refs(struct nf_queue_entry *entry); + +#if defined(CONFIG_IMQ) || defined(CONFIG_IMQ_MODULE) -+extern void nf_register_queue_imq_handler(const struct nf_queue_handler *qh); -+extern void nf_unregister_queue_imq_handler(void); ++void nf_register_queue_imq_handler(const struct nf_queue_handler *qh); ++void nf_unregister_queue_imq_handler(void); +#endif - #endif /* _NF_QUEUE_H */ -diff -uNr linux-2.6.39/net/core/dev.c linux-2.6.39-imqmq/net/core/dev.c ---- linux-2.6.39/net/core/dev.c 2011-05-19 07:06:34.000000000 +0300 -+++ linux-2.6.39-imqmq/net/core/dev.c 2011-05-19 11:08:04.288531274 +0300 -@@ -98,6 +98,9 @@ - #include - #include - #include + void nf_queue_entry_get_refs(struct nf_queue_entry *entry); + void nf_queue_entry_release_refs(struct nf_queue_entry *entry); +diff -Naupr linux-4.10_orig/include/net/pkt_sched.h linux-4.10/include/net/pkt_sched.h +--- linux-4.10_orig/include/net/pkt_sched.h 2017-02-20 05:34:00.000000000 +0700 ++++ linux-4.10/include/net/pkt_sched.h 2017-02-28 18:44:55.981613941 +0700 +@@ -107,6 +107,8 @@ int sch_direct_xmit(struct sk_buff *skb, + + void __qdisc_run(struct Qdisc *q); + ++struct sk_buff *qdisc_dequeue_skb(struct Qdisc *q, bool *validate); ++ + static inline void qdisc_run(struct Qdisc *q) + { + if (qdisc_run_begin(q)) +diff -Naupr linux-4.10_orig/include/net/sch_generic.h linux-4.10/include/net/sch_generic.h +--- linux-4.10_orig/include/net/sch_generic.h 2017-02-20 05:34:00.000000000 +0700 ++++ linux-4.10/include/net/sch_generic.h 2017-02-28 18:44:55.981613941 +0700 +@@ -518,6 +518,13 @@ static inline int qdisc_enqueue(struct s + return sch->enqueue(skb, sch, to_free); + } + ++static inline int qdisc_enqueue_root(struct sk_buff *skb, struct Qdisc *sch, ++ struct sk_buff **to_free) ++{ ++ qdisc_skb_cb(skb)->pkt_len = skb->len; ++ return qdisc_enqueue(skb, sch, to_free) & NET_XMIT_MASK; ++} ++ + static inline bool qdisc_is_percpu_stats(const struct Qdisc *q) + { + return q->flags & TCQ_F_CPUSTATS; +diff -Naupr linux-4.10_orig/include/uapi/linux/netfilter.h linux-4.10/include/uapi/linux/netfilter.h +--- linux-4.10_orig/include/uapi/linux/netfilter.h 2017-02-20 05:34:00.000000000 +0700 ++++ linux-4.10/include/uapi/linux/netfilter.h 2017-02-28 18:44:55.981613941 +0700 +@@ -14,7 +14,8 @@ + #define NF_QUEUE 3 + #define NF_REPEAT 4 + #define NF_STOP 5 /* Deprecated, for userspace nf_queue compatibility. */ +-#define NF_MAX_VERDICT NF_STOP ++#define NF_IMQ_QUEUE 6 ++#define NF_MAX_VERDICT NF_IMQ_QUEUE + + /* we overload the higher bits for encoding auxiliary data such as the queue + * number or errno values. Not nice, but better than additional function +diff -Naupr linux-4.10_orig/net/core/dev.c linux-4.10/net/core/dev.c +--- linux-4.10_orig/net/core/dev.c 2017-02-20 05:34:00.000000000 +0700 ++++ linux-4.10/net/core/dev.c 2017-02-28 18:44:55.984947288 +0700 +@@ -140,6 +140,9 @@ + #include + #include + #include +#if defined(CONFIG_IMQ) || defined(CONFIG_IMQ_MODULE) +#include +#endif - #include - #include - #include -@@ -2099,12 +2102,21 @@ - if (dev->priv_flags & IFF_XMIT_DST_RELEASE) - skb_dst_drop(skb); -+#if defined(CONFIG_IMQ) || defined(CONFIG_IMQ_MODULE) -+ if (!list_empty(&ptype_all) && -+ !(skb->imq_flags & IMQ_F_ENQUEUE)) -+#else - if (!list_empty(&ptype_all)) -+#endif - dev_queue_xmit_nit(skb, dev); + #include "net-sysfs.h" - skb_orphan_try(skb); +@@ -2881,7 +2884,12 @@ static int xmit_one(struct sk_buff *skb, + unsigned int len; + int rc; +#if defined(CONFIG_IMQ) || defined(CONFIG_IMQ_MODULE) -+ features = skb->dev ? netif_skb_features(skb) : dev->features; ++ if ((!list_empty(&ptype_all) || !list_empty(&dev->ptype_all)) && ++ !(skb->imq_flags & IMQ_F_ENQUEUE)) +#else - features = netif_skb_features(skb); + if (!list_empty(&ptype_all) || !list_empty(&dev->ptype_all)) +#endif + dev_queue_xmit_nit(skb, dev); - if (vlan_tx_tag_present(skb) && - !(features & NETIF_F_HW_VLAN_TX)) { -@@ -2269,8 +2281,7 @@ - #endif + len = skb->len; +@@ -2920,6 +2928,8 @@ out: + return skb; } --static struct netdev_queue *dev_pick_tx(struct net_device *dev, -- struct sk_buff *skb) -+static struct netdev_queue *dev_pick_tx(struct net_device *dev, struct sk_buff *skb) ++EXPORT_SYMBOL_GPL(dev_hard_start_xmit); ++ + static struct sk_buff *validate_xmit_vlan(struct sk_buff *skb, + netdev_features_t features) { - int queue_index; - const struct net_device_ops *ops = dev->netdev_ops; -diff -uNr linux-2.6.39/net/core/skbuff.c linux-2.6.39-imqmq/net/core/skbuff.c ---- linux-2.6.39/net/core/skbuff.c 2011-05-19 07:06:34.000000000 +0300 -+++ linux-2.6.39-imqmq/net/core/skbuff.c 2011-05-19 11:08:04.288531274 +0300 -@@ -72,6 +72,9 @@ - - static struct kmem_cache *skbuff_head_cache __read_mostly; +diff -Naupr linux-4.10_orig/net/core/skbuff.c linux-4.10/net/core/skbuff.c +--- linux-4.10_orig/net/core/skbuff.c 2017-02-20 05:34:00.000000000 +0700 ++++ linux-4.10/net/core/skbuff.c 2017-02-28 18:44:55.984947288 +0700 +@@ -82,6 +82,87 @@ struct kmem_cache *skbuff_head_cache __r static struct kmem_cache *skbuff_fclone_cache __read_mostly; + int sysctl_max_skb_frags __read_mostly = MAX_SKB_FRAGS; + EXPORT_SYMBOL(sysctl_max_skb_frags); +#if defined(CONFIG_IMQ) || defined(CONFIG_IMQ_MODULE) +static struct kmem_cache *skbuff_cb_store_cache __read_mostly; +#endif - - static void sock_pipe_buf_release(struct pipe_inode_info *pipe, - struct pipe_buffer *buf) -@@ -91,6 +94,82 @@ - return 1; - } - ++ +#if defined(CONFIG_IMQ) || defined(CONFIG_IMQ_MODULE) +/* Control buffer save/restore for IMQ devices */ +struct skb_cb_table { @@ -1194,6 +1395,7 @@ diff -uNr linux-2.6.39/net/core/skbuff.c linux-2.6.39-imqmq/net/core/skbuff.c +} +EXPORT_SYMBOL(skb_restore_cb); + ++static void skb_copy_stored_cb(struct sk_buff * , const struct sk_buff * ) __attribute__ ((unused)); +static void skb_copy_stored_cb(struct sk_buff *new, const struct sk_buff *__old) +{ + struct skb_cb_table *next; @@ -1216,46 +1418,49 @@ diff -uNr linux-2.6.39/net/core/skbuff.c linux-2.6.39-imqmq/net/core/skbuff.c +} +#endif - /* Pipe buffer operations for a socket. */ - static const struct pipe_buf_operations sock_pipe_buf_ops = { -@@ -379,6 +458,26 @@ + /** + * skb_panic - private function for out-of-line support +@@ -654,6 +735,28 @@ static void skb_release_head_state(struc WARN_ON(in_irq()); skb->destructor(skb); } +#if defined(CONFIG_IMQ) || defined(CONFIG_IMQ_MODULE) -+ /* This should not happen. When it does, avoid memleak by restoring -+ the chain of cb-backups. */ ++ /* ++ * This should not happen. When it does, avoid memleak by restoring ++ * the chain of cb-backups. ++ */ + while (skb->cb_next != NULL) { + if (net_ratelimit()) -+ printk(KERN_WARNING "IMQ: kfree_skb: skb->cb_next: " -+ "%08x\n", (unsigned int)skb->cb_next); ++ pr_warn("IMQ: kfree_skb: skb->cb_next: %08x\n", ++ (unsigned int)(uintptr_t)skb->cb_next); + + skb_restore_cb(skb); + } -+ /* This should not happen either, nf_queue_entry is nullified in ++ /* ++ * This should not happen either, nf_queue_entry is nullified in + * imq_dev_xmit(). If we have non-NULL nf_queue_entry then we are + * leaking entry pointers, maybe memory. We don't know if this is + * pointer to already freed memory, or should this be freed. + * If this happens we need to add refcounting, etc for nf_queue_entry. + */ + if (skb->nf_queue_entry && net_ratelimit()) -+ printk(KERN_WARNING -+ "IMQ: kfree_skb: skb->nf_queue_entry != NULL"); ++ pr_warn("%s\n", "IMQ: kfree_skb: skb->nf_queue_entry != NULL"); +#endif - #if defined(CONFIG_NF_CONNTRACK) || defined(CONFIG_NF_CONNTRACK_MODULE) + #if IS_ENABLED(CONFIG_NF_CONNTRACK) nf_conntrack_put(skb->nfct); #endif -@@ -517,6 +616,9 @@ +@@ -843,6 +946,10 @@ static void __copy_skb_header(struct sk_ new->sp = secpath_get(old->sp); #endif - memcpy(new->cb, old->cb, sizeof(old->cb)); + __nf_copy(new, old, false); +#if defined(CONFIG_IMQ) || defined(CONFIG_IMQ_MODULE) -+ skb_copy_stored_cb(new, old); ++ new->cb_next = NULL; ++ /*skb_copy_stored_cb(new, old);*/ +#endif - new->csum = old->csum; - new->local_df = old->local_df; - new->pkt_type = old->pkt_type; -@@ -2780,6 +2882,13 @@ + + /* Note : this field could be in headers_start/headers_end section + * It is not yet because we do not want to have a 16 bit hole +@@ -3465,6 +3572,13 @@ void __init skb_init(void) 0, SLAB_HWCACHE_ALIGN|SLAB_PANIC, NULL); @@ -1269,36 +1474,54 @@ diff -uNr linux-2.6.39/net/core/skbuff.c linux-2.6.39-imqmq/net/core/skbuff.c } /** -diff -uNr linux-2.6.39/net/netfilter/core.c linux-2.6.39-imqmq/net/netfilter/core.c ---- linux-2.6.39/net/netfilter/core.c 2011-05-19 07:06:34.000000000 +0300 -+++ linux-2.6.39-imqmq/net/netfilter/core.c 2011-05-19 11:13:19.891558119 +0300 -@@ -191,6 +191,20 @@ - kfree_skb(skb); - } - ret = 0; -+#if defined(CONFIG_IMQ) || defined(CONFIG_IMQ_MODULE) -+ } else if ((verdict & NF_VERDICT_MASK) == NF_IMQ_QUEUE) { -+ ret = nf_imq_queue(skb, elem, pf, hook, indev, outdev, okfn, -+ verdict >> NF_VERDICT_QBITS); -+ if (ret < 0) { -+ if (ret == -ECANCELED) -+ goto next_hook; -+ if (ret == -ESRCH && -+ (verdict & NF_VERDICT_FLAG_QUEUE_BYPASS)) -+ goto next_hook; -+ kfree_skb(skb); -+ } -+ ret = 0; -+#endif +diff -Naupr linux-4.10_orig/net/ipv6/ip6_output.c linux-4.10/net/ipv6/ip6_output.c +--- linux-4.10_orig/net/ipv6/ip6_output.c 2017-02-20 05:34:00.000000000 +0700 ++++ linux-4.10/net/ipv6/ip6_output.c 2017-02-28 18:44:55.988280636 +0700 +@@ -67,9 +67,6 @@ static int ip6_finish_output2(struct net + struct in6_addr *nexthop; + int ret; + +- skb->protocol = htons(ETH_P_IPV6); +- skb->dev = dev; +- + if (ipv6_addr_is_multicast(&ipv6_hdr(skb)->daddr)) { + struct inet6_dev *idev = ip6_dst_idev(skb_dst(skb)); + +@@ -159,6 +156,13 @@ int ip6_output(struct net *net, struct s + return 0; } - rcu_read_unlock(); - return ret; -diff -uNr linux-2.6.39/net/netfilter/Kconfig linux-2.6.39-imqmq/net/netfilter/Kconfig ---- linux-2.6.39/net/netfilter/Kconfig 2011-05-19 07:06:34.000000000 +0300 -+++ linux-2.6.39-imqmq/net/netfilter/Kconfig 2011-05-19 11:08:04.288531274 +0300 -@@ -507,6 +507,18 @@ - For more information on the LEDs available on your system, see - Documentation/leds-class.txt + ++ /* ++ * IMQ-patch: moved setting skb->dev and skb->protocol from ++ * ip6_finish_output2 to fix crashing at netif_skb_features(). ++ */ ++ skb->protocol = htons(ETH_P_IPV6); ++ skb->dev = dev; ++ + return NF_HOOK_COND(NFPROTO_IPV6, NF_INET_POST_ROUTING, + net, sk, skb, NULL, dev, + ip6_finish_output, +diff -Naupr linux-4.10_orig/net/netfilter/core.c linux-4.10/net/netfilter/core.c +--- linux-4.10_orig/net/netfilter/core.c 2017-02-20 05:34:00.000000000 +0700 ++++ linux-4.10/net/netfilter/core.c 2017-02-28 18:44:55.988280636 +0700 +@@ -318,6 +318,11 @@ int nf_hook_slow(struct sk_buff *skb, st + if (ret == 0) + ret = -EPERM; + return ret; ++ case NF_IMQ_QUEUE: ++ ret = nf_queue(skb, state, &entry, verdict); ++ if (ret == -ECANCELED) ++ continue; ++ return ret; + case NF_QUEUE: + ret = nf_queue(skb, state, &entry, verdict); + if (ret == 1 && entry) +diff -Naupr linux-4.10_orig/net/netfilter/Kconfig linux-4.10/net/netfilter/Kconfig +--- linux-4.10_orig/net/netfilter/Kconfig 2017-02-20 05:34:00.000000000 +0700 ++++ linux-4.10/net/netfilter/Kconfig 2017-02-28 18:44:55.988280636 +0700 +@@ -852,6 +852,18 @@ config NETFILTER_XT_TARGET_LOG + + To compile it as a module, choose M here. If unsure, say N. +config NETFILTER_XT_TARGET_IMQ + tristate '"IMQ" target support' @@ -1315,217 +1538,106 @@ diff -uNr linux-2.6.39/net/netfilter/Kconfig linux-2.6.39-imqmq/net/netfilter/Kc config NETFILTER_XT_TARGET_MARK tristate '"MARK" target support' depends on NETFILTER_ADVANCED -diff -uNr linux-2.6.39/net/netfilter/Makefile linux-2.6.39-imqmq/net/netfilter/Makefile ---- linux-2.6.39/net/netfilter/Makefile 2011-05-19 07:06:34.000000000 +0300 -+++ linux-2.6.39-imqmq/net/netfilter/Makefile 2011-05-19 11:08:04.291864674 +0300 -@@ -56,6 +56,7 @@ - obj-$(CONFIG_NETFILTER_XT_TARGET_CT) += xt_CT.o +diff -Naupr linux-4.10_orig/net/netfilter/Makefile linux-4.10/net/netfilter/Makefile +--- linux-4.10_orig/net/netfilter/Makefile 2017-02-20 05:34:00.000000000 +0700 ++++ linux-4.10/net/netfilter/Makefile 2017-02-28 18:44:55.988280636 +0700 +@@ -125,6 +125,7 @@ obj-$(CONFIG_NETFILTER_XT_TARGET_CT) += obj-$(CONFIG_NETFILTER_XT_TARGET_DSCP) += xt_DSCP.o obj-$(CONFIG_NETFILTER_XT_TARGET_HL) += xt_HL.o + obj-$(CONFIG_NETFILTER_XT_TARGET_HMARK) += xt_HMARK.o +obj-$(CONFIG_NETFILTER_XT_TARGET_IMQ) += xt_IMQ.o obj-$(CONFIG_NETFILTER_XT_TARGET_LED) += xt_LED.o - obj-$(CONFIG_NETFILTER_XT_TARGET_NFLOG) += xt_NFLOG.o - obj-$(CONFIG_NETFILTER_XT_TARGET_NFQUEUE) += xt_NFQUEUE.o -diff -uNr linux-2.6.39/net/netfilter/nf_internals.h linux-2.6.39-imqmq/net/netfilter/nf_internals.h ---- linux-2.6.39/net/netfilter/nf_internals.h 2011-05-19 07:06:34.000000000 +0300 -+++ linux-2.6.39-imqmq/net/netfilter/nf_internals.h 2011-05-19 11:08:04.291864674 +0300 -@@ -30,6 +30,15 @@ - struct net_device *outdev, - int (*okfn)(struct sk_buff *), - unsigned int queuenum); -+#if defined(CONFIG_IMQ) || defined(CONFIG_IMQ_MODULE) -+extern int nf_imq_queue(struct sk_buff *skb, -+ struct list_head *elem, -+ u_int8_t pf, unsigned int hook, -+ struct net_device *indev, -+ struct net_device *outdev, -+ int (*okfn)(struct sk_buff *), -+ unsigned int queuenum); -+#endif - extern int __init netfilter_queue_init(void); - - /* nf_log.c */ -diff -uNr linux-2.6.39/net/netfilter/nf_queue.c linux-2.6.39-imqmq/net/netfilter/nf_queue.c ---- linux-2.6.39/net/netfilter/nf_queue.c 2011-05-19 07:06:34.000000000 +0300 -+++ linux-2.6.39-imqmq/net/netfilter/nf_queue.c 2011-05-19 11:22:38.189467462 +0300 -@@ -22,6 +22,26 @@ - - static DEFINE_MUTEX(queue_handler_mutex); + obj-$(CONFIG_NETFILTER_XT_TARGET_LOG) += xt_LOG.o + obj-$(CONFIG_NETFILTER_XT_TARGET_NETMAP) += xt_NETMAP.o +diff -Naupr linux-4.10_orig/net/netfilter/nf_queue.c linux-4.10/net/netfilter/nf_queue.c +--- linux-4.10_orig/net/netfilter/nf_queue.c 2017-02-20 05:34:00.000000000 +0700 ++++ linux-4.10/net/netfilter/nf_queue.c 2017-02-28 18:44:55.988280636 +0700 +@@ -27,6 +27,23 @@ + * receives, no matter what. + */ +#if defined(CONFIG_IMQ) || defined(CONFIG_IMQ_MODULE) -+static const struct nf_queue_handler *queue_imq_handler; ++static const struct nf_queue_handler __rcu *queue_imq_handler __read_mostly; + +void nf_register_queue_imq_handler(const struct nf_queue_handler *qh) +{ -+ mutex_lock(&queue_handler_mutex); + rcu_assign_pointer(queue_imq_handler, qh); -+ mutex_unlock(&queue_handler_mutex); +} +EXPORT_SYMBOL_GPL(nf_register_queue_imq_handler); + +void nf_unregister_queue_imq_handler(void) +{ -+ mutex_lock(&queue_handler_mutex); -+ rcu_assign_pointer(queue_imq_handler, NULL); -+ mutex_unlock(&queue_handler_mutex); ++ RCU_INIT_POINTER(queue_imq_handler, NULL); ++ synchronize_rcu(); +} +EXPORT_SYMBOL_GPL(nf_unregister_queue_imq_handler); +#endif + /* return EBUSY when somebody else is registered, return EEXIST if the * same handler is registered, return 0 in case of success. */ - int nf_register_queue_handler(u_int8_t pf, const struct nf_queue_handler *qh) -@@ -92,7 +112,7 @@ - } - EXPORT_SYMBOL_GPL(nf_unregister_queue_handlers); - --static void nf_queue_entry_release_refs(struct nf_queue_entry *entry) -+void nf_queue_entry_release_refs(struct nf_queue_entry *entry) - { - /* Release those devices we held, or Alexey will kill me. */ - if (entry->indev) -@@ -112,6 +132,7 @@ - /* Drop reference to owner of hook which queued us. */ - module_put(entry->elem->owner); + void nf_register_queue_handler(struct net *net, const struct nf_queue_handler *qh) +@@ -108,16 +125,28 @@ void nf_queue_nf_hook_drop(struct net *n } -+EXPORT_SYMBOL_GPL(nf_queue_entry_release_refs); - /* - * Any packet that leaves via this function must come back -@@ -123,7 +144,8 @@ - struct net_device *indev, - struct net_device *outdev, - int (*okfn)(struct sk_buff *), -- unsigned int queuenum) -+ unsigned int queuenum, -+ bool imq_queue) + static int __nf_queue(struct sk_buff *skb, const struct nf_hook_state *state, +- struct nf_hook_entry *hook_entry, unsigned int queuenum) ++ struct nf_hook_entry *hook_entry, unsigned int verdict) { int status = -ENOENT; struct nf_queue_entry *entry = NULL; -@@ -137,7 +159,14 @@ - /* QUEUE == DROP if no one is waiting, to be safe. */ - rcu_read_lock(); + const struct nf_afinfo *afinfo; + const struct nf_queue_handler *qh; + struct net *net = state->net; ++ unsigned int queuetype = verdict & NF_VERDICT_MASK; ++ unsigned int queuenum = verdict >> NF_VERDICT_QBITS; -- qh = rcu_dereference(queue_handler[pf]); + /* QUEUE == DROP if no one is waiting, to be safe. */ +- qh = rcu_dereference(net->nf.queue_handler); ++ if (queuetype == NF_IMQ_QUEUE) { +#if defined(CONFIG_IMQ) || defined(CONFIG_IMQ_MODULE) -+ if (imq_queue) -+ qh = rcu_dereference(queue_imq_handler); -+ else -+ qh = rcu_dereference(queue_handler[pf]); ++ qh = rcu_dereference(queue_imq_handler); +#else -+ qh = rcu_dereference(queue_handler[pf]); ++ BUG(); ++ goto err_unlock; +#endif ++ } else { ++ qh = rcu_dereference(net->nf.queue_handler); ++ } ++ if (!qh) { status = -ESRCH; - goto err_unlock; -@@ -203,13 +232,14 @@ - return status; - } + goto err; +@@ -164,8 +193,17 @@ int nf_queue(struct sk_buff *skb, struct + struct nf_hook_entry *entry = *entryp; + int ret; --int nf_queue(struct sk_buff *skb, -- struct list_head *elem, -- u_int8_t pf, unsigned int hook, -- struct net_device *indev, -- struct net_device *outdev, -- int (*okfn)(struct sk_buff *), -- unsigned int queuenum) -+static int _nf_queue(struct sk_buff *skb, -+ struct list_head *elem, -+ u_int8_t pf, unsigned int hook, -+ struct net_device *indev, -+ struct net_device *outdev, -+ int (*okfn)(struct sk_buff *), -+ unsigned int queuenum, -+ bool imq_queue) - { - struct sk_buff *segs; - int err; -@@ -217,7 +247,7 @@ - - if (!skb_is_gso(skb)) - return __nf_queue(skb, elem, pf, hook, indev, outdev, okfn, -- queuenum); -+ queuenum, imq_queue); - - switch (pf) { - case NFPROTO_IPV4: -@@ -244,7 +274,7 @@ - segs->next = NULL; - if (err == 0) - err = __nf_queue(segs, elem, pf, hook, indev, -- outdev, okfn, queuenum); -+ outdev, okfn, queuenum, imq_queue); - if (err == 0) - queued++; - else -@@ -260,6 +290,32 @@ - return err; - } - -+int nf_queue(struct sk_buff *skb, -+ struct list_head *elem, -+ u_int8_t pf, unsigned int hook, -+ struct net_device *indev, -+ struct net_device *outdev, -+ int (*okfn)(struct sk_buff *), -+ unsigned int queuenum) -+{ -+ return _nf_queue(skb, elem, pf, hook, indev, outdev, okfn, queuenum, -+ false); -+} +- ret = __nf_queue(skb, state, entry, verdict >> NF_VERDICT_QBITS); ++ ret = __nf_queue(skb, state, entry, verdict); + if (ret < 0) { + +#if defined(CONFIG_IMQ) || defined(CONFIG_IMQ_MODULE) -+int nf_imq_queue(struct sk_buff *skb, -+ struct list_head *elem, -+ u_int8_t pf, unsigned int hook, -+ struct net_device *indev, -+ struct net_device *outdev, -+ int (*okfn)(struct sk_buff *), -+ unsigned int queuenum) -+{ -+ return _nf_queue(skb, elem, pf, hook, indev, outdev, okfn, queuenum, -+ true); -+} ++ /* IMQ Bypass */ ++ if (ret == -ECANCELED && skb->imq_flags == 0) { ++ *entryp = rcu_dereference(entry->next); ++ return 1; ++ } +#endif + - void nf_reinject(struct nf_queue_entry *entry, unsigned int verdict) - { - struct sk_buff *skb = entry->skb; -@@ -301,7 +357,7 @@ - case NF_QUEUE: - err = __nf_queue(skb, elem, entry->pf, entry->hook, - entry->indev, entry->outdev, entry->okfn, -- verdict >> NF_VERDICT_QBITS); -+ verdict >> NF_VERDICT_QBITS, false); - if (err < 0) { - if (err == -ECANCELED) - goto next_hook; -@@ -311,6 +367,21 @@ - kfree_skb(skb); - } + if (ret == -ESRCH && + (verdict & NF_VERDICT_FLAG_QUEUE_BYPASS)) { + *entryp = rcu_dereference(entry->next); +@@ -232,6 +270,7 @@ okfn: + local_bh_enable(); break; -+#if defined(CONFIG_IMQ) || defined(CONFIG_IMQ_MODULE) + case NF_QUEUE: + case NF_IMQ_QUEUE: -+ err = __nf_queue(skb, elem, entry->pf, entry->hook, -+ entry->indev, entry->outdev, entry->okfn, -+ verdict >> NF_VERDICT_QBITS, true); -+ if (err < 0) { -+ if (err == -ECANCELED) -+ goto next_hook; -+ if (err == -ESRCH && -+ (verdict & NF_VERDICT_FLAG_QUEUE_BYPASS)) -+ goto next_hook; -+ kfree_skb(skb); -+ } -+ break; -+#endif - case NF_STOLEN: - default: - kfree_skb(skb); -diff -uNr linux-2.6.39/net/netfilter/xt_IMQ.c linux-2.6.39-imqmq/net/netfilter/xt_IMQ.c ---- linux-2.6.39/net/netfilter/xt_IMQ.c 1970-01-01 02:00:00.000000000 +0200 -+++ linux-2.6.39-imqmq/net/netfilter/xt_IMQ.c 2011-05-19 11:08:04.308531677 +0300 -@@ -0,0 +1,74 @@ + err = nf_queue(skb, &entry->state, &hook_entry, verdict); + if (err == 1) { + if (hook_entry) +diff -Naupr linux-4.10_orig/net/netfilter/xt_IMQ.c linux-4.10/net/netfilter/xt_IMQ.c +--- linux-4.10_orig/net/netfilter/xt_IMQ.c 1970-01-01 07:00:00.000000000 +0700 ++++ linux-4.10/net/netfilter/xt_IMQ.c 2017-02-28 18:44:55.988280636 +0700 +@@ -0,0 +1,72 @@ +/* + * This target marks packets to be enqueued to an imq device + */ @@ -1550,9 +1662,8 @@ diff -uNr linux-2.6.39/net/netfilter/xt_IMQ.c linux-2.6.39-imqmq/net/netfilter/x + struct xt_imq_info *mr = par->targinfo; + + if (mr->todev > IMQ_MAX_DEVS - 1) { -+ printk(KERN_WARNING -+ "IMQ: invalid device specified, highest is %u\n", -+ IMQ_MAX_DEVS - 1); ++ pr_warn("IMQ: invalid device specified, highest is %u\n", ++ IMQ_MAX_DEVS - 1); + return -EINVAL; + } + @@ -1593,10 +1704,27 @@ diff -uNr linux-2.6.39/net/netfilter/xt_IMQ.c linux-2.6.39-imqmq/net/netfilter/x +module_init(imq_init); +module_exit(imq_fini); + -+MODULE_AUTHOR("http://www.linuximq.net"); -+MODULE_DESCRIPTION("Pseudo-driver for the intermediate queue device. " -+ "See http://www.linuximq.net/ for more information."); ++MODULE_AUTHOR("https://github.com/imq/linuximq"); ++MODULE_DESCRIPTION("Pseudo-driver for the intermediate queue device. See https://github.com/imq/linuximq/wiki for more information."); +MODULE_LICENSE("GPL"); +MODULE_ALIAS("ipt_IMQ"); +MODULE_ALIAS("ip6t_IMQ"); + +diff -Naupr linux-4.10_orig/net/sched/sch_generic.c linux-4.10/net/sched/sch_generic.c +--- linux-4.10_orig/net/sched/sch_generic.c 2017-02-20 05:34:00.000000000 +0700 ++++ linux-4.10/net/sched/sch_generic.c 2017-02-28 18:44:55.988280636 +0700 +@@ -154,6 +154,14 @@ bulk: + return skb; + } + ++struct sk_buff *qdisc_dequeue_skb(struct Qdisc *q, bool *validate) ++{ ++ int packets; ++ ++ return dequeue_skb(q, validate, &packets); ++} ++EXPORT_SYMBOL(qdisc_dequeue_skb); ++ + /* + * Transmit possibly several skbs, and handle the return status as + * required. Owning running seqcount bit guarantees that