mac80211: fix regression in skb resizing optimization in monitor mode (FS#2254)
[openwrt/staging/ldir.git] / package / kernel / mac80211 / patches / subsys / 357-mac80211-optimize-skb-resizing.patch
1 From: Felix Fietkau <nbd@nbd.name>
2 Date: Sun, 17 Mar 2019 18:11:30 +0100
3 Subject: [PATCH] mac80211: optimize skb resizing
4
5 When forwarding unicast packets from ethernet to batman-adv over 802.11s
6 (with forwarding disabled), the typical required headroom to transmit
7 encrypted packets on mt76 is 32 (802.11) + 6 (802.11s) + 8 (CCMP) +
8 2 (padding) + 6 (LLC) + 18 (batman-adv) - 14 (old ethernet header) = 58 bytes.
9
10 On systems where NET_SKB_PAD is 64 this leads to a call to pskb_expand_head
11 for every packet, since mac80211 also tries to allocate 16 bytes status
12 headroom for radiotap headers.
13
14 This patch fixes these unnecessary reallocations by only requiring the extra
15 status headroom in ieee80211_tx_monitor()
16 If however a reallocation happens before that call, the status headroom gets
17 added there as well, in order to avoid double reallocation.
18
19 The patch also cleans up the code by moving the headroom calculation to
20 ieee80211_skb_resize.
21
22 Signed-off-by: Felix Fietkau <nbd@nbd.name>
23 ---
24
25 --- a/net/mac80211/ieee80211_i.h
26 +++ b/net/mac80211/ieee80211_i.h
27 @@ -1761,6 +1761,9 @@ void ieee80211_clear_fast_xmit(struct st
28 int ieee80211_tx_control_port(struct wiphy *wiphy, struct net_device *dev,
29 const u8 *buf, size_t len,
30 const u8 *dest, __be16 proto, bool unencrypted);
31 +int ieee80211_skb_resize(struct ieee80211_local *local,
32 + struct ieee80211_sub_if_data *sdata,
33 + struct sk_buff *skb, int hdrlen, int hdr_add);
34
35 /* HT */
36 void ieee80211_apply_htcap_overrides(struct ieee80211_sub_if_data *sdata,
37 --- a/net/mac80211/status.c
38 +++ b/net/mac80211/status.c
39 @@ -672,6 +672,11 @@ void ieee80211_tx_monitor(struct ieee802
40 }
41 }
42
43 + if (ieee80211_skb_resize(local, NULL, skb, 0, 0)) {
44 + dev_kfree_skb(skb);
45 + return;
46 + }
47 +
48 /* send frame to monitor interfaces now */
49 rtap_len = ieee80211_tx_radiotap_len(info);
50 if (WARN_ON_ONCE(skb_headroom(skb) < rtap_len)) {
51 --- a/net/mac80211/tx.c
52 +++ b/net/mac80211/tx.c
53 @@ -1914,37 +1914,53 @@ static bool ieee80211_tx(struct ieee8021
54 }
55
56 /* device xmit handlers */
57 -
58 -static int ieee80211_skb_resize(struct ieee80211_sub_if_data *sdata,
59 - struct sk_buff *skb,
60 - int head_need, bool may_encrypt)
61 +int ieee80211_skb_resize(struct ieee80211_local *local,
62 + struct ieee80211_sub_if_data *sdata,
63 + struct sk_buff *skb, int hdr_len, int hdr_extra)
64 {
65 - struct ieee80211_local *local = sdata->local;
66 + struct ieee80211_tx_info *info = IEEE80211_SKB_CB(skb);
67 struct ieee80211_hdr *hdr;
68 - bool enc_tailroom;
69 - int tail_need = 0;
70 + int head_need, head_max;
71 + int tail_need, tail_max;
72 + bool enc_tailroom = false;
73
74 - hdr = (struct ieee80211_hdr *) skb->data;
75 - enc_tailroom = may_encrypt &&
76 - (sdata->crypto_tx_tailroom_needed_cnt ||
77 - ieee80211_is_mgmt(hdr->frame_control));
78 + if (sdata && !hdr_len &&
79 + !(info->flags & IEEE80211_TX_INTFL_DONT_ENCRYPT)) {
80 + hdr = (struct ieee80211_hdr *) skb->data;
81 + enc_tailroom = (sdata->crypto_tx_tailroom_needed_cnt ||
82 + ieee80211_is_mgmt(hdr->frame_control));
83 + hdr_len += sdata->encrypt_headroom;
84 + }
85
86 - if (enc_tailroom) {
87 - tail_need = IEEE80211_ENCRYPT_TAILROOM;
88 - tail_need -= skb_tailroom(skb);
89 - tail_need = max_t(int, tail_need, 0);
90 + head_need = head_max = hdr_len;
91 + tail_need = tail_max = 0;
92 + if (!sdata) {
93 + head_need = head_max = local->tx_headroom;
94 + } else {
95 + head_max += hdr_extra;
96 + head_max += max_t(int, local->tx_headroom,
97 + local->hw.extra_tx_headroom);
98 + head_need += local->hw.extra_tx_headroom;
99 +
100 + tail_max = IEEE80211_ENCRYPT_TAILROOM;
101 + if (enc_tailroom)
102 + tail_need = tail_max;
103 }
104
105 if (skb_cloned(skb) &&
106 (!ieee80211_hw_check(&local->hw, SUPPORTS_CLONED_SKBS) ||
107 !skb_clone_writable(skb, ETH_HLEN) || enc_tailroom))
108 I802_DEBUG_INC(local->tx_expand_skb_head_cloned);
109 - else if (head_need || tail_need)
110 + else if (head_need > skb_headroom(skb) ||
111 + tail_need > skb_tailroom(skb))
112 I802_DEBUG_INC(local->tx_expand_skb_head);
113 else
114 return 0;
115
116 - if (pskb_expand_head(skb, head_need, tail_need, GFP_ATOMIC)) {
117 + head_max = max_t(int, 0, head_max - skb_headroom(skb));
118 + tail_max = max_t(int, 0, tail_max - skb_tailroom(skb));
119 +
120 + if (pskb_expand_head(skb, head_max, tail_max, GFP_ATOMIC)) {
121 wiphy_debug(local->hw.wiphy,
122 "failed to reallocate TX buffer\n");
123 return -ENOMEM;
124 @@ -1960,18 +1976,8 @@ void ieee80211_xmit(struct ieee80211_sub
125 struct ieee80211_local *local = sdata->local;
126 struct ieee80211_tx_info *info = IEEE80211_SKB_CB(skb);
127 struct ieee80211_hdr *hdr;
128 - int headroom;
129 - bool may_encrypt;
130 -
131 - may_encrypt = !(info->flags & IEEE80211_TX_INTFL_DONT_ENCRYPT);
132 -
133 - headroom = local->tx_headroom;
134 - if (may_encrypt)
135 - headroom += sdata->encrypt_headroom;
136 - headroom -= skb_headroom(skb);
137 - headroom = max_t(int, 0, headroom);
138
139 - if (ieee80211_skb_resize(sdata, skb, headroom, may_encrypt)) {
140 + if (ieee80211_skb_resize(local, sdata, skb, 0, 0)) {
141 ieee80211_free_txskb(&local->hw, skb);
142 return;
143 }
144 @@ -2740,30 +2746,14 @@ static struct sk_buff *ieee80211_build_h
145
146 skb_pull(skb, skip_header_bytes);
147 padsize = ieee80211_hdr_padsize(&local->hw, hdrlen);
148 - head_need = hdrlen + encaps_len + meshhdrlen - skb_headroom(skb);
149 + head_need = hdrlen + encaps_len + meshhdrlen;
150 head_need += padsize;
151
152 - /*
153 - * So we need to modify the skb header and hence need a copy of
154 - * that. The head_need variable above doesn't, so far, include
155 - * the needed header space that we don't need right away. If we
156 - * can, then we don't reallocate right now but only after the
157 - * frame arrives at the master device (if it does...)
158 - *
159 - * If we cannot, however, then we will reallocate to include all
160 - * the ever needed space. Also, if we need to reallocate it anyway,
161 - * make it big enough for everything we may ever need.
162 - */
163 -
164 - if (head_need > 0 || skb_cloned(skb)) {
165 - head_need += sdata->encrypt_headroom;
166 - head_need += local->tx_headroom;
167 - head_need = max_t(int, 0, head_need);
168 - if (ieee80211_skb_resize(sdata, skb, head_need, true)) {
169 - ieee80211_free_txskb(&local->hw, skb);
170 - skb = NULL;
171 - return ERR_PTR(-ENOMEM);
172 - }
173 + if (ieee80211_skb_resize(local, sdata, skb, head_need,
174 + sdata->encrypt_headroom)) {
175 + ieee80211_free_txskb(&local->hw, skb);
176 + skb = NULL;
177 + return ERR_PTR(-ENOMEM);
178 }
179
180 if (encaps_data)
181 @@ -3377,7 +3367,6 @@ static bool ieee80211_xmit_fast(struct i
182 struct ieee80211_local *local = sdata->local;
183 u16 ethertype = (skb->data[12] << 8) | skb->data[13];
184 int extra_head = fast_tx->hdr_len - (ETH_HLEN - 2);
185 - int hw_headroom = sdata->local->hw.extra_tx_headroom;
186 struct ethhdr eth;
187 struct ieee80211_tx_info *info;
188 struct ieee80211_hdr *hdr = (void *)fast_tx->hdr;
189 @@ -3429,10 +3418,7 @@ static bool ieee80211_xmit_fast(struct i
190 * as the may-encrypt argument for the resize to not account for
191 * more room than we already have in 'extra_head'
192 */
193 - if (unlikely(ieee80211_skb_resize(sdata, skb,
194 - max_t(int, extra_head + hw_headroom -
195 - skb_headroom(skb), 0),
196 - false))) {
197 + if (unlikely(ieee80211_skb_resize(local, sdata, skb, extra_head, 0))) {
198 kfree_skb(skb);
199 return true;
200 }