Commit 4bd437ea authored by Christian Lamparter's avatar Christian Lamparter Committed by John W. Linville

carl9170: revamp carl9170_tx_prepare

David Miller complained about the driver's excessive use
of variables in __packed structs. While I did not fully
agree with his sole "performance" argument on all accounts.
I do see some room for improvement in hot-paths on
architectures without an efficient access to unaligned
elements.

This first patch (dare I say?) optimizes an important tx
hot-path in the driver: carl9170_tx_prepare.
Signed-off-by: default avatarChristian Lamparter <chunkeey@googlemail.com>
Signed-off-by: default avatarJohn W. Linville <linville@tuxdriver.com>
parent 9c655c8b
...@@ -760,8 +760,8 @@ static int carl9170_tx_prepare(struct ar9170 *ar, struct sk_buff *skb) ...@@ -760,8 +760,8 @@ static int carl9170_tx_prepare(struct ar9170 *ar, struct sk_buff *skb)
struct carl9170_tx_info *arinfo; struct carl9170_tx_info *arinfo;
unsigned int hw_queue; unsigned int hw_queue;
int i; int i;
u16 keytype = 0; __le16 mac_tmp;
u16 len, icv = 0; u16 len;
bool ampdu, no_ack; bool ampdu, no_ack;
BUILD_BUG_ON(sizeof(*arinfo) > sizeof(info->rate_driver_data)); BUILD_BUG_ON(sizeof(*arinfo) > sizeof(info->rate_driver_data));
...@@ -773,6 +773,10 @@ static int carl9170_tx_prepare(struct ar9170 *ar, struct sk_buff *skb) ...@@ -773,6 +773,10 @@ static int carl9170_tx_prepare(struct ar9170 *ar, struct sk_buff *skb)
BUILD_BUG_ON(IEEE80211_TX_MAX_RATES < CARL9170_TX_MAX_RATES); BUILD_BUG_ON(IEEE80211_TX_MAX_RATES < CARL9170_TX_MAX_RATES);
BUILD_BUG_ON(AR9170_MAX_VIRTUAL_MAC >
((CARL9170_TX_SUPER_MISC_VIF_ID >>
CARL9170_TX_SUPER_MISC_VIF_ID_S) + 1));
hw_queue = ar9170_qmap[carl9170_get_queue(ar, skb)]; hw_queue = ar9170_qmap[carl9170_get_queue(ar, skb)];
hdr = (void *)skb->data; hdr = (void *)skb->data;
...@@ -793,20 +797,37 @@ static int carl9170_tx_prepare(struct ar9170 *ar, struct sk_buff *skb) ...@@ -793,20 +797,37 @@ static int carl9170_tx_prepare(struct ar9170 *ar, struct sk_buff *skb)
txc = (void *)skb_push(skb, sizeof(*txc)); txc = (void *)skb_push(skb, sizeof(*txc));
memset(txc, 0, sizeof(*txc)); memset(txc, 0, sizeof(*txc));
ampdu = !!(info->flags & IEEE80211_TX_CTL_AMPDU); SET_VAL(CARL9170_TX_SUPER_MISC_QUEUE, txc->s.misc, hw_queue);
if (likely(cvif))
SET_VAL(CARL9170_TX_SUPER_MISC_VIF_ID, txc->s.misc, cvif->id);
if (unlikely(info->flags & IEEE80211_TX_CTL_SEND_AFTER_DTIM))
txc->s.misc |= CARL9170_TX_SUPER_MISC_CAB;
if (unlikely(ieee80211_is_probe_resp(hdr->frame_control)))
txc->s.misc |= CARL9170_TX_SUPER_MISC_FILL_IN_TSF;
mac_tmp = cpu_to_le16(AR9170_TX_MAC_HW_DURATION |
AR9170_TX_MAC_BACKOFF);
mac_tmp |= cpu_to_le16((hw_queue << AR9170_TX_MAC_QOS_S) &&
AR9170_TX_MAC_QOS);
no_ack = !!(info->flags & IEEE80211_TX_CTL_NO_ACK); no_ack = !!(info->flags & IEEE80211_TX_CTL_NO_ACK);
if (unlikely(no_ack))
mac_tmp |= cpu_to_le16(AR9170_TX_MAC_NO_ACK);
if (info->control.hw_key) { if (info->control.hw_key) {
icv = info->control.hw_key->icv_len; len += info->control.hw_key->icv_len;
switch (info->control.hw_key->cipher) { switch (info->control.hw_key->cipher) {
case WLAN_CIPHER_SUITE_WEP40: case WLAN_CIPHER_SUITE_WEP40:
case WLAN_CIPHER_SUITE_WEP104: case WLAN_CIPHER_SUITE_WEP104:
case WLAN_CIPHER_SUITE_TKIP: case WLAN_CIPHER_SUITE_TKIP:
keytype = AR9170_TX_MAC_ENCR_RC4; mac_tmp |= cpu_to_le16(AR9170_TX_MAC_ENCR_RC4);
break; break;
case WLAN_CIPHER_SUITE_CCMP: case WLAN_CIPHER_SUITE_CCMP:
keytype = AR9170_TX_MAC_ENCR_AES; mac_tmp |= cpu_to_le16(AR9170_TX_MAC_ENCR_AES);
break; break;
default: default:
WARN_ON(1); WARN_ON(1);
...@@ -814,48 +835,58 @@ static int carl9170_tx_prepare(struct ar9170 *ar, struct sk_buff *skb) ...@@ -814,48 +835,58 @@ static int carl9170_tx_prepare(struct ar9170 *ar, struct sk_buff *skb)
} }
} }
BUILD_BUG_ON(AR9170_MAX_VIRTUAL_MAC > ampdu = !!(info->flags & IEEE80211_TX_CTL_AMPDU);
((CARL9170_TX_SUPER_MISC_VIF_ID >> if (ampdu) {
CARL9170_TX_SUPER_MISC_VIF_ID_S) + 1)); unsigned int density, factor;
txc->s.len = cpu_to_le16(len + sizeof(*txc));
txc->f.length = cpu_to_le16(len + icv + 4);
SET_VAL(CARL9170_TX_SUPER_MISC_VIF_ID, txc->s.misc,
cvif ? cvif->id : 0);
txc->f.mac_control = cpu_to_le16(AR9170_TX_MAC_HW_DURATION | if (unlikely(!sta || !cvif))
AR9170_TX_MAC_BACKOFF); goto err_out;
SET_VAL(CARL9170_TX_SUPER_MISC_QUEUE, txc->s.misc, hw_queue); factor = min_t(unsigned int, 1u,
info->control.sta->ht_cap.ampdu_factor);
txc->f.mac_control |= cpu_to_le16(hw_queue << AR9170_TX_MAC_QOS_S); density = info->control.sta->ht_cap.ampdu_density;
txc->f.mac_control |= cpu_to_le16(keytype);
txc->f.phy_control = cpu_to_le32(0);
if (no_ack) if (density) {
txc->f.mac_control |= cpu_to_le16(AR9170_TX_MAC_NO_ACK); /*
* Watch out!
*
* Otus uses slightly different density values than
* those from the 802.11n spec.
*/
if (info->flags & IEEE80211_TX_CTL_SEND_AFTER_DTIM) density = max_t(unsigned int, density + 1, 7u);
txc->s.misc |= CARL9170_TX_SUPER_MISC_CAB; }
txrate = &info->control.rates[0]; SET_VAL(CARL9170_TX_SUPER_AMPDU_DENSITY,
if (carl9170_tx_rts_check(ar, txrate, ampdu, no_ack)) txc->s.ampdu_settings, density);
txc->f.mac_control |= cpu_to_le16(AR9170_TX_MAC_PROT_RTS);
else if (carl9170_tx_cts_check(ar, txrate))
txc->f.mac_control |= cpu_to_le16(AR9170_TX_MAC_PROT_CTS);
SET_VAL(CARL9170_TX_SUPER_RI_TRIES, txc->s.ri[0], txrate->count); SET_VAL(CARL9170_TX_SUPER_AMPDU_FACTOR,
txc->f.phy_control |= carl9170_tx_physet(ar, info, txrate); txc->s.ampdu_settings, factor);
if (info->flags & IEEE80211_TX_CTL_AMPDU) { for (i = 0; i < CARL9170_TX_MAX_RATES; i++) {
for (i = 1; i < CARL9170_TX_MAX_RATES; i++) {
txrate = &info->control.rates[i]; txrate = &info->control.rates[i];
if (txrate->idx >= 0) if (txrate->idx >= 0) {
txc->s.ri[i] =
CARL9170_TX_SUPER_RI_AMPDU;
if (WARN_ON(!(txrate->flags &
IEEE80211_TX_RC_MCS))) {
/*
* Not sure if it's even possible
* to aggregate non-ht rates with
* this HW.
*/
goto err_out;
}
continue; continue;
}
txrate->idx = 0; txrate->idx = 0;
txrate->count = ar->hw->max_rate_tries; txrate->count = ar->hw->max_rate_tries;
} }
mac_tmp |= cpu_to_le16(AR9170_TX_MAC_AGGR);
} }
/* /*
...@@ -878,57 +909,21 @@ static int carl9170_tx_prepare(struct ar9170 *ar, struct sk_buff *skb) ...@@ -878,57 +909,21 @@ static int carl9170_tx_prepare(struct ar9170 *ar, struct sk_buff *skb)
txc->s.ri[i] |= (AR9170_TX_MAC_PROT_CTS << txc->s.ri[i] |= (AR9170_TX_MAC_PROT_CTS <<
CARL9170_TX_SUPER_RI_ERP_PROT_S); CARL9170_TX_SUPER_RI_ERP_PROT_S);
/*
* unaggregated fallback, in case aggregation
* proves to be unsuccessful and unreliable.
*/
if (ampdu && i < 3)
txc->s.ri[i] |= CARL9170_TX_SUPER_RI_AMPDU;
txc->s.rr[i - 1] = carl9170_tx_physet(ar, info, txrate); txc->s.rr[i - 1] = carl9170_tx_physet(ar, info, txrate);
} }
if (ieee80211_is_probe_resp(hdr->frame_control)) txrate = &info->control.rates[0];
txc->s.misc |= CARL9170_TX_SUPER_MISC_FILL_IN_TSF; SET_VAL(CARL9170_TX_SUPER_RI_TRIES, txc->s.ri[0], txrate->count);
if (ampdu) {
unsigned int density, factor;
if (unlikely(!sta || !cvif))
goto err_out;
density = info->control.sta->ht_cap.ampdu_density;
factor = info->control.sta->ht_cap.ampdu_factor;
if (density) {
/*
* Watch out!
*
* Otus uses slightly different density values than
* those from the 802.11n spec.
*/
density = max_t(unsigned int, density + 1, 7u);
}
factor = min_t(unsigned int, 1u, factor);
SET_VAL(CARL9170_TX_SUPER_AMPDU_DENSITY,
txc->s.ampdu_settings, density);
SET_VAL(CARL9170_TX_SUPER_AMPDU_FACTOR, if (carl9170_tx_rts_check(ar, txrate, ampdu, no_ack))
txc->s.ampdu_settings, factor); mac_tmp |= cpu_to_le16(AR9170_TX_MAC_PROT_RTS);
else if (carl9170_tx_cts_check(ar, txrate))
mac_tmp |= cpu_to_le16(AR9170_TX_MAC_PROT_CTS);
if (info->control.rates[0].flags & IEEE80211_TX_RC_MCS) { txc->s.len = cpu_to_le16(skb->len);
txc->f.mac_control |= cpu_to_le16(AR9170_TX_MAC_AGGR); txc->f.length = cpu_to_le16(len + FCS_LEN);
} else { txc->f.mac_control = mac_tmp;
/* txc->f.phy_control = carl9170_tx_physet(ar, info, txrate);
* Not sure if it's even possible to aggregate
* non-ht rates with this HW.
*/
WARN_ON_ONCE(1);
}
}
arinfo = (void *)info->rate_driver_data; arinfo = (void *)info->rate_driver_data;
arinfo->timeout = jiffies; arinfo->timeout = jiffies;
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment