1 /******************************************************************************
3 * Copyright(c) 2003 - 2014 Intel Corporation. All rights reserved.
5 * Portions of this file are derived from the ipw3945 project, as well
6 * as portions of the ieee80211 subsystem header files.
8 * This program is free software; you can redistribute it and/or modify it
9 * under the terms of version 2 of the GNU General Public License as
10 * published by the Free Software Foundation.
12 * This program is distributed in the hope that it will be useful, but WITHOUT
13 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
14 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
17 * You should have received a copy of the GNU General Public License along with
18 * this program; if not, write to the Free Software Foundation, Inc.,
19 * 51 Franklin Street, Fifth Floor, Boston, MA 02110, USA
21 * The full GNU General Public License is included in this distribution in the
22 * file called LICENSE.
24 * Contact Information:
25 * Intel Linux Wireless <ilw@linux.intel.com>
26 * Intel Corporation, 5200 N.E. Elam Young Parkway, Hillsboro, OR 97124-6497
28 *****************************************************************************/
29 #include <linux/etherdevice.h>
30 #include <linux/slab.h>
31 #include <linux/sched.h>
33 #include "iwl-debug.h"
37 #include "iwl-op-mode.h"
39 /* FIXME: need to abstract out TX command (once we know what it looks like) */
40 #include "dvm/commands.h"
42 #define IWL_TX_CRC_SIZE 4
43 #define IWL_TX_DELIMITER_SIZE 4
45 /*************** DMA-QUEUE-GENERAL-FUNCTIONS *****
50 * A Tx or Rx queue resides in host DRAM, and is comprised of a circular buffer
51 * of buffer descriptors, each of which points to one or more data buffers for
52 * the device to read from or fill. Driver and device exchange status of each
53 * queue via "read" and "write" pointers. Driver keeps minimum of 2 empty
54 * entries in each circular buffer, to protect against confusing empty and full
57 * The device reads or writes the data in the queues via the device's several
58 * DMA/FIFO channels. Each queue is mapped to a single DMA channel.
60 * For Tx queue, there are low mark and high mark limits. If, after queuing
61 * the packet for Tx, free space become < low mark, Tx queue stopped. When
62 * reclaiming packets (on 'tx done IRQ), if free space become > high mark,
65 ***************************************************/
66 static int iwl_queue_space(const struct iwl_queue *q)
72 * To avoid ambiguity between empty and completely full queues, there
73 * should always be less than q->n_bd elements in the queue.
74 * If q->n_window is smaller than q->n_bd, there is no need to reserve
75 * any queue entries for this purpose.
77 if (q->n_window < q->n_bd)
83 * q->n_bd is a power of 2, so the following is equivalent to modulo by
84 * q->n_bd and is well defined for negative dividends.
86 used = (q->write_ptr - q->read_ptr) & (q->n_bd - 1);
88 if (WARN_ON(used > max))
95 * iwl_queue_init - Initialize queue's high/low-water and read/write indexes
97 static int iwl_queue_init(struct iwl_queue *q, int count, int slots_num, u32 id)
100 q->n_window = slots_num;
103 /* count must be power-of-two size, otherwise iwl_queue_inc_wrap
104 * and iwl_queue_dec_wrap are broken. */
105 if (WARN_ON(!is_power_of_2(count)))
108 /* slots_num must be power-of-two size, otherwise
109 * get_cmd_index is broken. */
110 if (WARN_ON(!is_power_of_2(slots_num)))
113 q->low_mark = q->n_window / 4;
117 q->high_mark = q->n_window / 8;
118 if (q->high_mark < 2)
127 static int iwl_pcie_alloc_dma_ptr(struct iwl_trans *trans,
128 struct iwl_dma_ptr *ptr, size_t size)
130 if (WARN_ON(ptr->addr))
133 ptr->addr = dma_alloc_coherent(trans->dev, size,
134 &ptr->dma, GFP_KERNEL);
141 static void iwl_pcie_free_dma_ptr(struct iwl_trans *trans,
142 struct iwl_dma_ptr *ptr)
144 if (unlikely(!ptr->addr))
147 dma_free_coherent(trans->dev, ptr->size, ptr->addr, ptr->dma);
148 memset(ptr, 0, sizeof(*ptr));
151 static void iwl_pcie_txq_stuck_timer(unsigned long data)
153 struct iwl_txq *txq = (void *)data;
154 struct iwl_queue *q = &txq->q;
155 struct iwl_trans_pcie *trans_pcie = txq->trans_pcie;
156 struct iwl_trans *trans = iwl_trans_pcie_get_trans(trans_pcie);
157 u32 scd_sram_addr = trans_pcie->scd_base_addr +
158 SCD_TX_STTS_QUEUE_OFFSET(txq->q.id);
162 spin_lock(&txq->lock);
163 /* check if triggered erroneously */
164 if (txq->q.read_ptr == txq->q.write_ptr) {
165 spin_unlock(&txq->lock);
168 spin_unlock(&txq->lock);
170 IWL_ERR(trans, "Queue %d stuck for %u ms.\n", txq->q.id,
171 jiffies_to_msecs(trans_pcie->wd_timeout));
172 IWL_ERR(trans, "Current SW read_ptr %d write_ptr %d\n",
173 txq->q.read_ptr, txq->q.write_ptr);
175 iwl_trans_read_mem_bytes(trans, scd_sram_addr, buf, sizeof(buf));
177 iwl_print_hex_error(trans, buf, sizeof(buf));
179 for (i = 0; i < FH_TCSR_CHNL_NUM; i++)
180 IWL_ERR(trans, "FH TRBs(%d) = 0x%08x\n", i,
181 iwl_read_direct32(trans, FH_TX_TRB_REG(i)));
183 for (i = 0; i < trans->cfg->base_params->num_of_queues; i++) {
184 u32 status = iwl_read_prph(trans, SCD_QUEUE_STATUS_BITS(i));
185 u8 fifo = (status >> SCD_QUEUE_STTS_REG_POS_TXF) & 0x7;
186 bool active = !!(status & BIT(SCD_QUEUE_STTS_REG_POS_ACTIVE));
188 iwl_trans_read_mem32(trans,
189 trans_pcie->scd_base_addr +
190 SCD_TRANS_TBL_OFFSET_QUEUE(i));
193 tbl_dw = (tbl_dw & 0xFFFF0000) >> 16;
195 tbl_dw = tbl_dw & 0x0000FFFF;
198 "Q %d is %sactive and mapped to fifo %d ra_tid 0x%04x [%d,%d]\n",
199 i, active ? "" : "in", fifo, tbl_dw,
201 SCD_QUEUE_RDPTR(i)) & (txq->q.n_bd - 1),
202 iwl_read_prph(trans, SCD_QUEUE_WRPTR(i)));
205 for (i = q->read_ptr; i != q->write_ptr;
206 i = iwl_queue_inc_wrap(i, q->n_bd))
207 IWL_ERR(trans, "scratch %d = 0x%08x\n", i,
208 le32_to_cpu(txq->scratchbufs[i].scratch));
210 iwl_trans_fw_error(trans);
214 * iwl_pcie_txq_update_byte_cnt_tbl - Set up entry in Tx byte-count array
216 static void iwl_pcie_txq_update_byte_cnt_tbl(struct iwl_trans *trans,
217 struct iwl_txq *txq, u16 byte_cnt)
219 struct iwlagn_scd_bc_tbl *scd_bc_tbl;
220 struct iwl_trans_pcie *trans_pcie = IWL_TRANS_GET_PCIE_TRANS(trans);
221 int write_ptr = txq->q.write_ptr;
222 int txq_id = txq->q.id;
225 u16 len = byte_cnt + IWL_TX_CRC_SIZE + IWL_TX_DELIMITER_SIZE;
227 struct iwl_tx_cmd *tx_cmd =
228 (void *) txq->entries[txq->q.write_ptr].cmd->payload;
230 scd_bc_tbl = trans_pcie->scd_bc_tbls.addr;
232 WARN_ON(len > 0xFFF || write_ptr >= TFD_QUEUE_SIZE_MAX);
234 sta_id = tx_cmd->sta_id;
235 sec_ctl = tx_cmd->sec_ctl;
237 switch (sec_ctl & TX_CMD_SEC_MSK) {
239 len += IEEE80211_CCMP_MIC_LEN;
241 case TX_CMD_SEC_TKIP:
242 len += IEEE80211_TKIP_ICV_LEN;
245 len += IEEE80211_WEP_IV_LEN + IEEE80211_WEP_ICV_LEN;
249 if (trans_pcie->bc_table_dword)
250 len = DIV_ROUND_UP(len, 4);
252 bc_ent = cpu_to_le16(len | (sta_id << 12));
254 scd_bc_tbl[txq_id].tfd_offset[write_ptr] = bc_ent;
256 if (write_ptr < TFD_QUEUE_SIZE_BC_DUP)
258 tfd_offset[TFD_QUEUE_SIZE_MAX + write_ptr] = bc_ent;
261 static void iwl_pcie_txq_inval_byte_cnt_tbl(struct iwl_trans *trans,
264 struct iwl_trans_pcie *trans_pcie =
265 IWL_TRANS_GET_PCIE_TRANS(trans);
266 struct iwlagn_scd_bc_tbl *scd_bc_tbl = trans_pcie->scd_bc_tbls.addr;
267 int txq_id = txq->q.id;
268 int read_ptr = txq->q.read_ptr;
271 struct iwl_tx_cmd *tx_cmd =
272 (void *)txq->entries[txq->q.read_ptr].cmd->payload;
274 WARN_ON(read_ptr >= TFD_QUEUE_SIZE_MAX);
276 if (txq_id != trans_pcie->cmd_queue)
277 sta_id = tx_cmd->sta_id;
279 bc_ent = cpu_to_le16(1 | (sta_id << 12));
280 scd_bc_tbl[txq_id].tfd_offset[read_ptr] = bc_ent;
282 if (read_ptr < TFD_QUEUE_SIZE_BC_DUP)
284 tfd_offset[TFD_QUEUE_SIZE_MAX + read_ptr] = bc_ent;
288 * iwl_pcie_txq_inc_wr_ptr - Send new write index to hardware
290 void iwl_pcie_txq_inc_wr_ptr(struct iwl_trans *trans, struct iwl_txq *txq)
293 int txq_id = txq->q.id;
295 if (txq->need_update == 0)
298 if (trans->cfg->base_params->shadow_reg_enable) {
299 /* shadow register enabled */
300 iwl_write32(trans, HBUS_TARG_WRPTR,
301 txq->q.write_ptr | (txq_id << 8));
303 /* if we're trying to save power */
304 if (test_bit(STATUS_TPOWER_PMI, &trans->status)) {
305 /* wake up nic if it's powered down ...
306 * uCode will wake up, and interrupt us again, so next
307 * time we'll skip this part. */
308 reg = iwl_read32(trans, CSR_UCODE_DRV_GP1);
310 if (reg & CSR_UCODE_DRV_GP1_BIT_MAC_SLEEP) {
311 IWL_DEBUG_INFO(trans,
312 "Tx queue %d requesting wakeup,"
313 " GP1 = 0x%x\n", txq_id, reg);
314 iwl_set_bit(trans, CSR_GP_CNTRL,
315 CSR_GP_CNTRL_REG_FLAG_MAC_ACCESS_REQ);
319 IWL_DEBUG_TX(trans, "Q:%d WR: 0x%x\n", txq_id,
322 iwl_write_direct32(trans, HBUS_TARG_WRPTR,
323 txq->q.write_ptr | (txq_id << 8));
326 * else not in power-save mode,
327 * uCode will never sleep when we're
328 * trying to tx (during RFKILL, we're not trying to tx).
331 iwl_write32(trans, HBUS_TARG_WRPTR,
332 txq->q.write_ptr | (txq_id << 8));
334 txq->need_update = 0;
337 static inline dma_addr_t iwl_pcie_tfd_tb_get_addr(struct iwl_tfd *tfd, u8 idx)
339 struct iwl_tfd_tb *tb = &tfd->tbs[idx];
341 dma_addr_t addr = get_unaligned_le32(&tb->lo);
342 if (sizeof(dma_addr_t) > sizeof(u32))
344 ((dma_addr_t)(le16_to_cpu(tb->hi_n_len) & 0xF) << 16) << 16;
349 static inline u16 iwl_pcie_tfd_tb_get_len(struct iwl_tfd *tfd, u8 idx)
351 struct iwl_tfd_tb *tb = &tfd->tbs[idx];
353 return le16_to_cpu(tb->hi_n_len) >> 4;
356 static inline void iwl_pcie_tfd_set_tb(struct iwl_tfd *tfd, u8 idx,
357 dma_addr_t addr, u16 len)
359 struct iwl_tfd_tb *tb = &tfd->tbs[idx];
360 u16 hi_n_len = len << 4;
362 put_unaligned_le32(addr, &tb->lo);
363 if (sizeof(dma_addr_t) > sizeof(u32))
364 hi_n_len |= ((addr >> 16) >> 16) & 0xF;
366 tb->hi_n_len = cpu_to_le16(hi_n_len);
368 tfd->num_tbs = idx + 1;
371 static inline u8 iwl_pcie_tfd_get_num_tbs(struct iwl_tfd *tfd)
373 return tfd->num_tbs & 0x1f;
376 static void iwl_pcie_tfd_unmap(struct iwl_trans *trans,
377 struct iwl_cmd_meta *meta,
383 /* Sanity check on number of chunks */
384 num_tbs = iwl_pcie_tfd_get_num_tbs(tfd);
386 if (num_tbs >= IWL_NUM_OF_TBS) {
387 IWL_ERR(trans, "Too many chunks: %i\n", num_tbs);
388 /* @todo issue fatal error, it is quite serious situation */
392 /* first TB is never freed - it's the scratchbuf data */
394 for (i = 1; i < num_tbs; i++)
395 dma_unmap_single(trans->dev, iwl_pcie_tfd_tb_get_addr(tfd, i),
396 iwl_pcie_tfd_tb_get_len(tfd, i),
403 * iwl_pcie_txq_free_tfd - Free all chunks referenced by TFD [txq->q.read_ptr]
404 * @trans - transport private data
406 * @dma_dir - the direction of the DMA mapping
408 * Does NOT advance any TFD circular buffer read/write indexes
409 * Does NOT free the TFD itself (which is within circular buffer)
411 static void iwl_pcie_txq_free_tfd(struct iwl_trans *trans, struct iwl_txq *txq)
413 struct iwl_tfd *tfd_tmp = txq->tfds;
415 /* rd_ptr is bounded by n_bd and idx is bounded by n_window */
416 int rd_ptr = txq->q.read_ptr;
417 int idx = get_cmd_index(&txq->q, rd_ptr);
419 lockdep_assert_held(&txq->lock);
421 /* We have only q->n_window txq->entries, but we use q->n_bd tfds */
422 iwl_pcie_tfd_unmap(trans, &txq->entries[idx].meta, &tfd_tmp[rd_ptr]);
428 skb = txq->entries[idx].skb;
430 /* Can be called from irqs-disabled context
431 * If skb is not NULL, it means that the whole queue is being
432 * freed and that the queue is not empty - free the skb
435 iwl_op_mode_free_skb(trans->op_mode, skb);
436 txq->entries[idx].skb = NULL;
441 static int iwl_pcie_txq_build_tfd(struct iwl_trans *trans, struct iwl_txq *txq,
442 dma_addr_t addr, u16 len, u8 reset)
445 struct iwl_tfd *tfd, *tfd_tmp;
450 tfd = &tfd_tmp[q->write_ptr];
453 memset(tfd, 0, sizeof(*tfd));
455 num_tbs = iwl_pcie_tfd_get_num_tbs(tfd);
457 /* Each TFD can point to a maximum 20 Tx buffers */
458 if (num_tbs >= IWL_NUM_OF_TBS) {
459 IWL_ERR(trans, "Error can not send more than %d chunks\n",
464 if (WARN(addr & ~IWL_TX_DMA_MASK,
465 "Unaligned address = %llx\n", (unsigned long long)addr))
468 iwl_pcie_tfd_set_tb(tfd, num_tbs, addr, len);
473 static int iwl_pcie_txq_alloc(struct iwl_trans *trans,
474 struct iwl_txq *txq, int slots_num,
477 struct iwl_trans_pcie *trans_pcie = IWL_TRANS_GET_PCIE_TRANS(trans);
478 size_t tfd_sz = sizeof(struct iwl_tfd) * TFD_QUEUE_SIZE_MAX;
479 size_t scratchbuf_sz;
482 if (WARN_ON(txq->entries || txq->tfds))
485 setup_timer(&txq->stuck_timer, iwl_pcie_txq_stuck_timer,
487 txq->trans_pcie = trans_pcie;
489 txq->q.n_window = slots_num;
491 txq->entries = kcalloc(slots_num,
492 sizeof(struct iwl_pcie_txq_entry),
498 if (txq_id == trans_pcie->cmd_queue)
499 for (i = 0; i < slots_num; i++) {
500 txq->entries[i].cmd =
501 kmalloc(sizeof(struct iwl_device_cmd),
503 if (!txq->entries[i].cmd)
507 /* Circular buffer of transmit frame descriptors (TFDs),
508 * shared with device */
509 txq->tfds = dma_alloc_coherent(trans->dev, tfd_sz,
510 &txq->q.dma_addr, GFP_KERNEL);
514 BUILD_BUG_ON(IWL_HCMD_SCRATCHBUF_SIZE != sizeof(*txq->scratchbufs));
515 BUILD_BUG_ON(offsetof(struct iwl_pcie_txq_scratch_buf, scratch) !=
516 sizeof(struct iwl_cmd_header) +
517 offsetof(struct iwl_tx_cmd, scratch));
519 scratchbuf_sz = sizeof(*txq->scratchbufs) * slots_num;
521 txq->scratchbufs = dma_alloc_coherent(trans->dev, scratchbuf_sz,
522 &txq->scratchbufs_dma,
524 if (!txq->scratchbufs)
531 dma_free_coherent(trans->dev, tfd_sz, txq->tfds, txq->q.dma_addr);
533 if (txq->entries && txq_id == trans_pcie->cmd_queue)
534 for (i = 0; i < slots_num; i++)
535 kfree(txq->entries[i].cmd);
543 static int iwl_pcie_txq_init(struct iwl_trans *trans, struct iwl_txq *txq,
544 int slots_num, u32 txq_id)
548 txq->need_update = 0;
550 /* TFD_QUEUE_SIZE_MAX must be power-of-two size, otherwise
551 * iwl_queue_inc_wrap and iwl_queue_dec_wrap are broken. */
552 BUILD_BUG_ON(TFD_QUEUE_SIZE_MAX & (TFD_QUEUE_SIZE_MAX - 1));
554 /* Initialize queue's high/low-water marks, and head/tail indexes */
555 ret = iwl_queue_init(&txq->q, TFD_QUEUE_SIZE_MAX, slots_num,
560 spin_lock_init(&txq->lock);
563 * Tell nic where to find circular buffer of Tx Frame Descriptors for
564 * given Tx queue, and enable the DMA channel used for that queue.
565 * Circular buffer (TFD queue in DRAM) physical base address */
566 iwl_write_direct32(trans, FH_MEM_CBBC_QUEUE(txq_id),
567 txq->q.dma_addr >> 8);
573 * iwl_pcie_txq_unmap - Unmap any remaining DMA mappings and free skb's
575 static void iwl_pcie_txq_unmap(struct iwl_trans *trans, int txq_id)
577 struct iwl_trans_pcie *trans_pcie = IWL_TRANS_GET_PCIE_TRANS(trans);
578 struct iwl_txq *txq = &trans_pcie->txq[txq_id];
579 struct iwl_queue *q = &txq->q;
584 spin_lock_bh(&txq->lock);
585 while (q->write_ptr != q->read_ptr) {
586 IWL_DEBUG_TX_REPLY(trans, "Q %d Free %d\n",
587 txq_id, q->read_ptr);
588 iwl_pcie_txq_free_tfd(trans, txq);
589 q->read_ptr = iwl_queue_inc_wrap(q->read_ptr, q->n_bd);
592 spin_unlock_bh(&txq->lock);
594 /* just in case - this queue may have been stopped */
595 iwl_wake_queue(trans, txq);
599 * iwl_pcie_txq_free - Deallocate DMA queue.
600 * @txq: Transmit queue to deallocate.
602 * Empty queue by removing and destroying all BD's.
604 * 0-fill, but do not free "txq" descriptor structure.
606 static void iwl_pcie_txq_free(struct iwl_trans *trans, int txq_id)
608 struct iwl_trans_pcie *trans_pcie = IWL_TRANS_GET_PCIE_TRANS(trans);
609 struct iwl_txq *txq = &trans_pcie->txq[txq_id];
610 struct device *dev = trans->dev;
616 iwl_pcie_txq_unmap(trans, txq_id);
618 /* De-alloc array of command/tx buffers */
619 if (txq_id == trans_pcie->cmd_queue)
620 for (i = 0; i < txq->q.n_window; i++) {
621 kfree(txq->entries[i].cmd);
622 kfree(txq->entries[i].free_buf);
625 /* De-alloc circular buffer of TFDs */
627 dma_free_coherent(dev, sizeof(struct iwl_tfd) *
628 txq->q.n_bd, txq->tfds, txq->q.dma_addr);
631 dma_free_coherent(dev,
632 sizeof(*txq->scratchbufs) * txq->q.n_window,
633 txq->scratchbufs, txq->scratchbufs_dma);
639 del_timer_sync(&txq->stuck_timer);
641 /* 0-fill queue descriptor structure */
642 memset(txq, 0, sizeof(*txq));
646 * Activate/Deactivate Tx DMA/FIFO channels according tx fifos mask
648 static void iwl_pcie_txq_set_sched(struct iwl_trans *trans, u32 mask)
650 struct iwl_trans_pcie __maybe_unused *trans_pcie =
651 IWL_TRANS_GET_PCIE_TRANS(trans);
653 iwl_write_prph(trans, SCD_TXFACT, mask);
656 void iwl_pcie_tx_start(struct iwl_trans *trans, u32 scd_base_addr)
658 struct iwl_trans_pcie *trans_pcie = IWL_TRANS_GET_PCIE_TRANS(trans);
659 int nq = trans->cfg->base_params->num_of_queues;
662 int clear_dwords = (SCD_TRANS_TBL_OFFSET_QUEUE(nq) -
663 SCD_CONTEXT_MEM_LOWER_BOUND) / sizeof(u32);
665 /* make sure all queue are not stopped/used */
666 memset(trans_pcie->queue_stopped, 0, sizeof(trans_pcie->queue_stopped));
667 memset(trans_pcie->queue_used, 0, sizeof(trans_pcie->queue_used));
669 trans_pcie->scd_base_addr =
670 iwl_read_prph(trans, SCD_SRAM_BASE_ADDR);
672 WARN_ON(scd_base_addr != 0 &&
673 scd_base_addr != trans_pcie->scd_base_addr);
675 /* reset context data, TX status and translation data */
676 iwl_trans_write_mem(trans, trans_pcie->scd_base_addr +
677 SCD_CONTEXT_MEM_LOWER_BOUND,
680 iwl_write_prph(trans, SCD_DRAM_BASE_ADDR,
681 trans_pcie->scd_bc_tbls.dma >> 10);
683 /* The chain extension of the SCD doesn't work well. This feature is
684 * enabled by default by the HW, so we need to disable it manually.
686 iwl_write_prph(trans, SCD_CHAINEXT_EN, 0);
688 iwl_trans_ac_txq_enable(trans, trans_pcie->cmd_queue,
689 trans_pcie->cmd_fifo);
691 /* Activate all Tx DMA/FIFO channels */
692 iwl_pcie_txq_set_sched(trans, IWL_MASK(0, 7));
694 /* Enable DMA channel */
695 for (chan = 0; chan < FH_TCSR_CHNL_NUM; chan++)
696 iwl_write_direct32(trans, FH_TCSR_CHNL_TX_CONFIG_REG(chan),
697 FH_TCSR_TX_CONFIG_REG_VAL_DMA_CHNL_ENABLE |
698 FH_TCSR_TX_CONFIG_REG_VAL_DMA_CREDIT_ENABLE);
700 /* Update FH chicken bits */
701 reg_val = iwl_read_direct32(trans, FH_TX_CHICKEN_BITS_REG);
702 iwl_write_direct32(trans, FH_TX_CHICKEN_BITS_REG,
703 reg_val | FH_TX_CHICKEN_BITS_SCD_AUTO_RETRY_EN);
705 /* Enable L1-Active */
706 iwl_clear_bits_prph(trans, APMG_PCIDEV_STT_REG,
707 APMG_PCIDEV_STT_VAL_L1_ACT_DIS);
710 void iwl_trans_pcie_tx_reset(struct iwl_trans *trans)
712 struct iwl_trans_pcie *trans_pcie = IWL_TRANS_GET_PCIE_TRANS(trans);
715 for (txq_id = 0; txq_id < trans->cfg->base_params->num_of_queues;
717 struct iwl_txq *txq = &trans_pcie->txq[txq_id];
719 iwl_write_direct32(trans, FH_MEM_CBBC_QUEUE(txq_id),
720 txq->q.dma_addr >> 8);
721 iwl_pcie_txq_unmap(trans, txq_id);
723 txq->q.write_ptr = 0;
726 /* Tell NIC where to find the "keep warm" buffer */
727 iwl_write_direct32(trans, FH_KW_MEM_ADDR_REG,
728 trans_pcie->kw.dma >> 4);
730 iwl_pcie_tx_start(trans, trans_pcie->scd_base_addr);
734 * iwl_pcie_tx_stop - Stop all Tx DMA channels
736 int iwl_pcie_tx_stop(struct iwl_trans *trans)
738 struct iwl_trans_pcie *trans_pcie = IWL_TRANS_GET_PCIE_TRANS(trans);
741 /* Turn off all Tx DMA fifos */
742 spin_lock(&trans_pcie->irq_lock);
744 iwl_pcie_txq_set_sched(trans, 0);
746 /* Stop each Tx DMA channel, and wait for it to be idle */
747 for (ch = 0; ch < FH_TCSR_CHNL_NUM; ch++) {
748 iwl_write_direct32(trans,
749 FH_TCSR_CHNL_TX_CONFIG_REG(ch), 0x0);
750 ret = iwl_poll_direct_bit(trans, FH_TSSR_TX_STATUS_REG,
751 FH_TSSR_TX_STATUS_REG_MSK_CHNL_IDLE(ch), 1000);
754 "Failing on timeout while stopping DMA channel %d [0x%08x]\n",
756 iwl_read_direct32(trans,
757 FH_TSSR_TX_STATUS_REG));
759 spin_unlock(&trans_pcie->irq_lock);
762 * This function can be called before the op_mode disabled the
763 * queues. This happens when we have an rfkill interrupt.
764 * Since we stop Tx altogether - mark the queues as stopped.
766 memset(trans_pcie->queue_stopped, 0, sizeof(trans_pcie->queue_stopped));
767 memset(trans_pcie->queue_used, 0, sizeof(trans_pcie->queue_used));
769 /* This can happen: start_hw, stop_device */
770 if (!trans_pcie->txq)
773 /* Unmap DMA from host system and free skb's */
774 for (txq_id = 0; txq_id < trans->cfg->base_params->num_of_queues;
776 iwl_pcie_txq_unmap(trans, txq_id);
782 * iwl_trans_tx_free - Free TXQ Context
784 * Destroy all TX DMA queues and structures
786 void iwl_pcie_tx_free(struct iwl_trans *trans)
789 struct iwl_trans_pcie *trans_pcie = IWL_TRANS_GET_PCIE_TRANS(trans);
792 if (trans_pcie->txq) {
794 txq_id < trans->cfg->base_params->num_of_queues; txq_id++)
795 iwl_pcie_txq_free(trans, txq_id);
798 kfree(trans_pcie->txq);
799 trans_pcie->txq = NULL;
801 iwl_pcie_free_dma_ptr(trans, &trans_pcie->kw);
803 iwl_pcie_free_dma_ptr(trans, &trans_pcie->scd_bc_tbls);
807 * iwl_pcie_tx_alloc - allocate TX context
808 * Allocate all Tx DMA structures and initialize them
810 static int iwl_pcie_tx_alloc(struct iwl_trans *trans)
813 int txq_id, slots_num;
814 struct iwl_trans_pcie *trans_pcie = IWL_TRANS_GET_PCIE_TRANS(trans);
816 u16 scd_bc_tbls_size = trans->cfg->base_params->num_of_queues *
817 sizeof(struct iwlagn_scd_bc_tbl);
819 /*It is not allowed to alloc twice, so warn when this happens.
820 * We cannot rely on the previous allocation, so free and fail */
821 if (WARN_ON(trans_pcie->txq)) {
826 ret = iwl_pcie_alloc_dma_ptr(trans, &trans_pcie->scd_bc_tbls,
829 IWL_ERR(trans, "Scheduler BC Table allocation failed\n");
833 /* Alloc keep-warm buffer */
834 ret = iwl_pcie_alloc_dma_ptr(trans, &trans_pcie->kw, IWL_KW_SIZE);
836 IWL_ERR(trans, "Keep Warm allocation failed\n");
840 trans_pcie->txq = kcalloc(trans->cfg->base_params->num_of_queues,
841 sizeof(struct iwl_txq), GFP_KERNEL);
842 if (!trans_pcie->txq) {
843 IWL_ERR(trans, "Not enough memory for txq\n");
848 /* Alloc and init all Tx queues, including the command queue (#4/#9) */
849 for (txq_id = 0; txq_id < trans->cfg->base_params->num_of_queues;
851 slots_num = (txq_id == trans_pcie->cmd_queue) ?
852 TFD_CMD_SLOTS : TFD_TX_CMD_SLOTS;
853 ret = iwl_pcie_txq_alloc(trans, &trans_pcie->txq[txq_id],
856 IWL_ERR(trans, "Tx %d queue alloc failed\n", txq_id);
864 iwl_pcie_tx_free(trans);
868 int iwl_pcie_tx_init(struct iwl_trans *trans)
870 struct iwl_trans_pcie *trans_pcie = IWL_TRANS_GET_PCIE_TRANS(trans);
872 int txq_id, slots_num;
875 if (!trans_pcie->txq) {
876 ret = iwl_pcie_tx_alloc(trans);
882 spin_lock(&trans_pcie->irq_lock);
884 /* Turn off all Tx DMA fifos */
885 iwl_write_prph(trans, SCD_TXFACT, 0);
887 /* Tell NIC where to find the "keep warm" buffer */
888 iwl_write_direct32(trans, FH_KW_MEM_ADDR_REG,
889 trans_pcie->kw.dma >> 4);
891 spin_unlock(&trans_pcie->irq_lock);
893 /* Alloc and init all Tx queues, including the command queue (#4/#9) */
894 for (txq_id = 0; txq_id < trans->cfg->base_params->num_of_queues;
896 slots_num = (txq_id == trans_pcie->cmd_queue) ?
897 TFD_CMD_SLOTS : TFD_TX_CMD_SLOTS;
898 ret = iwl_pcie_txq_init(trans, &trans_pcie->txq[txq_id],
901 IWL_ERR(trans, "Tx %d queue init failed\n", txq_id);
908 /*Upon error, free only if we allocated something */
910 iwl_pcie_tx_free(trans);
914 static inline void iwl_pcie_txq_progress(struct iwl_trans_pcie *trans_pcie,
917 if (!trans_pcie->wd_timeout)
921 * if empty delete timer, otherwise move timer forward
922 * since we're making progress on this queue
924 if (txq->q.read_ptr == txq->q.write_ptr)
925 del_timer(&txq->stuck_timer);
927 mod_timer(&txq->stuck_timer, jiffies + trans_pcie->wd_timeout);
930 /* Frees buffers until index _not_ inclusive */
931 void iwl_trans_pcie_reclaim(struct iwl_trans *trans, int txq_id, int ssn,
932 struct sk_buff_head *skbs)
934 struct iwl_trans_pcie *trans_pcie = IWL_TRANS_GET_PCIE_TRANS(trans);
935 struct iwl_txq *txq = &trans_pcie->txq[txq_id];
936 /* n_bd is usually 256 => n_bd - 1 = 0xff */
937 int tfd_num = ssn & (txq->q.n_bd - 1);
938 struct iwl_queue *q = &txq->q;
941 /* This function is not meant to release cmd queue*/
942 if (WARN_ON(txq_id == trans_pcie->cmd_queue))
945 spin_lock_bh(&txq->lock);
948 IWL_DEBUG_TX_QUEUES(trans, "Q %d inactive - ignoring idx %d\n",
953 if (txq->q.read_ptr == tfd_num)
956 IWL_DEBUG_TX_REPLY(trans, "[Q %d] %d -> %d (%d)\n",
957 txq_id, txq->q.read_ptr, tfd_num, ssn);
959 /*Since we free until index _not_ inclusive, the one before index is
960 * the last we will free. This one must be used */
961 last_to_free = iwl_queue_dec_wrap(tfd_num, q->n_bd);
963 if (!iwl_queue_used(q, last_to_free)) {
965 "%s: Read index for DMA queue txq id (%d), last_to_free %d is out of range [0-%d] %d %d.\n",
966 __func__, txq_id, last_to_free, q->n_bd,
967 q->write_ptr, q->read_ptr);
971 if (WARN_ON(!skb_queue_empty(skbs)))
975 q->read_ptr != tfd_num;
976 q->read_ptr = iwl_queue_inc_wrap(q->read_ptr, q->n_bd)) {
978 if (WARN_ON_ONCE(txq->entries[txq->q.read_ptr].skb == NULL))
981 __skb_queue_tail(skbs, txq->entries[txq->q.read_ptr].skb);
983 txq->entries[txq->q.read_ptr].skb = NULL;
985 iwl_pcie_txq_inval_byte_cnt_tbl(trans, txq);
987 iwl_pcie_txq_free_tfd(trans, txq);
990 iwl_pcie_txq_progress(trans_pcie, txq);
992 if (iwl_queue_space(&txq->q) > txq->q.low_mark)
993 iwl_wake_queue(trans, txq);
995 spin_unlock_bh(&txq->lock);
999 * iwl_pcie_cmdq_reclaim - Reclaim TX command queue entries already Tx'd
1001 * When FW advances 'R' index, all entries between old and new 'R' index
1002 * need to be reclaimed. As result, some free space forms. If there is
1003 * enough free space (> low mark), wake the stack that feeds us.
1005 static void iwl_pcie_cmdq_reclaim(struct iwl_trans *trans, int txq_id, int idx)
1007 struct iwl_trans_pcie *trans_pcie = IWL_TRANS_GET_PCIE_TRANS(trans);
1008 struct iwl_txq *txq = &trans_pcie->txq[txq_id];
1009 struct iwl_queue *q = &txq->q;
1010 unsigned long flags;
1013 lockdep_assert_held(&txq->lock);
1015 if ((idx >= q->n_bd) || (!iwl_queue_used(q, idx))) {
1017 "%s: Read index for DMA queue txq id (%d), index %d is out of range [0-%d] %d %d.\n",
1018 __func__, txq_id, idx, q->n_bd,
1019 q->write_ptr, q->read_ptr);
1023 for (idx = iwl_queue_inc_wrap(idx, q->n_bd); q->read_ptr != idx;
1024 q->read_ptr = iwl_queue_inc_wrap(q->read_ptr, q->n_bd)) {
1027 IWL_ERR(trans, "HCMD skipped: index (%d) %d %d\n",
1028 idx, q->write_ptr, q->read_ptr);
1029 iwl_trans_fw_error(trans);
1033 if (q->read_ptr == q->write_ptr) {
1034 spin_lock_irqsave(&trans_pcie->reg_lock, flags);
1035 WARN_ON(!trans_pcie->cmd_in_flight);
1036 trans_pcie->cmd_in_flight = false;
1037 __iwl_trans_pcie_clear_bit(trans,
1039 CSR_GP_CNTRL_REG_FLAG_MAC_ACCESS_REQ);
1040 spin_unlock_irqrestore(&trans_pcie->reg_lock, flags);
1043 iwl_pcie_txq_progress(trans_pcie, txq);
1046 static int iwl_pcie_txq_set_ratid_map(struct iwl_trans *trans, u16 ra_tid,
1049 struct iwl_trans_pcie *trans_pcie = IWL_TRANS_GET_PCIE_TRANS(trans);
1054 scd_q2ratid = ra_tid & SCD_QUEUE_RA_TID_MAP_RATID_MSK;
1056 tbl_dw_addr = trans_pcie->scd_base_addr +
1057 SCD_TRANS_TBL_OFFSET_QUEUE(txq_id);
1059 tbl_dw = iwl_trans_read_mem32(trans, tbl_dw_addr);
1062 tbl_dw = (scd_q2ratid << 16) | (tbl_dw & 0x0000FFFF);
1064 tbl_dw = scd_q2ratid | (tbl_dw & 0xFFFF0000);
1066 iwl_trans_write_mem32(trans, tbl_dw_addr, tbl_dw);
1071 static inline void iwl_pcie_txq_set_inactive(struct iwl_trans *trans,
1074 /* Simply stop the queue, but don't change any configuration;
1075 * the SCD_ACT_EN bit is the write-enable mask for the ACTIVE bit. */
1076 iwl_write_prph(trans,
1077 SCD_QUEUE_STATUS_BITS(txq_id),
1078 (0 << SCD_QUEUE_STTS_REG_POS_ACTIVE)|
1079 (1 << SCD_QUEUE_STTS_REG_POS_SCD_ACT_EN));
1082 /* Receiver address (actually, Rx station's index into station table),
1083 * combined with Traffic ID (QOS priority), in format used by Tx Scheduler */
1084 #define BUILD_RAxTID(sta_id, tid) (((sta_id) << 4) + (tid))
1086 void iwl_trans_pcie_txq_enable(struct iwl_trans *trans, int txq_id, int fifo,
1087 int sta_id, int tid, int frame_limit, u16 ssn)
1089 struct iwl_trans_pcie *trans_pcie = IWL_TRANS_GET_PCIE_TRANS(trans);
1091 if (test_and_set_bit(txq_id, trans_pcie->queue_used))
1092 WARN_ONCE(1, "queue %d already used - expect issues", txq_id);
1094 /* Stop this Tx queue before configuring it */
1095 iwl_pcie_txq_set_inactive(trans, txq_id);
1097 /* Set this queue as a chain-building queue unless it is CMD queue */
1098 if (txq_id != trans_pcie->cmd_queue)
1099 iwl_set_bits_prph(trans, SCD_QUEUECHAIN_SEL, BIT(txq_id));
1101 /* If this queue is mapped to a certain station: it is an AGG queue */
1103 u16 ra_tid = BUILD_RAxTID(sta_id, tid);
1105 /* Map receiver-address / traffic-ID to this queue */
1106 iwl_pcie_txq_set_ratid_map(trans, ra_tid, txq_id);
1108 /* enable aggregations for the queue */
1109 iwl_set_bits_prph(trans, SCD_AGGR_SEL, BIT(txq_id));
1110 trans_pcie->txq[txq_id].ampdu = true;
1113 * disable aggregations for the queue, this will also make the
1114 * ra_tid mapping configuration irrelevant since it is now a
1117 iwl_clear_bits_prph(trans, SCD_AGGR_SEL, BIT(txq_id));
1119 ssn = trans_pcie->txq[txq_id].q.read_ptr;
1122 /* Place first TFD at index corresponding to start sequence number.
1123 * Assumes that ssn_idx is valid (!= 0xFFF) */
1124 trans_pcie->txq[txq_id].q.read_ptr = (ssn & 0xff);
1125 trans_pcie->txq[txq_id].q.write_ptr = (ssn & 0xff);
1127 iwl_write_direct32(trans, HBUS_TARG_WRPTR,
1128 (ssn & 0xff) | (txq_id << 8));
1129 iwl_write_prph(trans, SCD_QUEUE_RDPTR(txq_id), ssn);
1131 /* Set up Tx window size and frame limit for this queue */
1132 iwl_trans_write_mem32(trans, trans_pcie->scd_base_addr +
1133 SCD_CONTEXT_QUEUE_OFFSET(txq_id), 0);
1134 iwl_trans_write_mem32(trans, trans_pcie->scd_base_addr +
1135 SCD_CONTEXT_QUEUE_OFFSET(txq_id) + sizeof(u32),
1136 ((frame_limit << SCD_QUEUE_CTX_REG2_WIN_SIZE_POS) &
1137 SCD_QUEUE_CTX_REG2_WIN_SIZE_MSK) |
1138 ((frame_limit << SCD_QUEUE_CTX_REG2_FRAME_LIMIT_POS) &
1139 SCD_QUEUE_CTX_REG2_FRAME_LIMIT_MSK));
1141 /* Set up Status area in SRAM, map to Tx DMA/FIFO, activate the queue */
1142 iwl_write_prph(trans, SCD_QUEUE_STATUS_BITS(txq_id),
1143 (1 << SCD_QUEUE_STTS_REG_POS_ACTIVE) |
1144 (fifo << SCD_QUEUE_STTS_REG_POS_TXF) |
1145 (1 << SCD_QUEUE_STTS_REG_POS_WSL) |
1146 SCD_QUEUE_STTS_REG_MSK);
1147 trans_pcie->txq[txq_id].active = true;
1148 IWL_DEBUG_TX_QUEUES(trans, "Activate queue %d on FIFO %d WrPtr: %d\n",
1149 txq_id, fifo, ssn & 0xff);
1152 void iwl_trans_pcie_txq_disable(struct iwl_trans *trans, int txq_id)
1154 struct iwl_trans_pcie *trans_pcie = IWL_TRANS_GET_PCIE_TRANS(trans);
1155 u32 stts_addr = trans_pcie->scd_base_addr +
1156 SCD_TX_STTS_QUEUE_OFFSET(txq_id);
1157 static const u32 zero_val[4] = {};
1160 * Upon HW Rfkill - we stop the device, and then stop the queues
1161 * in the op_mode. Just for the sake of the simplicity of the op_mode,
1162 * allow the op_mode to call txq_disable after it already called
1165 if (!test_and_clear_bit(txq_id, trans_pcie->queue_used)) {
1166 WARN_ONCE(test_bit(STATUS_DEVICE_ENABLED, &trans->status),
1167 "queue %d not used", txq_id);
1171 iwl_pcie_txq_set_inactive(trans, txq_id);
1173 iwl_trans_write_mem(trans, stts_addr, (void *)zero_val,
1174 ARRAY_SIZE(zero_val));
1176 iwl_pcie_txq_unmap(trans, txq_id);
1177 trans_pcie->txq[txq_id].ampdu = false;
1179 IWL_DEBUG_TX_QUEUES(trans, "Deactivate queue %d\n", txq_id);
1182 /*************** HOST COMMAND QUEUE FUNCTIONS *****/
1185 * iwl_pcie_enqueue_hcmd - enqueue a uCode command
1186 * @priv: device private data point
1187 * @cmd: a pointer to the ucode command structure
1189 * The function returns < 0 values to indicate the operation
1190 * failed. On success, it returns the index (>= 0) of command in the
1193 static int iwl_pcie_enqueue_hcmd(struct iwl_trans *trans,
1194 struct iwl_host_cmd *cmd)
1196 struct iwl_trans_pcie *trans_pcie = IWL_TRANS_GET_PCIE_TRANS(trans);
1197 struct iwl_txq *txq = &trans_pcie->txq[trans_pcie->cmd_queue];
1198 struct iwl_queue *q = &txq->q;
1199 struct iwl_device_cmd *out_cmd;
1200 struct iwl_cmd_meta *out_meta;
1201 unsigned long flags;
1202 void *dup_buf = NULL;
1203 dma_addr_t phys_addr;
1205 u16 copy_size, cmd_size, scratch_size;
1206 bool had_nocopy = false;
1209 const u8 *cmddata[IWL_MAX_CMD_TBS_PER_TFD];
1210 u16 cmdlen[IWL_MAX_CMD_TBS_PER_TFD];
1212 copy_size = sizeof(out_cmd->hdr);
1213 cmd_size = sizeof(out_cmd->hdr);
1215 /* need one for the header if the first is NOCOPY */
1216 BUILD_BUG_ON(IWL_MAX_CMD_TBS_PER_TFD > IWL_NUM_OF_TBS - 1);
1218 for (i = 0; i < IWL_MAX_CMD_TBS_PER_TFD; i++) {
1219 cmddata[i] = cmd->data[i];
1220 cmdlen[i] = cmd->len[i];
1225 /* need at least IWL_HCMD_SCRATCHBUF_SIZE copied */
1226 if (copy_size < IWL_HCMD_SCRATCHBUF_SIZE) {
1227 int copy = IWL_HCMD_SCRATCHBUF_SIZE - copy_size;
1229 if (copy > cmdlen[i])
1236 if (cmd->dataflags[i] & IWL_HCMD_DFL_NOCOPY) {
1238 if (WARN_ON(cmd->dataflags[i] & IWL_HCMD_DFL_DUP)) {
1242 } else if (cmd->dataflags[i] & IWL_HCMD_DFL_DUP) {
1244 * This is also a chunk that isn't copied
1245 * to the static buffer so set had_nocopy.
1249 /* only allowed once */
1250 if (WARN_ON(dup_buf)) {
1255 dup_buf = kmemdup(cmddata[i], cmdlen[i],
1260 /* NOCOPY must not be followed by normal! */
1261 if (WARN_ON(had_nocopy)) {
1265 copy_size += cmdlen[i];
1267 cmd_size += cmd->len[i];
1271 * If any of the command structures end up being larger than
1272 * the TFD_MAX_PAYLOAD_SIZE and they aren't dynamically
1273 * allocated into separate TFDs, then we will need to
1274 * increase the size of the buffers.
1276 if (WARN(copy_size > TFD_MAX_PAYLOAD_SIZE,
1277 "Command %s (%#x) is too large (%d bytes)\n",
1278 get_cmd_string(trans_pcie, cmd->id), cmd->id, copy_size)) {
1283 spin_lock_bh(&txq->lock);
1285 if (iwl_queue_space(q) < ((cmd->flags & CMD_ASYNC) ? 2 : 1)) {
1286 spin_unlock_bh(&txq->lock);
1288 IWL_ERR(trans, "No space in command queue\n");
1289 iwl_op_mode_cmd_queue_full(trans->op_mode);
1294 idx = get_cmd_index(q, q->write_ptr);
1295 out_cmd = txq->entries[idx].cmd;
1296 out_meta = &txq->entries[idx].meta;
1298 memset(out_meta, 0, sizeof(*out_meta)); /* re-initialize to NULL */
1299 if (cmd->flags & CMD_WANT_SKB)
1300 out_meta->source = cmd;
1302 /* set up the header */
1304 out_cmd->hdr.cmd = cmd->id;
1305 out_cmd->hdr.flags = 0;
1306 out_cmd->hdr.sequence =
1307 cpu_to_le16(QUEUE_TO_SEQ(trans_pcie->cmd_queue) |
1308 INDEX_TO_SEQ(q->write_ptr));
1310 /* and copy the data that needs to be copied */
1311 cmd_pos = offsetof(struct iwl_device_cmd, payload);
1312 copy_size = sizeof(out_cmd->hdr);
1313 for (i = 0; i < IWL_MAX_CMD_TBS_PER_TFD; i++) {
1319 /* need at least IWL_HCMD_SCRATCHBUF_SIZE copied */
1320 if (copy_size < IWL_HCMD_SCRATCHBUF_SIZE) {
1321 copy = IWL_HCMD_SCRATCHBUF_SIZE - copy_size;
1323 if (copy > cmd->len[i])
1327 /* copy everything if not nocopy/dup */
1328 if (!(cmd->dataflags[i] & (IWL_HCMD_DFL_NOCOPY |
1333 memcpy((u8 *)out_cmd + cmd_pos, cmd->data[i], copy);
1340 "Sending command %s (#%x), seq: 0x%04X, %d bytes at %d[%d]:%d\n",
1341 get_cmd_string(trans_pcie, out_cmd->hdr.cmd),
1342 out_cmd->hdr.cmd, le16_to_cpu(out_cmd->hdr.sequence),
1343 cmd_size, q->write_ptr, idx, trans_pcie->cmd_queue);
1345 /* start the TFD with the scratchbuf */
1346 scratch_size = min_t(int, copy_size, IWL_HCMD_SCRATCHBUF_SIZE);
1347 memcpy(&txq->scratchbufs[q->write_ptr], &out_cmd->hdr, scratch_size);
1348 iwl_pcie_txq_build_tfd(trans, txq,
1349 iwl_pcie_get_scratchbuf_dma(txq, q->write_ptr),
1352 /* map first command fragment, if any remains */
1353 if (copy_size > scratch_size) {
1354 phys_addr = dma_map_single(trans->dev,
1355 ((u8 *)&out_cmd->hdr) + scratch_size,
1356 copy_size - scratch_size,
1358 if (dma_mapping_error(trans->dev, phys_addr)) {
1359 iwl_pcie_tfd_unmap(trans, out_meta,
1360 &txq->tfds[q->write_ptr]);
1365 iwl_pcie_txq_build_tfd(trans, txq, phys_addr,
1366 copy_size - scratch_size, 0);
1369 /* map the remaining (adjusted) nocopy/dup fragments */
1370 for (i = 0; i < IWL_MAX_CMD_TBS_PER_TFD; i++) {
1371 const void *data = cmddata[i];
1375 if (!(cmd->dataflags[i] & (IWL_HCMD_DFL_NOCOPY |
1378 if (cmd->dataflags[i] & IWL_HCMD_DFL_DUP)
1380 phys_addr = dma_map_single(trans->dev, (void *)data,
1381 cmdlen[i], DMA_TO_DEVICE);
1382 if (dma_mapping_error(trans->dev, phys_addr)) {
1383 iwl_pcie_tfd_unmap(trans, out_meta,
1384 &txq->tfds[q->write_ptr]);
1389 iwl_pcie_txq_build_tfd(trans, txq, phys_addr, cmdlen[i], 0);
1392 out_meta->flags = cmd->flags;
1393 if (WARN_ON_ONCE(txq->entries[idx].free_buf))
1394 kfree(txq->entries[idx].free_buf);
1395 txq->entries[idx].free_buf = dup_buf;
1397 txq->need_update = 1;
1399 trace_iwlwifi_dev_hcmd(trans->dev, cmd, cmd_size, &out_cmd->hdr);
1401 /* start timer if queue currently empty */
1402 if (q->read_ptr == q->write_ptr && trans_pcie->wd_timeout)
1403 mod_timer(&txq->stuck_timer, jiffies + trans_pcie->wd_timeout);
1405 spin_lock_irqsave(&trans_pcie->reg_lock, flags);
1408 * wake up the NIC to make sure that the firmware will see the host
1409 * command - we will let the NIC sleep once all the host commands
1412 if (!trans_pcie->cmd_in_flight) {
1413 trans_pcie->cmd_in_flight = true;
1414 __iwl_trans_pcie_set_bit(trans, CSR_GP_CNTRL,
1415 CSR_GP_CNTRL_REG_FLAG_MAC_ACCESS_REQ);
1416 ret = iwl_poll_bit(trans, CSR_GP_CNTRL,
1417 CSR_GP_CNTRL_REG_VAL_MAC_ACCESS_EN,
1418 (CSR_GP_CNTRL_REG_FLAG_MAC_CLOCK_READY |
1419 CSR_GP_CNTRL_REG_FLAG_GOING_TO_SLEEP),
1422 __iwl_trans_pcie_clear_bit(trans, CSR_GP_CNTRL,
1423 CSR_GP_CNTRL_REG_FLAG_MAC_ACCESS_REQ);
1424 spin_unlock_irqrestore(&trans_pcie->reg_lock, flags);
1425 trans_pcie->cmd_in_flight = false;
1431 /* Increment and update queue's write index */
1432 q->write_ptr = iwl_queue_inc_wrap(q->write_ptr, q->n_bd);
1433 iwl_pcie_txq_inc_wr_ptr(trans, txq);
1435 spin_unlock_irqrestore(&trans_pcie->reg_lock, flags);
1438 spin_unlock_bh(&txq->lock);
1446 * iwl_pcie_hcmd_complete - Pull unused buffers off the queue and reclaim them
1447 * @rxb: Rx buffer to reclaim
1448 * @handler_status: return value of the handler of the command
1449 * (put in setup_rx_handlers)
1451 * If an Rx buffer has an async callback associated with it the callback
1452 * will be executed. The attached skb (if present) will only be freed
1453 * if the callback returns 1
1455 void iwl_pcie_hcmd_complete(struct iwl_trans *trans,
1456 struct iwl_rx_cmd_buffer *rxb, int handler_status)
1458 struct iwl_rx_packet *pkt = rxb_addr(rxb);
1459 u16 sequence = le16_to_cpu(pkt->hdr.sequence);
1460 int txq_id = SEQ_TO_QUEUE(sequence);
1461 int index = SEQ_TO_INDEX(sequence);
1463 struct iwl_device_cmd *cmd;
1464 struct iwl_cmd_meta *meta;
1465 struct iwl_trans_pcie *trans_pcie = IWL_TRANS_GET_PCIE_TRANS(trans);
1466 struct iwl_txq *txq = &trans_pcie->txq[trans_pcie->cmd_queue];
1468 /* If a Tx command is being handled and it isn't in the actual
1469 * command queue then there a command routing bug has been introduced
1470 * in the queue management code. */
1471 if (WARN(txq_id != trans_pcie->cmd_queue,
1472 "wrong command queue %d (should be %d), sequence 0x%X readp=%d writep=%d\n",
1473 txq_id, trans_pcie->cmd_queue, sequence,
1474 trans_pcie->txq[trans_pcie->cmd_queue].q.read_ptr,
1475 trans_pcie->txq[trans_pcie->cmd_queue].q.write_ptr)) {
1476 iwl_print_hex_error(trans, pkt, 32);
1480 spin_lock_bh(&txq->lock);
1482 cmd_index = get_cmd_index(&txq->q, index);
1483 cmd = txq->entries[cmd_index].cmd;
1484 meta = &txq->entries[cmd_index].meta;
1486 iwl_pcie_tfd_unmap(trans, meta, &txq->tfds[index]);
1488 /* Input error checking is done when commands are added to queue. */
1489 if (meta->flags & CMD_WANT_SKB) {
1490 struct page *p = rxb_steal_page(rxb);
1492 meta->source->resp_pkt = pkt;
1493 meta->source->_rx_page_addr = (unsigned long)page_address(p);
1494 meta->source->_rx_page_order = trans_pcie->rx_page_order;
1495 meta->source->handler_status = handler_status;
1498 iwl_pcie_cmdq_reclaim(trans, txq_id, index);
1500 if (!(meta->flags & CMD_ASYNC)) {
1501 if (!test_bit(STATUS_SYNC_HCMD_ACTIVE, &trans->status)) {
1503 "HCMD_ACTIVE already clear for command %s\n",
1504 get_cmd_string(trans_pcie, cmd->hdr.cmd));
1506 clear_bit(STATUS_SYNC_HCMD_ACTIVE, &trans->status);
1507 IWL_DEBUG_INFO(trans, "Clearing HCMD_ACTIVE for command %s\n",
1508 get_cmd_string(trans_pcie, cmd->hdr.cmd));
1509 wake_up(&trans_pcie->wait_command_queue);
1514 spin_unlock_bh(&txq->lock);
1517 #define HOST_COMPLETE_TIMEOUT (2 * HZ)
1519 static int iwl_pcie_send_hcmd_async(struct iwl_trans *trans,
1520 struct iwl_host_cmd *cmd)
1522 struct iwl_trans_pcie *trans_pcie = IWL_TRANS_GET_PCIE_TRANS(trans);
1525 /* An asynchronous command can not expect an SKB to be set. */
1526 if (WARN_ON(cmd->flags & CMD_WANT_SKB))
1529 ret = iwl_pcie_enqueue_hcmd(trans, cmd);
1532 "Error sending %s: enqueue_hcmd failed: %d\n",
1533 get_cmd_string(trans_pcie, cmd->id), ret);
1539 static int iwl_pcie_send_hcmd_sync(struct iwl_trans *trans,
1540 struct iwl_host_cmd *cmd)
1542 struct iwl_trans_pcie *trans_pcie = IWL_TRANS_GET_PCIE_TRANS(trans);
1546 IWL_DEBUG_INFO(trans, "Attempting to send sync command %s\n",
1547 get_cmd_string(trans_pcie, cmd->id));
1549 if (WARN(test_and_set_bit(STATUS_SYNC_HCMD_ACTIVE,
1551 "Command %s: a command is already active!\n",
1552 get_cmd_string(trans_pcie, cmd->id)))
1555 IWL_DEBUG_INFO(trans, "Setting HCMD_ACTIVE for command %s\n",
1556 get_cmd_string(trans_pcie, cmd->id));
1558 cmd_idx = iwl_pcie_enqueue_hcmd(trans, cmd);
1561 clear_bit(STATUS_SYNC_HCMD_ACTIVE, &trans->status);
1563 "Error sending %s: enqueue_hcmd failed: %d\n",
1564 get_cmd_string(trans_pcie, cmd->id), ret);
1568 ret = wait_event_timeout(trans_pcie->wait_command_queue,
1569 !test_bit(STATUS_SYNC_HCMD_ACTIVE,
1571 HOST_COMPLETE_TIMEOUT);
1573 struct iwl_txq *txq = &trans_pcie->txq[trans_pcie->cmd_queue];
1574 struct iwl_queue *q = &txq->q;
1576 IWL_ERR(trans, "Error sending %s: time out after %dms.\n",
1577 get_cmd_string(trans_pcie, cmd->id),
1578 jiffies_to_msecs(HOST_COMPLETE_TIMEOUT));
1580 IWL_ERR(trans, "Current CMD queue read_ptr %d write_ptr %d\n",
1581 q->read_ptr, q->write_ptr);
1583 clear_bit(STATUS_SYNC_HCMD_ACTIVE, &trans->status);
1584 IWL_DEBUG_INFO(trans, "Clearing HCMD_ACTIVE for command %s\n",
1585 get_cmd_string(trans_pcie, cmd->id));
1588 iwl_trans_fw_error(trans);
1593 if (test_bit(STATUS_FW_ERROR, &trans->status)) {
1594 IWL_ERR(trans, "FW error in SYNC CMD %s\n",
1595 get_cmd_string(trans_pcie, cmd->id));
1601 if (!(cmd->flags & CMD_SEND_IN_RFKILL) &&
1602 test_bit(STATUS_RFKILL, &trans->status)) {
1603 IWL_DEBUG_RF_KILL(trans, "RFKILL in SYNC CMD... no rsp\n");
1608 if ((cmd->flags & CMD_WANT_SKB) && !cmd->resp_pkt) {
1609 IWL_ERR(trans, "Error: Response NULL in '%s'\n",
1610 get_cmd_string(trans_pcie, cmd->id));
1618 if (cmd->flags & CMD_WANT_SKB) {
1620 * Cancel the CMD_WANT_SKB flag for the cmd in the
1621 * TX cmd queue. Otherwise in case the cmd comes
1622 * in later, it will possibly set an invalid
1623 * address (cmd->meta.source).
1625 trans_pcie->txq[trans_pcie->cmd_queue].
1626 entries[cmd_idx].meta.flags &= ~CMD_WANT_SKB;
1629 if (cmd->resp_pkt) {
1631 cmd->resp_pkt = NULL;
1637 int iwl_trans_pcie_send_hcmd(struct iwl_trans *trans, struct iwl_host_cmd *cmd)
1639 if (!(cmd->flags & CMD_SEND_IN_RFKILL) &&
1640 test_bit(STATUS_RFKILL, &trans->status)) {
1641 IWL_DEBUG_RF_KILL(trans, "Dropping CMD 0x%x: RF KILL\n",
1646 if (cmd->flags & CMD_ASYNC)
1647 return iwl_pcie_send_hcmd_async(trans, cmd);
1649 /* We still can fail on RFKILL that can be asserted while we wait */
1650 return iwl_pcie_send_hcmd_sync(trans, cmd);
1653 int iwl_trans_pcie_tx(struct iwl_trans *trans, struct sk_buff *skb,
1654 struct iwl_device_cmd *dev_cmd, int txq_id)
1656 struct iwl_trans_pcie *trans_pcie = IWL_TRANS_GET_PCIE_TRANS(trans);
1657 struct ieee80211_hdr *hdr = (struct ieee80211_hdr *)skb->data;
1658 struct iwl_tx_cmd *tx_cmd = (struct iwl_tx_cmd *)dev_cmd->payload;
1659 struct iwl_cmd_meta *out_meta;
1660 struct iwl_txq *txq;
1661 struct iwl_queue *q;
1662 dma_addr_t tb0_phys, tb1_phys, scratch_phys;
1664 u16 len, tb1_len, tb2_len;
1665 u8 wait_write_ptr = 0;
1666 __le16 fc = hdr->frame_control;
1667 u8 hdr_len = ieee80211_hdrlen(fc);
1670 txq = &trans_pcie->txq[txq_id];
1673 if (WARN_ONCE(!test_bit(txq_id, trans_pcie->queue_used),
1674 "TX on unused queue %d\n", txq_id))
1677 spin_lock(&txq->lock);
1679 /* In AGG mode, the index in the ring must correspond to the WiFi
1680 * sequence number. This is a HW requirements to help the SCD to parse
1682 * Check here that the packets are in the right place on the ring.
1684 wifi_seq = IEEE80211_SEQ_TO_SN(le16_to_cpu(hdr->seq_ctrl));
1685 WARN_ONCE(txq->ampdu &&
1686 (wifi_seq & 0xff) != q->write_ptr,
1687 "Q: %d WiFi Seq %d tfdNum %d",
1688 txq_id, wifi_seq, q->write_ptr);
1690 /* Set up driver data for this TFD */
1691 txq->entries[q->write_ptr].skb = skb;
1692 txq->entries[q->write_ptr].cmd = dev_cmd;
1694 dev_cmd->hdr.sequence =
1695 cpu_to_le16((u16)(QUEUE_TO_SEQ(txq_id) |
1696 INDEX_TO_SEQ(q->write_ptr)));
1698 tb0_phys = iwl_pcie_get_scratchbuf_dma(txq, q->write_ptr);
1699 scratch_phys = tb0_phys + sizeof(struct iwl_cmd_header) +
1700 offsetof(struct iwl_tx_cmd, scratch);
1702 tx_cmd->dram_lsb_ptr = cpu_to_le32(scratch_phys);
1703 tx_cmd->dram_msb_ptr = iwl_get_dma_hi_addr(scratch_phys);
1705 /* Set up first empty entry in queue's array of Tx/cmd buffers */
1706 out_meta = &txq->entries[q->write_ptr].meta;
1709 * The second TB (tb1) points to the remainder of the TX command
1710 * and the 802.11 header - dword aligned size
1711 * (This calculation modifies the TX command, so do it before the
1712 * setup of the first TB)
1714 len = sizeof(struct iwl_tx_cmd) + sizeof(struct iwl_cmd_header) +
1715 hdr_len - IWL_HCMD_SCRATCHBUF_SIZE;
1716 tb1_len = ALIGN(len, 4);
1718 /* Tell NIC about any 2-byte padding after MAC header */
1720 tx_cmd->tx_flags |= TX_CMD_FLG_MH_PAD_MSK;
1722 /* The first TB points to the scratchbuf data - min_copy bytes */
1723 memcpy(&txq->scratchbufs[q->write_ptr], &dev_cmd->hdr,
1724 IWL_HCMD_SCRATCHBUF_SIZE);
1725 iwl_pcie_txq_build_tfd(trans, txq, tb0_phys,
1726 IWL_HCMD_SCRATCHBUF_SIZE, 1);
1728 /* there must be data left over for TB1 or this code must be changed */
1729 BUILD_BUG_ON(sizeof(struct iwl_tx_cmd) < IWL_HCMD_SCRATCHBUF_SIZE);
1731 /* map the data for TB1 */
1732 tb1_addr = ((u8 *)&dev_cmd->hdr) + IWL_HCMD_SCRATCHBUF_SIZE;
1733 tb1_phys = dma_map_single(trans->dev, tb1_addr, tb1_len, DMA_TO_DEVICE);
1734 if (unlikely(dma_mapping_error(trans->dev, tb1_phys)))
1736 iwl_pcie_txq_build_tfd(trans, txq, tb1_phys, tb1_len, 0);
1739 * Set up TFD's third entry to point directly to remainder
1740 * of skb, if any (802.11 null frames have no payload).
1742 tb2_len = skb->len - hdr_len;
1744 dma_addr_t tb2_phys = dma_map_single(trans->dev,
1745 skb->data + hdr_len,
1746 tb2_len, DMA_TO_DEVICE);
1747 if (unlikely(dma_mapping_error(trans->dev, tb2_phys))) {
1748 iwl_pcie_tfd_unmap(trans, out_meta,
1749 &txq->tfds[q->write_ptr]);
1752 iwl_pcie_txq_build_tfd(trans, txq, tb2_phys, tb2_len, 0);
1755 /* Set up entry for this TFD in Tx byte-count array */
1756 iwl_pcie_txq_update_byte_cnt_tbl(trans, txq, le16_to_cpu(tx_cmd->len));
1758 trace_iwlwifi_dev_tx(trans->dev, skb,
1759 &txq->tfds[txq->q.write_ptr],
1760 sizeof(struct iwl_tfd),
1761 &dev_cmd->hdr, IWL_HCMD_SCRATCHBUF_SIZE + tb1_len,
1762 skb->data + hdr_len, tb2_len);
1763 trace_iwlwifi_dev_tx_data(trans->dev, skb,
1764 skb->data + hdr_len, tb2_len);
1766 if (!ieee80211_has_morefrags(fc)) {
1767 txq->need_update = 1;
1770 txq->need_update = 0;
1773 /* start timer if queue currently empty */
1774 if (txq->need_update && q->read_ptr == q->write_ptr &&
1775 trans_pcie->wd_timeout)
1776 mod_timer(&txq->stuck_timer, jiffies + trans_pcie->wd_timeout);
1778 /* Tell device the write index *just past* this latest filled TFD */
1779 q->write_ptr = iwl_queue_inc_wrap(q->write_ptr, q->n_bd);
1780 iwl_pcie_txq_inc_wr_ptr(trans, txq);
1783 * At this point the frame is "transmitted" successfully
1784 * and we will get a TX status notification eventually,
1785 * regardless of the value of ret. "ret" only indicates
1786 * whether or not we should update the write pointer.
1788 if (iwl_queue_space(q) < q->high_mark) {
1789 if (wait_write_ptr) {
1790 txq->need_update = 1;
1791 iwl_pcie_txq_inc_wr_ptr(trans, txq);
1793 iwl_stop_queue(trans, txq);
1796 spin_unlock(&txq->lock);
1799 spin_unlock(&txq->lock);