/* * TUSB6010 USB 2.0 OTG Dual Role controller OMAP DMA interface * * Copyright (C) 2006 Nokia Corporation * Tony Lindgren * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License version 2 as * published by the Free Software Foundation. */ #include #include #include #include #include #include #include #include #include #include "musbdefs.h" /* * REVISIT: With TUSB2.0 only one dmareq line can be used at a time. * This should get fixed in hardware at some point. */ #define BROKEN_DMAREQ #ifdef BROKEN_DMAREQ #define dmareq_works() 0 #else #define dmareq_works() 1 #endif #define to_chdat(c) (struct tusb_omap_dma_ch *)(c)->pPrivateData #define MAX_DMAREQ 5 /* REVISIT: Really 6, but req5 not OK */ struct tusb_omap_dma_ch { struct musb *musb; void __iomem *tusb_base; unsigned long phys_offset; int epnum; u8 tx; struct musb_hw_ep *hw_ep; int ch; s8 dmareq; s8 sync_dev; struct tusb_omap_dma *tusb_dma; void __iomem *dma_addr; u32 len; u16 packet_sz; u16 transfer_packet_sz; u32 transfer_len; u32 completed_len; }; struct tusb_omap_dma { struct dma_controller controller; struct musb *musb; void __iomem *tusb_base; int ch; s8 dmareq; s8 sync_dev; }; static int tusb_omap_dma_start(struct dma_controller *c) { struct tusb_omap_dma *tusb_dma; tusb_dma = container_of(c, struct tusb_omap_dma, controller); // DBG(3, "ep%i ch: %i\n", chdat->epnum, chdat->ch); return 0; } static int tusb_omap_dma_stop(struct dma_controller *c) { struct tusb_omap_dma *tusb_dma; tusb_dma = container_of(c, struct tusb_omap_dma, controller); // DBG(3, "ep%i ch: %i\n", chdat->epnum, chdat->ch); return 0; } #ifdef BROKEN_DMAREQ /* * Allocate dmareq0 to the current channel unless it's already taken */ static inline int tusb_omap_use_shared_dmareq(struct tusb_omap_dma_ch *chdat) { u32 reg = musb_readl(chdat->tusb_base, TUSB_DMA_EP_MAP); if (reg != 0) { DBG(3, "ep%i dmareq0 is busy for ep%i\n", chdat->epnum, reg & 0xf); return -EAGAIN; } if (chdat->tx) reg = (1 << 4) | chdat->epnum; else reg = chdat->epnum; musb_writel(chdat->tusb_base, TUSB_DMA_EP_MAP, reg); return 0; } static inline void tusb_omap_free_shared_dmareq(struct tusb_omap_dma_ch *chdat) { u32 reg = musb_readl(chdat->tusb_base, TUSB_DMA_EP_MAP); if ((reg & 0xf) != chdat->epnum) { printk(KERN_ERR "ep%i trying to release dmareq0 for ep%i\n", chdat->epnum, reg & 0xf); return; } musb_writel(chdat->tusb_base, TUSB_DMA_EP_MAP, 0); } #else #define tusb_omap_use_shared_dmareq(x, y) do {} while (0) #define tusb_omap_free_shared_dmareq(x, y) do {} while (0) #endif /* * See also musb_dma_completion in plat_uds.c and musb_g_[tx|rx]() in * musb_gadget.c. */ static void tusb_omap_dma_cb(int lch, u16 ch_status, void *data) { struct dma_channel *channel = (struct dma_channel *)data; struct tusb_omap_dma_ch *chdat = to_chdat(channel); struct tusb_omap_dma *tusb_dma = chdat->tusb_dma; struct musb *musb = chdat->musb; struct musb_hw_ep *hw_ep = chdat->hw_ep; void __iomem *ep_conf = hw_ep->conf; void __iomem *musb_base = musb->pRegs; unsigned long remaining, flags; int ch; spin_lock_irqsave(&musb->Lock, flags); if (dmareq_works()) ch = chdat->ch; else ch = tusb_dma->ch; if (ch_status != OMAP_DMA_BLOCK_IRQ) printk(KERN_ERR "TUSB DMA error status: %i\n", ch_status); DBG(2, "ep%i %s dma callback ch: %i status: %x\n", chdat->epnum, chdat->tx ? "tx" : "rx", ch, ch_status); if (chdat->tx) remaining = musb_readl(ep_conf, TUSB_EP_TX_OFFSET); else remaining = musb_readl(ep_conf, TUSB_EP_RX_OFFSET); remaining = TUSB_EP_CONFIG_XFR_SIZE(remaining); channel->dwActualLength = chdat->transfer_len - remaining; DBG(2, "remaining %lu/%u\n", remaining, chdat->transfer_len); if (!dmareq_works()) tusb_omap_free_shared_dmareq(chdat); channel->bStatus = MGC_DMA_STATUS_FREE; /* Handle only RX callbacks here. TX callbacks musb be handled based * on the TUSB DMA status interrupt. * REVISIT: Use both TUSB DMA status interrupt and OMAP DMA callback * interrupt for RX and TX. */ if (!chdat->tx) musb_dma_completion(musb, chdat->epnum, chdat->tx); /* We musb terminate short tx transfers manually by setting TXPKTRDY. * REVISIT: This same problem may occur with other MUSB dma as well. * Easy to test with g_ether by pinging the MUSB board with ping -s54. */ if ((chdat->transfer_len < chdat->packet_sz) || (chdat->transfer_len % chdat->packet_sz != 0)) { u16 csr; if (chdat->tx) { DBG(2, "terminating short tx packet\n"); MGC_SelectEnd(musb_base, chdat->epnum); csr = musb_readw(hw_ep->regs, MGC_O_HDRC_TXCSR); csr |= MGC_M_TXCSR_MODE | MGC_M_TXCSR_TXPKTRDY | MGC_M_TXCSR_P_WZC_BITS; musb_writew(hw_ep->regs, MGC_O_HDRC_TXCSR, csr); } } spin_unlock_irqrestore(&musb->Lock, flags); } static int tusb_omap_dma_program(struct dma_channel *channel, u16 packet_sz, u8 rndis_mode, dma_addr_t dma_addr, u32 len) { struct tusb_omap_dma_ch *chdat = to_chdat(channel); struct tusb_omap_dma *tusb_dma = chdat->tusb_dma; struct musb *musb = chdat->musb; struct musb_hw_ep *hw_ep = chdat->hw_ep; void __iomem *musb_base = musb->pRegs; void __iomem *ep_conf = hw_ep->conf; dma_addr_t fifo = hw_ep->fifo_sync; struct omap_dma_channel_params dma_params; int src_burst, dst_burst; u16 csr; int ch; s8 dmareq; s8 sync_dev; if (unlikely(dma_addr & 0x1)) return FALSE; if (len < 32) return FALSE; if ((len % 32 != 0)) return FALSE; else chdat->transfer_len = len; if (len < packet_sz) chdat->transfer_packet_sz = chdat->transfer_len; else chdat->transfer_packet_sz = packet_sz; if (dmareq_works()) { ch = chdat->ch; dmareq = chdat->dmareq; sync_dev = chdat->sync_dev; } else { if (tusb_omap_use_shared_dmareq(chdat) != 0) { DBG(3, "could not get dma for ep%i\n", chdat->epnum); return FALSE; } if (tusb_dma->ch < 0) { /* REVISIT: This should get blocked earlier, happens * with MSC ErrorRecoveryTest */ WARN_ON(1); return FALSE; } ch = tusb_dma->ch; dmareq = tusb_dma->dmareq; sync_dev = tusb_dma->sync_dev; omap_set_dma_callback(ch, tusb_omap_dma_cb, channel); } chdat->packet_sz = packet_sz; chdat->len = len; channel->dwActualLength = 0; chdat->dma_addr = (void __iomem *)dma_addr; channel->bStatus = MGC_DMA_STATUS_BUSY; /* Since we're recycling dma areas, we need to clean or invalidate */ if (chdat->tx) { consistent_sync(phys_to_virt(dma_addr), len, DMA_TO_DEVICE); } else consistent_sync(phys_to_virt(dma_addr), len, DMA_FROM_DEVICE); /* Use 16-bit transfer if dma_addr is not 32-bit aligned */ if ((dma_addr & 0x3) == 0) { dma_params.data_type = OMAP_DMA_DATA_TYPE_S32; dma_params.elem_count = 8; /* Elements in frame */ } else { dma_params.data_type = OMAP_DMA_DATA_TYPE_S16; dma_params.elem_count = 16; /* Elements in frame */ fifo = hw_ep->fifo_async; } dma_params.frame_count = chdat->transfer_len / 32; /* Burst sz frame */ DBG(2, "ep%i %s dma ch%i dma: %08x len: %u(%u) packet_sz: %i(%i)\n", chdat->epnum, chdat->tx ? "tx" : "rx", ch, dma_addr, chdat->transfer_len, len, chdat->transfer_packet_sz, packet_sz); /* * Prepare omap DMA for transfer */ if (chdat->tx) { dma_params.src_amode = OMAP_DMA_AMODE_POST_INC; dma_params.src_start = (unsigned long)dma_addr; dma_params.src_ei = 0; dma_params.src_fi = 0; dma_params.dst_amode = OMAP_DMA_AMODE_DOUBLE_IDX; dma_params.dst_start = (unsigned long)fifo; dma_params.dst_ei = 1; dma_params.dst_fi = -31; /* Loop 32 byte window */ dma_params.trigger = sync_dev; dma_params.sync_mode = OMAP_DMA_SYNC_FRAME; dma_params.src_or_dst_synch = 0; /* Dest sync */ src_burst = OMAP_DMA_DATA_BURST_16; /* 16x32 read */ dst_burst = OMAP_DMA_DATA_BURST_8; /* 8x32 write */ } else { dma_params.src_amode = OMAP_DMA_AMODE_DOUBLE_IDX; dma_params.src_start = (unsigned long)fifo; dma_params.src_ei = 1; dma_params.src_fi = -31; /* Loop 32 byte window */ dma_params.dst_amode = OMAP_DMA_AMODE_POST_INC; dma_params.dst_start = (unsigned long)dma_addr; dma_params.dst_ei = 0; dma_params.dst_fi = 0; dma_params.trigger = sync_dev; dma_params.sync_mode = OMAP_DMA_SYNC_FRAME; dma_params.src_or_dst_synch = 1; /* Source sync */ src_burst = OMAP_DMA_DATA_BURST_8; /* 8x32 read */ dst_burst = OMAP_DMA_DATA_BURST_16; /* 16x32 write */ } DBG(2, "ep%i %s using %i-bit %s dma from 0x%08lx to 0x%08lx\n", chdat->epnum, chdat->tx ? "tx" : "rx", (dma_params.data_type == OMAP_DMA_DATA_TYPE_S32) ? 32 : 16, ((dma_addr & 0x3) == 0) ? "sync" : "async", dma_params.src_start, dma_params.dst_start); omap_set_dma_params(ch, &dma_params); omap_set_dma_src_burst_mode(ch, src_burst); omap_set_dma_dest_burst_mode(ch, dst_burst); omap_set_dma_write_mode(ch, OMAP_DMA_WRITE_LAST_NON_POSTED); /* * Prepare MUSB for DMA transfer */ if (chdat->tx) { MGC_SelectEnd(musb_base, chdat->epnum); csr = musb_readw(hw_ep->regs, MGC_O_HDRC_TXCSR); csr |= (MGC_M_TXCSR_AUTOSET | MGC_M_TXCSR_DMAENAB | MGC_M_TXCSR_DMAMODE | MGC_M_TXCSR_MODE); csr &= ~MGC_M_TXCSR_P_UNDERRUN; musb_writew(hw_ep->regs, MGC_O_HDRC_TXCSR, csr); } else { MGC_SelectEnd(musb_base, chdat->epnum); csr = musb_readw(hw_ep->regs, MGC_O_HDRC_RXCSR); csr |= MGC_M_RXCSR_DMAENAB; csr &= ~(MGC_M_RXCSR_AUTOCLEAR | MGC_M_RXCSR_DMAMODE); musb_writew(hw_ep->regs, MGC_O_HDRC_RXCSR, csr | MGC_M_RXCSR_P_WZC_BITS); } /* * Start DMA transfer */ omap_start_dma(ch); if (chdat->tx) { /* Send transfer_packet_sz packets at a time */ musb_writel(ep_conf, TUSB_EP_MAX_PACKET_SIZE_OFFSET, chdat->transfer_packet_sz); musb_writel(ep_conf, TUSB_EP_TX_OFFSET, TUSB_EP_CONFIG_XFR_SIZE(chdat->transfer_len)); } else { /* Receive transfer_packet_sz packets at a time */ musb_writel(ep_conf, TUSB_EP_MAX_PACKET_SIZE_OFFSET, chdat->transfer_packet_sz << 16); musb_writel(ep_conf, TUSB_EP_RX_OFFSET, TUSB_EP_CONFIG_XFR_SIZE(chdat->transfer_len)); } return TRUE; } static int tusb_omap_dma_abort(struct dma_channel *channel) { struct tusb_omap_dma_ch *chdat = to_chdat(channel); struct tusb_omap_dma *tusb_dma = chdat->tusb_dma; if (!dmareq_works()) { if (tusb_dma->ch >= 0) { omap_stop_dma(tusb_dma->ch); omap_free_dma(tusb_dma->ch); tusb_dma->ch = -1; } tusb_dma->dmareq = -1; tusb_dma->sync_dev = -1; } channel->bStatus = MGC_DMA_STATUS_FREE; return 0; } static inline int tusb_omap_dma_allocate_dmareq(struct tusb_omap_dma_ch *chdat) { u32 reg = musb_readl(chdat->tusb_base, TUSB_DMA_EP_MAP); int i, dmareq_nr = -1; const int sync_dev[6] = { OMAP24XX_DMA_EXT_DMAREQ0, OMAP24XX_DMA_EXT_DMAREQ1, OMAP24XX_DMA_EXT_DMAREQ2, OMAP24XX_DMA_EXT_DMAREQ3, OMAP24XX_DMA_EXT_DMAREQ4, OMAP24XX_DMA_EXT_DMAREQ5, }; for (i = 0; i < MAX_DMAREQ; i++) { int cur = (reg & (0xf << (i * 5))) >> (i * 5); if (cur == 0) { dmareq_nr = i; break; } } if (dmareq_nr == -1) return -EAGAIN; reg |= (chdat->epnum << (dmareq_nr * 5)); if (chdat->tx) reg |= ((1 << 4) << (dmareq_nr * 5)); musb_writel(chdat->tusb_base, TUSB_DMA_EP_MAP, reg); chdat->dmareq = dmareq_nr; chdat->sync_dev = sync_dev[chdat->dmareq]; return 0; } static inline void tusb_omap_dma_free_dmareq(struct tusb_omap_dma_ch *chdat) { u32 reg; if (!chdat || chdat->dmareq < 0) return; reg = musb_readl(chdat->tusb_base, TUSB_DMA_EP_MAP); reg &= ~(0x1f << (chdat->dmareq * 5)); musb_writel(chdat->tusb_base, TUSB_DMA_EP_MAP, reg); chdat->dmareq = -1; chdat->sync_dev = -1; } static struct dma_channel *dma_channel_pool[MAX_DMAREQ]; static struct dma_channel * tusb_omap_dma_allocate(struct dma_controller *c, struct musb_hw_ep *hw_ep, u8 tx) { int ret, i; const char *dev_name; struct tusb_omap_dma *tusb_dma; struct musb *musb; void __iomem *tusb_base; struct dma_channel *channel = NULL; struct tusb_omap_dma_ch *chdat = NULL; u32 reg; tusb_dma = container_of(c, struct tusb_omap_dma, controller); musb = tusb_dma->musb; tusb_base = musb->ctrl_base; reg = musb_readl(tusb_base, TUSB_DMA_INT_MASK); if (tx) reg &= ~(1 << hw_ep->bLocalEnd); else reg &= ~(1 << (hw_ep->bLocalEnd + 15)); musb_writel(tusb_base, TUSB_DMA_INT_MASK, reg); /* REVISIT: Why does dmareq5 not work? */ if (hw_ep->bLocalEnd == 0) { DBG(3, "Not allowing DMA for ep0 %s\n", tx ? "tx" : "rx"); return NULL; } for (i = 0; i < MAX_DMAREQ; i++) { struct dma_channel *ch = dma_channel_pool[i]; if (ch->bStatus == MGC_DMA_STATUS_UNKNOWN) { ch->bStatus = MGC_DMA_STATUS_FREE; channel = ch; chdat = ch->pPrivateData; break; } } if (!channel) return NULL; if (tx) { chdat->tx = 1; dev_name = "TUSB transmit"; } else { chdat->tx = 0; dev_name = "TUSB receive"; } chdat->musb = tusb_dma->musb; chdat->tusb_base = tusb_dma->tusb_base; chdat->hw_ep = hw_ep; chdat->epnum = hw_ep->bLocalEnd; chdat->dmareq = -1; chdat->completed_len = 0; chdat->tusb_dma = tusb_dma; channel->dwMaxLength = 0x7fffffff; channel->bDesiredMode = 0; channel->dwActualLength = 0; if (dmareq_works()) { ret = tusb_omap_dma_allocate_dmareq(chdat); if (ret != 0) goto free_dmareq; ret = omap_request_dma(chdat->sync_dev, dev_name, tusb_omap_dma_cb, channel, &chdat->ch); if (ret != 0) goto free_dmareq; } else if (tusb_dma->ch == -1) { tusb_dma->dmareq = 0; tusb_dma->sync_dev = OMAP24XX_DMA_EXT_DMAREQ0; /* Callback data gets set later in the shared dmareq case */ ret = omap_request_dma(tusb_dma->sync_dev, "TUSB shared", tusb_omap_dma_cb, NULL, &tusb_dma->ch); if (ret != 0) goto free_dmareq; chdat->dmareq = -1; chdat->ch = -1; } DBG(3, "ep%i %s dma: %s dma%i dmareq%i sync%i\n", chdat->epnum, chdat->tx ? "tx" : "rx", chdat->ch >=0 ? "dedicated" : "shared", chdat->ch >= 0 ? chdat->ch : tusb_dma->ch, chdat->dmareq >= 0 ? chdat->dmareq : tusb_dma->dmareq, chdat->sync_dev >= 0 ? chdat->sync_dev : tusb_dma->sync_dev); return channel; free_dmareq: tusb_omap_dma_free_dmareq(chdat); DBG(3, "ep%i: Could not get a DMA channel\n", chdat->epnum); channel->bStatus = MGC_DMA_STATUS_UNKNOWN; return NULL; } static void tusb_omap_dma_release(struct dma_channel *channel) { struct tusb_omap_dma_ch *chdat = to_chdat(channel); struct musb *musb = chdat->musb; void __iomem *tusb_base = musb->ctrl_base; u32 reg; DBG(3, "ep%i ch%i\n", chdat->epnum, chdat->ch); reg = musb_readl(tusb_base, TUSB_DMA_INT_MASK); if (chdat->tx) reg |= (1 << chdat->epnum); else reg |= (1 << (chdat->epnum + 15)); musb_writel(tusb_base, TUSB_DMA_INT_MASK, reg); reg = musb_readl(tusb_base, TUSB_DMA_INT_CLEAR); if (chdat->tx) reg |= (1 << chdat->epnum); else reg |= (1 << (chdat->epnum + 15)); musb_writel(tusb_base, TUSB_DMA_INT_CLEAR, reg); channel->bStatus = MGC_DMA_STATUS_UNKNOWN; if (chdat->ch >= 0) { omap_stop_dma(chdat->ch); omap_free_dma(chdat->ch); chdat->ch = -1; } if (chdat->dmareq >= 0) tusb_omap_dma_free_dmareq(chdat); channel = NULL; } static void tusb_omap_dma_cleanup(struct dma_controller *c) { struct tusb_omap_dma *tusb_dma; int i; tusb_dma = container_of(c, struct tusb_omap_dma, controller); for (i = 0; i < MAX_DMAREQ; i++) { struct dma_channel *ch = dma_channel_pool[i]; if (ch) { if (ch->pPrivateData) kfree(ch->pPrivateData); kfree(ch); } } if (!dmareq_works() && tusb_dma && tusb_dma->ch >= 0) omap_free_dma(tusb_dma->ch); kfree(tusb_dma); } static struct dma_controller * tusb_omap_dma_init(struct musb *musb, void __iomem *base) { void __iomem *tusb_base = musb->ctrl_base; struct tusb_omap_dma *tusb_dma; int i; /* REVISIT: Get dmareq lines used from board-*.c */ #ifdef CONFIG_ARCH_OMAP2 omap_cfg_reg(AA10_242X_DMAREQ0); omap_cfg_reg(AA6_242X_DMAREQ1); omap_cfg_reg(E4_242X_DMAREQ2); omap_cfg_reg(G4_242X_DMAREQ3); omap_cfg_reg(D3_242X_DMAREQ4); omap_cfg_reg(E3_242X_DMAREQ5); #endif musb_writel(musb->ctrl_base, TUSB_DMA_INT_MASK, 0x7fffffff); musb_writel(musb->ctrl_base, TUSB_DMA_EP_MAP, 0); musb_writel(tusb_base, TUSB_DMA_REQ_CONF, TUSB_DMA_REQ_CONF_BURST_SIZE(2) | TUSB_DMA_REQ_CONF_DMA_REQ_EN(0x3f) | TUSB_DMA_REQ_CONF_DMA_REQ_ASSER(2)); tusb_dma = kzalloc(sizeof(struct tusb_omap_dma), GFP_KERNEL); if (!tusb_dma) goto cleanup; tusb_dma->musb = musb; tusb_dma->tusb_base = musb->ctrl_base; tusb_dma->ch = -1; tusb_dma->dmareq = -1; tusb_dma->sync_dev = -1; tusb_dma->controller.start = tusb_omap_dma_start; tusb_dma->controller.stop = tusb_omap_dma_stop; tusb_dma->controller.channel_alloc = tusb_omap_dma_allocate; tusb_dma->controller.channel_release = tusb_omap_dma_release; tusb_dma->controller.channel_program = tusb_omap_dma_program; tusb_dma->controller.channel_abort = tusb_omap_dma_abort; tusb_dma->controller.pPrivateData = tusb_dma; for (i = 0; i < MAX_DMAREQ; i++) { struct dma_channel *ch; struct tusb_omap_dma_ch *chdat; ch = kzalloc(sizeof(struct dma_channel), GFP_KERNEL); if (!ch) goto cleanup; dma_channel_pool[i] = ch; chdat = kzalloc(sizeof(struct tusb_omap_dma_ch), GFP_KERNEL); if (!chdat) goto cleanup; ch->bStatus = MGC_DMA_STATUS_UNKNOWN; ch->pPrivateData = chdat; } return &tusb_dma->controller; cleanup: tusb_omap_dma_cleanup(&tusb_dma->controller); return NULL; } const struct dma_controller_factory dma_controller_factory = { .create = tusb_omap_dma_init, .destroy = tusb_omap_dma_cleanup, };