kernel: usb: dwc2 DMA alignment fixes
Add two patches submitted for upstream review that significantly improve the dwc2 driver on openwrt from kernel stability and performance perspectives. Fixes: FS#1367 Signed-off-by: Antti Seppälä <a.seppala@gmail.com>
This commit is contained in:
parent
c79ef6fbe3
commit
9f451ec698
2 changed files with 176 additions and 0 deletions
|
@ -0,0 +1,126 @@
|
|||
From 028c9191bdf88f120f65626920a6a679170fcc3e Mon Sep 17 00:00:00 2001
|
||||
From: =?UTF-8?q?Antti=20Sepp=C3=A4l=C3=A4?= <a.seppala@gmail.com>
|
||||
Date: Thu, 5 Jul 2018 11:37:03 +0300
|
||||
Subject: [PATCH 1/2] usb: dwc2: Fix DMA alignment to start at allocated
|
||||
boundary
|
||||
MIME-Version: 1.0
|
||||
Content-Type: text/plain; charset=UTF-8
|
||||
Content-Transfer-Encoding: 8bit
|
||||
|
||||
The commit 3bc04e28a030 ("usb: dwc2: host: Get aligned DMA in a more
|
||||
supported way") introduced a common way to align DMA allocations.
|
||||
The code in the commit aligns the struct dma_aligned_buffer but the
|
||||
actual DMA address pointed by data[0] gets aligned to an offset from
|
||||
the allocated boundary by the kmalloc_ptr and the old_xfer_buffer
|
||||
pointers.
|
||||
|
||||
This is against the recommendation in Documentation/DMA-API.txt which
|
||||
states:
|
||||
|
||||
Therefore, it is recommended that driver writers who don't take
|
||||
special care to determine the cache line size at run time only map
|
||||
virtual regions that begin and end on page boundaries (which are
|
||||
guaranteed also to be cache line boundaries).
|
||||
|
||||
The effect of this is that architectures with non-coherent DMA caches
|
||||
may run into memory corruption or kernel crashes with Unhandled
|
||||
kernel unaligned accesses exceptions.
|
||||
|
||||
Fix the alignment by positioning the DMA area in front of the allocation
|
||||
and use memory at the end of the area for storing the orginal
|
||||
transfer_buffer pointer. This may have the added benefit of increased
|
||||
performance as the DMA area is now fully aligned on all architectures.
|
||||
|
||||
Tested with Lantiq xRX200 (MIPS) and RPi Model B Rev 2 (ARM).
|
||||
|
||||
Fixes: 3bc04e28a030 ("usb: dwc2: host: Get aligned DMA in a more
|
||||
supported way")
|
||||
|
||||
Signed-off-by: Antti Seppälä <a.seppala@gmail.com>
|
||||
---
|
||||
drivers/usb/dwc2/hcd.c | 44 +++++++++++++++++++++++---------------------
|
||||
1 file changed, 23 insertions(+), 21 deletions(-)
|
||||
|
||||
--- a/drivers/usb/dwc2/hcd.c
|
||||
+++ b/drivers/usb/dwc2/hcd.c
|
||||
@@ -2628,34 +2628,29 @@ static void dwc2_hc_init_xfer(struct dwc
|
||||
|
||||
#define DWC2_USB_DMA_ALIGN 4
|
||||
|
||||
-struct dma_aligned_buffer {
|
||||
- void *kmalloc_ptr;
|
||||
- void *old_xfer_buffer;
|
||||
- u8 data[0];
|
||||
-};
|
||||
-
|
||||
static void dwc2_free_dma_aligned_buffer(struct urb *urb)
|
||||
{
|
||||
- struct dma_aligned_buffer *temp;
|
||||
+ void *stored_xfer_buffer;
|
||||
|
||||
if (!(urb->transfer_flags & URB_ALIGNED_TEMP_BUFFER))
|
||||
return;
|
||||
|
||||
- temp = container_of(urb->transfer_buffer,
|
||||
- struct dma_aligned_buffer, data);
|
||||
+ /* Restore urb->transfer_buffer from the end of the allocated area */
|
||||
+ memcpy(&stored_xfer_buffer, urb->transfer_buffer +
|
||||
+ urb->transfer_buffer_length, sizeof(urb->transfer_buffer));
|
||||
|
||||
if (usb_urb_dir_in(urb))
|
||||
- memcpy(temp->old_xfer_buffer, temp->data,
|
||||
+ memcpy(stored_xfer_buffer, urb->transfer_buffer,
|
||||
urb->transfer_buffer_length);
|
||||
- urb->transfer_buffer = temp->old_xfer_buffer;
|
||||
- kfree(temp->kmalloc_ptr);
|
||||
+ kfree(urb->transfer_buffer);
|
||||
+ urb->transfer_buffer = stored_xfer_buffer;
|
||||
|
||||
urb->transfer_flags &= ~URB_ALIGNED_TEMP_BUFFER;
|
||||
}
|
||||
|
||||
static int dwc2_alloc_dma_aligned_buffer(struct urb *urb, gfp_t mem_flags)
|
||||
{
|
||||
- struct dma_aligned_buffer *temp, *kmalloc_ptr;
|
||||
+ void *kmalloc_ptr;
|
||||
size_t kmalloc_size;
|
||||
|
||||
if (urb->num_sgs || urb->sg ||
|
||||
@@ -2663,22 +2658,29 @@ static int dwc2_alloc_dma_aligned_buffer
|
||||
!((uintptr_t)urb->transfer_buffer & (DWC2_USB_DMA_ALIGN - 1)))
|
||||
return 0;
|
||||
|
||||
- /* Allocate a buffer with enough padding for alignment */
|
||||
+ /*
|
||||
+ * Allocate a buffer with enough padding for original transfer_buffer
|
||||
+ * pointer. This allocation is guaranteed to be aligned properly for
|
||||
+ * DMA
|
||||
+ */
|
||||
kmalloc_size = urb->transfer_buffer_length +
|
||||
- sizeof(struct dma_aligned_buffer) + DWC2_USB_DMA_ALIGN - 1;
|
||||
+ sizeof(urb->transfer_buffer);
|
||||
|
||||
kmalloc_ptr = kmalloc(kmalloc_size, mem_flags);
|
||||
if (!kmalloc_ptr)
|
||||
return -ENOMEM;
|
||||
|
||||
- /* Position our struct dma_aligned_buffer such that data is aligned */
|
||||
- temp = PTR_ALIGN(kmalloc_ptr + 1, DWC2_USB_DMA_ALIGN) - 1;
|
||||
- temp->kmalloc_ptr = kmalloc_ptr;
|
||||
- temp->old_xfer_buffer = urb->transfer_buffer;
|
||||
+ /*
|
||||
+ * Position value of original urb->transfer_buffer pointer to the end
|
||||
+ * of allocation for later referencing
|
||||
+ */
|
||||
+ memcpy(kmalloc_ptr + urb->transfer_buffer_length,
|
||||
+ &urb->transfer_buffer, sizeof(urb->transfer_buffer));
|
||||
+
|
||||
if (usb_urb_dir_out(urb))
|
||||
- memcpy(temp->data, urb->transfer_buffer,
|
||||
+ memcpy(kmalloc_ptr, urb->transfer_buffer,
|
||||
urb->transfer_buffer_length);
|
||||
- urb->transfer_buffer = temp->data;
|
||||
+ urb->transfer_buffer = kmalloc_ptr;
|
||||
|
||||
urb->transfer_flags |= URB_ALIGNED_TEMP_BUFFER;
|
||||
|
|
@ -0,0 +1,50 @@
|
|||
From 81da1738eee68f1961e03bdeb2d60cf0eb4dd713 Mon Sep 17 00:00:00 2001
|
||||
From: =?UTF-8?q?Antti=20Sepp=C3=A4l=C3=A4?= <a.seppala@gmail.com>
|
||||
Date: Thu, 5 Jul 2018 12:06:18 +0300
|
||||
Subject: [PATCH 2/2] usb: dwc2: Fix inefficient copy of unaligned buffers
|
||||
MIME-Version: 1.0
|
||||
Content-Type: text/plain; charset=UTF-8
|
||||
Content-Transfer-Encoding: 8bit
|
||||
|
||||
Make sure only to copy any actual data rather than the whole buffer,
|
||||
when releasing the temporary buffer used for unaligned non-isochronous
|
||||
transfers.
|
||||
|
||||
Taken directly from commit 0efd937e27d5e ("USB: ehci-tegra: fix inefficient
|
||||
copy of unaligned buffers")
|
||||
|
||||
Tested with Lantiq xRX200 (MIPS) and RPi Model B Rev 2 (ARM)
|
||||
|
||||
Signed-off-by: Antti Seppälä <a.seppala@gmail.com>
|
||||
---
|
||||
drivers/usb/dwc2/hcd.c | 12 +++++++++---
|
||||
1 file changed, 9 insertions(+), 3 deletions(-)
|
||||
|
||||
--- a/drivers/usb/dwc2/hcd.c
|
||||
+++ b/drivers/usb/dwc2/hcd.c
|
||||
@@ -2631,6 +2631,7 @@ static void dwc2_hc_init_xfer(struct dwc
|
||||
static void dwc2_free_dma_aligned_buffer(struct urb *urb)
|
||||
{
|
||||
void *stored_xfer_buffer;
|
||||
+ size_t length;
|
||||
|
||||
if (!(urb->transfer_flags & URB_ALIGNED_TEMP_BUFFER))
|
||||
return;
|
||||
@@ -2639,9 +2640,14 @@ static void dwc2_free_dma_aligned_buffer
|
||||
memcpy(&stored_xfer_buffer, urb->transfer_buffer +
|
||||
urb->transfer_buffer_length, sizeof(urb->transfer_buffer));
|
||||
|
||||
- if (usb_urb_dir_in(urb))
|
||||
- memcpy(stored_xfer_buffer, urb->transfer_buffer,
|
||||
- urb->transfer_buffer_length);
|
||||
+ if (usb_urb_dir_in(urb)) {
|
||||
+ if (usb_pipeisoc(urb->pipe))
|
||||
+ length = urb->transfer_buffer_length;
|
||||
+ else
|
||||
+ length = urb->actual_length;
|
||||
+
|
||||
+ memcpy(stored_xfer_buffer, urb->transfer_buffer, length);
|
||||
+ }
|
||||
kfree(urb->transfer_buffer);
|
||||
urb->transfer_buffer = stored_xfer_buffer;
|
||||
|
Loading…
Reference in a new issue