[PATCH v8 13/19] swiotlb-xen: use xen_dma_map/unmap_page, xen_dma_sync_single_for_cpu/device
Konrad Rzeszutek Wilk
konrad.wilk at oracle.com
Wed Oct 23 15:51:54 EDT 2013
On Wed, Oct 23, 2013 at 06:20:25PM +0100, Stefano Stabellini wrote:
> On Wed, 23 Oct 2013, Konrad Rzeszutek Wilk wrote:
> > On Thu, Oct 17, 2013 at 06:43:28PM +0100, Stefano Stabellini wrote:
> > > Call xen_dma_map_page, xen_dma_unmap_page, xen_dma_sync_single_for_cpu,
> > > xen_dma_sync_single_for_device from swiotlb-xen to ensure cpu/device
> > > coherency of the pages used for DMA, including the ones belonging to the
> > > swiotlb buffer.
> >
> > You lost me.
> >
> > Isn't it the driver's responsibility to do this?
> >
> > Looking at what 'xen_dma_map_page()' does for x86 it looks to add an extra
> > call - page_to_phys - and we ignore it here.
>
> map_page on arm calls the right cache flushes needed to communicate with
> the device. Same with unmap_page.
If this is flushing the cache then I think it makes more sense to do
that without this fancy 'dma_map_page'.
Just call it 'xen_flush_dma_page' and make it a nop on all platforms
except ARM.
> On x86 they are basically nop.
It calls page_to_phys in your patch. That is hardly nop.
> Only map_page and unmap_page know exactly what needs to be done to
> map a page for dma, this is why we need to call them here.
>
>
> > > Signed-off-by: Stefano Stabellini <stefano.stabellini at eu.citrix.com>
> > > ---
> > > drivers/xen/swiotlb-xen.c | 39 +++++++++++++++++++++++++++++++--------
> > > 1 files changed, 31 insertions(+), 8 deletions(-)
> > >
> > > diff --git a/drivers/xen/swiotlb-xen.c b/drivers/xen/swiotlb-xen.c
> > > index 189b8db..4221cb5 100644
> > > --- a/drivers/xen/swiotlb-xen.c
> > > +++ b/drivers/xen/swiotlb-xen.c
> > > @@ -378,8 +378,13 @@ dma_addr_t xen_swiotlb_map_page(struct device *dev, struct page *page,
> > > * buffering it.
> > > */
> > > if (dma_capable(dev, dev_addr, size) &&
> > > - !range_straddles_page_boundary(phys, size) && !swiotlb_force)
> > > + !range_straddles_page_boundary(phys, size) && !swiotlb_force) {
> > > + /* we are not interested in the dma_addr returned by
> > > + * xen_dma_map_page, only in the potential cache flushes executed
> > > + * by the function. */
> > > + xen_dma_map_page(dev, page, offset, size, dir, attrs);
> > > return dev_addr;
> > > + }
> > >
> > > /*
> > > * Oh well, have to allocate and map a bounce buffer.
> > > @@ -388,6 +393,8 @@ dma_addr_t xen_swiotlb_map_page(struct device *dev, struct page *page,
> > > if (map == SWIOTLB_MAP_ERROR)
> > > return DMA_ERROR_CODE;
> > >
> > > + xen_dma_map_page(dev, pfn_to_page(map >> PAGE_SHIFT),
> > > + map & ~PAGE_MASK, size, dir, attrs);
> > > dev_addr = xen_phys_to_bus(map);
> > >
> > > /*
> > > @@ -410,12 +417,15 @@ EXPORT_SYMBOL_GPL(xen_swiotlb_map_page);
> > > * whatever the device wrote there.
> > > */
> > > static void xen_unmap_single(struct device *hwdev, dma_addr_t dev_addr,
> > > - size_t size, enum dma_data_direction dir)
> > > + size_t size, enum dma_data_direction dir,
> > > + struct dma_attrs *attrs)
> > > {
> > > phys_addr_t paddr = xen_bus_to_phys(dev_addr);
> > >
> > > BUG_ON(dir == DMA_NONE);
> > >
> > > + xen_dma_unmap_page(hwdev, paddr, size, dir, attrs);
> > > +
> > > /* NOTE: We use dev_addr here, not paddr! */
> > > if (is_xen_swiotlb_buffer(dev_addr)) {
> > > swiotlb_tbl_unmap_single(hwdev, paddr, size, dir);
> > > @@ -438,7 +448,7 @@ void xen_swiotlb_unmap_page(struct device *hwdev, dma_addr_t dev_addr,
> > > size_t size, enum dma_data_direction dir,
> > > struct dma_attrs *attrs)
> > > {
> > > - xen_unmap_single(hwdev, dev_addr, size, dir);
> > > + xen_unmap_single(hwdev, dev_addr, size, dir, attrs);
> > > }
> > > EXPORT_SYMBOL_GPL(xen_swiotlb_unmap_page);
> > >
> > > @@ -461,11 +471,15 @@ xen_swiotlb_sync_single(struct device *hwdev, dma_addr_t dev_addr,
> > >
> > > BUG_ON(dir == DMA_NONE);
> > >
> > > + if (target == SYNC_FOR_CPU)
> > > + xen_dma_sync_single_for_cpu(hwdev, paddr, size, dir);
> > > +
> > > /* NOTE: We use dev_addr here, not paddr! */
> > > - if (is_xen_swiotlb_buffer(dev_addr)) {
> > > + if (is_xen_swiotlb_buffer(dev_addr))
> > > swiotlb_tbl_sync_single(hwdev, paddr, size, dir, target);
> > > - return;
> > > - }
> > > +
> > > + if (target == SYNC_FOR_DEVICE)
> > > + xen_dma_sync_single_for_cpu(hwdev, paddr, size, dir);
> > >
> > > if (dir != DMA_FROM_DEVICE)
> > > return;
> > > @@ -536,8 +550,17 @@ xen_swiotlb_map_sg_attrs(struct device *hwdev, struct scatterlist *sgl,
> > > return DMA_ERROR_CODE;
> > > }
> > > sg->dma_address = xen_phys_to_bus(map);
> > > - } else
> > > + } else {
> > > + /* we are not interested in the dma_addr returned by
> > > + * xen_dma_map_page, only in the potential cache flushes executed
> > > + * by the function. */
> > > + xen_dma_map_page(hwdev, pfn_to_page(paddr >> PAGE_SHIFT),
> > > + paddr & ~PAGE_MASK,
> > > + sg->length,
> > > + dir,
> > > + attrs);
> > > sg->dma_address = dev_addr;
> > > + }
> > > sg_dma_len(sg) = sg->length;
> > > }
> > > return nelems;
> > > @@ -559,7 +582,7 @@ xen_swiotlb_unmap_sg_attrs(struct device *hwdev, struct scatterlist *sgl,
> > > BUG_ON(dir == DMA_NONE);
> > >
> > > for_each_sg(sgl, sg, nelems, i)
> > > - xen_unmap_single(hwdev, sg->dma_address, sg_dma_len(sg), dir);
> > > + xen_unmap_single(hwdev, sg->dma_address, sg_dma_len(sg), dir, attrs);
> > >
> > > }
> > > EXPORT_SYMBOL_GPL(xen_swiotlb_unmap_sg_attrs);
> > > --
> > > 1.7.2.5
> > >
> >
More information about the linux-arm-kernel
mailing list