2 * arch/arm/common/dmabounce.c
4 * Special dma_{map/unmap/dma_sync}_* routines for systems that have
5 * limited DMA windows. These functions utilize bounce buffers to
6 * copy data to/from buffers located outside the DMA region. This
7 * only works for systems in which DMA memory is at the bottom of
8 * RAM, the remainder of memory is at the top and the DMA memory
9 * can be marked as ZONE_DMA. Anything beyond that such as discontigous
10 * DMA windows will require custom implementations that reserve memory
11 * areas at early bootup.
13 * Original version by Brad Parker (brad@heeltoe.com)
14 * Re-written by Christopher Hoover <ch@murgatroid.com>
15 * Made generic by Deepak Saxena <dsaxena@plexity.net>
17 * Copyright (C) 2002 Hewlett Packard Company.
18 * Copyright (C) 2004 MontaVista Software, Inc.
20 * This program is free software; you can redistribute it and/or
21 * modify it under the terms of the GNU General Public License
22 * version 2 as published by the Free Software Foundation.
25 #include <linux/module.h>
26 #include <linux/init.h>
27 #include <linux/slab.h>
28 #include <linux/device.h>
29 #include <linux/dma-mapping.h>
30 #include <linux/dmapool.h>
31 #include <linux/list.h>
33 #include <asm/cacheflush.h>
39 #define DO_STATS(X) do { X ; } while (0)
41 #define DO_STATS(X) do { } while (0)
44 /* ************************************************** */
47 struct list_head node;
49 /* original request */
54 /* safe buffer info */
55 struct dmabounce_pool *pool;
57 dma_addr_t safe_dma_addr;
60 struct dmabounce_pool {
62 struct dma_pool *pool;
68 struct dmabounce_device_info {
69 struct list_head node;
72 struct list_head safe_buffers;
74 unsigned long total_allocs;
75 unsigned long map_op_count;
76 unsigned long bounce_count;
78 struct dmabounce_pool small;
79 struct dmabounce_pool large;
84 static LIST_HEAD(dmabounce_devs);
87 static void print_alloc_stats(struct dmabounce_device_info *device_info)
90 "%s: dmabounce: sbp: %lu, lbp: %lu, other: %lu, total: %lu\n",
91 device_info->dev->bus_id,
92 device_info->small.allocs, device_info->large.allocs,
93 device_info->total_allocs - device_info->small.allocs -
94 device_info->large.allocs,
95 device_info->total_allocs);
99 /* find the given device in the dmabounce device list */
100 static inline struct dmabounce_device_info *
101 find_dmabounce_dev(struct device *dev)
103 struct dmabounce_device_info *d;
105 list_for_each_entry(d, &dmabounce_devs, node)
113 /* allocate a 'safe' buffer and keep track of it */
114 static inline struct safe_buffer *
115 alloc_safe_buffer(struct dmabounce_device_info *device_info, void *ptr,
116 size_t size, enum dma_data_direction dir)
118 struct safe_buffer *buf;
119 struct dmabounce_pool *pool;
120 struct device *dev = device_info->dev;
123 dev_dbg(dev, "%s(ptr=%p, size=%d, dir=%d)\n",
124 __func__, ptr, size, dir);
126 if (size <= device_info->small.size) {
127 pool = &device_info->small;
128 } else if (size <= device_info->large.size) {
129 pool = &device_info->large;
134 buf = kmalloc(sizeof(struct safe_buffer), GFP_ATOMIC);
136 dev_warn(dev, "%s: kmalloc failed\n", __func__);
142 buf->direction = dir;
146 buf->safe = dma_pool_alloc(pool->pool, GFP_ATOMIC,
147 &buf->safe_dma_addr);
149 buf->safe = dma_alloc_coherent(dev, size, &buf->safe_dma_addr,
153 if (buf->safe == NULL) {
155 "%s: could not alloc dma memory (size=%d)\n",
164 device_info->total_allocs++;
165 if (device_info->total_allocs % 1000 == 0)
166 print_alloc_stats(device_info);
169 write_lock_irqsave(&device_info->lock, flags);
171 list_add(&buf->node, &device_info->safe_buffers);
173 write_unlock_irqrestore(&device_info->lock, flags);
178 /* determine if a buffer is from our "safe" pool */
179 static inline struct safe_buffer *
180 find_safe_buffer(struct dmabounce_device_info *device_info, dma_addr_t safe_dma_addr)
182 struct safe_buffer *b, *rb = NULL;
185 read_lock_irqsave(&device_info->lock, flags);
187 list_for_each_entry(b, &device_info->safe_buffers, node)
188 if (b->safe_dma_addr == safe_dma_addr) {
193 read_unlock_irqrestore(&device_info->lock, flags);
198 free_safe_buffer(struct dmabounce_device_info *device_info, struct safe_buffer *buf)
202 dev_dbg(device_info->dev, "%s(buf=%p)\n", __func__, buf);
204 write_lock_irqsave(&device_info->lock, flags);
206 list_del(&buf->node);
208 write_unlock_irqrestore(&device_info->lock, flags);
211 dma_pool_free(buf->pool->pool, buf->safe, buf->safe_dma_addr);
213 dma_free_coherent(device_info->dev, buf->size, buf->safe,
219 /* ************************************************** */
222 static void print_map_stats(struct dmabounce_device_info *device_info)
224 dev_info(device_info->dev,
225 "dmabounce: map_op_count=%lu, bounce_count=%lu\n",
226 device_info->map_op_count, device_info->bounce_count);
230 static inline dma_addr_t
231 map_single(struct device *dev, void *ptr, size_t size,
232 enum dma_data_direction dir)
234 struct dmabounce_device_info *device_info = find_dmabounce_dev(dev);
236 int needs_bounce = 0;
239 DO_STATS ( device_info->map_op_count++ );
241 dma_addr = virt_to_dma(dev, ptr);
244 unsigned long mask = *dev->dma_mask;
247 limit = (mask + 1) & ~mask;
248 if (limit && size > limit) {
249 dev_err(dev, "DMA mapping too big (requested %#x "
250 "mask %#Lx)\n", size, *dev->dma_mask);
255 * Figure out if we need to bounce from the DMA mask.
257 needs_bounce = (dma_addr | (dma_addr + size - 1)) & ~mask;
260 if (device_info && (needs_bounce || dma_needs_bounce(dev, dma_addr, size))) {
261 struct safe_buffer *buf;
263 buf = alloc_safe_buffer(device_info, ptr, size, dir);
265 dev_err(dev, "%s: unable to map unsafe buffer %p!\n",
271 "%s: unsafe buffer %p (phy=%p) mapped to %p (phy=%p)\n",
272 __func__, buf->ptr, (void *) virt_to_dma(dev, buf->ptr),
273 buf->safe, (void *) buf->safe_dma_addr);
275 if ((dir == DMA_TO_DEVICE) ||
276 (dir == DMA_BIDIRECTIONAL)) {
277 dev_dbg(dev, "%s: copy unsafe %p to safe %p, size %d\n",
278 __func__, ptr, buf->safe, size);
279 memcpy(buf->safe, ptr, size);
283 dma_addr = buf->safe_dma_addr;
286 * We don't need to sync the DMA buffer since
287 * it was allocated via the coherent allocators.
289 consistent_sync(ptr, size, dir);
296 unmap_single(struct device *dev, dma_addr_t dma_addr, size_t size,
297 enum dma_data_direction dir)
299 struct dmabounce_device_info *device_info = find_dmabounce_dev(dev);
300 struct safe_buffer *buf = NULL;
303 * Trying to unmap an invalid mapping
305 if (dma_mapping_error(dma_addr)) {
306 dev_err(dev, "Trying to unmap invalid mapping\n");
311 buf = find_safe_buffer(device_info, dma_addr);
314 BUG_ON(buf->size != size);
317 "%s: unsafe buffer %p (phy=%p) mapped to %p (phy=%p)\n",
318 __func__, buf->ptr, (void *) virt_to_dma(dev, buf->ptr),
319 buf->safe, (void *) buf->safe_dma_addr);
321 DO_STATS ( device_info->bounce_count++ );
323 if (dir == DMA_FROM_DEVICE || dir == DMA_BIDIRECTIONAL) {
327 "%s: copy back safe %p to unsafe %p size %d\n",
328 __func__, buf->safe, buf->ptr, size);
329 memcpy(buf->ptr, buf->safe, size);
332 * DMA buffers must have the same cache properties
333 * as if they were really used for DMA - which means
334 * data must be written back to RAM. Note that
335 * we don't use dmac_flush_range() here for the
336 * bidirectional case because we know the cache
337 * lines will be coherent with the data written.
339 ptr = (unsigned long)buf->ptr;
340 dmac_clean_range(ptr, ptr + size);
342 free_safe_buffer(device_info, buf);
347 sync_single(struct device *dev, dma_addr_t dma_addr, size_t size,
348 enum dma_data_direction dir)
350 struct dmabounce_device_info *device_info = find_dmabounce_dev(dev);
351 struct safe_buffer *buf = NULL;
354 buf = find_safe_buffer(device_info, dma_addr);
358 * Both of these checks from original code need to be
359 * commented out b/c some drivers rely on the following:
361 * 1) Drivers may map a large chunk of memory into DMA space
362 * but only sync a small portion of it. Good example is
363 * allocating a large buffer, mapping it, and then
364 * breaking it up into small descriptors. No point
365 * in syncing the whole buffer if you only have to
366 * touch one descriptor.
368 * 2) Buffers that are mapped as DMA_BIDIRECTIONAL are
369 * usually only synced in one dir at a time.
371 * See drivers/net/eepro100.c for examples of both cases.
375 * BUG_ON(buf->size != size);
376 * BUG_ON(buf->direction != dir);
380 "%s: unsafe buffer %p (phy=%p) mapped to %p (phy=%p)\n",
381 __func__, buf->ptr, (void *) virt_to_dma(dev, buf->ptr),
382 buf->safe, (void *) buf->safe_dma_addr);
384 DO_STATS ( device_info->bounce_count++ );
387 case DMA_FROM_DEVICE:
389 "%s: copy back safe %p to unsafe %p size %d\n",
390 __func__, buf->safe, buf->ptr, size);
391 memcpy(buf->ptr, buf->safe, size);
395 "%s: copy out unsafe %p to safe %p, size %d\n",
396 __func__,buf->ptr, buf->safe, size);
397 memcpy(buf->safe, buf->ptr, size);
399 case DMA_BIDIRECTIONAL:
400 BUG(); /* is this allowed? what does it mean? */
405 * No need to sync the safe buffer - it was allocated
406 * via the coherent allocators.
409 consistent_sync(dma_to_virt(dev, dma_addr), size, dir);
413 /* ************************************************** */
416 * see if a buffer address is in an 'unsafe' range. if it is
417 * allocate a 'safe' buffer and copy the unsafe buffer into it.
418 * substitute the safe buffer for the unsafe one.
419 * (basically move the buffer from an unsafe area to a safe one)
422 dma_map_single(struct device *dev, void *ptr, size_t size,
423 enum dma_data_direction dir)
427 dev_dbg(dev, "%s(ptr=%p,size=%d,dir=%x)\n",
428 __func__, ptr, size, dir);
430 BUG_ON(dir == DMA_NONE);
432 dma_addr = map_single(dev, ptr, size, dir);
438 * see if a mapped address was really a "safe" buffer and if so, copy
439 * the data from the safe buffer back to the unsafe buffer and free up
440 * the safe buffer. (basically return things back to the way they
445 dma_unmap_single(struct device *dev, dma_addr_t dma_addr, size_t size,
446 enum dma_data_direction dir)
448 dev_dbg(dev, "%s(ptr=%p,size=%d,dir=%x)\n",
449 __func__, (void *) dma_addr, size, dir);
451 BUG_ON(dir == DMA_NONE);
453 unmap_single(dev, dma_addr, size, dir);
457 dma_map_sg(struct device *dev, struct scatterlist *sg, int nents,
458 enum dma_data_direction dir)
462 dev_dbg(dev, "%s(sg=%p,nents=%d,dir=%x)\n",
463 __func__, sg, nents, dir);
465 BUG_ON(dir == DMA_NONE);
467 for (i = 0; i < nents; i++, sg++) {
468 struct page *page = sg->page;
469 unsigned int offset = sg->offset;
470 unsigned int length = sg->length;
471 void *ptr = page_address(page) + offset;
474 map_single(dev, ptr, length, dir);
481 dma_unmap_sg(struct device *dev, struct scatterlist *sg, int nents,
482 enum dma_data_direction dir)
486 dev_dbg(dev, "%s(sg=%p,nents=%d,dir=%x)\n",
487 __func__, sg, nents, dir);
489 BUG_ON(dir == DMA_NONE);
491 for (i = 0; i < nents; i++, sg++) {
492 dma_addr_t dma_addr = sg->dma_address;
493 unsigned int length = sg->length;
495 unmap_single(dev, dma_addr, length, dir);
500 dma_sync_single_for_cpu(struct device *dev, dma_addr_t dma_addr, size_t size,
501 enum dma_data_direction dir)
503 dev_dbg(dev, "%s(ptr=%p,size=%d,dir=%x)\n",
504 __func__, (void *) dma_addr, size, dir);
506 sync_single(dev, dma_addr, size, dir);
510 dma_sync_single_for_device(struct device *dev, dma_addr_t dma_addr, size_t size,
511 enum dma_data_direction dir)
513 dev_dbg(dev, "%s(ptr=%p,size=%d,dir=%x)\n",
514 __func__, (void *) dma_addr, size, dir);
516 sync_single(dev, dma_addr, size, dir);
520 dma_sync_sg_for_cpu(struct device *dev, struct scatterlist *sg, int nents,
521 enum dma_data_direction dir)
525 dev_dbg(dev, "%s(sg=%p,nents=%d,dir=%x)\n",
526 __func__, sg, nents, dir);
528 BUG_ON(dir == DMA_NONE);
530 for (i = 0; i < nents; i++, sg++) {
531 dma_addr_t dma_addr = sg->dma_address;
532 unsigned int length = sg->length;
534 sync_single(dev, dma_addr, length, dir);
539 dma_sync_sg_for_device(struct device *dev, struct scatterlist *sg, int nents,
540 enum dma_data_direction dir)
544 dev_dbg(dev, "%s(sg=%p,nents=%d,dir=%x)\n",
545 __func__, sg, nents, dir);
547 BUG_ON(dir == DMA_NONE);
549 for (i = 0; i < nents; i++, sg++) {
550 dma_addr_t dma_addr = sg->dma_address;
551 unsigned int length = sg->length;
553 sync_single(dev, dma_addr, length, dir);
558 dmabounce_init_pool(struct dmabounce_pool *pool, struct device *dev, const char *name,
562 DO_STATS(pool->allocs = 0);
563 pool->pool = dma_pool_create(name, dev, size,
564 0 /* byte alignment */,
565 0 /* no page-crossing issues */);
567 return pool->pool ? 0 : -ENOMEM;
571 dmabounce_register_dev(struct device *dev, unsigned long small_buffer_size,
572 unsigned long large_buffer_size)
574 struct dmabounce_device_info *device_info;
577 device_info = kmalloc(sizeof(struct dmabounce_device_info), GFP_ATOMIC);
580 "Could not allocated dmabounce_device_info for %s",
585 ret = dmabounce_init_pool(&device_info->small, dev,
586 "small_dmabounce_pool", small_buffer_size);
589 "dmabounce: could not allocate DMA pool for %ld byte objects\n",
594 if (large_buffer_size) {
595 ret = dmabounce_init_pool(&device_info->large, dev,
596 "large_dmabounce_pool",
600 "dmabounce: could not allocate DMA pool for %ld byte objects\n",
606 device_info->dev = dev;
607 INIT_LIST_HEAD(&device_info->safe_buffers);
608 rwlock_init(&device_info->lock);
611 device_info->total_allocs = 0;
612 device_info->map_op_count = 0;
613 device_info->bounce_count = 0;
616 list_add(&device_info->node, &dmabounce_devs);
618 printk(KERN_INFO "dmabounce: registered device %s on %s bus\n",
619 dev->bus_id, dev->bus->name);
624 dma_pool_destroy(device_info->small.pool);
631 dmabounce_unregister_dev(struct device *dev)
633 struct dmabounce_device_info *device_info = find_dmabounce_dev(dev);
637 "%s: Never registered with dmabounce but attempting" \
638 "to unregister!\n", dev->bus_id);
642 if (!list_empty(&device_info->safe_buffers)) {
644 "%s: Removing from dmabounce with pending buffers!\n",
649 if (device_info->small.pool)
650 dma_pool_destroy(device_info->small.pool);
651 if (device_info->large.pool)
652 dma_pool_destroy(device_info->large.pool);
655 print_alloc_stats(device_info);
656 print_map_stats(device_info);
659 list_del(&device_info->node);
663 printk(KERN_INFO "dmabounce: device %s on %s bus unregistered\n",
664 dev->bus_id, dev->bus->name);
668 EXPORT_SYMBOL(dma_map_single);
669 EXPORT_SYMBOL(dma_unmap_single);
670 EXPORT_SYMBOL(dma_map_sg);
671 EXPORT_SYMBOL(dma_unmap_sg);
672 EXPORT_SYMBOL(dma_sync_single_for_cpu);
673 EXPORT_SYMBOL(dma_sync_single_for_device);
674 EXPORT_SYMBOL(dma_sync_sg);
675 EXPORT_SYMBOL(dmabounce_register_dev);
676 EXPORT_SYMBOL(dmabounce_unregister_dev);
678 MODULE_AUTHOR("Christopher Hoover <ch@hpl.hp.com>, Deepak Saxena <dsaxena@plexity.net>");
679 MODULE_DESCRIPTION("Special dma_{map/unmap/dma_sync}_* routines for systems with limited DMA windows");
680 MODULE_LICENSE("GPL");