mirror of
https://git.planet-casio.com/Lephenixnoir/gint.git
synced 2025-01-01 06:23:35 +01:00
dma: finalize dma_memset() and dma_memcpy()
Adds support for dma_memcpy(), and uses a proper ILRAM allocation scheme (static linking here) for the temporary buffer in dma_memset().
This commit is contained in:
parent
15558c8fb3
commit
fc7aab6eba
3 changed files with 37 additions and 5 deletions
|
@ -83,16 +83,31 @@ void dma_transfer_noint(int channel, dma_size_t size, uint blocks,
|
|||
//---
|
||||
|
||||
/* dma_memset(): Fast 32-aligned memset
|
||||
This function is your typical memset, except that the destination and size
|
||||
|
||||
This function is your typical memset(), except that the destination and size
|
||||
must be 32-aligned, and that the pattern is 4 bytes instead of one. It is
|
||||
replicated to 32 bytes then used to fill the destination area. This 4-byte
|
||||
fixed size may be lifted in future versions.
|
||||
|
||||
This function cannot be used with virtualized (P0) addresses.
|
||||
|
||||
@dst Destination address (32-aligned)
|
||||
@pattern 4-byte pattern to fill @dst
|
||||
@size Sie of destination area (32-aligned) */
|
||||
void *dma_memset(void *dst, uint32_t pattern, size_t size);
|
||||
|
||||
/* dma_memcpy(): Fast 32-aligned memcpy
|
||||
|
||||
This function works exactly like memcpy(), but it expects 32-aligned source,
|
||||
destination, and size, and uses the DMA to efficiently copy.
|
||||
|
||||
This function cannot be used with virtualized (P0) addresses.
|
||||
|
||||
@dst Destination address (32-aligned)
|
||||
@dst Source addresss (32-aligned)
|
||||
@size Size of region (32-aligned) */
|
||||
void *dma_memcpy(void * restrict dst, const void * restrict src, size_t size);
|
||||
|
||||
#endif /* FXCG50 */
|
||||
|
||||
#endif /* GINT_DMA */
|
||||
|
|
10
src/dma/memcpy.c
Normal file
10
src/dma/memcpy.c
Normal file
|
@ -0,0 +1,10 @@
|
|||
#include <gint/dma.h>
|
||||
|
||||
/* dma_memcpy(): Fast 32-aligned memcpy */
|
||||
void *dma_memcpy(void * restrict dst, const void * restrict src, size_t size)
|
||||
{
|
||||
dma_transfer(1, DMA_32B, size >> 5, src, DMA_INC, dst, DMA_INC);
|
||||
dma_transfer_wait(1);
|
||||
|
||||
return dst;
|
||||
}
|
|
@ -1,13 +1,20 @@
|
|||
#include <gint/dma.h>
|
||||
|
||||
/* Allocate a 32-byte buffer in ILRAM */
|
||||
GALIGNED(32) GILRAM static uint32_t ILbuf[8];
|
||||
|
||||
/* dma_memset(): Fast 32-aligned memset */
|
||||
void *dma_memset(void *dst, uint32_t l, size_t size)
|
||||
{
|
||||
/* TODO: Use a proper IL memory allocation scheme */
|
||||
uint32_t *IL = (void *)0xe5200000;
|
||||
for(int i = 0; i < 8; i++) IL[i] = l;
|
||||
/* Prepare the ILRAM buffer. We need to use ILRAM because the DMA will
|
||||
have to read the operand once per block, as opposed to an assembler
|
||||
routine that would hold it in a register. If we place it in RAM, the
|
||||
DMA will perform twice as many RAM accesses as the handwritten
|
||||
assembler, which would be very slow. By using ILRAM we use two
|
||||
different memory regions, making the DMA faster than the CPU. */
|
||||
for(int i = 0; i < 8; i++) ILbuf[i] = l;
|
||||
|
||||
dma_transfer(1, DMA_32B, size >> 5, IL, DMA_FIXED, dst, DMA_INC);
|
||||
dma_transfer(1, DMA_32B, size >> 5, ILbuf, DMA_FIXED, dst, DMA_INC);
|
||||
dma_transfer_wait(1);
|
||||
return dst;
|
||||
}
|
||||
|
|
Loading…
Reference in a new issue