|  | /* | 
|  | * Copyright (C) 2008-2009 Michal Simek <monstr@monstr.eu> | 
|  | * Copyright (C) 2008-2009 PetaLogix | 
|  | * Copyright (C) 2007 John Williams | 
|  | * | 
|  | * Reasonably optimised generic C-code for memcpy on Microblaze | 
|  | * This is generic C code to do efficient, alignment-aware memmove. | 
|  | * | 
|  | * It is based on demo code originally Copyright 2001 by Intel Corp, taken from | 
|  | * http://www.embedded.com/showArticle.jhtml?articleID=19205567 | 
|  | * | 
|  | * Attempts were made, unsuccessfully, to contact the original | 
|  | * author of this code (Michael Morrow, Intel).  Below is the original | 
|  | * copyright notice. | 
|  | * | 
|  | * This software has been developed by Intel Corporation. | 
|  | * Intel specifically disclaims all warranties, express or | 
|  | * implied, and all liability, including consequential and | 
|  | * other indirect damages, for the use of this program, including | 
|  | * liability for infringement of any proprietary rights, | 
|  | * and including the warranties of merchantability and fitness | 
|  | * for a particular purpose. Intel does not assume any | 
|  | * responsibility for and errors which may appear in this program | 
|  | * not any responsibility to update it. | 
|  | */ | 
|  |  | 
|  | #include <linux/export.h> | 
|  | #include <linux/types.h> | 
|  | #include <linux/stddef.h> | 
|  | #include <linux/compiler.h> | 
|  | #include <linux/string.h> | 
|  |  | 
|  | #ifdef __HAVE_ARCH_MEMMOVE | 
|  | #ifndef CONFIG_OPT_LIB_FUNCTION | 
|  | void *memmove(void *v_dst, const void *v_src, __kernel_size_t c) | 
|  | { | 
|  | const char *src = v_src; | 
|  | char *dst = v_dst; | 
|  |  | 
|  | if (!c) | 
|  | return v_dst; | 
|  |  | 
|  | /* Use memcpy when source is higher than dest */ | 
|  | if (v_dst <= v_src) | 
|  | return memcpy(v_dst, v_src, c); | 
|  |  | 
|  | /* copy backwards, from end to beginning */ | 
|  | src += c; | 
|  | dst += c; | 
|  |  | 
|  | /* Simple, byte oriented memmove. */ | 
|  | while (c--) | 
|  | *--dst = *--src; | 
|  |  | 
|  | return v_dst; | 
|  | } | 
|  | #else /* CONFIG_OPT_LIB_FUNCTION */ | 
|  | void *memmove(void *v_dst, const void *v_src, __kernel_size_t c) | 
|  | { | 
|  | const char *src = v_src; | 
|  | char *dst = v_dst; | 
|  | const uint32_t *i_src; | 
|  | uint32_t *i_dst; | 
|  |  | 
|  | if (!c) | 
|  | return v_dst; | 
|  |  | 
|  | /* Use memcpy when source is higher than dest */ | 
|  | if (v_dst <= v_src) | 
|  | return memcpy(v_dst, v_src, c); | 
|  |  | 
|  | /* The following code tries to optimize the copy by using unsigned | 
|  | * alignment. This will work fine if both source and destination are | 
|  | * aligned on the same boundary. However, if they are aligned on | 
|  | * different boundaries shifts will be necessary. This might result in | 
|  | * bad performance on MicroBlaze systems without a barrel shifter. | 
|  | */ | 
|  | /* FIXME this part needs more test */ | 
|  | /* Do a descending copy - this is a bit trickier! */ | 
|  | dst += c; | 
|  | src += c; | 
|  |  | 
|  | if (c >= 4) { | 
|  | unsigned  value, buf_hold; | 
|  |  | 
|  | /* Align the destination to a word boundary. */ | 
|  | /* This is done in an endian independent manner. */ | 
|  |  | 
|  | switch ((unsigned long)dst & 3) { | 
|  | case 3: | 
|  | *--dst = *--src; | 
|  | --c; | 
|  | case 2: | 
|  | *--dst = *--src; | 
|  | --c; | 
|  | case 1: | 
|  | *--dst = *--src; | 
|  | --c; | 
|  | } | 
|  |  | 
|  | i_dst = (void *)dst; | 
|  | /* Choose a copy scheme based on the source */ | 
|  | /* alignment relative to dstination. */ | 
|  | switch ((unsigned long)src & 3) { | 
|  | case 0x0:	/* Both byte offsets are aligned */ | 
|  |  | 
|  | i_src  = (const void *)src; | 
|  |  | 
|  | for (; c >= 4; c -= 4) | 
|  | *--i_dst = *--i_src; | 
|  |  | 
|  | src  = (const void *)i_src; | 
|  | break; | 
|  | case 0x1:	/* Unaligned - Off by 1 */ | 
|  | /* Word align the source */ | 
|  | i_src = (const void *) (((unsigned)src + 4) & ~3); | 
|  | #ifndef __MICROBLAZEEL__ | 
|  | /* Load the holding buffer */ | 
|  | buf_hold = *--i_src >> 24; | 
|  |  | 
|  | for (; c >= 4; c -= 4) { | 
|  | value = *--i_src; | 
|  | *--i_dst = buf_hold << 8 | value; | 
|  | buf_hold = value >> 24; | 
|  | } | 
|  | #else | 
|  | /* Load the holding buffer */ | 
|  | buf_hold = (*--i_src & 0xFF) << 24; | 
|  |  | 
|  | for (; c >= 4; c -= 4) { | 
|  | value = *--i_src; | 
|  | *--i_dst = buf_hold | | 
|  | ((value & 0xFFFFFF00) >> 8); | 
|  | buf_hold = (value  & 0xFF) << 24; | 
|  | } | 
|  | #endif | 
|  | /* Realign the source */ | 
|  | src = (const void *)i_src; | 
|  | src += 1; | 
|  | break; | 
|  | case 0x2:	/* Unaligned - Off by 2 */ | 
|  | /* Word align the source */ | 
|  | i_src = (const void *) (((unsigned)src + 4) & ~3); | 
|  | #ifndef __MICROBLAZEEL__ | 
|  | /* Load the holding buffer */ | 
|  | buf_hold = *--i_src >> 16; | 
|  |  | 
|  | for (; c >= 4; c -= 4) { | 
|  | value = *--i_src; | 
|  | *--i_dst = buf_hold << 16 | value; | 
|  | buf_hold = value >> 16; | 
|  | } | 
|  | #else | 
|  | /* Load the holding buffer */ | 
|  | buf_hold = (*--i_src & 0xFFFF) << 16; | 
|  |  | 
|  | for (; c >= 4; c -= 4) { | 
|  | value = *--i_src; | 
|  | *--i_dst = buf_hold | | 
|  | ((value & 0xFFFF0000) >> 16); | 
|  | buf_hold = (value & 0xFFFF) << 16; | 
|  | } | 
|  | #endif | 
|  | /* Realign the source */ | 
|  | src = (const void *)i_src; | 
|  | src += 2; | 
|  | break; | 
|  | case 0x3:	/* Unaligned - Off by 3 */ | 
|  | /* Word align the source */ | 
|  | i_src = (const void *) (((unsigned)src + 4) & ~3); | 
|  | #ifndef __MICROBLAZEEL__ | 
|  | /* Load the holding buffer */ | 
|  | buf_hold = *--i_src >> 8; | 
|  |  | 
|  | for (; c >= 4; c -= 4) { | 
|  | value = *--i_src; | 
|  | *--i_dst = buf_hold << 24 | value; | 
|  | buf_hold = value >> 8; | 
|  | } | 
|  | #else | 
|  | /* Load the holding buffer */ | 
|  | buf_hold = (*--i_src & 0xFFFFFF) << 8; | 
|  |  | 
|  | for (; c >= 4; c -= 4) { | 
|  | value = *--i_src; | 
|  | *--i_dst = buf_hold | | 
|  | ((value & 0xFF000000) >> 24); | 
|  | buf_hold = (value & 0xFFFFFF) << 8; | 
|  | } | 
|  | #endif | 
|  | /* Realign the source */ | 
|  | src = (const void *)i_src; | 
|  | src += 3; | 
|  | break; | 
|  | } | 
|  | dst = (void *)i_dst; | 
|  | } | 
|  |  | 
|  | /* simple fast copy, ... unless a cache boundary is crossed */ | 
|  | /* Finish off any remaining bytes */ | 
|  | switch (c) { | 
|  | case 4: | 
|  | *--dst = *--src; | 
|  | case 3: | 
|  | *--dst = *--src; | 
|  | case 2: | 
|  | *--dst = *--src; | 
|  | case 1: | 
|  | *--dst = *--src; | 
|  | } | 
|  | return v_dst; | 
|  | } | 
|  | #endif /* CONFIG_OPT_LIB_FUNCTION */ | 
|  | EXPORT_SYMBOL(memmove); | 
|  | #endif /* __HAVE_ARCH_MEMMOVE */ |