*/
void *memcpy(void *Dest, const void *Src, size_t Num)
{
+// Debug("\nmemcpy:Num=0x%x by %p", Num, __builtin_return_address(0));
if( ((Uint)Dest & 3) || ((Uint)Src & 3) )
__asm__ __volatile__ ("rep movsb" :: "D" (Dest), "S" (Src), "c" (Num));
else {