| /* |
| * Copyright (C) 2004, 2007-2010, 2011-2012 Synopsys, Inc. (www.synopsys.com) |
| * |
| * This program is free software; you can redistribute it and/or modify |
| * it under the terms of the GNU General Public License version 2 as |
| * published by the Free Software Foundation. |
| * |
| * vineetg: May 2011 |
| * -Support single cycle endian-swap insn in ARC700 4.10 |
| * |
| * vineetg: June 2009 |
| * -Better htonl implementation (5 instead of 9 ALU instructions) |
| * -Hardware assisted single cycle bswap (Use Case of ARC custom instrn) |
| */ |
| |
| #ifndef __ASM_ARC_SWAB_H |
| #define __ASM_ARC_SWAB_H |
| |
| #include <linux/types.h> |
| |
| /* Native single cycle endian swap insn */ |
| #ifdef CONFIG_ARC_HAS_SWAPE |
| |
| #define __arch_swab32(x) \ |
| ({ \ |
| unsigned int tmp=x; \ |
| __asm__ ( \ |
| "swape %0, %1\n\t" \ |
| :"=r" (tmp) \ |
| :"r" (tmp)); \ |
| tmp; \ |
| }) |
| |
| #else |
| |
| /* Several ways of Endian-Swap Emulation for ARC |
| * 0: kernel generic |
| * 1: ARC optimised "C" |
| * 2: ARC Custom instruction |
| */ |
| #define ARC_BSWAP_TYPE 1 |
| |
| #if (ARC_BSWAP_TYPE == 1) /******* Software only ********/ |
| |
| /* The kernel default implementation of htonl is |
| * return x<<24 | x>>24 | |
| * (x & (__u32)0x0000ff00UL)<<8 | (x & (__u32)0x00ff0000UL)>>8; |
| * |
| * This generates 9 instructions on ARC (excluding the ld/st) |
| * |
| * 8051fd8c: ld r3,[r7,20] ; Mem op : Get the value to be swapped |
| * 8051fd98: asl r5,r3,24 ; get 3rd Byte |
| * 8051fd9c: lsr r2,r3,24 ; get 0th Byte |
| * 8051fda0: and r4,r3,0xff00 |
| * 8051fda8: asl r4,r4,8 ; get 1st Byte |
| * 8051fdac: and r3,r3,0x00ff0000 |
| * 8051fdb4: or r2,r2,r5 ; combine 0th and 3rd Bytes |
| * 8051fdb8: lsr r3,r3,8 ; 2nd Byte at correct place in Dst Reg |
| * 8051fdbc: or r2,r2,r4 ; combine 0th and 3rd Bytes with 1st Byte |
| * 8051fdc0: or r2,r2,r3 ; combine 0th, 3rd, 1st Bytes with 2nd Byte |
| * 8051fdc4: st r2,[r1,20] ; Mem op : save result back to mem |
| * |
| * Joern suggested a better "C" algorithm which is great since |
| * (1) It is portable to any architecure |
| * (2) At the same time it takes advantage of ARC ISA (rotate intrns) |
| */ |
| |
| #define __arch_swab32(x) __extension__ \ |
| ({ unsigned long __swab32_in = (x), __swab32_tmp; \ |
| __swab32_tmp = __swab32_in << 8 | __swab32_in >> 24; /* ror tmp,in,24 */\ |
| __swab32_in = __swab32_in << 24 | __swab32_in >> 8; /* ror in,in,8 */ \ |
| __swab32_tmp ^= __swab32_in; \ |
| __swab32_tmp &= 0xff00ff; \ |
| __swab32_tmp ^ __swab32_in; \ |
| }) |
| |
| #elif (ARC_BSWAP_TYPE == 2) /* Custom single cycle bwap instruction */ |
| |
| #define __arch_swab32(x) \ |
| ({ \ |
| unsigned int tmp=x; \ |
| __asm__ ( \ |
| ".extInstruction bswap, 7, 0x00, SUFFIX_NONE, SYNTAX_2OP \n\t" \ |
| "bswap %0, %1\n\t" \ |
| :"=r" (tmp) \ |
| :"r" (tmp)); \ |
| tmp; \ |
| }) |
| |
| #endif /* ARC_BSWAP_TYPE=zzz */ |
| |
| #endif /* CONFIG_ARC_HAS_SWAPE */ |
| |
| #if !defined(__STRICT_ANSI__) || defined(__KERNEL__) |
| # define __BYTEORDER_HAS_U64__ |
| # define __SWAB_64_THRU_32__ |
| #endif |
| |
| |
| #endif |