Changeset 3933 for trunk/lib_ir/s2p.h


Ignore:
Timestamp:
Jul 28, 2014, 1:03:33 PM (5 years ago)
Author:
linmengl
Message:

IR inline s2p_bytepack, get the same perf result of SSE2 now.

File:
1 edited

Legend:

Unmodified
Added
Removed
  • trunk/lib_ir/s2p.h

    r3922 r3933  
    2020  BitBlock slli_16(BitBlock a, BitBlock shift_mask);
    2121
    22   BitBlock s2p_step_ir(BitBlock s0, BitBlock s1, BitBlock hi_mask, BitBlock shift_mask, BitBlock *p0, BitBlock *p1);
     22  void s2p_step_ir(BitBlock s0, BitBlock s1, BitBlock hi_mask, BitBlock shift_mask, BitBlock *p0, BitBlock *p1);
     23
     24  void s2p_bytepack_ir(BitBlock s0, BitBlock s1, BitBlock s2, BitBlock s3, BitBlock s4, BitBlock s5, BitBlock s6, BitBlock s7, BitBlock* p0, BitBlock* p1, BitBlock* p2, BitBlock* p3, BitBlock* p4, BitBlock* p5, BitBlock* p6, BitBlock* p7);
    2325
    2426  BitBlock const16_1();
     
    3133}
    3234
    33 #define S2P_ALGORITHM s2p_bytepack
     35//S2P_ALGORITHM: s2p_bytepack_inline, written in pure IR in order to use
     36//immediate constants in shifting.
     37#define S2P_ALGORITHM s2p_bytepack_inline
    3438
     39#define s2p_bytepack_inline(s0, s1, s2, s3, s4, s5, s6, s7, p0, p1, p2, p3, p4, p5, p6, p7) \
     40  s2p_bytepack_ir(s0, s1, s2, s3, s4, s5, s6, s7, &p0, &p1, &p2, &p3, &p4, &p5, &p6, &p7)
     41
     42//This macro is deprecated. Use inline version.
    3543#define s2p_bytepack(s0, s1, s2, s3, s4, s5, s6, s7, p0, p1, p2, p3, p4, p5, p6, p7) \
    3644  do {\
Note: See TracChangeset for help on using the changeset viewer.