summaryrefslogtreecommitdiff
path: root/src/gallium/drivers/cell/spu/spu_shuffle.h
blob: 74f2a0b6d2eab008601ab94ef28ff71e134a04f5 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
#ifndef SPU_SHUFFLE_H
#define SPU_SHUFFLE_H

/*
 * Generate shuffle patterns with minimal fuss.
 *
 * Based on ideas from 
 * http://www.insomniacgames.com/tech/articles/0408/files/shuffles.pdf
 *
 * A-P indicates 0-15th position in first vector
 * a-p indicates 0-15th position in second vector
 *
 * +--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+
 * |00|01|02|03|04|05|06|07|08|09|0a|0b|0c|0d|0e|0f|
 * +--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+
 * |          A|          B|          C|          D|
 * +-----+-----+-----+-----+-----+-----+-----+-----+
 * |    A|    B|    C|    D|    E|    F|    G|    H|
 * +--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+
 * | A| B| C| D| E| F| G| H| I| J| K| L| M| N| O| P|
 * +--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+
 *
 * x or X indicates 0xff
 * 8 indicates 0x80
 * 0 indicates 0x00
 *
 * The macros SHUFFLE4() SHUFFLE8() and SHUFFLE16() provide a const vector 
 * unsigned char literal suitable for use with spu_shuffle().
 *
 * The macros SHUFB4() SHUFB8() and SHUFB16() provide a const qword vector 
 * literal suitable for use with si_shufb().
 *
 *
 * For example :
 * SHUFB4(A,A,A,A)
 * expands to :
 * ((const qword){0,1,2,3,0,1,2,3,0,1,2,3,0,1,2,3})
 * 
 * SHUFFLE8(A,B,a,b,C,c,8,8)
 * expands to :
 * ((const vector unsigned char){0x00,0x01,0x02,0x03,0x10,0x11,0x12,0x13,
 *				 0x04,0x05,0x14,0x15,0xe0,0xe0,0xe0,0xe0})
 *
 */

#include <spu_intrinsics.h>

#define SHUFFLE_PATTERN_4_A__  0x00, 0x01, 0x02, 0x03
#define SHUFFLE_PATTERN_4_B__  0x04, 0x05, 0x06, 0x07
#define SHUFFLE_PATTERN_4_C__  0x08, 0x09, 0x0a, 0x0b
#define SHUFFLE_PATTERN_4_D__  0x0c, 0x0d, 0x0e, 0x0f
#define SHUFFLE_PATTERN_4_a__  0x10, 0x11, 0x12, 0x13
#define SHUFFLE_PATTERN_4_b__  0x14, 0x15, 0x16, 0x17
#define SHUFFLE_PATTERN_4_c__  0x18, 0x19, 0x1a, 0x1b
#define SHUFFLE_PATTERN_4_d__  0x1c, 0x1d, 0x1e, 0x1f
#define SHUFFLE_PATTERN_4_X__  0xc0, 0xc0, 0xc0, 0xc0
#define SHUFFLE_PATTERN_4_x__  0xc0, 0xc0, 0xc0, 0xc0
#define SHUFFLE_PATTERN_4_0__  0x80, 0x80, 0x80, 0x80
#define SHUFFLE_PATTERN_4_8__  0xe0, 0xe0, 0xe0, 0xe0

#define SHUFFLE_VECTOR_4__(A, B, C, D) \
   SHUFFLE_PATTERN_4_##A##__, \
   SHUFFLE_PATTERN_4_##B##__, \
   SHUFFLE_PATTERN_4_##C##__, \
   SHUFFLE_PATTERN_4_##D##__

#define SHUFFLE4(A, B, C, D) \
   ((const vector unsigned char){ \
      SHUFFLE_VECTOR_4__(A, B, C, D) \
   })

#define SHUFB4(A, B, C, D) \
   ((const qword){ \
      SHUFFLE_VECTOR_4__(A, B, C, D) \
   })


#define SHUFFLE_PATTERN_8_A__  0x00, 0x01
#define SHUFFLE_PATTERN_8_B__  0x02, 0x03
#define SHUFFLE_PATTERN_8_C__  0x04, 0x05
#define SHUFFLE_PATTERN_8_D__  0x06, 0x07
#define SHUFFLE_PATTERN_8_E__  0x08, 0x09
#define SHUFFLE_PATTERN_8_F__  0x0a, 0x0b
#define SHUFFLE_PATTERN_8_G__  0x0c, 0x0d
#define SHUFFLE_PATTERN_8_H__  0x0e, 0x0f
#define SHUFFLE_PATTERN_8_a__  0x10, 0x11
#define SHUFFLE_PATTERN_8_b__  0x12, 0x13
#define SHUFFLE_PATTERN_8_c__  0x14, 0x15
#define SHUFFLE_PATTERN_8_d__  0x16, 0x17
#define SHUFFLE_PATTERN_8_e__  0x18, 0x19
#define SHUFFLE_PATTERN_8_f__  0x1a, 0x1b
#define SHUFFLE_PATTERN_8_g__  0x1c, 0x1d
#define SHUFFLE_PATTERN_8_h__  0x1e, 0x1f
#define SHUFFLE_PATTERN_8_X__  0xc0, 0xc0
#define SHUFFLE_PATTERN_8_x__  0xc0, 0xc0
#define SHUFFLE_PATTERN_8_0__  0x80, 0x80
#define SHUFFLE_PATTERN_8_8__  0xe0, 0xe0


#define SHUFFLE_VECTOR_8__(A, B, C, D, E, F, G, H) \
   SHUFFLE_PATTERN_8_##A##__, \
   SHUFFLE_PATTERN_8_##B##__, \
   SHUFFLE_PATTERN_8_##C##__, \
   SHUFFLE_PATTERN_8_##D##__, \
   SHUFFLE_PATTERN_8_##E##__, \
   SHUFFLE_PATTERN_8_##F##__, \
   SHUFFLE_PATTERN_8_##G##__, \
   SHUFFLE_PATTERN_8_##H##__

#define SHUFFLE8(A, B, C, D, E, F, G, H) \
   ((const vector unsigned char){ \
      SHUFFLE_VECTOR_8__(A, B, C, D, E, F, G, H) \
   })

#define SHUFB8(A, B, C, D, E, F, G, H) \
   ((const qword){ \
      SHUFFLE_VECTOR_8__(A, B, C, D, E, F, G, H) \
   })


#define SHUFFLE_PATTERN_16_A__  0x00
#define SHUFFLE_PATTERN_16_B__  0x01
#define SHUFFLE_PATTERN_16_C__  0x02
#define SHUFFLE_PATTERN_16_D__  0x03
#define SHUFFLE_PATTERN_16_E__  0x04
#define SHUFFLE_PATTERN_16_F__  0x05
#define SHUFFLE_PATTERN_16_G__  0x06
#define SHUFFLE_PATTERN_16_H__  0x07
#define SHUFFLE_PATTERN_16_I__  0x08
#define SHUFFLE_PATTERN_16_J__  0x09
#define SHUFFLE_PATTERN_16_K__  0x0a
#define SHUFFLE_PATTERN_16_L__  0x0b
#define SHUFFLE_PATTERN_16_M__  0x0c
#define SHUFFLE_PATTERN_16_N__  0x0d
#define SHUFFLE_PATTERN_16_O__  0x0e
#define SHUFFLE_PATTERN_16_P__  0x0f
#define SHUFFLE_PATTERN_16_a__  0x10
#define SHUFFLE_PATTERN_16_b__  0x11
#define SHUFFLE_PATTERN_16_c__  0x12
#define SHUFFLE_PATTERN_16_d__  0x13
#define SHUFFLE_PATTERN_16_e__  0x14
#define SHUFFLE_PATTERN_16_f__  0x15
#define SHUFFLE_PATTERN_16_g__  0x16
#define SHUFFLE_PATTERN_16_h__  0x17
#define SHUFFLE_PATTERN_16_i__  0x18
#define SHUFFLE_PATTERN_16_j__  0x19
#define SHUFFLE_PATTERN_16_k__  0x1a
#define SHUFFLE_PATTERN_16_l__  0x1b
#define SHUFFLE_PATTERN_16_m__  0x1c
#define SHUFFLE_PATTERN_16_n__  0x1d
#define SHUFFLE_PATTERN_16_o__  0x1e
#define SHUFFLE_PATTERN_16_p__  0x1f
#define SHUFFLE_PATTERN_16_X__  0xc0
#define SHUFFLE_PATTERN_16_x__  0xc0
#define SHUFFLE_PATTERN_16_0__  0x80
#define SHUFFLE_PATTERN_16_8__  0xe0

#define SHUFFLE_VECTOR_16__(A, B, C, D, E, F, G, H, I, J, K, L, M, N, O, P) \
   SHUFFLE_PATTERN_16_##A##__, \
   SHUFFLE_PATTERN_16_##B##__, \
   SHUFFLE_PATTERN_16_##C##__, \
   SHUFFLE_PATTERN_16_##D##__, \
   SHUFFLE_PATTERN_16_##E##__, \
   SHUFFLE_PATTERN_16_##F##__, \
   SHUFFLE_PATTERN_16_##G##__, \
   SHUFFLE_PATTERN_16_##H##__, \
   SHUFFLE_PATTERN_16_##I##__, \
   SHUFFLE_PATTERN_16_##J##__, \
   SHUFFLE_PATTERN_16_##K##__, \
   SHUFFLE_PATTERN_16_##L##__, \
   SHUFFLE_PATTERN_16_##M##__, \
   SHUFFLE_PATTERN_16_##N##__, \
   SHUFFLE_PATTERN_16_##O##__, \
   SHUFFLE_PATTERN_16_##P##__

#define SHUFFLE16(A, B, C, D, E, F, G, H, I, J, K, L, M, N, O, P) \
   ((const vector unsigned char){ \
      SHUFFLE_VECTOR_16__(A, B, C, D, E, F, G, H, I, J, K, L, M, N, O, P) \
   })

#define SHUFB16(A, B, C, D, E, F, G, H, I, J, K, L, M, N, O, P) \
   ((const qword){ \
      SHUFFLE_VECTOR_16__(A, B, C, D, E, F, G, H, I, J, K, L, M, N, O, P) \
   })

#endif