1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
|
#!/usr/bin/env python
#
# Copyright 2011 Free Software Foundation, Inc.
#
# This file is part of GNU Radio
#
# GNU Radio is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation; either version 3, or (at your option)
# any later version.
#
# GNU Radio is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with GNU Radio; see the file COPYING. If not, write to
# the Free Software Foundation, Inc., 51 Franklin Street,
# Boston, MA 02110-1301, USA.
#
from xml.dom import minidom
HEADER_TEMPL = """\
/*this file is auto_generated by volk_register.py*/
#include <volk/volk_cpu.h>
#include <volk/volk_config_fixed.h>
struct VOLK_CPU volk_cpu;
#if defined(__i386__) || defined(__x86_64__) || defined(_M_IX86) || defined(_M_X64)
# define VOLK_CPU_x86
#endif
#if defined(VOLK_CPU_x86)
//implement get cpuid for gcc compilers using a copy of cpuid.h
#if defined(__GNUC__)
#include <gcc_x86_cpuid.h>
#define cpuid_x86(op, r) __get_cpuid(op, (unsigned int *)r+0, (unsigned int *)r+1, (unsigned int *)r+2, (unsigned int *)r+3)
/* Return Intel AVX extended CPU capabilities register.
* This function will bomb on non-AVX-capable machines, so
* check for AVX capability before executing.
*/
#if __GNUC__ > 4 || __GNUC__ == 4 && __GNUC_MINOR__ >= 4
static inline unsigned long long _xgetbv(unsigned int index){
unsigned int eax, edx;
__asm__ __volatile__("xgetbv" : "=a"(eax), "=d"(edx) : "c"(index));
return ((unsigned long long)edx << 32) | eax;
}
#define __xgetbv() _xgetbv(0)
#else
#define __xgetbv() 0
#endif
//implement get cpuid for MSVC compilers using __cpuid intrinsic
#elif defined(_MSC_VER)
#include <intrin.h>
#define cpuid_x86(op, r) __cpuid(r, op)
#if defined(_XCR_XFEATURE_ENABLED_MASK)
#define __xgetbv() _xgetbv(_XCR_XFEATURE_ENABLED_MASK)
#else
#define __xgetbv() 0
#endif
#else
#error "A get cpuid for volk is not available on this compiler..."
#endif
static inline unsigned int cpuid_eax(unsigned int op) {
int regs[4];
cpuid_x86 (op, regs);
return regs[0];
}
static inline unsigned int cpuid_ebx(unsigned int op) {
int regs[4];
cpuid_x86 (op, regs);
return regs[1];
}
static inline unsigned int cpuid_ecx(unsigned int op) {
int regs[4];
cpuid_x86 (op, regs);
return regs[2];
}
static inline unsigned int cpuid_edx(unsigned int op) {
int regs[4];
cpuid_x86 (op, regs);
return regs[3];
}
static inline unsigned int xgetbv(void) {
//check to make sure that xgetbv is enabled in OS
int xgetbv_enabled = cpuid_ecx(1) >> 27 & 0x01;
if(xgetbv_enabled == 0) return 0;
return __xgetbv();
}
#endif
"""
def make_cpuid_c(dom) :
tempstring = HEADER_TEMPL;
for domarch in dom:
if str(domarch.attributes["type"].value) == "x86":
if "no_test" in domarch.attributes.keys():
no_test = str(domarch.attributes["no_test"].value);
if no_test == "true":
no_test = True;
else:
no_test = False;
else:
no_test = False;
arch = str(domarch.attributes["name"].value)
op = domarch.getElementsByTagName("op")
if op:
op = str(op[0].firstChild.data)
reg = domarch.getElementsByTagName("reg")
if reg:
reg = str(reg[0].firstChild.data)
shift = domarch.getElementsByTagName("shift")
if shift:
shift = str(shift[0].firstChild.data)
val = domarch.getElementsByTagName("val")
if val:
val = str(val[0].firstChild.data)
check = domarch.getElementsByTagName("check")
if check:
check = str(check[0].firstChild.data)
checkval = domarch.getElementsByTagName("checkval")
if checkval:
checkval = str(checkval[0].firstChild.data)
if no_test:
tempstring = tempstring + """\
int i_can_has_%s () {
#if defined(VOLK_CPU_x86)
return 1;
#else
return 0;
#endif
}
""" % (arch)
elif op == "1":
tempstring = tempstring + """\
int i_can_has_%s () {
#if defined(VOLK_CPU_x86)
unsigned int e%sx = cpuid_e%sx (%s);
int hwcap = (((e%sx >> %s) & 1) == %s);
""" % (arch, reg, reg, op, reg, shift, val)
if check and checkval:
tempstring += """\
if (hwcap == 0) return 0;
hwcap &= (%s() == %s);
""" % (check, checkval)
tempstring += """\
return hwcap;
#else
return 0;
#endif
}
"""
elif op == "0x80000001":
tempstring = tempstring + """\
int i_can_has_%s () {
#if defined(VOLK_CPU_x86)
unsigned int extended_fct_count = cpuid_eax(0x80000000);
if (extended_fct_count < 0x80000001)
return %s^1;
unsigned int extended_features = cpuid_e%sx (%s);
return ((extended_features >> %s) & 1) == %s;
#else
return 0;
#endif
}
""" % (arch, val, reg, op, shift, val)
elif str(domarch.attributes["type"].value) == "powerpc":
arch = str(domarch.attributes["name"].value);
tempstring = tempstring + """\
int i_can_has_%s () {
#ifdef __PPC__
return 1;
#else
return 0;
#endif
}
""" % (arch)
elif str(domarch.attributes["type"].value) == "arm":
arch = str(domarch.attributes["name"].value);
tempstring = tempstring + """\
#if defined(__arm__) && defined(__linux__)
#include <asm/hwcap.h>
#include <linux/auxvec.h>
#include <stdio.h>
#define LOOK_FOR_NEON
#endif
int i_can_has_%s () {
//it's linux-specific, but if you're compiling libvolk for NEON
//on Windows you have other problems
#ifdef LOOK_FOR_NEON
FILE *auxvec_f;
unsigned long auxvec[2];
unsigned int found_neon = 0;
auxvec_f = fopen("/proc/self/auxv", "rb");
if(!auxvec_f) return 0;
//so auxv is basically 32b of ID and 32b of value
//so it goes like this
while(!found_neon && auxvec_f) {
fread(auxvec, sizeof(unsigned long), 2, auxvec_f);
if((auxvec[0] == AT_HWCAP) && (auxvec[1] & HWCAP_NEON))
found_neon = 1;
}
fclose(auxvec_f);
return found_neon;
#else
return 0;
#endif
}
""" % (arch)
elif str(domarch.attributes["type"].value) == "all":
arch = str(domarch.attributes["name"].value);
tempstring = tempstring + """\
int i_can_has_%s () {
return 1;
}
""" % (arch)
else:
arch = str(domarch.attributes["name"].value);
tempstring = tempstring + """\
int i_can_has_%s () {
return 0;
}
""" % (arch)
tempstring = tempstring + "void volk_cpu_init() {\n";
for domarch in dom:
arch = str(domarch.attributes["name"].value);
tempstring = tempstring + " volk_cpu.has_" + arch + " = &i_can_has_" + arch + ";\n"
tempstring = tempstring + "}\n\n"
tempstring = tempstring + "unsigned int volk_get_lvarch() {\n";
tempstring = tempstring + " unsigned int retval = 0;\n"
tempstring = tempstring + " volk_cpu_init();\n"
for domarch in dom:
arch = str(domarch.attributes["name"].value);
tempstring = tempstring + " retval += volk_cpu.has_" + arch + "() << LV_" + arch.swapcase() + ";\n"
tempstring = tempstring + " return retval;\n"
tempstring = tempstring + "}\n\n"
return tempstring;
|