1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
|
#
# Copyright 2010 Free Software Foundation, Inc.
#
# This program is free software: you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program. If not, see <http://www.gnu.org/licenses/>.
#
from volk_regexp import *
import string
from emit_omnilog import *
#ok todo list:
#put n_archs into the info struct so it doesn't have to be arch_defs[0].
def make_c(machines, archs, functions, arched_arglist, my_arglist):
tempstring = r"""
// This file is automatically generated by make_c.py.
// Do not edit this file.
"""
tempstring += """
#include <volk/volk_common.h>
#include <volk/volk_machines.h>
#include <volk/volk_registry.h>
#include <volk/volk_typedefs.h>
#include <volk/volk_cpu.h>
#include "volk_rank_archs.h"
#include <volk/volk.h>
#include <stdio.h>
#include <string.h>
"""
tempstring += emit_prolog();
#OK here's the deal. the .h prototypes the functions. the .c impls them as fptrs, can use p_whatever.
#also .c impls the get_machine call
#also .c impls the default call for each fn
#here do static fn get arch
tempstring += r"""
struct volk_machine *get_machine(void) {
extern struct volk_machine volk_machines[];
extern unsigned int n_volk_machines;
static struct volk_machine *machine = NULL;
if(machine != NULL) return machine;
else {
unsigned int max_score = 0;
int i;
for(i=0; i<n_volk_machines; i++) {
if(!(volk_machines[i].caps & (~volk_get_lvarch()))) {
if(volk_machines[i].caps > max_score) {
max_score = volk_machines[i].caps;
machine = &(volk_machines[i]);
}
}
}
printf("Using Volk machine: %s\n", machine->name);
return machine;
}
}
static unsigned int get_index(const char *indices[], unsigned int n_archs, const char *arch_name) {
int i;
for(i=0; i<n_archs; i++) {
if(!strncmp(indices[i], arch_name, 20)) {
return i;
}
}
//something terrible should happen here
printf("Volk warning: no arch found, returning generic impl\n");
return get_index(indices, n_archs, "generic"); //but we'll fake it for now
}
"""
for i in range(len(functions)):
tempstring += "void get_" + functions[i] + replace_arch.sub("", arched_arglist[i]) + "\n"
tempstring += " %s = get_machine()->%s_archs[volk_rank_archs(get_machine()->%s_desc.arch_defs, get_machine()->%s_desc.n_archs, volk_get_lvarch())];\n" % (functions[i], functions[i], functions[i], functions[i])
tempstring += " %s(%s);\n}\n\n" % (functions[i], my_arglist[i])
tempstring += replace_volk.sub("p", functions[i]) + " " + functions[i] + " = &get_" + functions[i] + ";\n\n"
tempstring += "void %s_manual%s\n" % (functions[i], arched_arglist[i])
tempstring += " get_machine()->%s_archs[get_index(get_machine()->%s_desc.indices, get_machine()->%s_desc.n_archs, arch)](%s);\n}\n" % (functions[i], functions[i], functions[i], my_arglist[i])
tempstring += "struct volk_func_desc %s_get_func_desc(void) {\n" % (functions[i])
tempstring += " return get_machine()->%s_desc;\n}\n" % (functions[i])
tempstring += emit_epilog();
return tempstring
|