1 |
1244 |
hpanther |
/* cuc.c -- OpenRISC Custom Unit Compiler
|
2 |
|
|
* Copyright (C) 2002 Marko Mlinar, markom@opencores.org
|
3 |
|
|
*
|
4 |
|
|
* This file is part of OpenRISC 1000 Architectural Simulator.
|
5 |
|
|
*
|
6 |
|
|
* This program is free software; you can redistribute it and/or modify
|
7 |
|
|
* it under the terms of the GNU General Public License as published by
|
8 |
|
|
* the Free Software Foundation; either version 2 of the License, or
|
9 |
|
|
* (at your option) any later version.
|
10 |
|
|
*
|
11 |
|
|
* This program is distributed in the hope that it will be useful,
|
12 |
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
13 |
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
14 |
|
|
* GNU General Public License for more details.
|
15 |
|
|
*
|
16 |
|
|
* You should have received a copy of the GNU General Public License
|
17 |
|
|
* along with this program; if not, write to the Free Software
|
18 |
|
|
* Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. */
|
19 |
|
|
|
20 |
|
|
/* Main file, including code optimization and command prompt */
|
21 |
|
|
|
22 |
|
|
#include <stdio.h>
|
23 |
|
|
#include <stdlib.h>
|
24 |
|
|
#include <stdarg.h>
|
25 |
|
|
#include <assert.h>
|
26 |
|
|
#include <ctype.h>
|
27 |
1308 |
phoenix |
#include <string.h>
|
28 |
|
|
#include <unistd.h>
|
29 |
|
|
|
30 |
1350 |
nogj |
#include "config.h"
|
31 |
|
|
|
32 |
|
|
#ifdef HAVE_INTTYPES_H
|
33 |
|
|
#include <inttypes.h>
|
34 |
|
|
#endif
|
35 |
|
|
|
36 |
|
|
#include "port.h"
|
37 |
|
|
#include "arch.h"
|
38 |
1308 |
phoenix |
#include "abstract.h"
|
39 |
1244 |
hpanther |
#include "sim-config.h"
|
40 |
|
|
#include "cuc.h"
|
41 |
|
|
#include "insn.h"
|
42 |
|
|
#include "profiler.h"
|
43 |
|
|
#include "opcode/or32.h"
|
44 |
|
|
#include "parse.h"
|
45 |
1308 |
phoenix |
#include "debug.h"
|
46 |
1244 |
hpanther |
|
47 |
|
|
FILE *flog;
|
48 |
|
|
int cuc_debug = 0;
|
49 |
|
|
|
50 |
|
|
/* Last used registers by software convention */
|
51 |
|
|
/* Note that r11 is caller saved register, and we can destroy it.
|
52 |
|
|
Due to CUC architecture we must always return something, even garbage (so that
|
53 |
|
|
caller knows, we are finished, when we send acknowledge).
|
54 |
|
|
In case r11 was not used (trivial register assignment) we will remove it later,
|
55 |
|
|
but if we assigned a value to it, it must not be removed, so caller_saved[11] = 0 */
|
56 |
|
|
const int caller_saved[MAX_REGS] = {
|
57 |
|
|
0, 0, 0, 1, 1, 1, 1, 1,
|
58 |
|
|
1, 1, 0, 0, 0, 1, 0, 1,
|
59 |
|
|
0, 1, 0, 1, 0, 1, 0, 1,
|
60 |
|
|
0, 1, 0, 1, 0, 1, 0, 1,
|
61 |
|
|
1, 1};
|
62 |
|
|
|
63 |
|
|
/* returns log2(x) */
|
64 |
|
|
/* Call this log2_int, because there is a library function named log2 */
|
65 |
|
|
int log2_int (unsigned long x)
|
66 |
|
|
{
|
67 |
|
|
int c = 0;
|
68 |
|
|
assert (x >= 0);
|
69 |
|
|
if (!x) return 0; /* not by the book, but practical */
|
70 |
|
|
while (x != 1) x >>= 1, c++;
|
71 |
|
|
return c;
|
72 |
|
|
}
|
73 |
|
|
|
74 |
|
|
/* Does all known instruction optimizations */
|
75 |
|
|
void cuc_optimize (cuc_func *func)
|
76 |
|
|
{
|
77 |
|
|
int modified = 0;
|
78 |
|
|
int first = 1;
|
79 |
|
|
log ("Optimizing.\n");
|
80 |
|
|
do {
|
81 |
|
|
modified = 0;
|
82 |
|
|
clean_deps (func);
|
83 |
|
|
if (cuc_debug >= 6) print_cuc_bb (func, "AFTER_CLEAN_DEPS");
|
84 |
|
|
if (optimize_cmovs (func)) {
|
85 |
|
|
if (cuc_debug >= 6) print_cuc_bb (func, "AFTER_OPT_CMOVS");
|
86 |
|
|
modified = 1;
|
87 |
|
|
}
|
88 |
|
|
if (cuc_debug) cuc_check (func);
|
89 |
|
|
if (optimize_tree (func)) {
|
90 |
|
|
if (cuc_debug >= 6) print_cuc_bb (func, "AFTER_OPT_TREE1");
|
91 |
|
|
modified = 1;
|
92 |
|
|
}
|
93 |
|
|
if (remove_nops (func)) {
|
94 |
|
|
if (cuc_debug >= 6) print_cuc_bb (func, "NO_NOPS");
|
95 |
|
|
modified = 1;
|
96 |
|
|
}
|
97 |
|
|
if (cuc_debug) cuc_check (func);
|
98 |
|
|
if (remove_dead (func)) {
|
99 |
|
|
if (cuc_debug >= 5) print_cuc_bb (func, "AFTER_DEAD");
|
100 |
|
|
modified = 1;
|
101 |
|
|
}
|
102 |
|
|
if (cuc_debug) cuc_check (func);
|
103 |
|
|
if (cse (func)) {
|
104 |
|
|
log ("Common subexpression elimination.\n");
|
105 |
|
|
if (cuc_debug >= 3) print_cuc_bb (func, "AFTER_CSE");
|
106 |
|
|
modified = 1;
|
107 |
|
|
}
|
108 |
|
|
if (first) {
|
109 |
|
|
insert_conditional_facts (func);
|
110 |
|
|
if (cuc_debug >= 3) print_cuc_bb (func, "AFTER_COND_FACT");
|
111 |
|
|
if (cuc_debug) cuc_check (func);
|
112 |
|
|
first = 0;
|
113 |
|
|
}
|
114 |
|
|
if (optimize_bb (func)) {
|
115 |
|
|
if (cuc_debug >= 5) print_cuc_bb (func, "AFTER_OPT_BB");
|
116 |
|
|
modified = 1;
|
117 |
|
|
}
|
118 |
|
|
if (cuc_debug) cuc_check (func);
|
119 |
|
|
if (remove_nops (func)) {
|
120 |
|
|
if (cuc_debug >= 6) print_cuc_bb (func, "NO_NOPS");
|
121 |
|
|
modified = 1;
|
122 |
|
|
}
|
123 |
|
|
if (remove_dead_bb (func)) {
|
124 |
|
|
if (cuc_debug >= 5) print_cuc_bb (func, "AFTER_DEAD_BB");
|
125 |
|
|
modified = 1;
|
126 |
|
|
}
|
127 |
|
|
if (remove_trivial_regs (func)) {
|
128 |
|
|
if (cuc_debug >= 2) print_cuc_bb (func, "AFTER_TRIVIAL");
|
129 |
|
|
modified = 1;
|
130 |
|
|
}
|
131 |
|
|
if (remove_nops (func)) {
|
132 |
|
|
if (cuc_debug >= 6) print_cuc_bb (func, "NO_NOPS");
|
133 |
|
|
modified = 1;
|
134 |
|
|
}
|
135 |
|
|
add_memory_dep (func, func->memory_order);
|
136 |
|
|
if (cuc_debug >= 7) print_cuc_bb (func, "AFTER_MEMORY_DEP");
|
137 |
|
|
add_data_dep (func);
|
138 |
|
|
if (cuc_debug >= 8) print_cuc_bb (func, "AFTER_DATA_DEP");
|
139 |
|
|
if (schedule_memory (func, func->memory_order)) {
|
140 |
|
|
if (cuc_debug >= 7) print_cuc_bb (func, "AFTER_SCHEDULE_MEM");
|
141 |
|
|
modified = 1;
|
142 |
|
|
}
|
143 |
|
|
} while (modified);
|
144 |
|
|
set_io (func);
|
145 |
|
|
#if 0
|
146 |
|
|
detect_max_values (func);
|
147 |
|
|
if (cuc_debug >= 5) print_cuc_bb (func, "AFTER_MAX_VALUES");
|
148 |
|
|
#endif
|
149 |
|
|
}
|
150 |
|
|
|
151 |
|
|
/* Pre/unrolls basic block and optimizes it */
|
152 |
|
|
cuc_timings *preunroll_bb (char *bb_filename, cuc_func *f, cuc_timings *timings, int b, int i, int j)
|
153 |
|
|
{
|
154 |
|
|
cuc_func *func;
|
155 |
|
|
cucdebug (2, "BB%i unroll %i times preroll %i times\n", b, j, i);
|
156 |
|
|
log ("BB%i unroll %i times preroll %i times\n", b, j, i);
|
157 |
|
|
func = preunroll_loop (f, b, i, j, bb_filename);
|
158 |
|
|
if (cuc_debug >= 2) print_cuc_bb (func, "AFTER_PREUNROLL");
|
159 |
|
|
cuc_optimize (func);
|
160 |
|
|
analyse_timings (func, timings);
|
161 |
|
|
|
162 |
|
|
cucdebug (2, "new_time = %i, old_time = %i, size = %f\n",
|
163 |
|
|
timings->new_time, func->orig_time, timings->size);
|
164 |
|
|
log ("new time = %icyc, old_time = %icyc, size = %.0f gates\n",
|
165 |
|
|
timings->new_time, func->orig_time, timings->size);
|
166 |
|
|
//output_verilog (func, argv[1]);
|
167 |
|
|
free_func (func);
|
168 |
|
|
timings->b = b;
|
169 |
|
|
timings->unroll = j;
|
170 |
|
|
timings->preroll = i;
|
171 |
|
|
timings->nshared = 0;
|
172 |
|
|
return timings;
|
173 |
|
|
}
|
174 |
|
|
|
175 |
|
|
/* Simple comparison function */
|
176 |
|
|
int tim_comp (cuc_timings *a, cuc_timings *b)
|
177 |
|
|
{
|
178 |
|
|
if (a->new_time < b->new_time) return -1;
|
179 |
|
|
else if (a->new_time > b->new_time) return 1;
|
180 |
|
|
else return 0;
|
181 |
|
|
}
|
182 |
|
|
|
183 |
|
|
/* Analyses function; done when cuc command is entered in (sim) prompt */
|
184 |
|
|
cuc_func *analyse_function (char *module_name, long orig_time,
|
185 |
|
|
unsigned long start_addr, unsigned long end_addr,
|
186 |
|
|
int memory_order, int num_runs)
|
187 |
|
|
{
|
188 |
|
|
cuc_timings timings;
|
189 |
|
|
cuc_func *func = (cuc_func *) malloc (sizeof (cuc_func));
|
190 |
|
|
cuc_func *saved;
|
191 |
|
|
int b, i, j;
|
192 |
|
|
char tmp1[256];
|
193 |
|
|
char tmp2[256];
|
194 |
|
|
|
195 |
|
|
func->orig_time = orig_time;
|
196 |
|
|
func->start_addr = start_addr;
|
197 |
|
|
func->end_addr = end_addr;
|
198 |
|
|
func->memory_order = memory_order;
|
199 |
|
|
func->nfdeps = 0;
|
200 |
|
|
func->fdeps = NULL;
|
201 |
|
|
func->num_runs = num_runs;
|
202 |
|
|
|
203 |
|
|
sprintf (tmp1, "%s.bin", module_name);
|
204 |
|
|
cucdebug (2, "Loading %s.bin\n", module_name);
|
205 |
|
|
if (cuc_load (tmp1)) {
|
206 |
|
|
free (func);
|
207 |
|
|
return NULL;
|
208 |
|
|
}
|
209 |
|
|
|
210 |
|
|
log ("Detecting basic blocks\n");
|
211 |
|
|
detect_bb (func);
|
212 |
|
|
if (cuc_debug >= 2) print_cuc_insns ("WITH_BB_LIMITS", 0);
|
213 |
|
|
|
214 |
|
|
//sprintf (tmp1, "%s.bin.mp", module_name);
|
215 |
|
|
sprintf (tmp2, "%s.bin.bb", module_name);
|
216 |
|
|
generate_bb_seq (func, config.sim.mprof_fn, tmp2);
|
217 |
|
|
log ("Assuming %i clk cycle load (%i cyc burst)\n", runtime.cuc.mdelay[0], runtime.cuc.mdelay[2]);
|
218 |
|
|
log ("Assuming %i clk cycle store (%i cyc burst)\n", runtime.cuc.mdelay[1], runtime.cuc.mdelay[3]);
|
219 |
|
|
|
220 |
|
|
build_bb (func);
|
221 |
|
|
if (cuc_debug >= 5) print_cuc_bb (func, "AFTER_BUILD_BB");
|
222 |
|
|
reg_dep (func);
|
223 |
|
|
|
224 |
|
|
log ("Detecting dependencies\n");
|
225 |
|
|
if (cuc_debug >= 2) print_cuc_bb (func, "AFTER_REG_DEP");
|
226 |
|
|
cuc_optimize (func);
|
227 |
|
|
|
228 |
|
|
#if 0
|
229 |
|
|
csm (func);
|
230 |
|
|
#endif
|
231 |
|
|
assert (saved = dup_func (func));
|
232 |
|
|
|
233 |
|
|
timings.preroll = timings.unroll = 1;
|
234 |
|
|
timings.nshared = 0;
|
235 |
|
|
|
236 |
|
|
add_latches (func);
|
237 |
|
|
if (cuc_debug >= 1) print_cuc_bb (func, "AFTER_LATCHES");
|
238 |
|
|
analyse_timings (func, &timings);
|
239 |
|
|
|
240 |
|
|
free_func (func);
|
241 |
|
|
log ("Base option: pre%i,un%i,sha%i: %icyc %.1f\n",
|
242 |
|
|
timings.preroll, timings.unroll, timings.nshared, timings.new_time, timings.size);
|
243 |
|
|
saved->timings = timings;
|
244 |
|
|
|
245 |
|
|
#if 1
|
246 |
|
|
/* detect and unroll simple loops */
|
247 |
|
|
for (b = 0; b < saved->num_bb; b++) {
|
248 |
|
|
cuc_timings t[MAX_UNROLL * MAX_PREROLL];
|
249 |
|
|
cuc_timings *ut;
|
250 |
|
|
cuc_timings *cut = &t[0];
|
251 |
|
|
int nt = 1;
|
252 |
|
|
double csize;
|
253 |
|
|
saved->bb[b].selected_tim = -1;
|
254 |
|
|
|
255 |
|
|
/* Is it a loop? */
|
256 |
|
|
if (saved->bb[b].next[0] != b && saved->bb[b].next[1] != b) continue;
|
257 |
|
|
log ("Found loop at BB%x. Trying to unroll.\n", b);
|
258 |
|
|
t[0] = timings;
|
259 |
|
|
t[0].b = b;
|
260 |
|
|
t[0].preroll = 1;
|
261 |
|
|
t[0].unroll = 1;
|
262 |
|
|
t[0].nshared = 0;
|
263 |
|
|
|
264 |
|
|
sprintf (tmp1, "%s.bin.bb", module_name);
|
265 |
|
|
i = 1;
|
266 |
|
|
do {
|
267 |
|
|
cuc_timings *pt;
|
268 |
|
|
cuc_timings *cpt = cut;
|
269 |
|
|
j = 1;
|
270 |
|
|
|
271 |
|
|
do {
|
272 |
|
|
pt = cpt;
|
273 |
|
|
cpt = preunroll_bb (tmp1, saved, &t[nt++], b, ++j, i);
|
274 |
|
|
} while (j <= MAX_PREROLL && pt->new_time > cpt->new_time);
|
275 |
|
|
i++;
|
276 |
|
|
ut = cut;
|
277 |
|
|
cut = preunroll_bb (tmp1, saved, &t[nt++], b, 1, i);
|
278 |
|
|
} while (i <= MAX_UNROLL && ut->new_time > cut->new_time);
|
279 |
|
|
|
280 |
|
|
/* Sort the timings */
|
281 |
|
|
#if 0
|
282 |
|
|
if (cuc_debug >= 3)
|
283 |
|
|
for (i = 0; i < nt; i++) PRINTF ("%i:%i,%i: %icyc\n",
|
284 |
|
|
t[i].b, t[i].preroll, t[i].unroll, t[i].new_time);
|
285 |
|
|
#endif
|
286 |
|
|
|
287 |
|
|
qsort (t, nt, sizeof (cuc_timings), (int (*)(const void *, const void *))tim_comp);
|
288 |
|
|
|
289 |
|
|
/* Delete timings, that have worst time and bigger size than other */
|
290 |
|
|
j = 1;
|
291 |
|
|
csize = t[0].size;
|
292 |
|
|
for (i = 1; i < nt; i++)
|
293 |
|
|
if (t[i].size < csize) t[j++] = t[i];
|
294 |
|
|
nt = j;
|
295 |
|
|
|
296 |
|
|
cucdebug (1, "Available options\n");
|
297 |
|
|
for (i = 0; i < nt; i++) cucdebug (1, "%i:%i,%i: %icyc %.1f\n",
|
298 |
|
|
t[i].b, t[i].preroll, t[i].unroll, t[i].new_time, t[i].size);
|
299 |
|
|
/* Add results from CSM */
|
300 |
|
|
j = nt;
|
301 |
|
|
for (i = 0; i < saved->bb[b].ntim; i++) {
|
302 |
|
|
int i1;
|
303 |
|
|
for (i1 = 0; i1 < nt; i1++) {
|
304 |
|
|
t[j] = t[i1];
|
305 |
|
|
t[j].size += saved->bb[b].tim[i].size - timings.size;
|
306 |
|
|
t[j].new_time += saved->bb[b].tim[i].new_time - timings.new_time;
|
307 |
|
|
t[j].nshared = saved->bb[b].tim[i].nshared;
|
308 |
|
|
t[j].shared = saved->bb[b].tim[i].shared;
|
309 |
|
|
if (++j >= MAX_UNROLL * MAX_PREROLL) goto full;
|
310 |
|
|
}
|
311 |
|
|
}
|
312 |
|
|
|
313 |
|
|
full:
|
314 |
|
|
nt = j;
|
315 |
|
|
|
316 |
|
|
cucdebug (1, "Available options:\n");
|
317 |
|
|
for (i = 0; i < nt; i++) cucdebug (1, "%i:%i,%i: %icyc %.1f\n",
|
318 |
|
|
t[i].b, t[i].preroll, t[i].unroll, t[i].new_time, t[i].size);
|
319 |
|
|
|
320 |
|
|
/* Sort again with new timings added */
|
321 |
|
|
qsort (t, nt, sizeof (cuc_timings), (int (*)(const void *, const void *))tim_comp);
|
322 |
|
|
|
323 |
|
|
/* Delete timings, that have worst time and bigger size than other */
|
324 |
|
|
j = 1;
|
325 |
|
|
csize = t[0].size;
|
326 |
|
|
for (i = 1; i < nt; i++)
|
327 |
|
|
if (t[i].size < csize) t[j++] = t[i];
|
328 |
|
|
nt = j;
|
329 |
|
|
|
330 |
|
|
cucdebug (1, "Available options:\n");
|
331 |
|
|
for (i = 0; i < nt; i++) cucdebug (1, "%i:%i,%i: %icyc %.1f\n",
|
332 |
|
|
t[i].b, t[i].preroll, t[i].unroll, t[i].new_time, t[i].size);
|
333 |
|
|
|
334 |
|
|
if (saved->bb[b].ntim) free (saved->bb[b].tim);
|
335 |
|
|
saved->bb[b].ntim = nt;
|
336 |
|
|
assert (saved->bb[b].tim = (cuc_timings *) malloc (sizeof (cuc_timings) * nt));
|
337 |
|
|
|
338 |
|
|
/* Copy options in reverse order -- smallest first */
|
339 |
|
|
for (i = 0; i < nt; i++) saved->bb[b].tim[i] = t[nt - 1 - i];
|
340 |
|
|
|
341 |
|
|
log ("Available options:\n");
|
342 |
|
|
for (i = 0; i < saved->bb[b].ntim; i++) {
|
343 |
|
|
log ("%i:pre%i,un%i,sha%i: %icyc %.1f\n",
|
344 |
|
|
saved->bb[b].tim[i].b, saved->bb[b].tim[i].preroll, saved->bb[b].tim[i].unroll,
|
345 |
|
|
saved->bb[b].tim[i].nshared, saved->bb[b].tim[i].new_time, saved->bb[b].tim[i].size);
|
346 |
|
|
}
|
347 |
|
|
}
|
348 |
|
|
#endif
|
349 |
|
|
return saved;
|
350 |
|
|
}
|
351 |
|
|
|
352 |
|
|
/* Utility option formatting functions */
|
353 |
|
|
static const char *option_char = "?abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ";
|
354 |
|
|
|
355 |
|
|
/*static */char *gen_option (char *s, int bb_no, int f_opt)
|
356 |
|
|
{
|
357 |
|
|
if (bb_no >= 0) sprintf (s, "%i", bb_no);
|
358 |
|
|
assert (f_opt <= strlen (option_char));
|
359 |
|
|
sprintf (s, "%s%c", s, option_char[f_opt]);
|
360 |
|
|
return s;
|
361 |
|
|
}
|
362 |
|
|
|
363 |
|
|
/*static */void print_option (int bb_no, int f_opt)
|
364 |
|
|
{
|
365 |
|
|
char tmp1[10];
|
366 |
|
|
char tmp2[10];
|
367 |
|
|
sprintf (tmp2, "%s", gen_option (tmp1, bb_no, f_opt));
|
368 |
|
|
PRINTF ("%3s", tmp2);
|
369 |
|
|
}
|
370 |
|
|
|
371 |
|
|
static char *format_func_options (char *s, cuc_func *f)
|
372 |
|
|
{
|
373 |
|
|
int b, first = 1;
|
374 |
|
|
*s = '\0';
|
375 |
|
|
for (b = 0; b < f->num_bb; b++)
|
376 |
|
|
if (f->bb[b].selected_tim >= 0) {
|
377 |
|
|
char tmp[10];
|
378 |
|
|
sprintf (s, "%s%s%s", s, first ? "" : ",", gen_option (tmp, b, f->bb[b].selected_tim));
|
379 |
|
|
first = 0;
|
380 |
|
|
}
|
381 |
|
|
return s;
|
382 |
|
|
}
|
383 |
|
|
|
384 |
|
|
static void options_cmd (int func_no, cuc_func *f)
|
385 |
|
|
{
|
386 |
|
|
int b, i;
|
387 |
|
|
char tmp[30];
|
388 |
|
|
char *name = prof_func[func_no].name;
|
389 |
|
|
PRINTF ("-----------------------------------------------------------------------------\n");
|
390 |
|
|
PRINTF ("|%-28s|pre/unrolled|shared| time | gates |old_time|\n",
|
391 |
|
|
strstrip (tmp, name, 28));
|
392 |
|
|
PRINTF ("| BASE |%4i / %4i | %4i |%8i|%8.f|%8i|\n", 1, 1, 0,
|
393 |
|
|
f->timings.new_time, f->timings.size, f->orig_time);
|
394 |
|
|
for (b = 0; b < f->num_bb; b++) {
|
395 |
|
|
/* Print out results */
|
396 |
|
|
for (i = 1; i < f->bb[b].ntim; i++) { /* First one is base option */
|
397 |
|
|
int time = f->bb[b].tim[i].new_time - f->timings.new_time;
|
398 |
|
|
double size = f->bb[b].tim[i].size - f->timings.size;
|
399 |
|
|
PRINTF ("| ");
|
400 |
|
|
print_option (b, i);
|
401 |
|
|
PRINTF (" |%4i / %4i | %4i |%+8i|%+8.f| |\n",
|
402 |
|
|
f->bb[b].tim[i].preroll, f->bb[b].tim[i].unroll, f->bb[b].tim[i].nshared,
|
403 |
|
|
time, size);
|
404 |
|
|
}
|
405 |
|
|
}
|
406 |
|
|
}
|
407 |
|
|
|
408 |
|
|
/* Generates a function, based on specified parameters */
|
409 |
|
|
cuc_func *generate_function (cuc_func *rf, char *name, char *cut_filename)
|
410 |
|
|
{
|
411 |
1308 |
phoenix |
int b;
|
412 |
1244 |
hpanther |
char tmp[256];
|
413 |
|
|
cuc_timings tt;
|
414 |
|
|
cuc_func *f;
|
415 |
|
|
assert (f = dup_func (rf));
|
416 |
|
|
|
417 |
|
|
if (cuc_debug >= 2) print_cuc_bb (f, "BEFORE_GENERATE");
|
418 |
|
|
log ("Generating function %s.\n", name);
|
419 |
|
|
PRINTF ("Generating function %s.\n", name);
|
420 |
|
|
|
421 |
|
|
format_func_options (tmp, rf);
|
422 |
|
|
if (strlen (tmp)) PRINTF ("Applying options: %s\n", tmp);
|
423 |
|
|
else PRINTF ("Using basic options.\n");
|
424 |
|
|
|
425 |
|
|
/* Generate function as specified by options */
|
426 |
|
|
for (b = 0; b < f->num_bb; b++) {
|
427 |
|
|
cuc_timings *st;
|
428 |
|
|
if (rf->bb[b].selected_tim < 0) continue;
|
429 |
|
|
st = &rf->bb[b].tim[rf->bb[b].selected_tim];
|
430 |
|
|
sprintf (tmp, "%s.bin.bb", name);
|
431 |
|
|
preunroll_bb (&tmp[0], f, &tt, b, st->preroll, st->unroll);
|
432 |
|
|
if (cuc_debug >= 1) print_cuc_bb (f, "AFTER_PREUNROLL");
|
433 |
|
|
}
|
434 |
|
|
for (b = 0; b < f->num_bb; b++) {
|
435 |
|
|
cuc_timings *st;
|
436 |
|
|
if (rf->bb[b].selected_tim < 0) continue;
|
437 |
|
|
st = &rf->bb[b].tim[rf->bb[b].selected_tim];
|
438 |
|
|
if (!st->nshared) continue;
|
439 |
|
|
assert (0);
|
440 |
|
|
//csm_gen (f, rf, st->nshared, st->shared);
|
441 |
|
|
}
|
442 |
|
|
add_latches (f);
|
443 |
|
|
if (cuc_debug >= 1) print_cuc_bb (f, "AFTER_LATCHES");
|
444 |
|
|
analyse_timings (f, &tt);
|
445 |
|
|
|
446 |
|
|
sprintf (tmp, "%s%s", cut_filename, name);
|
447 |
|
|
output_verilog (f, tmp, name);
|
448 |
|
|
return f;
|
449 |
|
|
}
|
450 |
|
|
|
451 |
|
|
/* Calculates required time, based on selected options */
|
452 |
|
|
int calc_cycles (cuc_func *f)
|
453 |
|
|
{
|
454 |
1308 |
phoenix |
int b, ntime = f->timings.new_time;
|
455 |
1244 |
hpanther |
for (b = 0; b < f->num_bb; b++)
|
456 |
|
|
if (f->bb[b].selected_tim >= 0) {
|
457 |
|
|
assert (f->bb[b].selected_tim < f->bb[b].ntim);
|
458 |
|
|
ntime += f->bb[b].tim[f->bb[b].selected_tim].new_time - f->timings.new_time;
|
459 |
|
|
}
|
460 |
|
|
return ntime;
|
461 |
|
|
}
|
462 |
|
|
|
463 |
|
|
/* Calculates required size, based on selected options */
|
464 |
|
|
double calc_size (cuc_func *f)
|
465 |
|
|
{
|
466 |
1308 |
phoenix |
int b;
|
467 |
1244 |
hpanther |
double size = f->timings.size;
|
468 |
|
|
for (b = 0; b < f->num_bb; b++)
|
469 |
|
|
if (f->bb[b].selected_tim >= 0) {
|
470 |
|
|
assert (f->bb[b].selected_tim < f->bb[b].ntim);
|
471 |
|
|
size += f->bb[b].tim[f->bb[b].selected_tim].size - f->timings.size;
|
472 |
|
|
}
|
473 |
|
|
return size;
|
474 |
|
|
}
|
475 |
|
|
|
476 |
|
|
/* Dumps specified function to file (hex) */
|
477 |
|
|
unsigned long extract_function (char *out_fn, unsigned long start_addr)
|
478 |
|
|
{
|
479 |
|
|
FILE *fo;
|
480 |
|
|
unsigned long a = start_addr;
|
481 |
|
|
int x = 0;
|
482 |
|
|
assert (fo = fopen (out_fn, "wt+"));
|
483 |
|
|
|
484 |
|
|
do {
|
485 |
1487 |
nogj |
unsigned long d = eval_direct32 (a, 0, 0);
|
486 |
1244 |
hpanther |
int index = insn_decode (d);
|
487 |
|
|
assert (index >= 0);
|
488 |
|
|
if (x) x++;
|
489 |
|
|
if (strcmp (insn_name (index), "l.jr") == 0) x = 1;
|
490 |
|
|
a += 4;
|
491 |
1308 |
phoenix |
fprintf (fo, "%08lx\n", d);
|
492 |
1244 |
hpanther |
} while (x < 2);
|
493 |
|
|
|
494 |
|
|
fclose (fo);
|
495 |
|
|
return a - 4;
|
496 |
|
|
}
|
497 |
|
|
|
498 |
|
|
static cuc_func *func[MAX_FUNCS];
|
499 |
|
|
static int func_v[MAX_FUNCS];
|
500 |
|
|
|
501 |
|
|
/* Detects function dependencies and removes */
|
502 |
|
|
static void set_func_deps ()
|
503 |
|
|
{
|
504 |
|
|
int f, b, i, j;
|
505 |
|
|
restart:
|
506 |
|
|
for (f = 0; f < prof_nfuncs - 1; f++) if (func[f]) {
|
507 |
|
|
int fused[MAX_FUNCS] = {0};
|
508 |
|
|
int c;
|
509 |
|
|
for (b = 0; b < func[f]->num_bb; b++)
|
510 |
|
|
for (i = 0; i < func[f]->bb[b].ninsn; i++) {
|
511 |
|
|
cuc_insn *ii = &func[f]->bb[b].insn[i];
|
512 |
|
|
if (ii->index == II_CALL) {
|
513 |
|
|
assert (ii->opt[0] == OPT_CONST);
|
514 |
|
|
for (j = 0; j < prof_nfuncs - 1; j++)
|
515 |
|
|
if (func[j] && func[j]->start_addr == ii->op[0]) break;
|
516 |
|
|
if (j >= prof_nfuncs - 1) {
|
517 |
1308 |
phoenix |
log ("%s is calling unknown function, address %08lx\n",
|
518 |
1244 |
hpanther |
prof_func[f].name, ii->op[0]);
|
519 |
1350 |
nogj |
debug (1, "%s is calling unknown function, address %08lx\n",
|
520 |
1244 |
hpanther |
prof_func[f].name, ii->op[0]);
|
521 |
|
|
free_func (func[f]);
|
522 |
|
|
func[f] = NULL;
|
523 |
|
|
goto restart;
|
524 |
|
|
} else if (f == j) {
|
525 |
|
|
log ("%s is recursive, ignoring\n", prof_func[f].name);
|
526 |
|
|
debug (1, "%s is recursive, ignoring\n", prof_func[f].name);
|
527 |
|
|
free_func (func[f]);
|
528 |
|
|
func[f] = NULL;
|
529 |
|
|
goto restart;
|
530 |
|
|
} else fused[j]++;
|
531 |
|
|
}
|
532 |
|
|
}
|
533 |
|
|
for (i = 0; i < MAX_FUNCS; i++) if (fused[i]) c++;
|
534 |
|
|
if (func[f]->nfdeps) free (func[f]->fdeps);
|
535 |
|
|
func[f]->nfdeps = c;
|
536 |
|
|
func[f]->fdeps = (cuc_func **) malloc (sizeof (cuc_func *) * c);
|
537 |
|
|
for (i = 0, j = 0; i < MAX_FUNCS; i++)
|
538 |
|
|
if (fused[i]) func[f]->fdeps[j++] = func[i];
|
539 |
|
|
}
|
540 |
|
|
|
541 |
|
|
/* Detect loops */
|
542 |
|
|
{
|
543 |
|
|
int change;
|
544 |
|
|
for (f = 0; f < MAX_FUNCS; f++) if (func[f]) func[f]->tmp = 0;
|
545 |
|
|
do {
|
546 |
|
|
change = 0;
|
547 |
|
|
for (f = 0; f < MAX_FUNCS; f++) if (func[f] && !func[f]->tmp) {
|
548 |
|
|
int o = 1;
|
549 |
|
|
for (i = 0; i < func[f]->nfdeps; i++)
|
550 |
|
|
if (!func[f]->fdeps[i]->tmp) {o = 0; break;}
|
551 |
|
|
if (o) {
|
552 |
|
|
func[f]->tmp = 1;
|
553 |
|
|
change = 1;
|
554 |
|
|
}
|
555 |
|
|
}
|
556 |
|
|
} while (change);
|
557 |
|
|
|
558 |
|
|
change = 0;
|
559 |
|
|
for (f = 0; f < MAX_FUNCS; f++) if (func[f] && !func[f]->tmp) {
|
560 |
|
|
free_func (func[f]);
|
561 |
|
|
func[f] = NULL;
|
562 |
|
|
change = 1;
|
563 |
|
|
}
|
564 |
|
|
if (change) goto restart;
|
565 |
|
|
}
|
566 |
|
|
}
|
567 |
|
|
|
568 |
|
|
void main_cuc (char *filename)
|
569 |
|
|
{
|
570 |
|
|
int i, j;
|
571 |
|
|
char tmp1[256];
|
572 |
|
|
char filename_cut[256];
|
573 |
|
|
#if 0 /* Select prefix, based on binary program name */
|
574 |
|
|
for (i = 0; i < sizeof (filename_cut); i++) {
|
575 |
|
|
if (isalpha(filename[i])) filename_cut[i] = filename[i];
|
576 |
|
|
else {
|
577 |
|
|
filename_cut[i] = '\0';
|
578 |
|
|
break;
|
579 |
|
|
}
|
580 |
|
|
}
|
581 |
|
|
#else
|
582 |
|
|
strcpy (filename_cut, "cu");
|
583 |
|
|
#endif
|
584 |
|
|
|
585 |
|
|
PRINTF ("Entering OpenRISC Custom Unit Compiler command prompt\n");
|
586 |
|
|
PRINTF ("Using profile file \"%s\" and memory profile file \"%s\".\n", config.sim.prof_fn, config.sim.mprof_fn);
|
587 |
|
|
sprintf (tmp1, "%s.log", filename_cut);
|
588 |
|
|
PRINTF ("Analyzing. (log file \"%s\").\n", tmp1);
|
589 |
|
|
assert (flog = fopen (tmp1, "wt+"));
|
590 |
|
|
|
591 |
|
|
/* Loads in the specified timings table */
|
592 |
|
|
PRINTF ("Using timings from \"%s\" at %s\n",config.cuc.timings_fn,
|
593 |
|
|
generate_time_pretty (tmp1, config.sim.clkcycle_ps));
|
594 |
|
|
load_timing_table (config.cuc.timings_fn);
|
595 |
|
|
runtime.cuc.cycle_duration = 1000. * config.sim.clkcycle_ps;
|
596 |
|
|
PRINTF ("Multicycle logic %s, bursts %s, %s memory order.\n",
|
597 |
|
|
config.cuc.no_multicycle ? "OFF" : "ON", config.cuc.enable_bursts ? "ON" : "OFF",
|
598 |
|
|
config.cuc.memory_order == MO_NONE ? "no" : config.cuc.memory_order == MO_WEAK ? "weak" :
|
599 |
|
|
config.cuc.memory_order == MO_STRONG ? "strong" : "exact");
|
600 |
|
|
|
601 |
|
|
prof_set (1, 0);
|
602 |
|
|
assert (prof_acquire (config.sim.prof_fn) == 0);
|
603 |
|
|
|
604 |
|
|
if (config.cuc.calling_convention)
|
605 |
|
|
PRINTF ("Assuming OpenRISC standard calling convention.\n");
|
606 |
|
|
|
607 |
|
|
/* Try all functions except "total" */
|
608 |
|
|
for (i = 0; i < prof_nfuncs - 1; i++) {
|
609 |
|
|
long orig_time;
|
610 |
|
|
unsigned long start_addr, end_addr;
|
611 |
|
|
orig_time = prof_func[i].cum_cycles;
|
612 |
|
|
start_addr = prof_func[i].addr;
|
613 |
|
|
|
614 |
|
|
/* Extract the function from the binary */
|
615 |
|
|
sprintf (tmp1, "%s.bin", prof_func[i].name);
|
616 |
|
|
end_addr = extract_function (tmp1, start_addr);
|
617 |
|
|
|
618 |
1308 |
phoenix |
log ("Testing function %s (%08lx - %08lx)\n", prof_func[i].name, start_addr,
|
619 |
|
|
end_addr);
|
620 |
|
|
PRINTF ("Testing function %s (%08lx - %08lx)\n", prof_func[i].name,
|
621 |
|
|
start_addr, end_addr);
|
622 |
1244 |
hpanther |
func[i] = analyse_function (prof_func[i].name, orig_time, start_addr,
|
623 |
|
|
end_addr, config.cuc.memory_order, prof_func[i].calls);
|
624 |
|
|
func_v[i] = 0;
|
625 |
|
|
}
|
626 |
|
|
set_func_deps ();
|
627 |
|
|
|
628 |
|
|
while (1) {
|
629 |
|
|
char *s;
|
630 |
|
|
wait_command:
|
631 |
|
|
PRINTF ("(cuc) ");
|
632 |
|
|
fflush (stdout);
|
633 |
|
|
wait_command_empty:
|
634 |
|
|
s = fgets(tmp1, sizeof tmp1, stdin);
|
635 |
|
|
usleep (100);
|
636 |
|
|
if (!s) goto wait_command_empty;
|
637 |
|
|
for (s = tmp1; *s != '\0' && *s != '\n' && *s != '\r'; s++);
|
638 |
|
|
*s = '\0';
|
639 |
|
|
|
640 |
|
|
/* quit command */
|
641 |
|
|
if (strcmp (tmp1, "q") == 0 || strcmp (tmp1, "quit") == 0) {
|
642 |
|
|
/* Delete temporary files */
|
643 |
|
|
for (i = 0; i < prof_nfuncs - 1; i++) {
|
644 |
|
|
sprintf (tmp1, "%s.bin", prof_func[i].name);
|
645 |
|
|
log ("Deleting temporary file %s %s\n", tmp1, remove (tmp1) ? "FAILED" : "OK");
|
646 |
|
|
sprintf (tmp1, "%s.bin.bb", prof_func[i].name);
|
647 |
|
|
log ("Deleting temporary file %s %s\n", tmp1, remove (tmp1) ? "FAILED" : "OK");
|
648 |
|
|
}
|
649 |
|
|
break;
|
650 |
|
|
|
651 |
|
|
/* profile command */
|
652 |
|
|
} else if (strcmp (tmp1, "p") == 0 || strcmp (tmp1, "profile") == 0) {
|
653 |
|
|
int ntime = 0;
|
654 |
|
|
int size = 0;
|
655 |
|
|
PRINTF ("-----------------------------------------------------------------------------\n");
|
656 |
1308 |
phoenix |
PRINTF ("|function name |calls|avg cycles |old%%| max. f. | impr. f.| options |\n");
|
657 |
1244 |
hpanther |
PRINTF ("|--------------------+-----+------------+----+----------|---------+---------|\n");
|
658 |
|
|
for (j = 0; j < prof_nfuncs; j++) {
|
659 |
|
|
int bestcyc = 0, besti = 0;
|
660 |
|
|
char tmp[100];
|
661 |
|
|
for (i = 0; i < prof_nfuncs; i++)
|
662 |
|
|
if (prof_func[i].cum_cycles > bestcyc) {
|
663 |
|
|
bestcyc = prof_func[i].cum_cycles;
|
664 |
|
|
besti = i;
|
665 |
|
|
}
|
666 |
|
|
i = besti;
|
667 |
1308 |
phoenix |
PRINTF ("|%-20s|%5li|%12.1f|%3.0f%%| ",
|
668 |
1244 |
hpanther |
strstrip (tmp, prof_func[i].name, 20), prof_func[i].calls,
|
669 |
|
|
((double)prof_func[i].cum_cycles / prof_func[i].calls),
|
670 |
|
|
(100. * prof_func[i].cum_cycles / prof_cycles));
|
671 |
|
|
if (func[i]) {
|
672 |
|
|
double f = 1.0;
|
673 |
|
|
if (func_v[i]) {
|
674 |
|
|
int nt = calc_cycles (func[i]);
|
675 |
|
|
int s = calc_size (func[i]);
|
676 |
|
|
f = 1. * func[i]->orig_time / nt;
|
677 |
|
|
ntime += nt;
|
678 |
|
|
size += s;
|
679 |
|
|
} else ntime += prof_func[i].cum_cycles;
|
680 |
|
|
PRINTF ("%8.1f |%8.1f | %-8s|\n", 1.f * prof_func[i].cum_cycles
|
681 |
|
|
/ func[i]->timings.new_time, f, format_func_options (tmp, func[i]));
|
682 |
|
|
} else {
|
683 |
|
|
PRINTF (" N/A | N/A | N/A |\n");
|
684 |
|
|
ntime += prof_func[i].cum_cycles;
|
685 |
|
|
}
|
686 |
|
|
prof_func[i].cum_cycles = -prof_func[i].cum_cycles;
|
687 |
|
|
}
|
688 |
|
|
for (i = 0; i < prof_nfuncs; i++)
|
689 |
|
|
prof_func[i].cum_cycles = -prof_func[i].cum_cycles;
|
690 |
|
|
PRINTF ("-----------------------------------------------------------------------------\n");
|
691 |
|
|
PRINTF ("Total %i cycles (was %i), total added gates = %i. Speed factor %.1f\n",
|
692 |
|
|
ntime, prof_cycles, size, 1. * prof_cycles / ntime);
|
693 |
|
|
|
694 |
|
|
/* debug command */
|
695 |
|
|
} else if (strncmp (tmp1, "d", 1) == 0 || strncmp (tmp1, "debug", 5) == 0) {
|
696 |
|
|
sscanf (tmp1, "%*s %i", &cuc_debug);
|
697 |
|
|
if (cuc_debug < 0) cuc_debug = 0;
|
698 |
|
|
if (cuc_debug > 9) cuc_debug = 9;
|
699 |
|
|
|
700 |
|
|
/* generate command */
|
701 |
|
|
} else if (strcmp (tmp1, "g") == 0 || strcmp (tmp1, "generate") == 0) {
|
702 |
|
|
/* check for function dependencies */
|
703 |
|
|
for (i = 0; i < prof_nfuncs; i++)
|
704 |
|
|
if (func[i]) func[i]->tmp = func_v[i];
|
705 |
|
|
for (i = 0; i < prof_nfuncs; i++) if (func[i])
|
706 |
|
|
for (j = 0; j < func[i]->nfdeps; j++)
|
707 |
|
|
if (!func[i]->fdeps[j] || !func[i]->fdeps[j]->tmp) {
|
708 |
|
|
PRINTF ("Function %s must be selected for translation (required by %s)\n",
|
709 |
|
|
prof_func[j].name, prof_func[i].name);
|
710 |
|
|
goto wait_command;
|
711 |
|
|
}
|
712 |
|
|
for (i = 0; i < prof_nfuncs; i++)
|
713 |
|
|
if (func[i] && func_v[i]) generate_function (func[i], prof_func[i].name, filename_cut);
|
714 |
|
|
generate_main (prof_nfuncs, func, filename_cut);
|
715 |
|
|
|
716 |
|
|
/* list command */
|
717 |
|
|
} else if (strcmp (tmp1, "l") == 0 || strcmp (tmp1, "list") == 0) {
|
718 |
|
|
/* check for function dependencies */
|
719 |
|
|
for (i = 0; i < prof_nfuncs; i++)
|
720 |
|
|
if (func_v[i]) {
|
721 |
|
|
PRINTF ("%s\n", prof_func[j].name);
|
722 |
|
|
}
|
723 |
|
|
|
724 |
|
|
/* selectall command */
|
725 |
|
|
} else if (strcmp (tmp1, "sa") == 0 || strcmp (tmp1, "selectall") == 0) {
|
726 |
1308 |
phoenix |
int f;
|
727 |
1244 |
hpanther |
for (f = 0; f < prof_nfuncs; f++) if (func[f]) {
|
728 |
|
|
func_v[f] = 1;
|
729 |
|
|
PRINTF ("Function %s selected for translation.\n", prof_func[f].name);
|
730 |
|
|
}
|
731 |
|
|
|
732 |
|
|
/* select command */
|
733 |
|
|
} else if (strncmp (tmp1, "s", 1) == 0 || strncmp (tmp1, "select", 6) == 0) {
|
734 |
|
|
char tmp[50], ch;
|
735 |
|
|
int p, o, b, f;
|
736 |
|
|
p = sscanf (tmp1, "%*s %s %i%c", tmp, &b, &ch);
|
737 |
|
|
if (p < 1) PRINTF ("Invalid parameters.\n");
|
738 |
|
|
else {
|
739 |
|
|
/* Check if we have valid option */
|
740 |
|
|
for (f = 0; f < prof_nfuncs; f++)
|
741 |
|
|
if (strcmp (prof_func[f].name, tmp) == 0 && func[f]) break;
|
742 |
|
|
if (f < prof_nfuncs) {
|
743 |
|
|
if (p == 1) {
|
744 |
|
|
if (func[f]) {
|
745 |
|
|
func_v[f] = 1;
|
746 |
|
|
PRINTF ("Function %s selected for translation.\n", prof_func[f].name);
|
747 |
|
|
} else PRINTF ("Function %s not suitable for translation.\n", prof_func[f].name);
|
748 |
|
|
} else {
|
749 |
|
|
if (!func_v[f])
|
750 |
|
|
PRINTF ("Function %s not yet selected for translation.\n", prof_func[f].name);
|
751 |
|
|
if (p < 3) goto invalid_option;
|
752 |
|
|
for (o = 0; option_char[o] != '\0' && option_char[o] != ch; o++);
|
753 |
|
|
if (!option_char[o]) goto invalid_option;
|
754 |
|
|
if (b < 0 || b >= func[f]->num_bb) goto invalid_option;
|
755 |
|
|
if (o < 0 || o >= func[f]->bb[b].ntim) goto invalid_option;
|
756 |
|
|
|
757 |
|
|
/* select an option */
|
758 |
|
|
func[f]->bb[b].selected_tim = o;
|
759 |
|
|
if (func[f]->bb[b].tim[o].nshared) {
|
760 |
|
|
PRINTF ("Option has shared instructions: ");
|
761 |
|
|
print_shared (func[f], func[f]->bb[b].tim[o].shared, func[f]->bb[b].tim[o].nshared);
|
762 |
|
|
PRINTF ("\n");
|
763 |
|
|
}
|
764 |
|
|
goto wait_command;
|
765 |
|
|
invalid_option:
|
766 |
|
|
PRINTF ("Invalid option.\n");
|
767 |
|
|
}
|
768 |
|
|
} else PRINTF ("Invalid function.\n");
|
769 |
|
|
}
|
770 |
|
|
|
771 |
|
|
/* unselect command */
|
772 |
|
|
} else if (strncmp (tmp1, "u", 1) == 0 || strncmp (tmp1, "unselect", 8) == 0) {
|
773 |
|
|
char tmp[50], ch;
|
774 |
|
|
int p, o, b, f;
|
775 |
|
|
p = sscanf (tmp1, "%*s %s %i%c", tmp, &b, &ch);
|
776 |
|
|
if (p < 1) PRINTF ("Invalid parameters.\n");
|
777 |
|
|
else {
|
778 |
|
|
/* Check if we have valid option */
|
779 |
|
|
for (f = 0; f < prof_nfuncs; f++)
|
780 |
|
|
if (strcmp (prof_func[f].name, tmp) == 0 && func[f]) break;
|
781 |
|
|
if (f < prof_nfuncs) {
|
782 |
|
|
if (p == 1) {
|
783 |
|
|
if (func[f]) {
|
784 |
|
|
func_v[f] = 0;
|
785 |
|
|
PRINTF ("Function %s unselected for translation.\n", prof_func[f].name);
|
786 |
|
|
} else PRINTF ("Function %s not suitable for translation.\n", prof_func[f].name);
|
787 |
|
|
} else {
|
788 |
|
|
if (p < 3) goto invalid_option;
|
789 |
|
|
for (o = 0; option_char[o] != '\0' && option_char[o] != ch; o++);
|
790 |
|
|
if (!option_char[o]) goto invalid_option;
|
791 |
|
|
if (b < 0 || b >= func[f]->num_bb) goto invalid_option;
|
792 |
|
|
if (o < 0 || o >= func[f]->bb[b].ntim) goto invalid_option;
|
793 |
|
|
|
794 |
|
|
/* select an option */
|
795 |
|
|
func[f]->bb[b].selected_tim = -1;
|
796 |
|
|
}
|
797 |
|
|
} else PRINTF ("Invalid function.\n");
|
798 |
|
|
}
|
799 |
|
|
|
800 |
|
|
/* options command */
|
801 |
|
|
} else if (strcmp (tmp1, "o") == 0 || strcmp (tmp1, "options") == 0) {
|
802 |
|
|
int any = 0;
|
803 |
|
|
PRINTF ("Available options:\n");
|
804 |
|
|
for (i = 0; i < prof_nfuncs; i++)
|
805 |
|
|
if (func[i]) {
|
806 |
|
|
options_cmd (i, func[i]);
|
807 |
|
|
any = 1;
|
808 |
|
|
}
|
809 |
|
|
if (any) PRINTF ("-----------------------------------------------------------------------------\n");
|
810 |
|
|
else PRINTF ("Sorry. No available options.\n");
|
811 |
|
|
|
812 |
|
|
/* Ignore empty string */
|
813 |
|
|
} else if (strcmp (tmp1, "") == 0) {
|
814 |
|
|
|
815 |
|
|
/* help command */
|
816 |
|
|
} else {
|
817 |
|
|
if (strcmp (tmp1, "h") != 0 && strcmp (tmp1, "help") != 0)
|
818 |
|
|
PRINTF ("Unknown command.\n");
|
819 |
|
|
PRINTF ("OpenRISC Custom Unit Compiler command prompt\n");
|
820 |
|
|
PRINTF ("Available commands:\n");
|
821 |
|
|
PRINTF (" h | help displays this help\n");
|
822 |
|
|
PRINTF (" q | quit returns to or1ksim prompt\n");
|
823 |
|
|
PRINTF (" p | profile displays function profiling\n");
|
824 |
|
|
PRINTF (" d | debug # sets debug level (0-9)\n");
|
825 |
|
|
PRINTF (" o | options displays available options\n");
|
826 |
|
|
PRINTF (" s | select func [option] selects an option/function\n");
|
827 |
|
|
PRINTF (" u | unselect func [option] unselects an option/function\n");
|
828 |
|
|
PRINTF (" g | generate generates verilog file\n");
|
829 |
|
|
PRINTF (" l | list displays selected functions\n");
|
830 |
|
|
}
|
831 |
|
|
}
|
832 |
|
|
|
833 |
|
|
/* Dispose memory */
|
834 |
|
|
for (i = 0; i < prof_nfuncs -1; i++)
|
835 |
|
|
if (func[i]) free_func (func[i]);
|
836 |
|
|
|
837 |
|
|
fclose (flog);
|
838 |
|
|
}
|
839 |
|
|
|
840 |
1358 |
nogj |
/*----------------------------------------------------[ CUC Configuration ]---*/
|
841 |
|
|
void cuc_calling_convention(union param_val val, void *dat)
|
842 |
|
|
{
|
843 |
|
|
config.cuc.calling_convention = val.int_val;
|
844 |
|
|
}
|
845 |
|
|
|
846 |
|
|
void cuc_enable_bursts(union param_val val, void *dat)
|
847 |
|
|
{
|
848 |
|
|
config.cuc.enable_bursts = val.int_val;
|
849 |
|
|
}
|
850 |
|
|
|
851 |
|
|
void cuc_no_multicycle(union param_val val, void *dat)
|
852 |
|
|
{
|
853 |
|
|
config.cuc.no_multicycle = val.int_val;
|
854 |
|
|
}
|
855 |
|
|
|
856 |
|
|
void cuc_memory_order(union param_val val, void *dat)
|
857 |
|
|
{
|
858 |
|
|
if (strcmp (val.str_val, "none") == 0)
|
859 |
|
|
config.cuc.memory_order = MO_NONE;
|
860 |
|
|
else if (strcmp (val.str_val, "weak") == 0)
|
861 |
|
|
config.cuc.memory_order = MO_WEAK;
|
862 |
|
|
else if (strcmp (val.str_val, "strong") == 0)
|
863 |
|
|
config.cuc.memory_order = MO_STRONG;
|
864 |
|
|
else if (strcmp (val.str_val, "exact") == 0) {
|
865 |
|
|
config.cuc.memory_order = MO_EXACT;
|
866 |
|
|
} else {
|
867 |
|
|
char tmp[200];
|
868 |
|
|
sprintf (tmp, "invalid memory order '%s'.\n", val.str_val);
|
869 |
|
|
CONFIG_ERROR(tmp);
|
870 |
|
|
}
|
871 |
|
|
}
|
872 |
|
|
|
873 |
|
|
void cuc_timings_fn(union param_val val, void *dat)
|
874 |
|
|
{
|
875 |
|
|
strcpy(config.cuc.timings_fn, val.str_val);
|
876 |
|
|
}
|
877 |
|
|
|
878 |
|
|
void reg_cuc_sec(void)
|
879 |
|
|
{
|
880 |
|
|
struct config_section *sec = reg_config_sec("cuc", NULL, NULL);
|
881 |
|
|
|
882 |
|
|
reg_config_param(sec, "calling_convention", paramt_int, cuc_calling_convention);
|
883 |
|
|
reg_config_param(sec, "enable_bursts", paramt_int, cuc_enable_bursts);
|
884 |
|
|
reg_config_param(sec, "no_multicycle", paramt_int, cuc_no_multicycle);
|
885 |
|
|
reg_config_param(sec, "memory_order", paramt_word, cuc_memory_order);
|
886 |
|
|
reg_config_param(sec, "timings_fn", paramt_str, cuc_timings_fn);
|
887 |
|
|
}
|