Mercurial > octave-nkf
annotate src/jit-typeinfo.cc @ 15068:f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
* src/jit-typeinfo.cc (make_indices, octave_jit_paren_scalar_subsasgn,
jit_typeinfo::gen_subsasgn): New function.
(octave_jit_paren_scalar): Use make_indices.
(jit_typeinfo::jit_typeinfo): Call gen_subsasgn.
* src/pt-jit.h (jit_typeinfo::gen_subsasgn): New declaration.
* src/pt-jit.cc (jit_convert::resolve): Add extra_arg argument.
(jit_convert::do_assign): Pass rhs to resolve.
* src/pt-jit.h (jit_convert::resolve): Change function signature.
author | Max Brister <max@2bass.com> |
---|---|
date | Tue, 31 Jul 2012 15:40:52 -0500 |
parents | df4538e3b50b |
children | fe4752f772e2 |
rev | line source |
---|---|
15016 | 1 /* |
2 | |
3 Copyright (C) 2012 Max Brister <max@2bass.com> | |
4 | |
5 This file is part of Octave. | |
6 | |
7 Octave is free software; you can redistribute it and/or modify it | |
8 under the terms of the GNU General Public License as published by the | |
9 Free Software Foundation; either version 3 of the License, or (at your | |
10 option) any later version. | |
11 | |
12 Octave is distributed in the hope that it will be useful, but WITHOUT | |
13 ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or | |
14 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License | |
15 for more details. | |
16 | |
17 You should have received a copy of the GNU General Public License | |
18 along with Octave; see the file COPYING. If not, see | |
19 <http://www.gnu.org/licenses/>. | |
20 | |
21 */ | |
22 | |
23 // defines required by llvm | |
24 #define __STDC_LIMIT_MACROS | |
25 #define __STDC_CONSTANT_MACROS | |
26 | |
27 #ifdef HAVE_CONFIG_H | |
28 #include <config.h> | |
29 #endif | |
30 | |
31 #ifdef HAVE_LLVM | |
32 | |
33 #include "jit-typeinfo.h" | |
34 | |
35 #include <llvm/Analysis/Verifier.h> | |
36 #include <llvm/GlobalVariable.h> | |
37 #include <llvm/ExecutionEngine/ExecutionEngine.h> | |
38 #include <llvm/LLVMContext.h> | |
39 #include <llvm/Function.h> | |
40 #include <llvm/Instructions.h> | |
41 #include <llvm/Intrinsics.h> | |
42 #include <llvm/Support/IRBuilder.h> | |
43 #include <llvm/Support/raw_os_ostream.h> | |
44 | |
45 #include "jit-ir.h" | |
46 #include "ov.h" | |
47 #include "ov-builtin.h" | |
48 #include "ov-complex.h" | |
49 #include "ov-scalar.h" | |
50 #include "pager.h" | |
51 | |
52 static llvm::LLVMContext& context = llvm::getGlobalContext (); | |
53 | |
54 jit_typeinfo *jit_typeinfo::instance = 0; | |
55 | |
56 std::ostream& jit_print (std::ostream& os, jit_type *atype) | |
57 { | |
58 if (! atype) | |
59 return os << "null"; | |
60 return os << atype->name (); | |
61 } | |
62 | |
63 // function that jit code calls | |
64 extern "C" void | |
65 octave_jit_print_any (const char *name, octave_base_value *obv) | |
66 { | |
67 obv->print_with_name (octave_stdout, name, true); | |
68 } | |
69 | |
70 extern "C" void | |
15019
ae3670d4df29
Update the execution engine's global mapping for external functions
Max Brister <max@2bass.com>
parents:
15016
diff
changeset
|
71 octave_jit_print_scalar (const char *name, double value) |
15016 | 72 { |
73 // FIXME: We should avoid allocating a new octave_scalar each time | |
74 octave_value ov (value); | |
75 ov.print_with_name (octave_stdout, name); | |
76 } | |
77 | |
78 extern "C" octave_base_value* | |
79 octave_jit_binary_any_any (octave_value::binary_op op, octave_base_value *lhs, | |
80 octave_base_value *rhs) | |
81 { | |
82 octave_value olhs (lhs, true); | |
83 octave_value orhs (rhs, true); | |
84 octave_value result = do_binary_op (op, olhs, orhs); | |
85 octave_base_value *rep = result.internal_rep (); | |
86 rep->grab (); | |
87 return rep; | |
88 } | |
89 | |
90 extern "C" octave_idx_type | |
91 octave_jit_compute_nelem (double base, double limit, double inc) | |
92 { | |
93 Range rng = Range (base, limit, inc); | |
94 return rng.nelem (); | |
95 } | |
96 | |
97 extern "C" void | |
98 octave_jit_release_any (octave_base_value *obv) | |
99 { | |
100 obv->release (); | |
101 } | |
102 | |
103 extern "C" void | |
104 octave_jit_release_matrix (jit_matrix *m) | |
105 { | |
106 delete m->array; | |
107 } | |
108 | |
109 extern "C" octave_base_value * | |
110 octave_jit_grab_any (octave_base_value *obv) | |
111 { | |
112 obv->grab (); | |
113 return obv; | |
114 } | |
115 | |
116 extern "C" void | |
117 octave_jit_grab_matrix (jit_matrix *result, jit_matrix *m) | |
118 { | |
119 *result = *m->array; | |
120 } | |
121 | |
122 extern "C" octave_base_value * | |
123 octave_jit_cast_any_matrix (jit_matrix *m) | |
124 { | |
125 octave_value ret (*m->array); | |
126 octave_base_value *rep = ret.internal_rep (); | |
127 rep->grab (); | |
128 delete m->array; | |
129 | |
130 return rep; | |
131 } | |
132 | |
133 extern "C" void | |
134 octave_jit_cast_matrix_any (jit_matrix *ret, octave_base_value *obv) | |
135 { | |
136 NDArray m = obv->array_value (); | |
137 *ret = m; | |
138 obv->release (); | |
139 } | |
140 | |
15027
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
141 extern "C" octave_base_value * |
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
142 octave_jit_cast_any_range (jit_range *rng) |
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
143 { |
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
144 Range temp (*rng); |
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
145 octave_value ret (temp); |
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
146 octave_base_value *rep = ret.internal_rep (); |
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
147 rep->grab (); |
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
148 |
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
149 return rep; |
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
150 } |
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
151 extern "C" void |
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
152 octave_jit_cast_range_any (jit_range *ret, octave_base_value *obv) |
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
153 { |
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
154 |
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
155 jit_range r (obv->range_value ()); |
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
156 *ret = r; |
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
157 obv->release (); |
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
158 } |
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
159 |
15016 | 160 extern "C" double |
161 octave_jit_cast_scalar_any (octave_base_value *obv) | |
162 { | |
163 double ret = obv->double_value (); | |
164 obv->release (); | |
165 return ret; | |
166 } | |
167 | |
168 extern "C" octave_base_value * | |
169 octave_jit_cast_any_scalar (double value) | |
170 { | |
171 return new octave_scalar (value); | |
172 } | |
173 | |
174 extern "C" Complex | |
175 octave_jit_cast_complex_any (octave_base_value *obv) | |
176 { | |
177 Complex ret = obv->complex_value (); | |
178 obv->release (); | |
179 return ret; | |
180 } | |
181 | |
182 extern "C" octave_base_value * | |
183 octave_jit_cast_any_complex (Complex c) | |
184 { | |
185 if (c.imag () == 0) | |
186 return new octave_scalar (c.real ()); | |
187 else | |
188 return new octave_complex (c); | |
189 } | |
190 | |
191 extern "C" void | |
192 octave_jit_gripe_nan_to_logical_conversion (void) | |
193 { | |
194 try | |
195 { | |
196 gripe_nan_to_logical_conversion (); | |
197 } | |
198 catch (const octave_execution_exception&) | |
199 { | |
200 gripe_library_execution_error (); | |
201 } | |
202 } | |
203 | |
204 extern "C" void | |
205 octave_jit_ginvalid_index (void) | |
206 { | |
207 try | |
208 { | |
209 gripe_invalid_index (); | |
210 } | |
211 catch (const octave_execution_exception&) | |
212 { | |
213 gripe_library_execution_error (); | |
214 } | |
215 } | |
216 | |
217 extern "C" void | |
218 octave_jit_gindex_range (int nd, int dim, octave_idx_type iext, | |
219 octave_idx_type ext) | |
220 { | |
221 try | |
222 { | |
223 gripe_index_out_of_range (nd, dim, iext, ext); | |
224 } | |
225 catch (const octave_execution_exception&) | |
226 { | |
227 gripe_library_execution_error (); | |
228 } | |
229 } | |
230 | |
231 extern "C" void | |
15027
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
232 octave_jit_paren_subsasgn_impl (jit_matrix *ret, jit_matrix *mat, |
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
233 octave_idx_type index, double value) |
15016 | 234 { |
235 NDArray *array = mat->array; | |
236 if (array->nelem () < index) | |
237 array->resize1 (index); | |
238 | |
239 double *data = array->fortran_vec (); | |
240 data[index - 1] = value; | |
241 | |
242 mat->update (); | |
15027
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
243 *ret = *mat; |
15016 | 244 } |
245 | |
15068
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
246 static void |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
247 make_indices (double *indices, octave_idx_type idx_count, |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
248 Array<idx_vector>& result) |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
249 { |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
250 result.resize (dim_vector (1, idx_count)); |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
251 for (octave_idx_type i = 0; i < idx_count; ++i) |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
252 result(i) = idx_vector (indices[i]); |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
253 } |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
254 |
15067 | 255 extern "C" double |
256 octave_jit_paren_scalar (jit_matrix *mat, double *indicies, | |
257 octave_idx_type idx_count) | |
258 { | |
259 // FIXME: Replace this with a more optimal version | |
260 try | |
261 { | |
15068
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
262 Array<idx_vector> idx; |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
263 make_indices (indicies, idx_count, idx); |
15067 | 264 |
265 Array<double> ret = mat->array->index (idx); | |
266 return ret.xelem (0); | |
267 } | |
268 catch (const octave_execution_exception&) | |
269 { | |
270 gripe_library_execution_error (); | |
271 return 0; | |
272 } | |
273 } | |
274 | |
15016 | 275 extern "C" void |
15068
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
276 octave_jit_paren_scalar_subsasgn (jit_matrix *ret, jit_matrix *mat, |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
277 double *indices, octave_idx_type idx_count, |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
278 double value) |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
279 { |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
280 // FIXME: Replace this with a more optimal version |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
281 try |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
282 { |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
283 Array<idx_vector> idx; |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
284 make_indices (indices, idx_count, idx); |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
285 |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
286 Matrix temp (1, 1); |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
287 temp.xelem(0) = value; |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
288 mat->array->assign (idx, temp); |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
289 ret->update (mat->array); |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
290 } |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
291 catch (const octave_execution_exception&) |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
292 { |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
293 gripe_library_execution_error (); |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
294 } |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
295 } |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
296 |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
297 extern "C" void |
15016 | 298 octave_jit_paren_subsasgn_matrix_range (jit_matrix *result, jit_matrix *mat, |
299 jit_range *index, double value) | |
300 { | |
301 NDArray *array = mat->array; | |
302 bool done = false; | |
303 | |
304 // optimize for the simple case (no resizing and no errors) | |
305 if (*array->jit_ref_count () == 1 | |
306 && index->all_elements_are_ints ()) | |
307 { | |
308 // this code is similar to idx_vector::fill, but we avoid allocating an | |
309 // idx_vector and its associated rep | |
310 octave_idx_type start = static_cast<octave_idx_type> (index->base) - 1; | |
311 octave_idx_type step = static_cast<octave_idx_type> (index->inc); | |
312 octave_idx_type nelem = index->nelem; | |
313 octave_idx_type final = start + nelem * step; | |
314 if (step < 0) | |
315 { | |
316 step = -step; | |
317 std::swap (final, start); | |
318 } | |
319 | |
320 if (start >= 0 && final < mat->slice_len) | |
321 { | |
322 done = true; | |
323 | |
324 double *data = array->jit_slice_data (); | |
325 if (step == 1) | |
326 std::fill (data + start, data + start + nelem, value); | |
327 else | |
328 { | |
329 for (octave_idx_type i = start; i < final; i += step) | |
330 data[i] = value; | |
331 } | |
332 } | |
333 } | |
334 | |
335 if (! done) | |
336 { | |
337 idx_vector idx (*index); | |
338 NDArray avalue (dim_vector (1, 1)); | |
339 avalue.xelem (0) = value; | |
340 array->assign (idx, avalue); | |
341 } | |
342 | |
343 result->update (array); | |
344 } | |
345 | |
346 extern "C" Complex | |
347 octave_jit_complex_div (Complex lhs, Complex rhs) | |
348 { | |
349 // see src/OPERATORS/op-cs-cs.cc | |
350 if (rhs == 0.0) | |
351 gripe_divide_by_zero (); | |
352 | |
353 return lhs / rhs; | |
354 } | |
355 | |
356 // FIXME: CP form src/xpow.cc | |
357 static inline int | |
358 xisint (double x) | |
359 { | |
360 return (D_NINT (x) == x | |
361 && ((x >= 0 && x < INT_MAX) | |
362 || (x <= 0 && x > INT_MIN))); | |
363 } | |
364 | |
365 extern "C" Complex | |
366 octave_jit_pow_scalar_scalar (double lhs, double rhs) | |
367 { | |
368 // FIXME: almost CP from src/xpow.cc | |
369 if (lhs < 0.0 && ! xisint (rhs)) | |
370 return std::pow (Complex (lhs), rhs); | |
371 return std::pow (lhs, rhs); | |
372 } | |
373 | |
374 extern "C" Complex | |
375 octave_jit_pow_complex_complex (Complex lhs, Complex rhs) | |
376 { | |
377 if (lhs.imag () == 0 && rhs.imag () == 0) | |
378 return octave_jit_pow_scalar_scalar (lhs.real (), rhs.real ()); | |
379 return std::pow (lhs, rhs); | |
380 } | |
381 | |
382 extern "C" Complex | |
383 octave_jit_pow_complex_scalar (Complex lhs, double rhs) | |
384 { | |
385 if (lhs.imag () == 0) | |
386 return octave_jit_pow_scalar_scalar (lhs.real (), rhs); | |
387 return std::pow (lhs, rhs); | |
388 } | |
389 | |
390 extern "C" Complex | |
391 octave_jit_pow_scalar_complex (double lhs, Complex rhs) | |
392 { | |
393 if (rhs.imag () == 0) | |
394 return octave_jit_pow_scalar_scalar (lhs, rhs.real ()); | |
395 return std::pow (lhs, rhs); | |
396 } | |
397 | |
398 extern "C" void | |
399 octave_jit_print_matrix (jit_matrix *m) | |
400 { | |
401 std::cout << *m << std::endl; | |
402 } | |
403 | |
404 static void | |
405 gripe_bad_result (void) | |
406 { | |
407 error ("incorrect type information given to the JIT compiler"); | |
408 } | |
409 | |
410 // FIXME: Add support for multiple outputs | |
411 extern "C" octave_base_value * | |
412 octave_jit_call (octave_builtin::fcn fn, size_t nargin, | |
413 octave_base_value **argin, jit_type *result_type) | |
414 { | |
415 octave_value_list ovl (nargin); | |
416 for (size_t i = 0; i < nargin; ++i) | |
417 ovl.xelem (i) = octave_value (argin[i]); | |
418 | |
419 ovl = fn (ovl, 1); | |
420 | |
421 // These type checks are not strictly required, but I'm guessing that | |
422 // incorrect types will be entered on occasion. This will be very difficult to | |
423 // debug unless we do the sanity check here. | |
424 if (result_type) | |
425 { | |
426 if (ovl.length () != 1) | |
427 { | |
428 gripe_bad_result (); | |
429 return 0; | |
430 } | |
431 | |
432 octave_value& result = ovl.xelem (0); | |
433 jit_type *jtype = jit_typeinfo::join (jit_typeinfo::type_of (result), | |
434 result_type); | |
435 if (jtype != result_type) | |
436 { | |
437 gripe_bad_result (); | |
438 return 0; | |
439 } | |
440 | |
441 octave_base_value *ret = result.internal_rep (); | |
442 ret->grab (); | |
443 return ret; | |
444 } | |
445 | |
446 if (! (ovl.length () == 0 | |
447 || (ovl.length () == 1 && ovl.xelem (0).is_undefined ()))) | |
448 gripe_bad_result (); | |
449 | |
450 return 0; | |
451 } | |
452 | |
453 // -------------------- jit_range -------------------- | |
454 bool | |
455 jit_range::all_elements_are_ints () const | |
456 { | |
457 Range r (*this); | |
458 return r.all_elements_are_ints (); | |
459 } | |
460 | |
461 std::ostream& | |
462 operator<< (std::ostream& os, const jit_range& rng) | |
463 { | |
464 return os << "Range[" << rng.base << ", " << rng.limit << ", " << rng.inc | |
465 << ", " << rng.nelem << "]"; | |
466 } | |
467 | |
468 // -------------------- jit_matrix -------------------- | |
469 | |
470 std::ostream& | |
471 operator<< (std::ostream& os, const jit_matrix& mat) | |
472 { | |
473 return os << "Matrix[" << mat.ref_count << ", " << mat.slice_data << ", " | |
474 << mat.slice_len << ", " << mat.dimensions << ", " | |
475 << mat.array << "]"; | |
476 } | |
477 | |
478 // -------------------- jit_type -------------------- | |
479 jit_type::jit_type (const std::string& aname, jit_type *aparent, | |
480 llvm::Type *allvm_type, int aid) : | |
481 mname (aname), mparent (aparent), llvm_type (allvm_type), mid (aid), | |
482 mdepth (aparent ? aparent->mdepth + 1 : 0) | |
483 { | |
484 std::memset (msret, 0, sizeof (msret)); | |
485 std::memset (mpointer_arg, 0, sizeof (mpointer_arg)); | |
486 std::memset (mpack, 0, sizeof (mpack)); | |
487 std::memset (munpack, 0, sizeof (munpack)); | |
488 | |
489 for (size_t i = 0; i < jit_convention::length; ++i) | |
490 mpacked_type[i] = llvm_type; | |
491 } | |
492 | |
493 llvm::Type * | |
494 jit_type::to_llvm_arg (void) const | |
495 { | |
496 return llvm_type ? llvm_type->getPointerTo () : 0; | |
497 } | |
498 | |
499 // -------------------- jit_function -------------------- | |
500 jit_function::jit_function () : module (0), llvm_function (0), mresult (0), | |
501 call_conv (jit_convention::length), | |
502 mcan_error (false) | |
503 {} | |
504 | |
505 jit_function::jit_function (llvm::Module *amodule, | |
506 jit_convention::type acall_conv, | |
507 const llvm::Twine& aname, jit_type *aresult, | |
508 const std::vector<jit_type *>& aargs) | |
509 : module (amodule), mresult (aresult), args (aargs), call_conv (acall_conv), | |
510 mcan_error (false) | |
511 { | |
512 llvm::SmallVector<llvm::Type *, 15> llvm_args; | |
513 | |
514 llvm::Type *rtype = llvm::Type::getVoidTy (context); | |
515 if (mresult) | |
516 { | |
517 rtype = mresult->packed_type (call_conv); | |
518 if (sret ()) | |
519 { | |
520 llvm_args.push_back (rtype->getPointerTo ()); | |
521 rtype = llvm::Type::getVoidTy (context); | |
522 } | |
523 } | |
524 | |
525 for (std::vector<jit_type *>::const_iterator iter = args.begin (); | |
526 iter != args.end (); ++iter) | |
527 { | |
528 jit_type *ty = *iter; | |
529 assert (ty); | |
530 llvm::Type *argty = ty->packed_type (call_conv); | |
531 if (ty->pointer_arg (call_conv)) | |
532 argty = argty->getPointerTo (); | |
533 | |
534 llvm_args.push_back (argty); | |
535 } | |
536 | |
537 // we mark all functinos as external linkage because this prevents llvm | |
538 // from getting rid of always inline functions | |
539 llvm::FunctionType *ft = llvm::FunctionType::get (rtype, llvm_args, false); | |
540 llvm_function = llvm::Function::Create (ft, llvm::Function::ExternalLinkage, | |
541 aname, module); | |
542 if (call_conv == jit_convention::internal) | |
543 llvm_function->addFnAttr (llvm::Attribute::AlwaysInline); | |
544 } | |
545 | |
546 jit_function::jit_function (const jit_function& fn, jit_type *aresult, | |
547 const std::vector<jit_type *>& aargs) | |
548 : module (fn.module), llvm_function (fn.llvm_function), mresult (aresult), | |
549 args (aargs), call_conv (fn.call_conv), mcan_error (fn.mcan_error) | |
550 { | |
551 } | |
552 | |
553 jit_function::jit_function (const jit_function& fn) | |
554 : module (fn.module), llvm_function (fn.llvm_function), mresult (fn.mresult), | |
555 args (fn.args), call_conv (fn.call_conv), mcan_error (fn.mcan_error) | |
556 {} | |
557 | |
558 std::string | |
559 jit_function::name (void) const | |
560 { | |
561 return llvm_function->getName (); | |
562 } | |
563 | |
564 llvm::BasicBlock * | |
565 jit_function::new_block (const std::string& aname, | |
566 llvm::BasicBlock *insert_before) | |
567 { | |
568 return llvm::BasicBlock::Create (context, aname, llvm_function, | |
569 insert_before); | |
570 } | |
571 | |
572 llvm::Value * | |
573 jit_function::call (llvm::IRBuilderD& builder, | |
574 const std::vector<jit_value *>& in_args) const | |
575 { | |
15056
bc32288f4a42
Support the end keyword for one dimentional indexing in JIT.
Max Brister <max@2bass.com>
parents:
15027
diff
changeset
|
576 if (! valid ()) |
bc32288f4a42
Support the end keyword for one dimentional indexing in JIT.
Max Brister <max@2bass.com>
parents:
15027
diff
changeset
|
577 throw jit_fail_exception ("Call not implemented"); |
bc32288f4a42
Support the end keyword for one dimentional indexing in JIT.
Max Brister <max@2bass.com>
parents:
15027
diff
changeset
|
578 |
15016 | 579 assert (in_args.size () == args.size ()); |
580 std::vector<llvm::Value *> llvm_args (args.size ()); | |
581 for (size_t i = 0; i < in_args.size (); ++i) | |
582 llvm_args[i] = in_args[i]->to_llvm (); | |
583 | |
584 return call (builder, llvm_args); | |
585 } | |
586 | |
587 llvm::Value * | |
588 jit_function::call (llvm::IRBuilderD& builder, | |
589 const std::vector<llvm::Value *>& in_args) const | |
590 { | |
15056
bc32288f4a42
Support the end keyword for one dimentional indexing in JIT.
Max Brister <max@2bass.com>
parents:
15027
diff
changeset
|
591 if (! valid ()) |
bc32288f4a42
Support the end keyword for one dimentional indexing in JIT.
Max Brister <max@2bass.com>
parents:
15027
diff
changeset
|
592 throw jit_fail_exception ("Call not implemented"); |
bc32288f4a42
Support the end keyword for one dimentional indexing in JIT.
Max Brister <max@2bass.com>
parents:
15027
diff
changeset
|
593 |
15016 | 594 assert (in_args.size () == args.size ()); |
595 llvm::Function *stacksave | |
596 = llvm::Intrinsic::getDeclaration (module, llvm::Intrinsic::stacksave); | |
597 llvm::SmallVector<llvm::Value *, 10> llvm_args; | |
598 llvm_args.reserve (in_args.size () + sret ()); | |
599 | |
600 llvm::Value *sret_mem = 0; | |
601 llvm::Value *saved_stack = 0; | |
602 if (sret ()) | |
603 { | |
604 saved_stack = builder.CreateCall (stacksave); | |
605 sret_mem = builder.CreateAlloca (mresult->packed_type (call_conv)); | |
606 llvm_args.push_back (sret_mem); | |
607 } | |
608 | |
609 for (size_t i = 0; i < in_args.size (); ++i) | |
610 { | |
611 llvm::Value *arg = in_args[i]; | |
612 jit_type::convert_fn convert = args[i]->pack (call_conv); | |
613 if (convert) | |
614 arg = convert (builder, arg); | |
615 | |
616 if (args[i]->pointer_arg (call_conv)) | |
617 { | |
618 if (! saved_stack) | |
619 saved_stack = builder.CreateCall (stacksave); | |
620 | |
621 arg = builder.CreateAlloca (args[i]->to_llvm ()); | |
622 builder.CreateStore (in_args[i], arg); | |
623 } | |
624 | |
625 llvm_args.push_back (arg); | |
626 } | |
627 | |
628 llvm::Value *ret = builder.CreateCall (llvm_function, llvm_args); | |
629 if (sret_mem) | |
630 ret = builder.CreateLoad (sret_mem); | |
631 | |
632 if (mresult) | |
633 { | |
634 jit_type::convert_fn unpack = mresult->unpack (call_conv); | |
635 if (unpack) | |
636 ret = unpack (builder, ret); | |
637 } | |
638 | |
639 if (saved_stack) | |
640 { | |
641 llvm::Function *stackrestore | |
642 = llvm::Intrinsic::getDeclaration (module, | |
643 llvm::Intrinsic::stackrestore); | |
644 builder.CreateCall (stackrestore, saved_stack); | |
645 } | |
646 | |
647 return ret; | |
648 } | |
649 | |
650 llvm::Value * | |
651 jit_function::argument (llvm::IRBuilderD& builder, size_t idx) const | |
652 { | |
653 assert (idx < args.size ()); | |
654 | |
655 // FIXME: We should be treating arguments like a list, not a vector. Shouldn't | |
656 // matter much for now, as the number of arguments shouldn't be much bigger | |
657 // than 4 | |
658 llvm::Function::arg_iterator iter = llvm_function->arg_begin (); | |
659 if (sret ()) | |
660 ++iter; | |
661 | |
662 for (size_t i = 0; i < idx; ++i, ++iter); | |
663 | |
664 if (args[idx]->pointer_arg (call_conv)) | |
665 return builder.CreateLoad (iter); | |
666 | |
667 return iter; | |
668 } | |
669 | |
670 void | |
671 jit_function::do_return (llvm::IRBuilderD& builder, llvm::Value *rval) | |
672 { | |
673 assert (! rval == ! mresult); | |
674 | |
675 if (rval) | |
676 { | |
677 jit_type::convert_fn convert = mresult->pack (call_conv); | |
678 if (convert) | |
679 rval = convert (builder, rval); | |
680 | |
681 if (sret ()) | |
682 builder.CreateStore (rval, llvm_function->arg_begin ()); | |
683 else | |
684 builder.CreateRet (rval); | |
685 } | |
686 else | |
687 builder.CreateRetVoid (); | |
688 | |
689 llvm::verifyFunction (*llvm_function); | |
690 } | |
691 | |
15019
ae3670d4df29
Update the execution engine's global mapping for external functions
Max Brister <max@2bass.com>
parents:
15016
diff
changeset
|
692 void |
ae3670d4df29
Update the execution engine's global mapping for external functions
Max Brister <max@2bass.com>
parents:
15016
diff
changeset
|
693 jit_function::do_add_mapping (llvm::ExecutionEngine *engine, void *fn) |
ae3670d4df29
Update the execution engine's global mapping for external functions
Max Brister <max@2bass.com>
parents:
15016
diff
changeset
|
694 { |
ae3670d4df29
Update the execution engine's global mapping for external functions
Max Brister <max@2bass.com>
parents:
15016
diff
changeset
|
695 assert (valid ()); |
ae3670d4df29
Update the execution engine's global mapping for external functions
Max Brister <max@2bass.com>
parents:
15016
diff
changeset
|
696 engine->addGlobalMapping (llvm_function, fn); |
ae3670d4df29
Update the execution engine's global mapping for external functions
Max Brister <max@2bass.com>
parents:
15016
diff
changeset
|
697 } |
ae3670d4df29
Update the execution engine's global mapping for external functions
Max Brister <max@2bass.com>
parents:
15016
diff
changeset
|
698 |
15016 | 699 std::ostream& |
700 operator<< (std::ostream& os, const jit_function& fn) | |
701 { | |
702 llvm::Function *lfn = fn.to_llvm (); | |
703 os << "jit_function: cc=" << fn.call_conv; | |
704 llvm::raw_os_ostream llvm_out (os); | |
705 lfn->print (llvm_out); | |
706 llvm_out.flush (); | |
707 return os; | |
708 } | |
709 | |
710 // -------------------- jit_operation -------------------- | |
711 void | |
712 jit_operation::add_overload (const jit_function& func, | |
713 const std::vector<jit_type*>& args) | |
714 { | |
715 if (args.size () >= overloads.size ()) | |
716 overloads.resize (args.size () + 1); | |
717 | |
718 Array<jit_function>& over = overloads[args.size ()]; | |
719 dim_vector dv (over.dims ()); | |
720 Array<octave_idx_type> idx = to_idx (args); | |
721 bool must_resize = false; | |
722 | |
723 if (dv.length () != idx.numel ()) | |
724 { | |
725 dv.resize (idx.numel ()); | |
726 must_resize = true; | |
727 } | |
728 | |
729 for (octave_idx_type i = 0; i < dv.length (); ++i) | |
730 if (dv(i) <= idx(i)) | |
731 { | |
732 must_resize = true; | |
733 dv(i) = idx(i) + 1; | |
734 } | |
735 | |
736 if (must_resize) | |
737 over.resize (dv); | |
738 | |
739 over(idx) = func; | |
740 } | |
741 | |
742 const jit_function& | |
743 jit_operation::overload (const std::vector<jit_type*>& types) const | |
744 { | |
745 // FIXME: We should search for the next best overload on failure | |
746 static jit_function null_overload; | |
747 if (types.size () >= overloads.size ()) | |
748 return null_overload; | |
749 | |
750 for (size_t i =0; i < types.size (); ++i) | |
751 if (! types[i]) | |
752 return null_overload; | |
753 | |
754 const Array<jit_function>& over = overloads[types.size ()]; | |
755 dim_vector dv (over.dims ()); | |
756 Array<octave_idx_type> idx = to_idx (types); | |
757 for (octave_idx_type i = 0; i < dv.length (); ++i) | |
758 if (idx(i) >= dv(i)) | |
759 return null_overload; | |
760 | |
761 return over(idx); | |
762 } | |
763 | |
764 Array<octave_idx_type> | |
765 jit_operation::to_idx (const std::vector<jit_type*>& types) const | |
766 { | |
767 octave_idx_type numel = types.size (); | |
768 if (numel == 1) | |
769 numel = 2; | |
770 | |
771 Array<octave_idx_type> idx (dim_vector (1, numel)); | |
772 for (octave_idx_type i = 0; i < static_cast<octave_idx_type> (types.size ()); | |
773 ++i) | |
774 idx(i) = types[i]->type_id (); | |
775 | |
776 if (types.size () == 1) | |
777 { | |
778 idx(1) = idx(0); | |
779 idx(0) = 0; | |
780 } | |
781 | |
782 return idx; | |
783 } | |
784 | |
785 // -------------------- jit_typeinfo -------------------- | |
786 void | |
787 jit_typeinfo::initialize (llvm::Module *m, llvm::ExecutionEngine *e) | |
788 { | |
789 new jit_typeinfo (m, e); | |
790 } | |
791 | |
792 jit_typeinfo::jit_typeinfo (llvm::Module *m, llvm::ExecutionEngine *e) | |
793 : module (m), engine (e), next_id (0), | |
794 builder (*new llvm::IRBuilderD (context)) | |
795 { | |
796 instance = this; | |
797 | |
798 // FIXME: We should be registering types like in octave_value_typeinfo | |
799 llvm::Type *any_t = llvm::StructType::create (context, "octave_base_value"); | |
800 any_t = any_t->getPointerTo (); | |
801 | |
802 llvm::Type *scalar_t = llvm::Type::getDoubleTy (context); | |
803 llvm::Type *bool_t = llvm::Type::getInt1Ty (context); | |
804 llvm::Type *string_t = llvm::Type::getInt8Ty (context); | |
805 string_t = string_t->getPointerTo (); | |
806 llvm::Type *index_t = llvm::Type::getIntNTy (context, | |
807 sizeof(octave_idx_type) * 8); | |
808 | |
809 llvm::StructType *range_t = llvm::StructType::create (context, "range"); | |
810 std::vector<llvm::Type *> range_contents (4, scalar_t); | |
811 range_contents[3] = index_t; | |
812 range_t->setBody (range_contents); | |
813 | |
814 llvm::Type *refcount_t = llvm::Type::getIntNTy (context, sizeof(int) * 8); | |
815 | |
816 llvm::StructType *matrix_t = llvm::StructType::create (context, "matrix"); | |
817 llvm::Type *matrix_contents[5]; | |
818 matrix_contents[0] = refcount_t->getPointerTo (); | |
819 matrix_contents[1] = scalar_t->getPointerTo (); | |
820 matrix_contents[2] = index_t; | |
821 matrix_contents[3] = index_t->getPointerTo (); | |
822 matrix_contents[4] = string_t; | |
823 matrix_t->setBody (llvm::makeArrayRef (matrix_contents, 5)); | |
824 | |
825 llvm::Type *complex_t = llvm::VectorType::get (scalar_t, 2); | |
826 | |
827 // complex_ret is what is passed to C functions in order to get calling | |
828 // convention right | |
829 complex_ret = llvm::StructType::create (context, "complex_ret"); | |
830 llvm::Type *complex_ret_contents[] = {scalar_t, scalar_t}; | |
831 complex_ret->setBody (complex_ret_contents); | |
832 | |
833 // create types | |
834 any = new_type ("any", 0, any_t); | |
835 matrix = new_type ("matrix", any, matrix_t); | |
836 complex = new_type ("complex", any, complex_t); | |
837 scalar = new_type ("scalar", complex, scalar_t); | |
838 range = new_type ("range", any, range_t); | |
839 string = new_type ("string", any, string_t); | |
840 boolean = new_type ("bool", any, bool_t); | |
841 index = new_type ("index", any, index_t); | |
842 | |
15067 | 843 // a fake type for interfacing with C++ |
844 jit_type *scalar_ptr = new_type ("scalar_ptr", 0, scalar_t->getPointerTo ()); | |
845 | |
15016 | 846 create_int (8); |
847 create_int (16); | |
848 create_int (32); | |
849 create_int (64); | |
850 | |
851 casts.resize (next_id + 1); | |
852 identities.resize (next_id + 1); | |
853 | |
854 // specify calling conventions | |
855 // FIXME: We should detect architecture and do something sane based on that | |
856 // here we assume x86 or x86_64 | |
857 matrix->mark_sret (); | |
858 matrix->mark_pointer_arg (); | |
859 | |
860 range->mark_sret (); | |
861 range->mark_pointer_arg (); | |
862 | |
863 complex->set_pack (jit_convention::external, &jit_typeinfo::pack_complex); | |
864 complex->set_unpack (jit_convention::external, &jit_typeinfo::unpack_complex); | |
865 complex->set_packed_type (jit_convention::external, complex_ret); | |
866 | |
867 if (sizeof (void *) == 4) | |
868 complex->mark_sret (); | |
869 | |
870 // bind global variables | |
871 lerror_state = new llvm::GlobalVariable (*module, bool_t, false, | |
872 llvm::GlobalValue::ExternalLinkage, | |
873 0, "error_state"); | |
874 engine->addGlobalMapping (lerror_state, | |
875 reinterpret_cast<void *> (&error_state)); | |
876 | |
877 // any with anything is an any op | |
878 jit_function fn; | |
879 jit_type *binary_op_type = intN (sizeof (octave_value::binary_op) * 8); | |
880 llvm::Type *llvm_bo_type = binary_op_type->to_llvm (); | |
881 jit_function any_binary = create_function (jit_convention::external, | |
882 "octave_jit_binary_any_any", | |
883 any, binary_op_type, any, any); | |
15019
ae3670d4df29
Update the execution engine's global mapping for external functions
Max Brister <max@2bass.com>
parents:
15016
diff
changeset
|
884 any_binary.add_mapping (engine, &octave_jit_binary_any_any); |
15016 | 885 any_binary.mark_can_error (); |
886 binary_ops.resize (octave_value::num_binary_ops); | |
887 for (size_t i = 0; i < octave_value::num_binary_ops; ++i) | |
888 { | |
889 octave_value::binary_op op = static_cast<octave_value::binary_op> (i); | |
890 std::string op_name = octave_value::binary_op_as_string (op); | |
891 binary_ops[i].stash_name ("binary" + op_name); | |
892 } | |
893 | |
894 for (int op = 0; op < octave_value::num_binary_ops; ++op) | |
895 { | |
896 llvm::Twine fn_name ("octave_jit_binary_any_any_"); | |
897 fn_name = fn_name + llvm::Twine (op); | |
898 | |
899 fn = create_function (jit_convention::internal, fn_name, any, any, any); | |
900 fn.mark_can_error (); | |
901 llvm::BasicBlock *block = fn.new_block (); | |
902 builder.SetInsertPoint (block); | |
903 llvm::APInt op_int(sizeof (octave_value::binary_op) * 8, op, | |
904 std::numeric_limits<octave_value::binary_op>::is_signed); | |
905 llvm::Value *op_as_llvm = llvm::ConstantInt::get (llvm_bo_type, op_int); | |
906 llvm::Value *ret = any_binary.call (builder, op_as_llvm, | |
907 fn.argument (builder, 0), | |
908 fn.argument (builder, 1)); | |
909 fn.do_return (builder, ret); | |
910 binary_ops[op].add_overload (fn); | |
911 } | |
912 | |
913 // grab any | |
914 fn = create_function (jit_convention::external, "octave_jit_grab_any", any, | |
915 any); | |
15019
ae3670d4df29
Update the execution engine's global mapping for external functions
Max Brister <max@2bass.com>
parents:
15016
diff
changeset
|
916 fn.add_mapping (engine, &octave_jit_grab_any); |
15016 | 917 grab_fn.add_overload (fn); |
918 grab_fn.stash_name ("grab"); | |
919 | |
920 // grab matrix | |
921 fn = create_function (jit_convention::external, "octave_jit_grab_matrix", | |
922 matrix, matrix); | |
15019
ae3670d4df29
Update the execution engine's global mapping for external functions
Max Brister <max@2bass.com>
parents:
15016
diff
changeset
|
923 fn.add_mapping (engine, &octave_jit_grab_matrix); |
15016 | 924 grab_fn.add_overload (fn); |
925 | |
926 // release any | |
927 fn = create_function (jit_convention::external, "octave_jit_release_any", 0, | |
928 any); | |
15019
ae3670d4df29
Update the execution engine's global mapping for external functions
Max Brister <max@2bass.com>
parents:
15016
diff
changeset
|
929 fn.add_mapping (engine, &octave_jit_release_any); |
15016 | 930 release_fn.add_overload (fn); |
931 release_fn.stash_name ("release"); | |
932 | |
933 // release matrix | |
934 fn = create_function (jit_convention::external, "octave_jit_release_matrix", | |
935 0, matrix); | |
15019
ae3670d4df29
Update the execution engine's global mapping for external functions
Max Brister <max@2bass.com>
parents:
15016
diff
changeset
|
936 fn.add_mapping (engine, &octave_jit_release_matrix); |
15016 | 937 release_fn.add_overload (fn); |
938 | |
939 // release scalar | |
940 fn = create_identity (scalar); | |
941 release_fn.add_overload (fn); | |
942 | |
943 // release complex | |
944 fn = create_identity (complex); | |
945 release_fn.add_overload (fn); | |
946 | |
947 // release index | |
948 fn = create_identity (index); | |
949 release_fn.add_overload (fn); | |
950 | |
951 // now for binary scalar operations | |
952 // FIXME: Finish all operations | |
953 add_binary_op (scalar, octave_value::op_add, llvm::Instruction::FAdd); | |
954 add_binary_op (scalar, octave_value::op_sub, llvm::Instruction::FSub); | |
955 add_binary_op (scalar, octave_value::op_mul, llvm::Instruction::FMul); | |
956 add_binary_op (scalar, octave_value::op_el_mul, llvm::Instruction::FMul); | |
957 | |
958 add_binary_fcmp (scalar, octave_value::op_lt, llvm::CmpInst::FCMP_ULT); | |
959 add_binary_fcmp (scalar, octave_value::op_le, llvm::CmpInst::FCMP_ULE); | |
960 add_binary_fcmp (scalar, octave_value::op_eq, llvm::CmpInst::FCMP_UEQ); | |
961 add_binary_fcmp (scalar, octave_value::op_ge, llvm::CmpInst::FCMP_UGE); | |
962 add_binary_fcmp (scalar, octave_value::op_gt, llvm::CmpInst::FCMP_UGT); | |
963 add_binary_fcmp (scalar, octave_value::op_ne, llvm::CmpInst::FCMP_UNE); | |
964 | |
965 jit_function gripe_div0 = create_function (jit_convention::external, | |
966 "gripe_divide_by_zero", 0); | |
15019
ae3670d4df29
Update the execution engine's global mapping for external functions
Max Brister <max@2bass.com>
parents:
15016
diff
changeset
|
967 gripe_div0.add_mapping (engine, &gripe_divide_by_zero); |
15016 | 968 gripe_div0.mark_can_error (); |
969 | |
970 // divide is annoying because it might error | |
971 fn = create_function (jit_convention::internal, | |
972 "octave_jit_div_scalar_scalar", scalar, scalar, scalar); | |
973 fn.mark_can_error (); | |
974 | |
975 llvm::BasicBlock *body = fn.new_block (); | |
976 builder.SetInsertPoint (body); | |
977 { | |
978 llvm::BasicBlock *warn_block = fn.new_block ("warn"); | |
979 llvm::BasicBlock *normal_block = fn.new_block ("normal"); | |
980 | |
981 llvm::Value *zero = llvm::ConstantFP::get (scalar_t, 0); | |
982 llvm::Value *check = builder.CreateFCmpUEQ (zero, fn.argument (builder, 0)); | |
983 builder.CreateCondBr (check, warn_block, normal_block); | |
984 | |
985 builder.SetInsertPoint (warn_block); | |
986 gripe_div0.call (builder); | |
987 builder.CreateBr (normal_block); | |
988 | |
989 builder.SetInsertPoint (normal_block); | |
990 llvm::Value *ret = builder.CreateFDiv (fn.argument (builder, 0), | |
991 fn.argument (builder, 1)); | |
992 fn.do_return (builder, ret); | |
993 } | |
994 binary_ops[octave_value::op_div].add_overload (fn); | |
995 binary_ops[octave_value::op_el_div].add_overload (fn); | |
996 | |
997 // ldiv is the same as div with the operators reversed | |
998 fn = mirror_binary (fn); | |
999 binary_ops[octave_value::op_ldiv].add_overload (fn); | |
1000 binary_ops[octave_value::op_el_ldiv].add_overload (fn); | |
1001 | |
1002 // In general, the result of scalar ^ scalar is a complex number. We might be | |
1003 // able to improve on this if we keep track of the range of values varaibles | |
1004 // can take on. | |
1005 fn = create_function (jit_convention::external, | |
1006 "octave_jit_pow_scalar_scalar", complex, scalar, | |
1007 scalar); | |
15019
ae3670d4df29
Update the execution engine's global mapping for external functions
Max Brister <max@2bass.com>
parents:
15016
diff
changeset
|
1008 fn.add_mapping (engine, &octave_jit_pow_scalar_scalar); |
15016 | 1009 binary_ops[octave_value::op_pow].add_overload (fn); |
1010 binary_ops[octave_value::op_el_pow].add_overload (fn); | |
1011 | |
1012 // now for binary complex operations | |
1013 add_binary_op (complex, octave_value::op_add, llvm::Instruction::FAdd); | |
1014 add_binary_op (complex, octave_value::op_sub, llvm::Instruction::FSub); | |
1015 | |
1016 fn = create_function (jit_convention::internal, | |
1017 "octave_jit_*_complex_complex", complex, complex, | |
1018 complex); | |
1019 body = fn.new_block (); | |
1020 builder.SetInsertPoint (body); | |
1021 { | |
1022 // (x0*x1 - y0*y1, x0*y1 + y0*x1) = (x0,y0) * (x1,y1) | |
1023 // We compute this in one vectorized multiplication, a subtraction, and an | |
1024 // addition. | |
1025 llvm::Value *lhs = fn.argument (builder, 0); | |
1026 llvm::Value *rhs = fn.argument (builder, 1); | |
1027 | |
1028 // FIXME: We need a better way of doing this, working with llvm's IR | |
1029 // directly is sort of a pain. | |
1030 llvm::Value *zero = builder.getInt32 (0); | |
1031 llvm::Value *one = builder.getInt32 (1); | |
1032 llvm::Value *two = builder.getInt32 (2); | |
1033 llvm::Value *three = builder.getInt32 (3); | |
1034 | |
1035 llvm::Type *vec4 = llvm::VectorType::get (scalar_t, 4); | |
1036 llvm::Value *mlhs = llvm::UndefValue::get (vec4); | |
1037 llvm::Value *mrhs = mlhs; | |
1038 | |
1039 llvm::Value *temp = complex_real (lhs); | |
1040 mlhs = builder.CreateInsertElement (mlhs, temp, zero); | |
1041 mlhs = builder.CreateInsertElement (mlhs, temp, two); | |
1042 temp = complex_imag (lhs); | |
1043 mlhs = builder.CreateInsertElement (mlhs, temp, one); | |
1044 mlhs = builder.CreateInsertElement (mlhs, temp, three); | |
1045 | |
1046 temp = complex_real (rhs); | |
1047 mrhs = builder.CreateInsertElement (mrhs, temp, zero); | |
1048 mrhs = builder.CreateInsertElement (mrhs, temp, three); | |
1049 temp = complex_imag (rhs); | |
1050 mrhs = builder.CreateInsertElement (mrhs, temp, one); | |
1051 mrhs = builder.CreateInsertElement (mrhs, temp, two); | |
1052 | |
1053 llvm::Value *mres = builder.CreateFMul (mlhs, mrhs); | |
1054 llvm::Value *tlhs = builder.CreateExtractElement (mres, zero); | |
1055 llvm::Value *trhs = builder.CreateExtractElement (mres, one); | |
1056 llvm::Value *ret_real = builder.CreateFSub (tlhs, trhs); | |
1057 | |
1058 tlhs = builder.CreateExtractElement (mres, two); | |
1059 trhs = builder.CreateExtractElement (mres, three); | |
1060 llvm::Value *ret_imag = builder.CreateFAdd (tlhs, trhs); | |
1061 fn.do_return (builder, complex_new (ret_real, ret_imag)); | |
1062 } | |
1063 | |
1064 binary_ops[octave_value::op_mul].add_overload (fn); | |
1065 binary_ops[octave_value::op_el_mul].add_overload (fn); | |
1066 | |
1067 jit_function complex_div = create_function (jit_convention::external, | |
1068 "octave_jit_complex_div", | |
1069 complex, complex, complex); | |
15019
ae3670d4df29
Update the execution engine's global mapping for external functions
Max Brister <max@2bass.com>
parents:
15016
diff
changeset
|
1070 complex_div.add_mapping (engine, &octave_jit_complex_div); |
15016 | 1071 complex_div.mark_can_error (); |
1072 binary_ops[octave_value::op_div].add_overload (fn); | |
1073 binary_ops[octave_value::op_ldiv].add_overload (fn); | |
1074 | |
1075 fn = mirror_binary (complex_div); | |
1076 binary_ops[octave_value::op_ldiv].add_overload (fn); | |
1077 binary_ops[octave_value::op_el_ldiv].add_overload (fn); | |
1078 | |
1079 fn = create_function (jit_convention::external, | |
1080 "octave_jit_pow_complex_complex", complex, complex, | |
1081 complex); | |
15019
ae3670d4df29
Update the execution engine's global mapping for external functions
Max Brister <max@2bass.com>
parents:
15016
diff
changeset
|
1082 fn.add_mapping (engine, &octave_jit_pow_complex_complex); |
15016 | 1083 binary_ops[octave_value::op_pow].add_overload (fn); |
1084 binary_ops[octave_value::op_el_pow].add_overload (fn); | |
1085 | |
1086 fn = create_function (jit_convention::internal, | |
1087 "octave_jit_*_scalar_complex", complex, scalar, | |
1088 complex); | |
1089 jit_function mul_scalar_complex = fn; | |
1090 body = fn.new_block (); | |
1091 builder.SetInsertPoint (body); | |
1092 { | |
1093 llvm::Value *lhs = fn.argument (builder, 0); | |
1094 llvm::Value *tlhs = complex_new (lhs, lhs); | |
1095 llvm::Value *rhs = fn.argument (builder, 1); | |
1096 fn.do_return (builder, builder.CreateFMul (tlhs, rhs)); | |
1097 } | |
1098 binary_ops[octave_value::op_mul].add_overload (fn); | |
1099 binary_ops[octave_value::op_el_mul].add_overload (fn); | |
1100 | |
1101 | |
1102 fn = mirror_binary (mul_scalar_complex); | |
1103 binary_ops[octave_value::op_mul].add_overload (fn); | |
1104 binary_ops[octave_value::op_el_mul].add_overload (fn); | |
1105 | |
1106 fn = create_function (jit_convention::internal, "octave_jit_+_scalar_complex", | |
1107 complex, scalar, complex); | |
1108 body = fn.new_block (); | |
1109 builder.SetInsertPoint (body); | |
1110 { | |
1111 llvm::Value *lhs = fn.argument (builder, 0); | |
1112 llvm::Value *rhs = fn.argument (builder, 1); | |
1113 llvm::Value *real = builder.CreateFAdd (lhs, complex_real (rhs)); | |
1114 fn.do_return (builder, complex_real (rhs, real)); | |
1115 } | |
1116 binary_ops[octave_value::op_add].add_overload (fn); | |
1117 | |
1118 fn = mirror_binary (fn); | |
1119 binary_ops[octave_value::op_add].add_overload (fn); | |
1120 | |
1121 fn = create_function (jit_convention::internal, "octave_jit_-_complex_scalar", | |
1122 complex, complex, scalar); | |
1123 body = fn.new_block (); | |
1124 builder.SetInsertPoint (body); | |
1125 { | |
1126 llvm::Value *lhs = fn.argument (builder, 0); | |
1127 llvm::Value *rhs = fn.argument (builder, 1); | |
1128 llvm::Value *real = builder.CreateFSub (complex_real (lhs), rhs); | |
1129 fn.do_return (builder, complex_real (lhs, real)); | |
1130 } | |
1131 binary_ops[octave_value::op_sub].add_overload (fn); | |
1132 | |
1133 fn = create_function (jit_convention::internal, "octave_jit_-_scalar_complex", | |
1134 complex, scalar, complex); | |
1135 body = fn.new_block (); | |
1136 builder.SetInsertPoint (body); | |
1137 { | |
1138 llvm::Value *lhs = fn.argument (builder, 0); | |
1139 llvm::Value *rhs = fn.argument (builder, 1); | |
1140 llvm::Value *real = builder.CreateFSub (lhs, complex_real (rhs)); | |
1141 fn.do_return (builder, complex_real (rhs, real)); | |
1142 } | |
1143 binary_ops[octave_value::op_sub].add_overload (fn); | |
1144 | |
1145 fn = create_function (jit_convention::external, | |
1146 "octave_jit_pow_scalar_complex", complex, scalar, | |
1147 complex); | |
15019
ae3670d4df29
Update the execution engine's global mapping for external functions
Max Brister <max@2bass.com>
parents:
15016
diff
changeset
|
1148 fn.add_mapping (engine, &octave_jit_pow_scalar_complex); |
15016 | 1149 binary_ops[octave_value::op_pow].add_overload (fn); |
1150 binary_ops[octave_value::op_el_pow].add_overload (fn); | |
1151 | |
1152 fn = create_function (jit_convention::external, | |
1153 "octave_jit_pow_complex_scalar", complex, complex, | |
1154 scalar); | |
15019
ae3670d4df29
Update the execution engine's global mapping for external functions
Max Brister <max@2bass.com>
parents:
15016
diff
changeset
|
1155 fn.add_mapping (engine, &octave_jit_pow_complex_scalar); |
15016 | 1156 binary_ops[octave_value::op_pow].add_overload (fn); |
1157 binary_ops[octave_value::op_el_pow].add_overload (fn); | |
1158 | |
1159 // now for binary index operators | |
1160 add_binary_op (index, octave_value::op_add, llvm::Instruction::Add); | |
1161 | |
1162 // and binary bool operators | |
1163 add_binary_op (boolean, octave_value::op_el_or, llvm::Instruction::Or); | |
1164 add_binary_op (boolean, octave_value::op_el_and, llvm::Instruction::And); | |
1165 | |
1166 // now for printing functions | |
1167 print_fn.stash_name ("print"); | |
15019
ae3670d4df29
Update the execution engine's global mapping for external functions
Max Brister <max@2bass.com>
parents:
15016
diff
changeset
|
1168 add_print (any, reinterpret_cast<void *> (&octave_jit_print_any)); |
ae3670d4df29
Update the execution engine's global mapping for external functions
Max Brister <max@2bass.com>
parents:
15016
diff
changeset
|
1169 add_print (scalar, reinterpret_cast<void *> (&octave_jit_print_scalar)); |
15016 | 1170 |
1171 // initialize for loop | |
1172 for_init_fn.stash_name ("for_init"); | |
1173 | |
1174 fn = create_function (jit_convention::internal, "octave_jit_for_range_init", | |
1175 index, range); | |
1176 body = fn.new_block (); | |
1177 builder.SetInsertPoint (body); | |
1178 { | |
1179 llvm::Value *zero = llvm::ConstantInt::get (index_t, 0); | |
1180 fn.do_return (builder, zero); | |
1181 } | |
1182 for_init_fn.add_overload (fn); | |
1183 | |
1184 // bounds check for for loop | |
1185 for_check_fn.stash_name ("for_check"); | |
1186 | |
1187 fn = create_function (jit_convention::internal, "octave_jit_for_range_check", | |
1188 boolean, range, index); | |
1189 body = fn.new_block (); | |
1190 builder.SetInsertPoint (body); | |
1191 { | |
1192 llvm::Value *nelem | |
1193 = builder.CreateExtractValue (fn.argument (builder, 0), 3); | |
1194 llvm::Value *idx = fn.argument (builder, 1); | |
1195 llvm::Value *ret = builder.CreateICmpULT (idx, nelem); | |
1196 fn.do_return (builder, ret); | |
1197 } | |
1198 for_check_fn.add_overload (fn); | |
1199 | |
1200 // index variabe for for loop | |
1201 for_index_fn.stash_name ("for_index"); | |
1202 | |
1203 fn = create_function (jit_convention::internal, "octave_jit_for_range_idx", | |
1204 scalar, range, index); | |
1205 body = fn.new_block (); | |
1206 builder.SetInsertPoint (body); | |
1207 { | |
1208 llvm::Value *idx = fn.argument (builder, 1); | |
1209 llvm::Value *didx = builder.CreateSIToFP (idx, scalar_t); | |
1210 llvm::Value *rng = fn.argument (builder, 0); | |
1211 llvm::Value *base = builder.CreateExtractValue (rng, 0); | |
1212 llvm::Value *inc = builder.CreateExtractValue (rng, 2); | |
1213 | |
1214 llvm::Value *ret = builder.CreateFMul (didx, inc); | |
1215 ret = builder.CreateFAdd (base, ret); | |
1216 fn.do_return (builder, ret); | |
1217 } | |
1218 for_index_fn.add_overload (fn); | |
1219 | |
1220 // logically true | |
1221 logically_true_fn.stash_name ("logically_true"); | |
1222 | |
1223 jit_function gripe_nantl | |
1224 = create_function (jit_convention::external, | |
1225 "octave_jit_gripe_nan_to_logical_conversion", 0); | |
15019
ae3670d4df29
Update the execution engine's global mapping for external functions
Max Brister <max@2bass.com>
parents:
15016
diff
changeset
|
1226 gripe_nantl.add_mapping (engine, &octave_jit_gripe_nan_to_logical_conversion); |
15016 | 1227 gripe_nantl.mark_can_error (); |
1228 | |
1229 fn = create_function (jit_convention::internal, | |
1230 "octave_jit_logically_true_scalar", boolean, scalar); | |
1231 fn.mark_can_error (); | |
1232 | |
1233 body = fn.new_block (); | |
1234 builder.SetInsertPoint (body); | |
1235 { | |
1236 llvm::BasicBlock *error_block = fn.new_block ("error"); | |
1237 llvm::BasicBlock *normal_block = fn.new_block ("normal"); | |
1238 | |
1239 llvm::Value *check = builder.CreateFCmpUNE (fn.argument (builder, 0), | |
1240 fn.argument (builder, 0)); | |
1241 builder.CreateCondBr (check, error_block, normal_block); | |
1242 | |
1243 builder.SetInsertPoint (error_block); | |
1244 gripe_nantl.call (builder); | |
1245 builder.CreateBr (normal_block); | |
1246 builder.SetInsertPoint (normal_block); | |
1247 | |
1248 llvm::Value *zero = llvm::ConstantFP::get (scalar_t, 0); | |
1249 llvm::Value *ret = builder.CreateFCmpONE (fn.argument (builder, 0), zero); | |
1250 fn.do_return (builder, ret); | |
1251 } | |
1252 logically_true_fn.add_overload (fn); | |
1253 | |
1254 // logically_true boolean | |
1255 fn = create_identity (boolean); | |
1256 logically_true_fn.add_overload (fn); | |
1257 | |
1258 // make_range | |
1259 // FIXME: May be benificial to implement all in LLVM | |
1260 make_range_fn.stash_name ("make_range"); | |
1261 jit_function compute_nelem | |
1262 = create_function (jit_convention::external, "octave_jit_compute_nelem", | |
1263 index, scalar, scalar, scalar); | |
15019
ae3670d4df29
Update the execution engine's global mapping for external functions
Max Brister <max@2bass.com>
parents:
15016
diff
changeset
|
1264 compute_nelem.add_mapping (engine, &octave_jit_compute_nelem); |
15016 | 1265 |
1266 fn = create_function (jit_convention::internal, "octave_jit_make_range", | |
1267 range, scalar, scalar, scalar); | |
1268 body = fn.new_block (); | |
1269 builder.SetInsertPoint (body); | |
1270 { | |
1271 llvm::Value *base = fn.argument (builder, 0); | |
1272 llvm::Value *limit = fn.argument (builder, 1); | |
1273 llvm::Value *inc = fn.argument (builder, 2); | |
1274 llvm::Value *nelem = compute_nelem.call (builder, base, limit, inc); | |
1275 | |
1276 llvm::Value *dzero = llvm::ConstantFP::get (scalar_t, 0); | |
1277 llvm::Value *izero = llvm::ConstantInt::get (index_t, 0); | |
1278 llvm::Value *rng = llvm::ConstantStruct::get (range_t, dzero, dzero, dzero, | |
1279 izero, NULL); | |
1280 rng = builder.CreateInsertValue (rng, base, 0); | |
1281 rng = builder.CreateInsertValue (rng, limit, 1); | |
1282 rng = builder.CreateInsertValue (rng, inc, 2); | |
1283 rng = builder.CreateInsertValue (rng, nelem, 3); | |
1284 fn.do_return (builder, rng); | |
1285 } | |
1286 make_range_fn.add_overload (fn); | |
1287 | |
1288 // paren_subsref | |
1289 jit_type *jit_int = intN (sizeof (int) * 8); | |
1290 llvm::Type *int_t = jit_int->to_llvm (); | |
1291 jit_function ginvalid_index | |
1292 = create_function (jit_convention::external, "octave_jit_ginvalid_index", | |
1293 0); | |
15019
ae3670d4df29
Update the execution engine's global mapping for external functions
Max Brister <max@2bass.com>
parents:
15016
diff
changeset
|
1294 ginvalid_index.add_mapping (engine, &octave_jit_ginvalid_index); |
15016 | 1295 jit_function gindex_range = create_function (jit_convention::external, |
1296 "octave_jit_gindex_range", | |
1297 0, jit_int, jit_int, index, | |
1298 index); | |
15019
ae3670d4df29
Update the execution engine's global mapping for external functions
Max Brister <max@2bass.com>
parents:
15016
diff
changeset
|
1299 gindex_range.add_mapping (engine, &octave_jit_gindex_range); |
15016 | 1300 |
1301 fn = create_function (jit_convention::internal, "()subsref", scalar, matrix, | |
1302 scalar); | |
1303 fn.mark_can_error (); | |
1304 | |
1305 body = fn.new_block (); | |
1306 builder.SetInsertPoint (body); | |
1307 { | |
1308 llvm::Value *one = llvm::ConstantInt::get (index_t, 1); | |
1309 llvm::Value *ione; | |
1310 if (index_t == int_t) | |
1311 ione = one; | |
1312 else | |
1313 ione = llvm::ConstantInt::get (int_t, 1); | |
1314 | |
1315 llvm::Value *undef = llvm::UndefValue::get (scalar_t); | |
1316 llvm::Value *mat = fn.argument (builder, 0); | |
1317 llvm::Value *idx = fn.argument (builder, 1); | |
1318 | |
1319 // convert index to scalar to integer, and check index >= 1 | |
1320 llvm::Value *int_idx = builder.CreateFPToSI (idx, index_t); | |
1321 llvm::Value *check_idx = builder.CreateSIToFP (int_idx, scalar_t); | |
1322 llvm::Value *cond0 = builder.CreateFCmpUNE (idx, check_idx); | |
1323 llvm::Value *cond1 = builder.CreateICmpSLT (int_idx, one); | |
1324 llvm::Value *cond = builder.CreateOr (cond0, cond1); | |
1325 | |
1326 llvm::BasicBlock *done = fn.new_block ("done"); | |
1327 llvm::BasicBlock *conv_error = fn.new_block ("conv_error", done); | |
1328 llvm::BasicBlock *normal = fn.new_block ("normal", done); | |
1329 builder.CreateCondBr (cond, conv_error, normal); | |
1330 | |
1331 builder.SetInsertPoint (conv_error); | |
1332 ginvalid_index.call (builder); | |
1333 builder.CreateBr (done); | |
1334 | |
1335 builder.SetInsertPoint (normal); | |
1336 llvm::Value *len = builder.CreateExtractValue (mat, | |
1337 llvm::ArrayRef<unsigned> (2)); | |
1338 cond = builder.CreateICmpSGT (int_idx, len); | |
1339 | |
1340 | |
1341 llvm::BasicBlock *bounds_error = fn.new_block ("bounds_error", done); | |
1342 llvm::BasicBlock *success = fn.new_block ("success", done); | |
1343 builder.CreateCondBr (cond, bounds_error, success); | |
1344 | |
1345 builder.SetInsertPoint (bounds_error); | |
1346 gindex_range.call (builder, ione, ione, int_idx, len); | |
1347 builder.CreateBr (done); | |
1348 | |
1349 builder.SetInsertPoint (success); | |
1350 llvm::Value *data = builder.CreateExtractValue (mat, | |
1351 llvm::ArrayRef<unsigned> (1)); | |
1352 llvm::Value *gep = builder.CreateInBoundsGEP (data, int_idx); | |
1353 llvm::Value *ret = builder.CreateLoad (gep); | |
1354 builder.CreateBr (done); | |
1355 | |
1356 builder.SetInsertPoint (done); | |
1357 | |
1358 llvm::PHINode *merge = llvm::PHINode::Create (scalar_t, 3); | |
1359 builder.Insert (merge); | |
1360 merge->addIncoming (undef, conv_error); | |
1361 merge->addIncoming (undef, bounds_error); | |
1362 merge->addIncoming (ret, success); | |
1363 fn.do_return (builder, merge); | |
1364 } | |
1365 paren_subsref_fn.add_overload (fn); | |
1366 | |
15067 | 1367 // generate () subsref for ND indexing of matricies with scalars |
1368 jit_function paren_scalar = create_function (jit_convention::external, | |
1369 "octave_jit_paren_scalar", | |
1370 scalar, matrix, scalar_ptr, | |
1371 index); | |
1372 paren_scalar.add_mapping (engine, &octave_jit_paren_scalar); | |
1373 paren_scalar.mark_can_error (); | |
1374 | |
15068
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1375 jit_function paren_scalar_subsasgn |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1376 = create_function (jit_convention::external, |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1377 "octave_jit_paren_scalar_subsasgn", matrix, matrix, |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1378 scalar_ptr, index, scalar); |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1379 paren_scalar_subsasgn.add_mapping (engine, &octave_jit_paren_scalar_subsasgn); |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1380 paren_scalar_subsasgn.mark_can_error (); |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1381 |
15067 | 1382 // FIXME: Generate this on the fly |
1383 for (size_t i = 2; i < 10; ++i) | |
15068
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1384 { |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1385 gen_subsref (paren_scalar, i); |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1386 gen_subsasgn (paren_scalar_subsasgn, i); |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1387 } |
15067 | 1388 |
15016 | 1389 // paren subsasgn |
1390 paren_subsasgn_fn.stash_name ("()subsasgn"); | |
1391 | |
1392 jit_function resize_paren_subsasgn | |
1393 = create_function (jit_convention::external, | |
15027
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
1394 "octave_jit_paren_subsasgn_impl", matrix, matrix, index, |
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
1395 scalar); |
15019
ae3670d4df29
Update the execution engine's global mapping for external functions
Max Brister <max@2bass.com>
parents:
15016
diff
changeset
|
1396 resize_paren_subsasgn.add_mapping (engine, &octave_jit_paren_subsasgn_impl); |
15016 | 1397 fn = create_function (jit_convention::internal, "octave_jit_paren_subsasgn", |
1398 matrix, matrix, scalar, scalar); | |
1399 fn.mark_can_error (); | |
1400 body = fn.new_block (); | |
1401 builder.SetInsertPoint (body); | |
1402 { | |
1403 llvm::Value *one = llvm::ConstantInt::get (index_t, 1); | |
1404 | |
1405 llvm::Value *mat = fn.argument (builder, 0); | |
1406 llvm::Value *idx = fn.argument (builder, 1); | |
1407 llvm::Value *value = fn.argument (builder, 2); | |
1408 | |
1409 llvm::Value *int_idx = builder.CreateFPToSI (idx, index_t); | |
1410 llvm::Value *check_idx = builder.CreateSIToFP (int_idx, scalar_t); | |
1411 llvm::Value *cond0 = builder.CreateFCmpUNE (idx, check_idx); | |
1412 llvm::Value *cond1 = builder.CreateICmpSLT (int_idx, one); | |
1413 llvm::Value *cond = builder.CreateOr (cond0, cond1); | |
1414 | |
1415 llvm::BasicBlock *done = fn.new_block ("done"); | |
1416 | |
1417 llvm::BasicBlock *conv_error = fn.new_block ("conv_error", done); | |
1418 llvm::BasicBlock *normal = fn.new_block ("normal", done); | |
1419 builder.CreateCondBr (cond, conv_error, normal); | |
1420 builder.SetInsertPoint (conv_error); | |
1421 ginvalid_index.call (builder); | |
1422 builder.CreateBr (done); | |
1423 | |
1424 builder.SetInsertPoint (normal); | |
15056
bc32288f4a42
Support the end keyword for one dimentional indexing in JIT.
Max Brister <max@2bass.com>
parents:
15027
diff
changeset
|
1425 llvm::Value *len = builder.CreateExtractValue (mat, 2); |
15016 | 1426 cond0 = builder.CreateICmpSGT (int_idx, len); |
1427 | |
1428 llvm::Value *rcount = builder.CreateExtractValue (mat, 0); | |
1429 rcount = builder.CreateLoad (rcount); | |
1430 cond1 = builder.CreateICmpSGT (rcount, one); | |
1431 cond = builder.CreateOr (cond0, cond1); | |
1432 | |
1433 llvm::BasicBlock *bounds_error = fn.new_block ("bounds_error", done); | |
1434 llvm::BasicBlock *success = fn.new_block ("success", done); | |
1435 builder.CreateCondBr (cond, bounds_error, success); | |
1436 | |
1437 // resize on out of bounds access | |
1438 builder.SetInsertPoint (bounds_error); | |
15027
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
1439 llvm::Value *resize_result = resize_paren_subsasgn.call (builder, mat, |
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
1440 int_idx, value); |
15016 | 1441 builder.CreateBr (done); |
1442 | |
1443 builder.SetInsertPoint (success); | |
1444 llvm::Value *data = builder.CreateExtractValue (mat, | |
1445 llvm::ArrayRef<unsigned> (1)); | |
1446 llvm::Value *gep = builder.CreateInBoundsGEP (data, int_idx); | |
1447 builder.CreateStore (value, gep); | |
1448 builder.CreateBr (done); | |
1449 | |
1450 builder.SetInsertPoint (done); | |
1451 | |
1452 llvm::PHINode *merge = llvm::PHINode::Create (matrix_t, 3); | |
1453 builder.Insert (merge); | |
1454 merge->addIncoming (mat, conv_error); | |
1455 merge->addIncoming (resize_result, bounds_error); | |
1456 merge->addIncoming (mat, success); | |
1457 fn.do_return (builder, merge); | |
1458 } | |
1459 paren_subsasgn_fn.add_overload (fn); | |
1460 | |
1461 fn = create_function (jit_convention::external, | |
1462 "octave_jit_paren_subsasgn_matrix_range", matrix, | |
1463 matrix, range, scalar); | |
15019
ae3670d4df29
Update the execution engine's global mapping for external functions
Max Brister <max@2bass.com>
parents:
15016
diff
changeset
|
1464 fn.add_mapping (engine, &octave_jit_paren_subsasgn_matrix_range); |
15016 | 1465 fn.mark_can_error (); |
1466 paren_subsasgn_fn.add_overload (fn); | |
1467 | |
15056
bc32288f4a42
Support the end keyword for one dimentional indexing in JIT.
Max Brister <max@2bass.com>
parents:
15027
diff
changeset
|
1468 end_fn.stash_name ("end"); |
bc32288f4a42
Support the end keyword for one dimentional indexing in JIT.
Max Brister <max@2bass.com>
parents:
15027
diff
changeset
|
1469 fn = create_function (jit_convention::internal, "octave_jit_end_matrix", |
bc32288f4a42
Support the end keyword for one dimentional indexing in JIT.
Max Brister <max@2bass.com>
parents:
15027
diff
changeset
|
1470 scalar, matrix); |
bc32288f4a42
Support the end keyword for one dimentional indexing in JIT.
Max Brister <max@2bass.com>
parents:
15027
diff
changeset
|
1471 body = fn.new_block (); |
bc32288f4a42
Support the end keyword for one dimentional indexing in JIT.
Max Brister <max@2bass.com>
parents:
15027
diff
changeset
|
1472 builder.SetInsertPoint (body); |
bc32288f4a42
Support the end keyword for one dimentional indexing in JIT.
Max Brister <max@2bass.com>
parents:
15027
diff
changeset
|
1473 { |
bc32288f4a42
Support the end keyword for one dimentional indexing in JIT.
Max Brister <max@2bass.com>
parents:
15027
diff
changeset
|
1474 llvm::Value *mat = fn.argument (builder, 0); |
bc32288f4a42
Support the end keyword for one dimentional indexing in JIT.
Max Brister <max@2bass.com>
parents:
15027
diff
changeset
|
1475 llvm::Value *ret = builder.CreateExtractValue (mat, 2); |
bc32288f4a42
Support the end keyword for one dimentional indexing in JIT.
Max Brister <max@2bass.com>
parents:
15027
diff
changeset
|
1476 fn.do_return (builder, builder.CreateSIToFP (ret, scalar_t)); |
bc32288f4a42
Support the end keyword for one dimentional indexing in JIT.
Max Brister <max@2bass.com>
parents:
15027
diff
changeset
|
1477 } |
bc32288f4a42
Support the end keyword for one dimentional indexing in JIT.
Max Brister <max@2bass.com>
parents:
15027
diff
changeset
|
1478 end_fn.add_overload (fn); |
bc32288f4a42
Support the end keyword for one dimentional indexing in JIT.
Max Brister <max@2bass.com>
parents:
15027
diff
changeset
|
1479 |
15016 | 1480 casts[any->type_id ()].stash_name ("(any)"); |
1481 casts[scalar->type_id ()].stash_name ("(scalar)"); | |
1482 casts[complex->type_id ()].stash_name ("(complex)"); | |
1483 casts[matrix->type_id ()].stash_name ("(matrix)"); | |
15027
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
1484 casts[any->type_id ()].stash_name ("(range)"); |
15016 | 1485 |
1486 // cast any <- matrix | |
1487 fn = create_function (jit_convention::external, "octave_jit_cast_any_matrix", | |
1488 any, matrix); | |
15019
ae3670d4df29
Update the execution engine's global mapping for external functions
Max Brister <max@2bass.com>
parents:
15016
diff
changeset
|
1489 fn.add_mapping (engine, &octave_jit_cast_any_matrix); |
15016 | 1490 casts[any->type_id ()].add_overload (fn); |
1491 | |
1492 // cast matrix <- any | |
1493 fn = create_function (jit_convention::external, "octave_jit_cast_matrix_any", | |
1494 matrix, any); | |
15019
ae3670d4df29
Update the execution engine's global mapping for external functions
Max Brister <max@2bass.com>
parents:
15016
diff
changeset
|
1495 fn.add_mapping (engine, &octave_jit_cast_matrix_any); |
15016 | 1496 casts[matrix->type_id ()].add_overload (fn); |
1497 | |
15027
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
1498 // cast any <- range |
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
1499 fn = create_function (jit_convention::external, "octave_jit_cast_any_range", |
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
1500 any, range); |
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
1501 fn.add_mapping (engine, &octave_jit_cast_any_range); |
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
1502 casts[any->type_id ()].add_overload (fn); |
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
1503 |
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
1504 // cast range <- any |
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
1505 fn = create_function (jit_convention::external, "octave_jit_cast_range_any", |
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
1506 range, any); |
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
1507 fn.add_mapping (engine, &octave_jit_cast_range_any); |
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
1508 casts[range->type_id ()].add_overload (fn); |
741d2dbcc117
Check trip count before compiling for loops.
Max Brister <max@2bass.com>
parents:
15019
diff
changeset
|
1509 |
15016 | 1510 // cast any <- scalar |
1511 fn = create_function (jit_convention::external, "octave_jit_cast_any_scalar", | |
1512 any, scalar); | |
15019
ae3670d4df29
Update the execution engine's global mapping for external functions
Max Brister <max@2bass.com>
parents:
15016
diff
changeset
|
1513 fn.add_mapping (engine, &octave_jit_cast_any_scalar); |
15016 | 1514 casts[any->type_id ()].add_overload (fn); |
1515 | |
1516 // cast scalar <- any | |
1517 fn = create_function (jit_convention::external, "octave_jit_cast_scalar_any", | |
1518 scalar, any); | |
15019
ae3670d4df29
Update the execution engine's global mapping for external functions
Max Brister <max@2bass.com>
parents:
15016
diff
changeset
|
1519 fn.add_mapping (engine, &octave_jit_cast_scalar_any); |
15016 | 1520 casts[scalar->type_id ()].add_overload (fn); |
1521 | |
1522 // cast any <- complex | |
1523 fn = create_function (jit_convention::external, "octave_jit_cast_any_complex", | |
1524 any, complex); | |
15019
ae3670d4df29
Update the execution engine's global mapping for external functions
Max Brister <max@2bass.com>
parents:
15016
diff
changeset
|
1525 fn.add_mapping (engine, &octave_jit_cast_any_complex); |
15016 | 1526 casts[any->type_id ()].add_overload (fn); |
1527 | |
1528 // cast complex <- any | |
1529 fn = create_function (jit_convention::external, "octave_jit_cast_complex_any", | |
1530 complex, any); | |
15019
ae3670d4df29
Update the execution engine's global mapping for external functions
Max Brister <max@2bass.com>
parents:
15016
diff
changeset
|
1531 fn.add_mapping (engine, &octave_jit_cast_complex_any); |
15016 | 1532 casts[complex->type_id ()].add_overload (fn); |
1533 | |
1534 // cast complex <- scalar | |
1535 fn = create_function (jit_convention::internal, | |
1536 "octave_jit_cast_complex_scalar", complex, scalar); | |
1537 body = fn.new_block (); | |
1538 builder.SetInsertPoint (body); | |
1539 { | |
1540 llvm::Value *zero = llvm::ConstantFP::get (scalar_t, 0); | |
1541 fn.do_return (builder, complex_new (fn.argument (builder, 0), zero)); | |
1542 } | |
1543 casts[complex->type_id ()].add_overload (fn); | |
1544 | |
1545 // cast scalar <- complex | |
1546 fn = create_function (jit_convention::internal, | |
1547 "octave_jit_cast_scalar_complex", scalar, complex); | |
1548 body = fn.new_block (); | |
1549 builder.SetInsertPoint (body); | |
1550 fn.do_return (builder, complex_real (fn.argument (builder, 0))); | |
1551 casts[scalar->type_id ()].add_overload (fn); | |
1552 | |
1553 // cast any <- any | |
1554 fn = create_identity (any); | |
1555 casts[any->type_id ()].add_overload (fn); | |
1556 | |
1557 // cast scalar <- scalar | |
1558 fn = create_identity (scalar); | |
1559 casts[scalar->type_id ()].add_overload (fn); | |
1560 | |
1561 // cast complex <- complex | |
1562 fn = create_identity (complex); | |
1563 casts[complex->type_id ()].add_overload (fn); | |
1564 | |
1565 // -------------------- builtin functions -------------------- | |
1566 add_builtin ("#unknown_function"); | |
1567 unknown_function = builtins["#unknown_function"]; | |
1568 | |
1569 add_builtin ("sin"); | |
1570 register_intrinsic ("sin", llvm::Intrinsic::sin, scalar, scalar); | |
1571 register_generic ("sin", matrix, matrix); | |
1572 | |
1573 add_builtin ("cos"); | |
1574 register_intrinsic ("cos", llvm::Intrinsic::cos, scalar, scalar); | |
1575 register_generic ("cos", matrix, matrix); | |
1576 | |
1577 add_builtin ("exp"); | |
1578 register_intrinsic ("exp", llvm::Intrinsic::cos, scalar, scalar); | |
1579 register_generic ("exp", matrix, matrix); | |
1580 | |
1581 casts.resize (next_id + 1); | |
1582 jit_function any_id = create_identity (any); | |
1583 jit_function release_any = get_release (any); | |
1584 std::vector<jit_type *> args; | |
1585 args.resize (1); | |
1586 | |
1587 for (std::map<std::string, jit_type *>::iterator iter = builtins.begin (); | |
1588 iter != builtins.end (); ++iter) | |
1589 { | |
1590 jit_type *btype = iter->second; | |
1591 args[0] = btype; | |
1592 | |
1593 release_fn.add_overload (jit_function (release_any, 0, args)); | |
1594 casts[any->type_id ()].add_overload (jit_function (any_id, any, args)); | |
1595 | |
1596 args[0] = any; | |
1597 casts[btype->type_id ()].add_overload (jit_function (any_id, btype, | |
1598 args)); | |
1599 } | |
1600 } | |
1601 | |
1602 void | |
15019
ae3670d4df29
Update the execution engine's global mapping for external functions
Max Brister <max@2bass.com>
parents:
15016
diff
changeset
|
1603 jit_typeinfo::add_print (jit_type *ty, void *fptr) |
15016 | 1604 { |
1605 std::stringstream name; | |
1606 name << "octave_jit_print_" << ty->name (); | |
1607 jit_function fn = create_function (jit_convention::external, name.str (), 0, | |
1608 intN (8), ty); | |
15019
ae3670d4df29
Update the execution engine's global mapping for external functions
Max Brister <max@2bass.com>
parents:
15016
diff
changeset
|
1609 fn.add_mapping (engine, fptr); |
15016 | 1610 print_fn.add_overload (fn); |
1611 } | |
1612 | |
1613 // FIXME: cp between add_binary_op, add_binary_icmp, and add_binary_fcmp | |
1614 void | |
1615 jit_typeinfo::add_binary_op (jit_type *ty, int op, int llvm_op) | |
1616 { | |
1617 std::stringstream fname; | |
1618 octave_value::binary_op ov_op = static_cast<octave_value::binary_op>(op); | |
1619 fname << "octave_jit_" << octave_value::binary_op_as_string (ov_op) | |
1620 << "_" << ty->name (); | |
1621 | |
1622 jit_function fn = create_function (jit_convention::internal, fname.str (), | |
1623 ty, ty, ty); | |
1624 llvm::BasicBlock *block = fn.new_block (); | |
1625 builder.SetInsertPoint (block); | |
1626 llvm::Instruction::BinaryOps temp | |
1627 = static_cast<llvm::Instruction::BinaryOps>(llvm_op); | |
1628 | |
1629 llvm::Value *ret = builder.CreateBinOp (temp, fn.argument (builder, 0), | |
1630 fn.argument (builder, 1)); | |
1631 fn.do_return (builder, ret); | |
1632 binary_ops[op].add_overload (fn); | |
1633 } | |
1634 | |
1635 void | |
1636 jit_typeinfo::add_binary_icmp (jit_type *ty, int op, int llvm_op) | |
1637 { | |
1638 std::stringstream fname; | |
1639 octave_value::binary_op ov_op = static_cast<octave_value::binary_op>(op); | |
1640 fname << "octave_jit" << octave_value::binary_op_as_string (ov_op) | |
1641 << "_" << ty->name (); | |
1642 | |
1643 jit_function fn = create_function (jit_convention::internal, fname.str (), | |
1644 boolean, ty, ty); | |
1645 llvm::BasicBlock *block = fn.new_block (); | |
1646 builder.SetInsertPoint (block); | |
1647 llvm::CmpInst::Predicate temp | |
1648 = static_cast<llvm::CmpInst::Predicate>(llvm_op); | |
1649 llvm::Value *ret = builder.CreateICmp (temp, fn.argument (builder, 0), | |
1650 fn.argument (builder, 1)); | |
1651 fn.do_return (builder, ret); | |
1652 binary_ops[op].add_overload (fn); | |
1653 } | |
1654 | |
1655 void | |
1656 jit_typeinfo::add_binary_fcmp (jit_type *ty, int op, int llvm_op) | |
1657 { | |
1658 std::stringstream fname; | |
1659 octave_value::binary_op ov_op = static_cast<octave_value::binary_op>(op); | |
1660 fname << "octave_jit" << octave_value::binary_op_as_string (ov_op) | |
1661 << "_" << ty->name (); | |
1662 | |
1663 jit_function fn = create_function (jit_convention::internal, fname.str (), | |
1664 boolean, ty, ty); | |
1665 llvm::BasicBlock *block = fn.new_block (); | |
1666 builder.SetInsertPoint (block); | |
1667 llvm::CmpInst::Predicate temp | |
1668 = static_cast<llvm::CmpInst::Predicate>(llvm_op); | |
1669 llvm::Value *ret = builder.CreateFCmp (temp, fn.argument (builder, 0), | |
1670 fn.argument (builder, 1)); | |
1671 fn.do_return (builder, ret); | |
1672 binary_ops[op].add_overload (fn); | |
1673 } | |
1674 | |
1675 jit_function | |
1676 jit_typeinfo::create_function (jit_convention::type cc, const llvm::Twine& name, | |
1677 jit_type *ret, | |
1678 const std::vector<jit_type *>& args) | |
1679 { | |
1680 jit_function result (module, cc, name, ret, args); | |
1681 return result; | |
1682 } | |
1683 | |
1684 jit_function | |
1685 jit_typeinfo::create_identity (jit_type *type) | |
1686 { | |
1687 size_t id = type->type_id (); | |
1688 if (id >= identities.size ()) | |
1689 identities.resize (id + 1); | |
1690 | |
1691 if (! identities[id].valid ()) | |
1692 { | |
1693 jit_function fn = create_function (jit_convention::internal, "id", type, | |
1694 type); | |
1695 llvm::BasicBlock *body = fn.new_block (); | |
1696 builder.SetInsertPoint (body); | |
1697 fn.do_return (builder, fn.argument (builder, 0)); | |
1698 return identities[id] = fn; | |
1699 } | |
1700 | |
1701 return identities[id]; | |
1702 } | |
1703 | |
1704 llvm::Value * | |
15019
ae3670d4df29
Update the execution engine's global mapping for external functions
Max Brister <max@2bass.com>
parents:
15016
diff
changeset
|
1705 jit_typeinfo::do_insert_error_check (llvm::IRBuilderD& abuilder) |
15016 | 1706 { |
15019
ae3670d4df29
Update the execution engine's global mapping for external functions
Max Brister <max@2bass.com>
parents:
15016
diff
changeset
|
1707 return abuilder.CreateLoad (lerror_state); |
15016 | 1708 } |
1709 | |
1710 void | |
1711 jit_typeinfo::add_builtin (const std::string& name) | |
1712 { | |
1713 jit_type *btype = new_type (name, any, any->to_llvm ()); | |
1714 builtins[name] = btype; | |
1715 | |
1716 octave_builtin *ov_builtin = find_builtin (name); | |
1717 if (ov_builtin) | |
1718 ov_builtin->stash_jit (*btype); | |
1719 } | |
1720 | |
1721 void | |
1722 jit_typeinfo::register_intrinsic (const std::string& name, size_t iid, | |
1723 jit_type *result, | |
1724 const std::vector<jit_type *>& args) | |
1725 { | |
1726 jit_type *builtin_type = builtins[name]; | |
1727 size_t nargs = args.size (); | |
1728 llvm::SmallVector<llvm::Type *, 5> llvm_args (nargs); | |
1729 for (size_t i = 0; i < nargs; ++i) | |
1730 llvm_args[i] = args[i]->to_llvm (); | |
1731 | |
1732 llvm::Intrinsic::ID id = static_cast<llvm::Intrinsic::ID> (iid); | |
1733 llvm::Function *ifun = llvm::Intrinsic::getDeclaration (module, id, | |
1734 llvm_args); | |
1735 std::stringstream fn_name; | |
1736 fn_name << "octave_jit_" << name; | |
1737 | |
1738 std::vector<jit_type *> args1 (nargs + 1); | |
1739 args1[0] = builtin_type; | |
1740 std::copy (args.begin (), args.end (), args1.begin () + 1); | |
1741 | |
1742 // The first argument will be the Octave function, but we already know that | |
1743 // the function call is the equivalent of the intrinsic, so we ignore it and | |
1744 // call the intrinsic with the remaining arguments. | |
1745 jit_function fn = create_function (jit_convention::internal, fn_name.str (), | |
1746 result, args1); | |
1747 llvm::BasicBlock *body = fn.new_block (); | |
1748 builder.SetInsertPoint (body); | |
1749 | |
1750 llvm::SmallVector<llvm::Value *, 5> fargs (nargs); | |
1751 for (size_t i = 0; i < nargs; ++i) | |
1752 fargs[i] = fn.argument (builder, i + 1); | |
1753 | |
1754 llvm::Value *ret = builder.CreateCall (ifun, fargs); | |
1755 fn.do_return (builder, ret); | |
1756 paren_subsref_fn.add_overload (fn); | |
1757 } | |
1758 | |
1759 octave_builtin * | |
1760 jit_typeinfo::find_builtin (const std::string& name) | |
1761 { | |
1762 // FIXME: Finalize what we want to store in octave_builtin, then add functions | |
1763 // to access these values in octave_value | |
1764 octave_value ov_builtin = symbol_table::find (name); | |
1765 return dynamic_cast<octave_builtin *> (ov_builtin.internal_rep ()); | |
1766 } | |
1767 | |
1768 void | |
1769 jit_typeinfo::register_generic (const std::string&, jit_type *, | |
1770 const std::vector<jit_type *>&) | |
1771 { | |
1772 // FIXME: Implement | |
1773 } | |
1774 | |
1775 jit_function | |
1776 jit_typeinfo::mirror_binary (const jit_function& fn) | |
1777 { | |
1778 jit_function ret = create_function (jit_convention::internal, | |
1779 fn.name () + "_reverse", | |
1780 fn.result (), fn.argument_type (1), | |
1781 fn.argument_type (0)); | |
1782 if (fn.can_error ()) | |
1783 ret.mark_can_error (); | |
1784 | |
1785 llvm::BasicBlock *body = ret.new_block (); | |
1786 builder.SetInsertPoint (body); | |
1787 llvm::Value *result = fn.call (builder, ret.argument (builder, 1), | |
1788 ret.argument (builder, 0)); | |
1789 if (ret.result ()) | |
1790 ret.do_return (builder, result); | |
1791 else | |
1792 ret.do_return (builder); | |
1793 | |
1794 return ret; | |
1795 } | |
1796 | |
1797 llvm::Value * | |
1798 jit_typeinfo::pack_complex (llvm::IRBuilderD& bld, llvm::Value *cplx) | |
1799 { | |
1800 llvm::Type *complex_ret = instance->complex_ret; | |
1801 llvm::Value *real = bld.CreateExtractElement (cplx, bld.getInt32 (0)); | |
1802 llvm::Value *imag = bld.CreateExtractElement (cplx, bld.getInt32 (1)); | |
1803 llvm::Value *ret = llvm::UndefValue::get (complex_ret); | |
1804 ret = bld.CreateInsertValue (ret, real, 0); | |
1805 return bld.CreateInsertValue (ret, imag, 1); | |
1806 } | |
1807 | |
1808 llvm::Value * | |
1809 jit_typeinfo::unpack_complex (llvm::IRBuilderD& bld, llvm::Value *result) | |
1810 { | |
1811 llvm::Type *complex_t = get_complex ()->to_llvm (); | |
1812 llvm::Value *real = bld.CreateExtractValue (result, 0); | |
1813 llvm::Value *imag = bld.CreateExtractValue (result, 1); | |
1814 llvm::Value *ret = llvm::UndefValue::get (complex_t); | |
1815 ret = bld.CreateInsertElement (ret, real, bld.getInt32 (0)); | |
1816 return bld.CreateInsertElement (ret, imag, bld.getInt32 (1)); | |
1817 } | |
1818 | |
1819 llvm::Value * | |
1820 jit_typeinfo::complex_real (llvm::Value *cx) | |
1821 { | |
1822 return builder.CreateExtractElement (cx, builder.getInt32 (0)); | |
1823 } | |
1824 | |
1825 llvm::Value * | |
1826 jit_typeinfo::complex_real (llvm::Value *cx, llvm::Value *real) | |
1827 { | |
1828 return builder.CreateInsertElement (cx, real, builder.getInt32 (0)); | |
1829 } | |
1830 | |
1831 llvm::Value * | |
1832 jit_typeinfo::complex_imag (llvm::Value *cx) | |
1833 { | |
1834 return builder.CreateExtractElement (cx, builder.getInt32 (1)); | |
1835 } | |
1836 | |
1837 llvm::Value * | |
1838 jit_typeinfo::complex_imag (llvm::Value *cx, llvm::Value *imag) | |
1839 { | |
1840 return builder.CreateInsertElement (cx, imag, builder.getInt32 (1)); | |
1841 } | |
1842 | |
1843 llvm::Value * | |
1844 jit_typeinfo::complex_new (llvm::Value *real, llvm::Value *imag) | |
1845 { | |
1846 llvm::Value *ret = llvm::UndefValue::get (complex->to_llvm ()); | |
1847 ret = complex_real (ret, real); | |
1848 return complex_imag (ret, imag); | |
1849 } | |
1850 | |
1851 void | |
1852 jit_typeinfo::create_int (size_t nbits) | |
1853 { | |
1854 std::stringstream tname; | |
1855 tname << "int" << nbits; | |
1856 ints[nbits] = new_type (tname.str (), any, llvm::Type::getIntNTy (context, | |
1857 nbits)); | |
1858 } | |
1859 | |
1860 jit_type * | |
1861 jit_typeinfo::intN (size_t nbits) const | |
1862 { | |
1863 std::map<size_t, jit_type *>::const_iterator iter = ints.find (nbits); | |
1864 if (iter != ints.end ()) | |
1865 return iter->second; | |
1866 | |
1867 throw jit_fail_exception ("No such integer type"); | |
1868 } | |
1869 | |
1870 jit_type * | |
1871 jit_typeinfo::do_type_of (const octave_value &ov) const | |
1872 { | |
1873 if (ov.is_function ()) | |
1874 { | |
1875 // FIXME: This is ugly, we need to finalize how we want to to this, then | |
1876 // have octave_value fully support the needed functionality | |
1877 octave_builtin *builtin | |
1878 = dynamic_cast<octave_builtin *> (ov.internal_rep ()); | |
1879 return builtin && builtin->to_jit () ? builtin->to_jit () | |
1880 : unknown_function; | |
1881 } | |
1882 | |
1883 if (ov.is_range ()) | |
1884 return get_range (); | |
1885 | |
1886 if (ov.is_double_type ()) | |
1887 { | |
1888 if (ov.is_real_scalar ()) | |
1889 return get_scalar (); | |
1890 | |
1891 if (ov.is_matrix_type ()) | |
1892 return get_matrix (); | |
1893 } | |
1894 | |
1895 if (ov.is_complex_scalar ()) | |
1896 return get_complex (); | |
1897 | |
1898 return get_any (); | |
1899 } | |
1900 | |
1901 jit_type* | |
1902 jit_typeinfo::new_type (const std::string& name, jit_type *parent, | |
1903 llvm::Type *llvm_type) | |
1904 { | |
1905 jit_type *ret = new jit_type (name, parent, llvm_type, next_id++); | |
1906 id_to_type.push_back (ret); | |
1907 return ret; | |
1908 } | |
1909 | |
15067 | 1910 void |
1911 jit_typeinfo::gen_subsref (const jit_function& paren_scalar, size_t n) | |
1912 { | |
1913 std::stringstream name; | |
1914 name << "jit_paren_subsref_matrix_scalar" << n; | |
1915 std::vector<jit_type *> args (n + 1, scalar); | |
1916 args[0] = matrix; | |
1917 jit_function fn = create_function (jit_convention::internal, name.str (), | |
1918 scalar, args); | |
1919 fn.mark_can_error (); | |
1920 llvm::BasicBlock *body = fn.new_block (); | |
1921 builder.SetInsertPoint (body); | |
1922 | |
1923 llvm::Type *scalar_t = scalar->to_llvm (); | |
1924 llvm::ArrayType *array_t = llvm::ArrayType::get (scalar_t, n); | |
1925 llvm::Value *array = llvm::UndefValue::get (array_t); | |
1926 for (size_t i = 0; i < n; ++i) | |
1927 { | |
1928 llvm::Value *idx = fn.argument (builder, i + 1); | |
1929 array = builder.CreateInsertValue (array, idx, i); | |
1930 } | |
1931 | |
1932 llvm::Value *array_mem = builder.CreateAlloca (array_t); | |
1933 builder.CreateStore (array, array_mem); | |
1934 array = builder.CreateBitCast (array_mem, scalar_t->getPointerTo ()); | |
1935 | |
1936 llvm::Value *nelem = llvm::ConstantInt::get (index->to_llvm (), n); | |
1937 llvm::Value *mat = fn.argument (builder, 0); | |
1938 llvm::Value *ret = paren_scalar.call (builder, mat, array, nelem); | |
1939 fn.do_return (builder, ret); | |
1940 paren_subsref_fn.add_overload (fn); | |
1941 } | |
1942 | |
15068
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1943 void |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1944 jit_typeinfo::gen_subsasgn (const jit_function& paren_scalar, size_t n) |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1945 { |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1946 std::stringstream name; |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1947 name << "jit_paren_subsasgn_matrix_scalar" << n; |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1948 std::vector<jit_type *> args (n + 2, scalar); |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1949 args[0] = matrix; |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1950 jit_function fn = create_function (jit_convention::internal, name.str (), |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1951 matrix, args); |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1952 fn.mark_can_error (); |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1953 llvm::BasicBlock *body = fn.new_block (); |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1954 builder.SetInsertPoint (body); |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1955 |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1956 llvm::Type *scalar_t = scalar->to_llvm (); |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1957 llvm::ArrayType *array_t = llvm::ArrayType::get (scalar_t, n); |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1958 llvm::Value *array = llvm::UndefValue::get (array_t); |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1959 for (size_t i = 0; i < n; ++i) |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1960 { |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1961 llvm::Value *idx = fn.argument (builder, i + 1); |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1962 array = builder.CreateInsertValue (array, idx, i); |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1963 } |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1964 |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1965 llvm::Value *array_mem = builder.CreateAlloca (array_t); |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1966 builder.CreateStore (array, array_mem); |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1967 array = builder.CreateBitCast (array_mem, scalar_t->getPointerTo ()); |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1968 |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1969 llvm::Value *nelem = llvm::ConstantInt::get (index->to_llvm (), n); |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1970 llvm::Value *mat = fn.argument (builder, 0); |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1971 llvm::Value *value = fn.argument (builder, n + 1); |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1972 llvm::Value *ret = paren_scalar.call (builder, mat, array, nelem, value); |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1973 fn.do_return (builder, ret); |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1974 paren_subsasgn_fn.add_overload (fn); |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1975 } |
f57d7578c1a6
Support ND matrix indexing with scalar assignment in JIT.
Max Brister <max@2bass.com>
parents:
15067
diff
changeset
|
1976 |
15016 | 1977 #endif |