Mercurial > octave
diff src/corefcn/lookup.cc @ 15039:e753177cde93
maint: Move non-dynamically linked functions from DLD-FUNCTIONS/ to corefcn/ directory
* __contourc__.cc, __dispatch__.cc, __lin_interpn__.cc, __pchip_deriv__.cc,
__qp__.cc, balance.cc, besselj.cc, betainc.cc, bsxfun.cc, cellfun.cc,
colloc.cc, conv2.cc, daspk.cc, dasrt.cc, dassl.cc, det.cc, dlmread.cc, dot.cc,
eig.cc, fft.cc, fft2.cc, fftn.cc, filter.cc, find.cc, gammainc.cc, gcd.cc,
getgrent.cc, getpwent.cc, getrusage.cc, givens.cc, hess.cc, hex2num.cc, inv.cc,
kron.cc, lookup.cc, lsode.cc, lu.cc, luinc.cc, matrix_type.cc, max.cc,
md5sum.cc, mgorth.cc, nproc.cc, pinv.cc, quad.cc, quadcc.cc, qz.cc,
rand.cc, rcond.cc, regexp.cc, schur.cc, spparms.cc, sqrtm.cc, str2double.cc,
strfind.cc, sub2ind.cc, svd.cc, syl.cc, time.cc, tril.cc, typecast.cc:
Move functions from DLD-FUNCTIONS/ to corefcn/ directory. Include "defun.h",
not "defun-dld.h". Change docstring to refer to these as "Built-in Functions".
* build-aux/mk-opts.pl: Generate options code with '#include "defun.h"'. Change
option docstrings to refer to these as "Built-in Functions".
* corefcn/module.mk: List of functions to build in corefcn/ dir.
* DLD-FUNCTIONS/config-module.awk: Update to new build system.
* DLD-FUNCTIONS/module-files: Remove functions which are now in corefcn/ directory.
* src/Makefile.am: Update to build "convenience library" in corefcn/. Octave
program now links against all other libraries + corefcn libary.
* src/find-defun-files.sh: Strip $srcdir from filename.
* src/link-deps.mk: Add REGEX and FFTW link dependencies for liboctinterp.
* type.m, which.m: Change failing tests to use 'amd', still a dynamic function,
rather than 'dot', which isn't.
author | Rik <rik@octave.org> |
---|---|
date | Fri, 27 Jul 2012 15:35:00 -0700 |
parents | src/DLD-FUNCTIONS/lookup.cc@460a3c6d8bf1 |
children |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/src/corefcn/lookup.cc Fri Jul 27 15:35:00 2012 -0700 @@ -0,0 +1,397 @@ +/* + +Copyright (C) 2008-2012 VZLU Prague a.s., Czech Republic + +This file is part of Octave. + +Octave is free software; you can redistribute it and/or modify it +under the terms of the GNU General Public License as published by +the Free Software Foundation; either version 3 of the License, or (at +your option) any later version. + +Octave is distributed in the hope that it will be useful, but +WITHOUT ANY WARRANTY; without even the implied warranty of +MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU +General Public License for more details. + +You should have received a copy of the GNU General Public License +along with Octave; see the file COPYING. If not, see +<http://www.gnu.org/licenses/>. + +*/ + +// Author: Jaroslav Hajek <highegg@gmail.com> + +#ifdef HAVE_CONFIG_H +#include <config.h> +#endif + +#include <cctype> +#include <functional> +#include <algorithm> + +#include "dNDArray.h" +#include "CNDArray.h" + +#include "Cell.h" +#include "defun.h" +#include "error.h" +#include "gripes.h" +#include "oct-obj.h" +#include "ov.h" + +static +bool +contains_char (const std::string& str, char c) +{ + return (str.find (c) != std::string::npos + || str.find (std::toupper (c)) != std::string::npos); +} + +// case-insensitive character comparison functors +struct icmp_char_lt : public std::binary_function<char, char, bool> +{ + bool operator () (char x, char y) const + { return std::toupper (x) < std::toupper (y); } +}; + +struct icmp_char_gt : public std::binary_function<char, char, bool> +{ + bool operator () (char x, char y) const + { return std::toupper (x) > std::toupper (y); } +}; + +// FIXME -- maybe these should go elsewhere? +// FIXME -- are they even needed now? +// case-insensitive ascending comparator +#if 0 +static bool +stri_comp_lt (const std::string& a, const std::string& b) +{ + return std::lexicographical_compare (a.begin (), a.end (), + b.begin (), b.end (), + icmp_char_lt ()); +} + +// case-insensitive descending comparator +static bool +stri_comp_gt (const std::string& a, const std::string& b) +{ + return std::lexicographical_compare (a.begin (), a.end (), + b.begin (), b.end (), + icmp_char_gt ()); +} +#endif + +template <class T> +inline sortmode +get_sort_mode (const Array<T>& array, + typename octave_sort<T>::compare_fcn_type desc_comp + = octave_sort<T>::descending_compare) +{ + octave_idx_type n = array.numel (); + if (n > 1 && desc_comp (array (0), array (n-1))) + return DESCENDING; + else + return ASCENDING; +} + +// FIXME: perhaps there should be octave_value::lookup? +// The question is, how should it behave w.r.t. the second argument's type. +// We'd need a dispatch on two arguments. Hmmm... + +#define INT_ARRAY_LOOKUP(TYPE) \ + (table.is_ ## TYPE ## _type () && y.is_ ## TYPE ## _type ()) \ + retval = do_numeric_lookup (table.TYPE ## _array_value (), \ + y.TYPE ## _array_value (), \ + left_inf, right_inf, \ + match_idx, match_bool); +template <class ArrayT> +static octave_value +do_numeric_lookup (const ArrayT& array, const ArrayT& values, + bool left_inf, bool right_inf, + bool match_idx, bool match_bool) +{ + octave_value retval; + + Array<octave_idx_type> idx = array.lookup (values); + octave_idx_type n = array.numel (), nval = values.numel (); + + // Post-process. + if (match_bool) + { + boolNDArray match (idx.dims ()); + for (octave_idx_type i = 0; i < nval; i++) + { + octave_idx_type j = idx.xelem (i); + match.xelem (i) = j != 0 && values(i) == array(j-1); + } + + retval = match; + } + else if (match_idx || left_inf || right_inf) + { + if (match_idx) + { + NDArray ridx (idx.dims ()); + + for (octave_idx_type i = 0; i < nval; i++) + { + octave_idx_type j = idx.xelem (i); + ridx.xelem (i) = (j != 0 && values(i) == array(j-1)) ? j : 0; + } + + retval = ridx; + } + else if (left_inf && right_inf) + { + // Results in valid indices. Optimize using lazy index. + octave_idx_type zero = 0; + for (octave_idx_type i = 0; i < nval; i++) + { + octave_idx_type j = idx.xelem (i) - 1; + idx.xelem (i) = std::max (zero, std::min (j, n-2)); + } + + retval = idx_vector (idx); + } + else if (left_inf) + { + // Results in valid indices. Optimize using lazy index. + octave_idx_type zero = 0; + for (octave_idx_type i = 0; i < nval; i++) + { + octave_idx_type j = idx.xelem (i) - 1; + idx.xelem (i) = std::max (zero, j); + } + + retval = idx_vector (idx); + } + else if (right_inf) + { + NDArray ridx (idx.dims ()); + + for (octave_idx_type i = 0; i < nval; i++) + { + octave_idx_type j = idx.xelem (i); + ridx.xelem (i) = std::min (j, n-1); + } + + retval = ridx; + } + } + else + retval = idx; + + return retval; +} + +DEFUN (lookup, args, , + "-*- texinfo -*-\n\ +@deftypefn {Built-in Function} {@var{idx} =} lookup (@var{table}, @var{y})\n\ +@deftypefnx {Built-in Function} {@var{idx} =} lookup (@var{table}, @var{y}, @var{opt})\n\ +Lookup values in a sorted table. Usually used as a prelude to\n\ +interpolation.\n\ +\n\ +If table is increasing and @code{idx = lookup (table, y)}, then\n\ +@code{table(idx(i)) <= y(i) < table(idx(i+1))} for all @code{y(i)}\n\ +within the table. If @code{y(i) < table(1)} then\n\ +@code{idx(i)} is 0. If @code{y(i) >= table(end)} or @code{isnan (y(i))} then\n\ +@code{idx(i)} is @code{n}.\n\ +\n\ +If the table is decreasing, then the tests are reversed.\n\ +For non-strictly monotonic tables, empty intervals are always skipped.\n\ +The result is undefined if @var{table} is not monotonic, or if\n\ +@var{table} contains a NaN.\n\ +\n\ +The complexity of the lookup is O(M*log(N)) where N is the size of\n\ +@var{table} and M is the size of @var{y}. In the special case when @var{y}\n\ +is also sorted, the complexity is O(min(M*log(N),M+N)).\n\ +\n\ +@var{table} and @var{y} can also be cell arrays of strings\n\ +(or @var{y} can be a single string). In this case, string lookup\n\ +is performed using lexicographical comparison.\n\ +\n\ +If @var{opts} is specified, it must be a string with letters indicating\n\ +additional options.\n\ +\n\ +@table @code\n\ +@item m\n\ +@code{table(idx(i)) == val(i)} if @code{val(i)}\n\ +occurs in table; otherwise, @code{idx(i)} is zero.\n\ +\n\ +@item b\n\ +@code{idx(i)} is a logical 1 or 0, indicating whether\n\ +@code{val(i)} is contained in table or not.\n\ +\n\ +@item l\n\ +For numeric lookups\n\ +the leftmost subinterval shall be extended to infinity (i.e., all indices\n\ +at least 1)\n\ +\n\ +@item r\n\ +For numeric lookups\n\ +the rightmost subinterval shall be extended to infinity (i.e., all indices\n\ +at most n-1).\n\ +@end table\n\ +@end deftypefn") +{ + octave_value retval; + + int nargin = args.length (); + + if (nargin < 2 || nargin > 3 || (nargin == 3 && ! args(2).is_string ())) + { + print_usage (); + return retval; + } + + octave_value table = args(0), y = args(1); + if (table.ndims () > 2 || (table.columns () > 1 && table.rows () > 1)) + warning ("lookup: table is not a vector"); + + bool num_case = ((table.is_numeric_type () && y.is_numeric_type ()) + || (table.is_char_matrix () && y.is_char_matrix ())); + bool str_case = table.is_cellstr () && (y.is_string () || y.is_cellstr ()); + bool left_inf = false; + bool right_inf = false; + bool match_idx = false; + bool match_bool = false; + + if (nargin == 3) + { + std::string opt = args(2).string_value (); + left_inf = contains_char (opt, 'l'); + right_inf = contains_char (opt, 'r'); + match_idx = contains_char (opt, 'm'); + match_bool = contains_char (opt, 'b'); + if (opt.find_first_not_of ("lrmb") != std::string::npos) + { + error ("lookup: unrecognized option: %c", + opt[opt.find_first_not_of ("lrmb")]); + return retval; + } + } + + if ((match_idx || match_bool) && (left_inf || right_inf)) + error ("lookup: m, b cannot be specified with l or r"); + else if (match_idx && match_bool) + error ("lookup: only one of m or b can be specified"); + else if (str_case && (left_inf || right_inf)) + error ("lookup: l, r are not recognized for string lookups"); + + if (error_state) + return retval; + + if (num_case) + { + + // In the case of a complex array, absolute values will be used for compatibility + // (though it's not too meaningful). + + if (table.is_complex_type ()) + table = table.abs (); + + if (y.is_complex_type ()) + y = y.abs (); + + Array<octave_idx_type> idx; + + // PS: I learned this from data.cc + if INT_ARRAY_LOOKUP (int8) + else if INT_ARRAY_LOOKUP (int16) + else if INT_ARRAY_LOOKUP (int32) + else if INT_ARRAY_LOOKUP (int64) + else if INT_ARRAY_LOOKUP (uint8) + else if INT_ARRAY_LOOKUP (uint16) + else if INT_ARRAY_LOOKUP (uint32) + else if INT_ARRAY_LOOKUP (uint64) + else if (table.is_char_matrix () && y.is_char_matrix ()) + retval = do_numeric_lookup (table.char_array_value (), + y.char_array_value (), + left_inf, right_inf, + match_idx, match_bool); + else if (table.is_single_type () || y.is_single_type ()) + retval = do_numeric_lookup (table.float_array_value (), + y.float_array_value (), + left_inf, right_inf, + match_idx, match_bool); + else + retval = do_numeric_lookup (table.array_value (), + y.array_value (), + left_inf, right_inf, + match_idx, match_bool); + + } + else if (str_case) + { + Array<std::string> str_table = table.cellstr_value (); + Array<std::string> str_y (dim_vector (1, 1)); + + if (y.is_cellstr ()) + str_y = y.cellstr_value (); + else + str_y(0) = y.string_value (); + + Array<octave_idx_type> idx = str_table.lookup (str_y); + octave_idx_type nval = str_y.numel (); + + // Post-process. + if (match_bool) + { + boolNDArray match (idx.dims ()); + for (octave_idx_type i = 0; i < nval; i++) + { + octave_idx_type j = idx.xelem (i); + match.xelem (i) = j != 0 && str_y(i) == str_table(j-1); + } + + retval = match; + } + else if (match_idx) + { + NDArray ridx (idx.dims ()); + if (match_idx) + { + for (octave_idx_type i = 0; i < nval; i++) + { + octave_idx_type j = idx.xelem (i); + ridx.xelem (i) = (j != 0 && str_y(i) == str_table(j-1)) ? j : 0; + } + } + + retval = ridx; + } + else + retval = idx; + } + else + print_usage (); + + return retval; + +} + +/* +%!assert (lookup (1:3, 0.5), 0) # value before table +%!assert (lookup (1:3, 3.5), 3) # value after table error +%!assert (lookup (1:3, 1.5), 1) # value within table error +%!assert (lookup (1:3, [3,2,1]), [3,2,1]) +%!assert (lookup ([1:4]', [1.2, 3.5]'), [1, 3]') +%!assert (lookup ([1:4], [1.2, 3.5]'), [1, 3]') +%!assert (lookup ([1:4]', [1.2, 3.5]), [1, 3]) +%!assert (lookup ([1:4], [1.2, 3.5]), [1, 3]) +%!assert (lookup (1:3, [3, 2, 1]), [3, 2, 1]) +%!assert (lookup ([3:-1:1], [3.5, 3, 1.2, 2.5, 2.5]), [0, 1, 2, 1, 1]) +%!assert (isempty (lookup ([1:3], []))) +%!assert (isempty (lookup ([1:3]', []))) +%!assert (lookup (1:3, [1, 2; 3, 0.5]), [1, 2; 3, 0]) +%!assert (lookup (1:4, [1, 1.2; 3, 2.5], "m"), [1, 0; 3, 0]) +%!assert (lookup (4:-1:1, [1, 1.2; 3, 2.5], "m"), [4, 0; 2, 0]) +%!assert (lookup (1:4, [1, 1.2; 3, 2.5], "b"), logical ([1, 0; 3, 0])) +%!assert (lookup (4:-1:1, [1, 1.2; 3, 2.5], "b"), logical ([4, 0; 2, 0])) +%! +%!assert (lookup ({"apple","lemon","orange"}, {"banana","kiwi"; "ananas","mango"}), [1,1;0,2]) +%!assert (lookup ({"apple","lemon","orange"}, "potato"), 3) +%!assert (lookup ({"orange","lemon","apple"}, "potato"), 0) +*/