Mercurial > octave
view libinterp/corefcn/dlmread.cc @ 23457:21baad6b35c4
maint: Use C++11 nullptr rather than 0 or NULL when possible.
* FigureWindow.h, Logger.cc, Menu.cc, MouseModeActionGroup.h, Object.h,
ObjectFactory.cc, ObjectProxy.h, color-picker.h, documentation-dock-widget.h,
files-dock-widget.h, find-files-dialog.h, history-dock-widget.h,
file-editor-tab.cc, file-editor.cc, file-editor.h, find-dialog.h,
main-window.cc, main-window.h, octave-dock-widget.h, parser.cc, parser.h,
webinfo.h, resource-manager.cc, shortcut-manager.cc, shortcut-manager.h,
terminal-dock-widget.h, welcome-wizard.cc, welcome-wizard.h, workspace-model.h,
workspace-view.h, __magick_read__.cc, call-stack.cc, call-stack.h, cdisplay.c,
display.cc, dlmread.cc, dynamic-ld.cc, ft-text-renderer.cc, gl2ps-print.cc,
graphics.cc, graphics.in.h, input.h, interpreter.cc, interpreter.h, ls-hdf5.cc,
mex.cc, mxarray.in.h, oct-errno.in.cc, oct-fstrm.cc, oct-iostrm.h,
oct-procbuf.cc, oct-stdstrm.h, oct-stream.cc, oct-stream.h, octave-link.cc,
pager.cc, pr-output.cc, profiler.h, qz.cc, sighandlers.cc, strfns.cc,
symtab.cc, symtab.h, typecast.cc, urlwrite.cc, variables.cc, __eigs__.cc,
__init_fltk__.cc, __ode15__.cc, colamd.cc, ov-base-int.cc, ov-base.cc,
ov-bool-mat.cc, ov-bool-sparse.cc, ov-builtin.cc, ov-class.cc, ov-classdef.cc,
ov-complex.cc, ov-cx-diag.cc, ov-cx-mat.cc, ov-cx-sparse.cc, ov-fcn-handle.cc,
ov-fcn-inline.cc, ov-flt-complex.cc, ov-flt-cx-diag.cc, ov-flt-cx-mat.cc,
ov-flt-re-diag.cc, ov-flt-re-mat.cc, ov-java.cc, ov-java.h, ov-lazy-idx.cc,
ov-perm.cc, ov-range.cc, ov-re-diag.cc, ov-re-mat.cc, ov-re-sparse.cc,
ov-str-mat.cc, ov-struct.cc, ov-usr-fcn.h, octave.cc, octave.h, bp-table.cc,
jit-ir.cc, jit-ir.h, jit-typeinfo.cc, jit-typeinfo.h, lex.h, pt-arg-list.cc,
pt-arg-list.h, pt-array-list.h, pt-cell.h, pt-classdef.h, pt-colon.cc,
pt-decl.h, pt-eval.cc, pt-eval.h, pt-except.h, pt-idx.h, pt-jit.cc, pt-jit.h,
pt-loop.h, pt-mat.h, pt-select.h, pt.h, CSparse.cc, dSparse.cc, DASPK.cc,
DASRT.cc, DASSL.cc, oct-fftw.cc, oct-rand.cc, oct-spparms.cc, child-list.cc,
file-ops.cc, mach-info.cc, oct-env.cc, oct-time.cc, cmd-edit.cc, cmd-hist.cc,
oct-locbuf.cc, oct-shlib.cc, pathsearch.cc, singleton-cleanup.cc,
unwind-prot.h, url-transfer.cc:
Use C++11 nullptr rather than 0 or NULL when possible.
author | Rik <rik@octave.org> |
---|---|
date | Fri, 28 Apr 2017 13:19:12 -0700 |
parents | c14cf947142f |
children | b6144e6dda9e |
line wrap: on
line source
/* Copyright (C) 2008-2017 Jonathan Stickel Copyright (C) 2010 Jaroslav Hajek This file is part of Octave. Octave is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 3 of the License, or (at your option) any later version. Octave is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with Octave; see the file COPYING. If not, see <http://www.gnu.org/licenses/>. */ // Adapted from previous version of dlmread.occ as authored by Kai // Habel, but core code has been completely re-written. #if defined (HAVE_CONFIG_H) # include "config.h" #endif #include <cctype> #include <fstream> #include <limits> #include "file-ops.h" #include "lo-ieee.h" #include "defun.h" #include "oct-stream.h" #include "error.h" #include "ovl.h" #include "utils.h" static const octave_idx_type idx_max = std::numeric_limits<octave_idx_type>::max () - 1; static const double idx_max_dbl = double (idx_max); static bool read_cell_spec (std::istream& is, octave_idx_type& row, octave_idx_type& col) { bool stat = false; if (is.peek () == std::istream::traits_type::eof ()) stat = true; else { if (::isalpha (is.peek ())) { col = 0; while (is && ::isalpha (is.peek ())) { char ch = is.get (); col *= 26; if (ch >= 'a') col += ch - 'a' + 1; else col += ch - 'A' + 1; } col--; if (is) { is >> row; row--; if (is) stat = true; } } } return stat; } static bool parse_range_spec (const octave_value& range_spec, octave_idx_type& rlo, octave_idx_type& clo, octave_idx_type& rup, octave_idx_type& cup) { bool stat = true; if (range_spec.is_string ()) { std::istringstream is (range_spec.string_value ()); char ch = is.peek (); if (ch == '.' || ch == ':') { rlo = 0; clo = 0; ch = is.get (); if (ch == '.') { ch = is.get (); if (ch != '.') stat = false; } } else { stat = read_cell_spec (is, rlo, clo); if (stat) { ch = is.peek (); if (ch == '.' || ch == ':') { ch = is.get (); if (ch == '.') { ch = is.get (); if (! is || ch != '.') stat = false; } rup = idx_max; cup = idx_max; } else { rup = rlo; cup = clo; if (! is || ! is.eof ()) stat = false; } } } if (stat && is && ! is.eof ()) stat = read_cell_spec (is, rup, cup); if (! is || ! is.eof ()) stat = false; } else if (range_spec.is_real_matrix () && range_spec.numel () == 4) { ColumnVector range (range_spec.vector_value ()); // double --> unsigned int avoiding any overflow rlo = static_cast<octave_idx_type> (std::min (range(0), idx_max_dbl)); clo = static_cast<octave_idx_type> (std::min (range(1), idx_max_dbl)); rup = static_cast<octave_idx_type> (std::min (range(2), idx_max_dbl)); cup = static_cast<octave_idx_type> (std::min (range(3), idx_max_dbl)); } else stat = false; return stat; } DEFUN (dlmread, args, , doc: /* -*- texinfo -*- @deftypefn {} {@var{data} =} dlmread (@var{file}) @deftypefnx {} {@var{data} =} dlmread (@var{file}, @var{sep}) @deftypefnx {} {@var{data} =} dlmread (@var{file}, @var{sep}, @var{r0}, @var{c0}) @deftypefnx {} {@var{data} =} dlmread (@var{file}, @var{sep}, @var{range}) @deftypefnx {} {@var{data} =} dlmread (@dots{}, "emptyvalue", @var{EMPTYVAL}) Read numeric data from the text file @var{file} which uses the delimiter @var{sep} between data values. If @var{sep} is not defined the separator between fields is determined from the file itself. The optional scalar arguments @var{r0} and @var{c0} define the starting row and column of the data to be read. These values are indexed from zero, i.e., the first data row corresponds to an index of zero. The @var{range} parameter specifies exactly which data elements are read. The first form of the parameter is a 4-element vector containing the upper left and lower right corners @code{[@var{R0},@var{C0},@var{R1},@var{C1}]} where the indices are zero-based. Alternatively, a spreadsheet style form such as @qcode{"A2..Q15"} or @qcode{"T1:AA5"} can be used. The lowest alphabetical index @qcode{'A'} refers to the first column. The lowest row index is 1. @var{file} should be a filename or a file id given by @code{fopen}. In the latter case, the file is read until end of file is reached. The @qcode{"emptyvalue"} option may be used to specify the value used to fill empty fields. The default is zero. Note that any non-numeric values, such as text, are also replaced by the @qcode{"emptyvalue"}. @seealso{csvread, textscan, textread, dlmwrite} @end deftypefn */) { int nargin = args.length (); double empty_value = 0.0; if (nargin > 2 && args(nargin-2).is_string () && args(nargin-2).string_value () == "emptyvalue") { empty_value = args(nargin-1).double_value (); nargin -= 2; } if (nargin < 1 || nargin > 4) print_usage (); std::istream *input = nullptr; std::ifstream input_file; if (args(0).is_string ()) { // Filename. std::string fname (args(0).string_value ()); std::string tname = octave::sys::file_ops::tilde_expand (fname); tname = find_data_file_in_load_path ("dlmread", tname); input_file.open (tname.c_str (), std::ios::in); if (! input_file) error ("dlmread: unable to open file '%s'", fname.c_str ()); input = &input_file; } else if (args(0).is_scalar_type ()) { octave::stream is = octave::stream_list::lookup (args(0), "dlmread"); input = is.input_stream (); if (! input) error ("dlmread: stream FILE not open for input"); } else error ("dlmread: FILE argument must be a string or file id"); // Set default separator. std::string sep; if (nargin > 1) { if (args(1).is_sq_string ()) sep = do_string_escapes (args(1).string_value ()); else sep = args(1).string_value (); } // Take a subset if a range was given. octave_idx_type r0 = 0; octave_idx_type c0 = 0; octave_idx_type r1 = idx_max; octave_idx_type c1 = idx_max; if (nargin > 2) { if (nargin == 3) { if (! parse_range_spec (args(2), r0, c0, r1, c1)) error ("dlmread: error parsing RANGE"); } else if (nargin == 4) { r0 = args(2).idx_type_value (); c0 = args(3).idx_type_value (); } if (r0 < 0 || c0 < 0) error ("dlmread: left & top must be positive"); // Short-circuit and return if range is empty if (r1 < r0 || c1 < c0) return ovl (Matrix (0,0)); } octave_idx_type i = 0; octave_idx_type j = 0; octave_idx_type r = 1; octave_idx_type c = 1; // Start with a reasonable size to avoid constant resizing of matrix. octave_idx_type rmax = 32; octave_idx_type cmax = 0; Matrix rdata (rmax, cmax, empty_value); ComplexMatrix cdata; bool iscmplx = false; bool sep_is_wspace = (sep.find_first_of (" \t") != std::string::npos); bool auto_sep_is_wspace = false; std::string line; // Skip the r0 leading lines octave_idx_type rcnt = r0; while (rcnt > 0 && getline (*input, line)) rcnt--; if (rcnt > 0) return ovl (Matrix (0,0)); // Not enough lines in file to satisfy RANGE else r1 -= r0; std::istringstream tmp_stream; // Read the data one field at a time, growing the data matrix as needed. while (getline (*input, line)) { // Skip blank lines for compatibility. if ((! sep_is_wspace || auto_sep_is_wspace) && line.find_first_not_of (" \t") == std::string::npos) continue; // Infer separator from file if delimiter is blank. if (sep.empty ()) { // Skip leading whitespace. size_t pos1 = line.find_first_not_of (" \t"); // For Matlab compatibility, blank delimiter should // correspond to whitespace (space and tab). size_t n = line.find_first_of (",:; \t", pos1); if (n == std::string::npos) { sep = " \t"; auto_sep_is_wspace = true; } else { char ch = line.at (n); switch (line.at (n)) { case ' ': case '\t': sep = " \t"; auto_sep_is_wspace = true; break; default: sep = ch; break; } } } // Estimate the number of columns from first line of data. if (cmax == 0) { size_t pos1, pos2; if (auto_sep_is_wspace) pos1 = line.find_first_not_of (" \t"); else pos1 = 0; do { pos2 = line.find_first_of (sep, pos1); if (auto_sep_is_wspace && pos2 != std::string::npos) { // Treat consecutive separators as one. pos2 = line.find_first_not_of (sep, pos2); if (pos2 != std::string::npos) pos2 -= 1; } // Separator followed by EOL doesn't generate extra column if (pos2 != std::string::npos) cmax++; pos1 = pos2 + 1; } while (pos2 != std::string::npos); // FIXME: Should always be the case that iscmplx == false. // Flag is initialized that way and no data has been read. if (iscmplx) cdata.resize (rmax, cmax, empty_value); else rdata.resize (rmax, cmax, empty_value); } r = (r > i + 1 ? r : i + 1); j = 0; size_t pos1, pos2; if (auto_sep_is_wspace) pos1 = line.find_first_not_of (" \t"); // Skip leading whitespace. else pos1 = 0; do { octave_quit (); pos2 = line.find_first_of (sep, pos1); std::string str = line.substr (pos1, pos2 - pos1); if (auto_sep_is_wspace && pos2 != std::string::npos) { // Treat consecutive separators as one. pos2 = line.find_first_not_of (sep, pos2); if (pos2 != std::string::npos) pos2 -= 1; else pos2 = line.length () - 1; } // Separator followed by EOL doesn't generate extra column if (pos2 == std::string::npos && str.empty ()) break; c = (c > j + 1 ? c : j + 1); if (r > rmax || c > cmax) { // Use resize_and_fill for the case of unequal length rows. // Keep rmax a power of 2. rmax = std::max (2*(r-1), rmax); cmax = std::max (c, cmax); if (iscmplx) cdata.resize (rmax, cmax, empty_value); else rdata.resize (rmax, cmax, empty_value); } tmp_stream.str (str); tmp_stream.clear (); double x = octave_read_double (tmp_stream); if (tmp_stream) { if (tmp_stream.eof ()) { if (iscmplx) cdata(i,j++) = x; else rdata(i,j++) = x; } else { int next_char = std::tolower (tmp_stream.peek ()); if (next_char == 'i' || next_char == 'j') { // Process pure imaginary numbers. if (! iscmplx) { iscmplx = true; cdata = ComplexMatrix (rdata); } cdata(i,j++) = Complex (0, x); } else { double y = octave_read_double (tmp_stream); if (! iscmplx && y != 0.) { iscmplx = true; cdata = ComplexMatrix (rdata); } if (iscmplx) cdata(i,j++) = Complex (x, y); else rdata(i,j++) = x; } } } else if (iscmplx) cdata(i,j++) = empty_value; else rdata(i,j++) = empty_value; pos1 = pos2 + 1; } while (pos2 != std::string::npos); if (i == r1) break; // Stop early if the desired range has been read. i++; } // Clip selection indices to actual size of data if (r1 >= r) r1 = r - 1; if (c1 >= c) c1 = c - 1; if (iscmplx) { if ((i == 0 && j == 0) || (c0 > c1)) return ovl (ComplexMatrix (0,0)); cdata = cdata.extract (0, c0, r1, c1); return ovl (cdata); } else { if ((i == 0 && j == 0) || (c0 > c1)) return ovl (Matrix (0,0)); rdata = rdata.extract (0, c0, r1, c1); return ovl (rdata); } } /* %!test %! file = tempname (); %! unwind_protect %! fid = fopen (file, "wt"); %! fwrite (fid, "1, 2, 3\n4, 5, 6\n7, 8, 9\n10, 11, 12"); %! fclose (fid); %! %! assert (dlmread (file), [1, 2, 3; 4, 5, 6; 7, 8, 9;10, 11, 12]); %! assert (dlmread (file, ","), [1, 2, 3; 4, 5, 6; 7, 8, 9; 10, 11, 12]); %! assert (dlmread (file, ",", [1, 0, 2, 1]), [4, 5; 7, 8]); %! assert (dlmread (file, ",", "B1..C2"), [2, 3; 5, 6]); %! assert (dlmread (file, ",", "B1:C2"), [2, 3; 5, 6]); %! assert (dlmread (file, ",", "..C2"), [1, 2, 3; 4, 5, 6]); %! assert (dlmread (file, ",", 0, 1), [2, 3; 5, 6; 8, 9; 11, 12]); %! assert (dlmread (file, ",", "B1.."), [2, 3; 5, 6; 8, 9; 11, 12]); %! assert (dlmread (file, ",", 10, 0), []); %! assert (dlmread (file, ",", 0, 10), []); %! fail ('dlmread (file, ",", [0 1])', "error parsing RANGE"); %! unwind_protect_cleanup %! unlink (file); %! end_unwind_protect %!test %! file = tempname (); %! unwind_protect %! fid = fopen (file, "wt"); %! fwrite (fid, "1, 2, 3\n4+4i, 5, 6\n7, 8, 9\n10, 11, 12"); %! fclose (fid); %! %! assert (dlmread (file), [1, 2, 3; 4 + 4i, 5, 6; 7, 8, 9; 10, 11, 12]); %! assert (dlmread (file, ","), [1,2,3; 4 + 4i, 5, 6; 7, 8, 9; 10, 11, 12]); %! assert (dlmread (file, ",", [1, 0, 2, 1]), [4 + 4i, 5; 7, 8]); %! assert (dlmread (file, ",", "A2..B3"), [4 + 4i, 5; 7, 8]); %! assert (dlmread (file, ",", "A2:B3"), [4 + 4i, 5; 7, 8]); %! assert (dlmread (file, ",", "..B3"), [1, 2; 4 + 4i, 5; 7, 8]); %! assert (dlmread (file, ",", 1, 0), [4 + 4i, 5, 6; 7, 8, 9; 10, 11, 12]); %! assert (dlmread (file, ",", "A2.."), [4 + 4i, 5, 6; 7, 8, 9; 10, 11, 12]); %! assert (dlmread (file, ",", 10, 0), []); %! assert (dlmread (file, ",", 0, 10), []); %! unwind_protect_cleanup %! unlink (file); %! end_unwind_protect %!test <42025> %! file = tempname (); %! unwind_protect %! fid = fopen (file, "wt"); %! fwrite (fid, " \n 1 2\n11 22\n "); %! fclose (fid); %! %! assert (dlmread (file), [1, 2; 11, 22]); %! assert (dlmread (file, " "), [ 0, 0, 0, 0 %! 0, 1, 2, 0 %! 11, 22, 0, 0 %! 0, 0, 0, 0]); %! unwind_protect_cleanup %! unlink (file); %! end_unwind_protect %!test <50589> %! file = tempname (); %! unwind_protect %! fid = fopen (file, "wt"); %! fwrite (fid, "1;2;3\n"); %! fwrite (fid, "1i;2I;3j;4J\n"); %! fwrite (fid, "4;5;6\n"); %! fwrite (fid, "-4i;+5I;-6j;+7J\n"); %! fclose (fid); %! %! assert (dlmread (file), [1, 2, 3, 0; 1i, 2i, 3i, 4i; %! 4, 5, 6, 0; -4i, 5i, -6i, 7i]); %! assert (dlmread (file, "", [0 0 0 3]), [1, 2, 3]); %! assert (dlmread (file, "", [1 0 1 3]), [1i, 2i, 3i, 4i]); %! unwind_protect_cleanup %! unlink (file); %! end_unwind_protect */