/* Copyright (C) 1995,1996,1997,1998,1999,2000,2001, 2006 Free Software Foundation, Inc. * * This library is free software; you can redistribute it and/or * modify it under the terms of the GNU Lesser General Public License * as published by the Free Software Foundation; either version 3 of * the License, or (at your option) any later version. * * This library is distributed in the hope that it will be useful, but * WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU * Lesser General Public License for more details. * * You should have received a copy of the GNU Lesser General Public * License along with this library; if not, write to the Free Software * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA * 02110-1301 USA */ #ifdef HAVE_CONFIG_H # include #endif #include "libguile/_scm.h" #include #ifdef HAVE_STRING_H #include #endif #include "libguile/chars.h" #include "libguile/modules.h" #include "libguile/ports.h" #include "libguile/rdelim.h" #include "libguile/root.h" #include "libguile/strings.h" #include "libguile/strports.h" #include "libguile/validate.h" SCM_DEFINE (scm_read_delimited_x, "%read-delimited!", 3, 3, 0, (SCM delims, SCM str, SCM gobble, SCM port, SCM start, SCM end), "Read characters from @var{port} into @var{str} until one of the\n" "characters in the @var{delims} string is encountered. If\n" "@var{gobble} is true, discard the delimiter character;\n" "otherwise, leave it in the input stream for the next read. If\n" "@var{port} is not specified, use the value of\n" "@code{(current-input-port)}. If @var{start} or @var{end} are\n" "specified, store data only into the substring of @var{str}\n" "bounded by @var{start} and @var{end} (which default to the\n" "beginning and end of the string, respectively).\n" "\n" " Return a pair consisting of the delimiter that terminated the\n" "string and the number of characters read. If reading stopped\n" "at the end of file, the delimiter returned is the\n" "@var{eof-object}; if the string was filled without encountering\n" "a delimiter, this value is @code{#f}.") #define FUNC_NAME s_scm_read_delimited_x { size_t j; size_t cstart; size_t cend; int c; const char *cdelims; size_t num_delims; SCM_VALIDATE_STRING (1, delims); cdelims = scm_i_string_chars (delims); num_delims = scm_i_string_length (delims); SCM_VALIDATE_STRING (2, str); scm_i_get_substring_spec (scm_i_string_length (str), start, &cstart, end, &cend); if (SCM_UNBNDP (port)) port = scm_current_input_port (); else SCM_VALIDATE_OPINPORT (4, port); for (j = cstart; j < cend; j++) { size_t k; c = scm_getc (port); for (k = 0; k < num_delims; k++) { if (cdelims[k] == c) { if (scm_is_false (gobble)) scm_ungetc (c, port); return scm_cons (SCM_MAKE_CHAR (c), scm_from_size_t (j - cstart)); } } if (c == EOF) return scm_cons (SCM_EOF_VAL, scm_from_size_t (j - cstart)); scm_c_string_set_x (str, j, SCM_MAKE_CHAR (c)); } return scm_cons (SCM_BOOL_F, scm_from_size_t (j - cstart)); } #undef FUNC_NAME static unsigned char * scm_do_read_line (SCM port, size_t *len_p) { scm_t_port *pt = SCM_PTAB_ENTRY (port); unsigned char *end; /* I thought reading lines was simple. Mercy me. */ /* The common case: the buffer contains a complete line. This needs to be fast. */ if ((end = memchr (pt->read_pos, '\n', (pt->read_end - pt->read_pos))) != 0) { size_t buf_len = (end + 1) - pt->read_pos; /* Allocate a buffer of the perfect size. */ unsigned char *buf = scm_malloc (buf_len + 1); memcpy (buf, pt->read_pos, buf_len); pt->read_pos += buf_len; buf[buf_len] = '\0'; *len_p = buf_len; return buf; } /* The buffer contains no newlines. */ { /* When live, len is always the number of characters in the current buffer that are part of the current line. */ size_t len = (pt->read_end - pt->read_pos); size_t buf_size = (len < 50) ? 60 : len * 2; /* Invariant: buf always has buf_size + 1 characters allocated; the `+ 1' is for the final '\0'. */ unsigned char *buf = scm_malloc (buf_size + 1); size_t buf_len = 0; for (;;) { if (buf_len + len > buf_size) { size_t new_size = (buf_len + len) * 2; buf = scm_realloc (buf, new_size + 1); buf_size = new_size; } /* Copy what we've got out of the port, into our buffer. */ memcpy (buf + buf_len, pt->read_pos, len); buf_len += len; pt->read_pos += len; /* If we had seen a newline, we're done now. */ if (end) break; /* Get more characters. */ if (scm_fill_input (port) == EOF) { /* If we're missing a final newline in the file, return what we did get, sans newline. */ if (buf_len > 0) break; free (buf); return 0; } /* Search the buffer for newlines. */ if ((end = memchr (pt->read_pos, '\n', (len = (pt->read_end - pt->read_pos)))) != 0) len = (end - pt->read_pos) + 1; } /* I wonder how expensive this realloc is. */ buf = scm_realloc (buf, buf_len + 1); buf[buf_len] = '\0'; *len_p = buf_len; return buf; } } /* * %read-line * truncates any terminating newline from its input, and returns * a cons of the string read and its terminating character. Doing * so makes it easy to implement the hairy `read-line' options * efficiently in Scheme. */ SCM_DEFINE (scm_read_line, "%read-line", 0, 1, 0, (SCM port), "Read a newline-terminated line from @var{port}, allocating storage as\n" "necessary. The newline terminator (if any) is removed from the string,\n" "and a pair consisting of the line and its delimiter is returned. The\n" "delimiter may be either a newline or the @var{eof-object}; if\n" "@code{%read-line} is called at the end of file, it returns the pair\n" "@code{(# . #)}.") #define FUNC_NAME s_scm_read_line { scm_t_port *pt; char *s; size_t slen = 0; SCM line, term; if (SCM_UNBNDP (port)) port = scm_current_input_port (); SCM_VALIDATE_OPINPORT (1,port); pt = SCM_PTAB_ENTRY (port); if (pt->rw_active == SCM_PORT_WRITE) scm_ptobs[SCM_PTOBNUM (port)].flush (port); s = (char *) scm_do_read_line (port, &slen); if (s == NULL) term = line = SCM_EOF_VAL; else { if (s[slen-1] == '\n') { term = SCM_MAKE_CHAR ('\n'); s[slen-1] = '\0'; line = scm_take_locale_stringn (s, slen-1); SCM_INCLINE (port); } else { /* Fix: we should check for eof on the port before assuming this. */ term = SCM_EOF_VAL; line = scm_take_locale_stringn (s, slen); SCM_COL (port) += slen; } } if (pt->rw_random) pt->rw_active = SCM_PORT_READ; return scm_cons (line, term); } #undef FUNC_NAME SCM_DEFINE (scm_write_line, "write-line", 1, 1, 0, (SCM obj, SCM port), "Display @var{obj} and a newline character to @var{port}. If\n" "@var{port} is not specified, @code{(current-output-port)} is\n" "used. This function is equivalent to:\n" "@lisp\n" "(display obj [port])\n" "(newline [port])\n" "@end lisp") #define FUNC_NAME s_scm_write_line { scm_display (obj, port); return scm_newline (port); } #undef FUNC_NAME SCM scm_init_rdelim_builtins (void) { #include "libguile/rdelim.x" return SCM_UNSPECIFIED; } void scm_init_rdelim (void) { scm_c_define_gsubr ("%init-rdelim-builtins", 0, 0, 0, scm_init_rdelim_builtins); } /* Local Variables: c-file-style: "gnu" End: */