From 87b5b1afe8237ab9054fc08fde007455ef4d7012 Mon Sep 17 00:00:00 2001
From: Simon Brooke <simon@journeyman.cc>
Date: Sun, 30 Dec 2018 11:14:50 +0000
Subject: [PATCH 01/31] Fixed failing test

---
 unit-tests/integer-allocation.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/unit-tests/integer-allocation.sh b/unit-tests/integer-allocation.sh
index 5d07d90..c2edf14 100644
--- a/unit-tests/integer-allocation.sh
+++ b/unit-tests/integer-allocation.sh
@@ -2,7 +2,7 @@
 
 value=354
 expected="Integer cell: value ${value}"
-echo ${value} | target/psse -d 2>&1 | grep "${expected}" > /dev/null
+echo ${value} | target/psse -v4 2>&1 | grep "${expected}" > /dev/null
 
 if [ $? -eq 0 ]
 then

From a355a28ffa1f8789b13ca43ee4c62fe19a04ee2a Mon Sep 17 00:00:00 2001
From: Simon Brooke <simon@journeyman.cc>
Date: Thu, 24 Jan 2019 18:59:01 +0000
Subject: [PATCH 02/31] Tactical commit whilst converting to URL_FILE

---
 .gitignore                   |   2 +
 Makefile                     |   2 +-
 src/arith/integer.c          |  10 +-
 src/init.c                   |  15 +-
 src/io/fopen.c               | 543 +++++++++++++++++++++++++++++++++++
 src/io/fopen.h               |  72 +++++
 src/memory/conspage.c        |   2 +-
 src/memory/conspage.h        |   2 +-
 src/memory/consspaceobject.c |   6 +-
 src/memory/consspaceobject.h |   9 +-
 src/memory/dump.c            |   8 +-
 src/memory/dump.h            |   2 +-
 src/memory/stack.c           |   4 +-
 src/memory/stack.h           |   4 +-
 src/ops/io.c                 |   8 +
 src/ops/lispops.c            |   8 +-
 src/ops/print.c              |  12 +-
 src/ops/print.h              |   4 +-
 src/ops/read.c               |  23 +-
 src/ops/read.h               |   2 +-
 unit-tests/bignum-print.sh   |  38 +--
 unit-tests/string-cons.sh    |   0
 unit-tests/wide-character.sh |  12 +
 23 files changed, 700 insertions(+), 88 deletions(-)
 create mode 100644 src/io/fopen.c
 create mode 100644 src/io/fopen.h
 create mode 100644 src/ops/io.c
 mode change 100644 => 100755 unit-tests/string-cons.sh
 create mode 100755 unit-tests/wide-character.sh

diff --git a/.gitignore b/.gitignore
index b428e03..6fa1cd9 100644
--- a/.gitignore
+++ b/.gitignore
@@ -32,3 +32,5 @@ log*
 utils_src/readprintwc/out
 
 *.dump
+
+*.bak
diff --git a/Makefile b/Makefile
index 7179c91..c4c4ef3 100644
--- a/Makefile
+++ b/Makefile
@@ -16,7 +16,7 @@ INDENT_FLAGS := -nbad -bap -nbc -br -brf -brs -c33 -cd33 -ncdb -ce -ci4 -cli4 \
 -npsl -nsc -nsob -nss -nut -prs -l79 -ts2
 
 CPPFLAGS ?= $(INC_FLAGS) -MMD -MP -g -DDEBUG
-LDFLAGS := -lm
+LDFLAGS := -lm -lcurl
 
 all: $(TARGET)
 
diff --git a/src/arith/integer.c b/src/arith/integer.c
index 6a26126..679bf37 100644
--- a/src/arith/integer.c
+++ b/src/arith/integer.c
@@ -314,7 +314,6 @@ struct cons_pointer multiply_integers( struct cons_pointer a,
  */
 struct cons_pointer integer_to_string_add_digit( int digit, int digits,
                                                  struct cons_pointer tail ) {
-    digits++;
     wint_t character = btowc( hex_digits[digit] );
     return ( digits % 3 == 0 ) ?
         make_string( L',', make_string( character,
@@ -352,10 +351,7 @@ struct cons_pointer integer_to_string( struct cons_pointer int_pointer,
         while ( accumulator > 0 || !nilp( integer.payload.integer.more ) ) {
             if ( !nilp( integer.payload.integer.more ) ) {
                 integer = pointer2cell( integer.payload.integer.more );
-                accumulator += integer.payload.integer.value == 0 ?
-                    MAX_INTEGER :
-                    ( llabs( integer.payload.integer.value ) *
-                      ( MAX_INTEGER + 1 ) );
+                accumulator += integer.payload.integer.value;
                 debug_print
                     ( L"integer_to_string: crossing cell boundary, accumulator is: ",
                       DEBUG_IO );
@@ -369,10 +365,12 @@ struct cons_pointer integer_to_string( struct cons_pointer int_pointer,
                               L"integer_to_string: digit is %ld, hexadecimal is %c, accumulator is: ",
                               offset, hex_digits[offset] );
                 debug_print_128bit( accumulator, DEBUG_IO );
+                debug_print( L"; result is: ", DEBUG_IO);
+                debug_print_object( result, DEBUG_IO);
                 debug_println( DEBUG_IO );
 
                 result =
-                    integer_to_string_add_digit( offset, digits++, result );
+                    integer_to_string_add_digit( offset, ++digits, result );
                 accumulator = accumulator / base;
             } while ( accumulator > base );
         }
diff --git a/src/init.c b/src/init.c
index e0d2b01..e8a33a9 100644
--- a/src/init.c
+++ b/src/init.c
@@ -9,6 +9,7 @@
  * Licensed under GPL version 2.0, or, at your option, any later version.
  */
 
+#include <locale.h>
 #include <stdbool.h>
 #include <stdio.h>
 #include <stdlib.h>
@@ -81,6 +82,8 @@ int main( int argc, char *argv[] ) {
     bool dump_at_end = false;
     bool show_prompt = false;
 
+    setlocale(LC_ALL, "");
+
     while ( ( option = getopt( argc, argv, "cpdv:" ) ) != -1 ) {
         switch ( option ) {
             case 'c':
@@ -123,14 +126,14 @@ int main( int argc, char *argv[] ) {
      * standard input, output, error and sink streams
      * attempt to set wide character acceptance on all streams
      */
-    FILE *sink = fopen( "/dev/null", "w" );
+    URL_FILE *sink = url_fopen( "/dev/null", "w" );
     fwide( stdin, 1 );
     fwide( stdout, 1 );
     fwide( stderr, 1 );
     fwide( sink, 1 );
-    bind_value( L"*in*", make_read_stream( stdin ) );
-    bind_value( L"*out*", make_write_stream( stdout ) );
-    bind_value( L"*log*", make_write_stream( stderr ) );
+    bind_value( L"*in*", make_read_stream( file_to_url_file(stdin) ) );
+    bind_value( L"*out*", make_write_stream( file_to_url_file(stdout) ) );
+    bind_value( L"*log*", make_write_stream( file_to_url_file(stderr) ) );
     bind_value( L"*sink*", make_write_stream( sink ) );
 
     /*
@@ -180,9 +183,9 @@ int main( int argc, char *argv[] ) {
      */
     bind_special( L"cond", &lisp_cond );
     bind_special( L"lambda", &lisp_lambda );
-    // bind_special( L"λ", &lisp_lambda );
+    bind_special( L"\u03bb", &lisp_lambda ); // λ
     bind_special( L"nlambda", &lisp_nlambda );
-    // bind_special( L"nλ", &lisp_nlambda );
+    bind_special( L"n\u03bb", &lisp_nlambda );
     bind_special( L"progn", &lisp_progn );
     bind_special( L"quote", &lisp_quote );
     bind_special( L"set!", &lisp_set_shriek );
diff --git a/src/io/fopen.c b/src/io/fopen.c
new file mode 100644
index 0000000..d13250f
--- /dev/null
+++ b/src/io/fopen.c
@@ -0,0 +1,543 @@
+/*
+ * fopen.c
+ *
+ * adapted from https://curl.haxx.se/libcurl/c/fopen.html.
+ *
+ * Copyright (c) 2003, 2017 Simtec Electronics
+ * Some portions (c) 2017 Simon Brooke <simon@journeyman.cc>
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ * 1. Redistributions of source code must retain the above copyright
+ *    notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ *    notice, this list of conditions and the following disclaimer in the
+ *    documentation and/or other materials provided with the distribution.
+ * 3. The name of the author may not be used to endorse or promote products
+ *    derived from this software without specific prior written permission.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
+ * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
+ * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
+ * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
+ * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
+ * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+ * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
+ * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+ * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
+ * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+ *
+ * This example requires libcurl 7.9.7 or later.
+ */
+
+
+#include <stdio.h>
+#include <string.h>
+#ifndef WIN32
+#  include <sys/time.h>
+#endif
+#include <stdlib.h>
+#include <errno.h>
+
+#include <curl/curl.h>
+/*
+ * wide characters
+ */
+#include <wchar.h>
+#include <wctype.h>
+
+#include "fopen.h"
+
+/* we use a global one for convenience */
+static CURLM *multi_handle;
+
+/* curl calls this routine to get more data */
+static size_t write_callback(char *buffer,
+                             size_t size,
+                             size_t nitems,
+                             void *userp)
+{
+  char *newbuff;
+  size_t rembuff;
+
+  URL_FILE *url = (URL_FILE *)userp;
+  size *= nitems;
+
+  rembuff = url->buffer_len - url->buffer_pos; /* remaining space in buffer */
+
+  if(size > rembuff) {
+    /* not enough space in buffer */
+    newbuff = realloc(url->buffer, url->buffer_len + (size - rembuff));
+    if(newbuff == NULL) {
+      fprintf(stderr, "callback buffer grow failed\n");
+      size = rembuff;
+    }
+    else {
+      /* realloc succeeded increase buffer size*/
+      url->buffer_len += size - rembuff;
+      url->buffer = newbuff;
+    }
+  }
+
+  memcpy(&url->buffer[url->buffer_pos], buffer, size);
+  url->buffer_pos += size;
+
+  return size;
+}
+
+/* use to attempt to fill the read buffer up to requested number of bytes */
+static int fill_buffer(URL_FILE *file, size_t want)
+{
+  fd_set fdread;
+  fd_set fdwrite;
+  fd_set fdexcep;
+  struct timeval timeout;
+  int rc;
+  CURLMcode mc; /* curl_multi_fdset() return code */
+
+  /* only attempt to fill buffer if transactions still running and buffer
+   * doesn't exceed required size already
+   */
+  if((!file->still_running) || (file->buffer_pos > want))
+    return 0;
+
+  /* attempt to fill buffer */
+  do {
+    int maxfd = -1;
+    long curl_timeo = -1;
+
+    FD_ZERO(&fdread);
+    FD_ZERO(&fdwrite);
+    FD_ZERO(&fdexcep);
+
+    /* set a suitable timeout to fail on */
+    timeout.tv_sec = 60; /* 1 minute */
+    timeout.tv_usec = 0;
+
+    curl_multi_timeout(multi_handle, &curl_timeo);
+    if(curl_timeo >= 0) {
+      timeout.tv_sec = curl_timeo / 1000;
+      if(timeout.tv_sec > 1)
+        timeout.tv_sec = 1;
+      else
+        timeout.tv_usec = (curl_timeo % 1000) * 1000;
+    }
+
+    /* get file descriptors from the transfers */
+    mc = curl_multi_fdset(multi_handle, &fdread, &fdwrite, &fdexcep, &maxfd);
+
+    if(mc != CURLM_OK) {
+      fprintf(stderr, "curl_multi_fdset() failed, code %d.\n", mc);
+      break;
+    }
+
+    /* On success the value of maxfd is guaranteed to be >= -1. We call
+       select(maxfd + 1, ...); specially in case of (maxfd == -1) there are
+       no fds ready yet so we call select(0, ...) --or Sleep() on Windows--
+       to sleep 100ms, which is the minimum suggested value in the
+       curl_multi_fdset() doc. */
+
+    if(maxfd == -1) {
+#ifdef _WIN32
+      Sleep(100);
+      rc = 0;
+#else
+      /* Portable sleep for platforms other than Windows. */
+      struct timeval wait = { 0, 100 * 1000 }; /* 100ms */
+      rc = select(0, NULL, NULL, NULL, &wait);
+#endif
+    }
+    else {
+      /* Note that on some platforms 'timeout' may be modified by select().
+         If you need access to the original value save a copy beforehand. */
+      rc = select(maxfd + 1, &fdread, &fdwrite, &fdexcep, &timeout);
+    }
+
+    switch(rc) {
+    case -1:
+      /* select error */
+      break;
+
+    case 0:
+    default:
+      /* timeout or readable/writable sockets */
+      curl_multi_perform(multi_handle, &file->still_running);
+      break;
+    }
+  } while(file->still_running && (file->buffer_pos < want));
+  return 1;
+}
+
+/* use to remove want bytes from the front of a files buffer */
+static int use_buffer(URL_FILE *file, size_t want)
+{
+  /* sort out buffer */
+  if((file->buffer_pos - want) <= 0) {
+    /* ditch buffer - write will recreate */
+    free(file->buffer);
+    file->buffer = NULL;
+    file->buffer_pos = 0;
+    file->buffer_len = 0;
+  }
+  else {
+    /* move rest down make it available for later */
+    memmove(file->buffer,
+            &file->buffer[want],
+            (file->buffer_pos - want));
+
+    file->buffer_pos -= want;
+  }
+  return 0;
+}
+
+URL_FILE *url_fopen(const char *url, const char *operation)
+{
+  /* this code could check for URLs or types in the 'url' and
+     basically use the real fopen() for standard files */
+
+  URL_FILE *file;
+  (void)operation;
+
+  file = calloc(1, sizeof(URL_FILE));
+  if(!file)
+    return NULL;
+
+  file->handle.file = fopen(url, operation);
+  if(file->handle.file)
+    file->type = CFTYPE_FILE; /* marked as URL */
+
+  else {
+    file->type = CFTYPE_CURL; /* marked as URL */
+    file->handle.curl = curl_easy_init();
+
+    curl_easy_setopt(file->handle.curl, CURLOPT_URL, url);
+    curl_easy_setopt(file->handle.curl, CURLOPT_WRITEDATA, file);
+    curl_easy_setopt(file->handle.curl, CURLOPT_VERBOSE, 0L);
+    curl_easy_setopt(file->handle.curl, CURLOPT_WRITEFUNCTION, write_callback);
+
+    if(!multi_handle)
+      multi_handle = curl_multi_init();
+
+    curl_multi_add_handle(multi_handle, file->handle.curl);
+
+    /* lets start the fetch */
+    curl_multi_perform(multi_handle, &file->still_running);
+
+    if((file->buffer_pos == 0) && (!file->still_running)) {
+      /* if still_running is 0 now, we should return NULL */
+
+      /* make sure the easy handle is not in the multi handle anymore */
+      curl_multi_remove_handle(multi_handle, file->handle.curl);
+
+      /* cleanup */
+      curl_easy_cleanup(file->handle.curl);
+
+      free(file);
+
+      file = NULL;
+    }
+  }
+  return file;
+}
+
+int url_fclose(URL_FILE *file)
+{
+  int ret = 0;/* default is good return */
+
+  switch(file->type) {
+  case CFTYPE_FILE:
+    ret = fclose(file->handle.file); /* passthrough */
+    break;
+
+  case CFTYPE_CURL:
+    /* make sure the easy handle is not in the multi handle anymore */
+    curl_multi_remove_handle(multi_handle, file->handle.curl);
+
+    /* cleanup */
+    curl_easy_cleanup(file->handle.curl);
+    break;
+
+  default: /* unknown or supported type - oh dear */
+    ret = EOF;
+    errno = EBADF;
+    break;
+  }
+
+  free(file->buffer);/* free any allocated buffer space */
+  free(file);
+
+  return ret;
+}
+
+int url_feof(URL_FILE *file)
+{
+  int ret = 0;
+
+  switch(file->type) {
+  case CFTYPE_FILE:
+    ret = feof(file->handle.file);
+    break;
+
+  case CFTYPE_CURL:
+    if((file->buffer_pos == 0) && (!file->still_running))
+      ret = 1;
+    break;
+
+  default: /* unknown or supported type - oh dear */
+    ret = -1;
+    errno = EBADF;
+    break;
+  }
+  return ret;
+}
+
+size_t url_fread(void *ptr, size_t size, size_t nmemb, URL_FILE *file)
+{
+  size_t want;
+
+  switch(file->type) {
+  case CFTYPE_FILE:
+    want = fread(ptr, size, nmemb, file->handle.file);
+    break;
+
+  case CFTYPE_CURL:
+    want = nmemb * size;
+
+    fill_buffer(file, want);
+
+    /* check if there's data in the buffer - if not fill_buffer()
+     * either errored or EOF */
+    if(!file->buffer_pos)
+      return 0;
+
+    /* ensure only available data is considered */
+    if(file->buffer_pos < want)
+      want = file->buffer_pos;
+
+    /* xfer data to caller */
+    memcpy(ptr, file->buffer, want);
+
+    use_buffer(file, want);
+
+    want = want / size;     /* number of items */
+    break;
+
+  default: /* unknown or supported type - oh dear */
+    want = 0;
+    errno = EBADF;
+    break;
+
+  }
+  return want;
+}
+
+char *url_fgets(char *ptr, size_t size, URL_FILE *file)
+{
+  size_t want = size - 1;/* always need to leave room for zero termination */
+  size_t loop;
+
+  switch(file->type) {
+  case CFTYPE_FILE:
+    ptr = fgets(ptr, (int)size, file->handle.file);
+    break;
+
+  case CFTYPE_CURL:
+    fill_buffer(file, want);
+
+    /* check if there's data in the buffer - if not fill either errored or
+     * EOF */
+    if(!file->buffer_pos)
+      return NULL;
+
+    /* ensure only available data is considered */
+    if(file->buffer_pos < want)
+      want = file->buffer_pos;
+
+    /*buffer contains data */
+    /* look for newline or eof */
+    for(loop = 0; loop < want; loop++) {
+      if(file->buffer[loop] == '\n') {
+        want = loop + 1;/* include newline */
+        break;
+      }
+    }
+
+    /* xfer data to caller */
+    memcpy(ptr, file->buffer, want);
+    ptr[want] = 0;/* always null terminate */
+
+    use_buffer(file, want);
+
+    break;
+
+  default: /* unknown or supported type - oh dear */
+    ptr = NULL;
+    errno = EBADF;
+    break;
+  }
+
+  return ptr;/*success */
+}
+
+void url_rewind(URL_FILE *file)
+{
+  switch(file->type) {
+  case CFTYPE_FILE:
+    rewind(file->handle.file); /* passthrough */
+    break;
+
+  case CFTYPE_CURL:
+    /* halt transaction */
+    curl_multi_remove_handle(multi_handle, file->handle.curl);
+
+    /* restart */
+    curl_multi_add_handle(multi_handle, file->handle.curl);
+
+    /* ditch buffer - write will recreate - resets stream pos*/
+    free(file->buffer);
+    file->buffer = NULL;
+    file->buffer_pos = 0;
+    file->buffer_len = 0;
+
+    break;
+
+  default: /* unknown or supported type - oh dear */
+    break;
+  }
+}
+
+/**
+ * given this file handle f, return a new url_file handle wrapping it.
+ *
+ * @param f the file to be wrapped;
+ * @return the new handle, or null if no such handle could be allocated.
+ */
+URL_FILE * file_to_url_file( FILE* f) {
+  URL_FILE * result = (URL_FILE *)malloc(sizeof(URL_FILE));
+
+  if ( result != NULL) {
+    result->type = CFTYPE_FILE,
+    result->handle.file = f;
+  }
+
+  return result;
+}
+
+
+wint_t url_fgetwc(URL_FILE *file) {
+  wint_t result = 0;
+
+  switch(file->type) {
+  case CFTYPE_FILE:
+    fwide( file->handle.file, 1 ); /* wide characters */
+    result = fgetc(file->handle.file); /* passthrough */
+    break;
+
+  case CFTYPE_CURL:
+    url_fread(&result, sizeof(wint_t), 1, file);
+    break;
+  }
+
+  return result;
+}
+
+/* #define FGETSFILE "fgets.test" */
+/* #define FREADFILE "fread.test" */
+/* #define REWINDFILE "rewind.test" */
+
+/* /\* Small main program to retrieve from a url using fgets and fread saving the */
+/*  * output to two test files (note the fgets method will corrupt binary files if */
+/*  * they contain 0 chars *\/ */
+/* int main(int argc, char *argv[]) */
+/* { */
+/*   URL_FILE *handle; */
+/*   FILE *outf; */
+
+/*   size_t nread; */
+/*   char buffer[256]; */
+/*   const char *url; */
+
+/*   if(argc < 2) */
+/*     url = "http://192.168.7.3/testfile";/\* default to testurl *\/ */
+/*   else */
+/*     url = argv[1];/\* use passed url *\/ */
+
+/*   /\* copy from url line by line with fgets *\/ */
+/*   outf = fopen(FGETSFILE, "wb+"); */
+/*   if(!outf) { */
+/*     perror("couldn't open fgets output file\n"); */
+/*     return 1; */
+/*   } */
+
+/*   handle = url_fopen(url, "r"); */
+/*   if(!handle) { */
+/*     printf("couldn't url_fopen() %s\n", url); */
+/*     fclose(outf); */
+/*     return 2; */
+/*   } */
+
+/*   while(!url_feof(handle)) { */
+/*     url_fgets(buffer, sizeof(buffer), handle); */
+/*     fwrite(buffer, 1, strlen(buffer), outf); */
+/*   } */
+
+/*   url_fclose(handle); */
+
+/*   fclose(outf); */
+
+
+/*   /\* Copy from url with fread *\/ */
+/*   outf = fopen(FREADFILE, "wb+"); */
+/*   if(!outf) { */
+/*     perror("couldn't open fread output file\n"); */
+/*     return 1; */
+/*   } */
+
+/*   handle = url_fopen("testfile", "r"); */
+/*   if(!handle) { */
+/*     printf("couldn't url_fopen() testfile\n"); */
+/*     fclose(outf); */
+/*     return 2; */
+/*   } */
+
+/*   do { */
+/*     nread = url_fread(buffer, 1, sizeof(buffer), handle); */
+/*     fwrite(buffer, 1, nread, outf); */
+/*   } while(nread); */
+
+/*   url_fclose(handle); */
+
+/*   fclose(outf); */
+
+
+/*   /\* Test rewind *\/ */
+/*   outf = fopen(REWINDFILE, "wb+"); */
+/*   if(!outf) { */
+/*     perror("couldn't open fread output file\n"); */
+/*     return 1; */
+/*   } */
+
+/*   handle = url_fopen("testfile", "r"); */
+/*   if(!handle) { */
+/*     printf("couldn't url_fopen() testfile\n"); */
+/*     fclose(outf); */
+/*     return 2; */
+/*   } */
+
+/*   nread = url_fread(buffer, 1, sizeof(buffer), handle); */
+/*   fwrite(buffer, 1, nread, outf); */
+/*   url_rewind(handle); */
+
+/*   buffer[0]='\n'; */
+/*   fwrite(buffer, 1, 1, outf); */
+
+/*   nread = url_fread(buffer, 1, sizeof(buffer), handle); */
+/*   fwrite(buffer, 1, nread, outf); */
+
+/*   url_fclose(handle); */
+
+/*   fclose(outf); */
+
+/*   return 0;/\* all done *\/ */
+/* } */
diff --git a/src/io/fopen.h b/src/io/fopen.h
new file mode 100644
index 0000000..9874ac7
--- /dev/null
+++ b/src/io/fopen.h
@@ -0,0 +1,72 @@
+/*
+ * fopen.h
+ *
+ * adapted from https://curl.haxx.se/libcurl/c/fopen.html.
+ *
+ * Copyright (c) 2003, 2017 Simtec Electronics
+ * Some portions (c) 2017 Simon Brooke <simon@journeyman.cc>
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ * 1. Redistributions of source code must retain the above copyright
+ *    notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ *    notice, this list of conditions and the following disclaimer in the
+ *    documentation and/or other materials provided with the distribution.
+ * 3. The name of the author may not be used to endorse or promote products
+ *    derived from this software without specific prior written permission.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
+ * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
+ * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
+ * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
+ * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
+ * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+ * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
+ * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+ * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
+ * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+ *
+ * This example requires libcurl 7.9.7 or later.
+ */
+
+#ifndef __fopen_h
+#define __fopen_h
+
+enum fcurl_type_e {
+  CFTYPE_NONE = 0,
+  CFTYPE_FILE = 1,
+  CFTYPE_CURL = 2
+};
+
+struct fcurl_data
+{
+  enum fcurl_type_e type;     /* type of handle */
+  union {
+    CURL *curl;
+    FILE *file;
+  } handle;                   /* handle */
+
+  char *buffer;               /* buffer to store cached data*/
+  size_t buffer_len;          /* currently allocated buffers length */
+  size_t buffer_pos;          /* end of data in buffer*/
+  int still_running;          /* Is background url fetch still in progress */
+};
+
+typedef struct fcurl_data URL_FILE;
+
+/* exported functions */
+URL_FILE *url_fopen(const char *url, const char *operation);
+int url_fclose(URL_FILE *file);
+int url_feof(URL_FILE *file);
+size_t url_fread(void *ptr, size_t size, size_t nmemb, URL_FILE *file);
+char *url_fgets(char *ptr, size_t size, URL_FILE *file);
+void url_rewind(URL_FILE *file);
+
+wint_t url_fgetwc(URL_FILE *file);
+URL_FILE * file_to_url_file( FILE* f);
+
+
+
+#endif
diff --git a/src/memory/conspage.c b/src/memory/conspage.c
index f3c1760..03034e4 100644
--- a/src/memory/conspage.c
+++ b/src/memory/conspage.c
@@ -115,7 +115,7 @@ void make_cons_page(  ) {
 /**
  * dump the allocated pages to this `output` stream.
  */
-void dump_pages( FILE * output ) {
+void dump_pages( URL_FILE * output ) {
     for ( int i = 0; i < initialised_cons_pages; i++ ) {
         fwprintf( output, L"\nDUMPING PAGE %d\n", i );
 
diff --git a/src/memory/conspage.h b/src/memory/conspage.h
index ab04d6d..fa11da9 100644
--- a/src/memory/conspage.h
+++ b/src/memory/conspage.h
@@ -47,6 +47,6 @@ struct cons_pointer allocate_cell( char *tag );
 
 void initialise_cons_pages(  );
 
-void dump_pages( FILE * output );
+void dump_pages( URL_FILE * output );
 
 #endif
diff --git a/src/memory/consspaceobject.c b/src/memory/consspaceobject.c
index 6a7e2bd..9edbf66 100644
--- a/src/memory/consspaceobject.c
+++ b/src/memory/consspaceobject.c
@@ -95,8 +95,6 @@ struct cons_pointer make_exception( struct cons_pointer message,
     struct cons_pointer pointer = allocate_cell( EXCEPTIONTAG );
     struct cons_space_object *cell = &pointer2cell( pointer );
 
-//    inc_ref( pointer );         /* this is a hack; I don't know why it's necessary to do this, but if I don't the cell gets freed */
-
     inc_ref( message );
     inc_ref( frame_pointer );
     cell->payload.exception.message = message;
@@ -235,7 +233,7 @@ make_special( struct cons_pointer src, struct cons_pointer ( *executable )
  * Construct a cell which points to a stream open for reading.
  * @param input the C stream to wrap.
  */
-struct cons_pointer make_read_stream( FILE * input ) {
+struct cons_pointer make_read_stream( URL_FILE * input ) {
     struct cons_pointer pointer = allocate_cell( READTAG );
     struct cons_space_object *cell = &pointer2cell( pointer );
 
@@ -248,7 +246,7 @@ struct cons_pointer make_read_stream( FILE * input ) {
  * Construct a cell which points to a stream open for writing.
  * @param output the C stream to wrap.
  */
-struct cons_pointer make_write_stream( FILE * output ) {
+struct cons_pointer make_write_stream( URL_FILE * output ) {
     struct cons_pointer pointer = allocate_cell( WRITETAG );
     struct cons_space_object *cell = &pointer2cell( pointer );
 
diff --git a/src/memory/consspaceobject.h b/src/memory/consspaceobject.h
index acc36df..8db8099 100644
--- a/src/memory/consspaceobject.h
+++ b/src/memory/consspaceobject.h
@@ -16,6 +16,9 @@
  */
 #include <wchar.h>
 #include <wctype.h>
+#include <curl/curl.h>
+
+#include "fopen.h"
 
 #ifndef __consspaceobject_h
 #define __consspaceobject_h
@@ -488,7 +491,7 @@ struct special_payload {
  */
 struct stream_payload {
     /** the stream to read from or write to. */
-    FILE *stream;
+    URL_FILE *stream;
 };
 
 /**
@@ -636,9 +639,9 @@ struct cons_pointer make_string( wint_t c, struct cons_pointer tail );
 
 struct cons_pointer make_symbol( wint_t c, struct cons_pointer tail );
 
-struct cons_pointer make_read_stream( FILE * input );
+struct cons_pointer make_read_stream( URL_FILE * input );
 
-struct cons_pointer make_write_stream( FILE * output );
+struct cons_pointer make_write_stream( URL_FILE * output );
 
 struct cons_pointer c_string_to_lisp_string( wchar_t *string );
 
diff --git a/src/memory/dump.c b/src/memory/dump.c
index 7ec2631..cec0dfd 100644
--- a/src/memory/dump.c
+++ b/src/memory/dump.c
@@ -26,7 +26,7 @@
 #include "vectorspace.h"
 
 
-void dump_string_cell( FILE * output, wchar_t *prefix,
+void dump_string_cell( URL_FILE * output, wchar_t *prefix,
                        struct cons_pointer pointer ) {
     struct cons_space_object cell = pointer2cell( pointer );
     if ( cell.payload.string.character == 0 ) {
@@ -52,7 +52,7 @@ void dump_string_cell( FILE * output, wchar_t *prefix,
 /**
  * dump the object at this cons_pointer to this output stream.
  */
-void dump_object( FILE * output, struct cons_pointer pointer ) {
+void dump_object( URL_FILE * output, struct cons_pointer pointer ) {
     struct cons_space_object cell = pointer2cell( pointer );
     fwprintf( output,
               L"\t%4.4s (%d) at page %d, offset %d count %u\n",
@@ -89,7 +89,7 @@ void dump_object( FILE * output, struct cons_pointer pointer ) {
             }
             break;
         case LAMBDATV:
-            fwprintf( output, L"\t\tLambda cell;\n\t\t args: " );
+            fwprintf( output, L"\t\t\u03bb cell;\n\t\t args: " );
             print( output, cell.payload.lambda.args );
             fwprintf( output, L";\n\t\t\tbody: " );
             print( output, cell.payload.lambda.body );
@@ -98,7 +98,7 @@ void dump_object( FILE * output, struct cons_pointer pointer ) {
         case NILTV:
             break;
         case NLAMBDATV:
-            fwprintf( output, L"\t\tNlambda cell; \n\t\targs: " );
+            fwprintf( output, L"\t\tn\u03bb cell; \n\t\targs: " );
             print( output, cell.payload.lambda.args );
             fwprintf( output, L";\n\t\t\tbody: " );
             print( output, cell.payload.lambda.body );
diff --git a/src/memory/dump.h b/src/memory/dump.h
index ec8928e..f8ef75f 100644
--- a/src/memory/dump.h
+++ b/src/memory/dump.h
@@ -20,6 +20,6 @@
 #define __dump_h
 
 
-void dump_object( FILE * output, struct cons_pointer pointer );
+void dump_object( URL_FILE * output, struct cons_pointer pointer );
 
 #endif
diff --git a/src/memory/stack.c b/src/memory/stack.c
index cf68701..b2585c7 100644
--- a/src/memory/stack.c
+++ b/src/memory/stack.c
@@ -241,7 +241,7 @@ void free_stack_frame( struct stack_frame *frame ) {
  * @param output the stream
  * @param frame_pointer the pointer to the frame
  */
-void dump_frame( FILE * output, struct cons_pointer frame_pointer ) {
+void dump_frame( URL_FILE * output, struct cons_pointer frame_pointer ) {
     struct stack_frame *frame = get_stack_frame( frame_pointer );
 
     if ( frame != NULL ) {
@@ -265,7 +265,7 @@ void dump_frame( FILE * output, struct cons_pointer frame_pointer ) {
     }
 }
 
-void dump_stack_trace( FILE * output, struct cons_pointer pointer ) {
+void dump_stack_trace( URL_FILE * output, struct cons_pointer pointer ) {
     if ( exceptionp( pointer ) ) {
         print( output, pointer2cell( pointer ).payload.exception.message );
         fputws( L"\n", output );
diff --git a/src/memory/stack.h b/src/memory/stack.h
index 11763b2..0ea903c 100644
--- a/src/memory/stack.h
+++ b/src/memory/stack.h
@@ -47,9 +47,9 @@ struct cons_pointer make_stack_frame( struct cons_pointer previous,
 
 void free_stack_frame( struct stack_frame *frame );
 
-void dump_frame( FILE * output, struct cons_pointer pointer );
+void dump_frame( URL_FILE * output, struct cons_pointer pointer );
 
-void dump_stack_trace( FILE * output, struct cons_pointer frame_pointer );
+void dump_stack_trace( URL_FILE * output, struct cons_pointer frame_pointer );
 
 struct cons_pointer fetch_arg( struct stack_frame *frame, unsigned int n );
 
diff --git a/src/ops/io.c b/src/ops/io.c
new file mode 100644
index 0000000..ccd0af5
--- /dev/null
+++ b/src/ops/io.c
@@ -0,0 +1,8 @@
+/*
+ * io.c
+ *
+ * Communication between PSSE and the outside world, via libcurl.
+ *
+ * (c) 2017 Simon Brooke <simon@journeyman.cc>
+ * Licensed under GPL version 2.0, or, at your option, any later version.
+ */
diff --git a/src/ops/lispops.c b/src/ops/lispops.c
index c80d965..9448c55 100644
--- a/src/ops/lispops.c
+++ b/src/ops/lispops.c
@@ -839,7 +839,7 @@ lisp_read( struct stack_frame *frame, struct cons_pointer frame_pointer,
 #ifdef DEBUG
     debug_print( L"entering lisp_read\n", DEBUG_IO );
 #endif
-    FILE *input = stdin;
+    URL_FILE *input = stdin;
     struct cons_pointer in_stream = readp( frame->arg[0] ) ?
         frame->arg[0] : get_default_stream( true, env );
 
@@ -922,7 +922,7 @@ lisp_print( struct stack_frame *frame, struct cons_pointer frame_pointer,
             struct cons_pointer env ) {
     debug_print( L"Entering print\n", DEBUG_IO );
     struct cons_pointer result = NIL;
-    FILE *output = stdout;
+    URL_FILE *output = stdout;
     struct cons_pointer out_stream = writep( frame->arg[1] ) ?
         frame->arg[1] : get_default_stream( false, env );
 
@@ -1148,7 +1148,7 @@ struct cons_pointer lisp_repl( struct stack_frame *frame,
 
     struct cons_pointer input = get_default_stream( true, env );
     struct cons_pointer output = get_default_stream( false, env );
-    FILE *os = pointer2cell( output ).payload.stream.stream;
+    URL_FILE *os = pointer2cell( output ).payload.stream.stream;
     struct cons_pointer prompt_name = c_string_to_lisp_symbol( L"*prompt*" );
     struct cons_pointer old_oblist = oblist;
     struct cons_pointer new_env = env;
@@ -1282,7 +1282,7 @@ struct cons_pointer lisp_inspect( struct stack_frame *frame,
                                   struct cons_pointer frame_pointer,
                                   struct cons_pointer env ) {
     debug_print( L"Entering print\n", DEBUG_IO );
-    FILE *output = stdout;
+    URL_FILE *output = stdout;
     struct cons_pointer out_stream = writep( frame->arg[1] ) ?
         frame->arg[1] : get_default_stream( false, env );
 
diff --git a/src/ops/print.c b/src/ops/print.c
index 604c07c..d313960 100644
--- a/src/ops/print.c
+++ b/src/ops/print.c
@@ -34,7 +34,7 @@ int print_use_colours = 0;
  * onto this `output`; if `pointer` does not indicate a string or symbol,
  * don't print anything but just return.
  */
-void print_string_contents( FILE * output, struct cons_pointer pointer ) {
+void print_string_contents( URL_FILE * output, struct cons_pointer pointer ) {
     while ( stringp( pointer ) || symbolp( pointer ) ) {
         struct cons_space_object *cell = &pointer2cell( pointer );
         wchar_t c = cell->payload.string.character;
@@ -51,7 +51,7 @@ void print_string_contents( FILE * output, struct cons_pointer pointer ) {
  * the stream at this `output`, prepending and appending double quote
  * characters.
  */
-void print_string( FILE * output, struct cons_pointer pointer ) {
+void print_string( URL_FILE * output, struct cons_pointer pointer ) {
     fputwc( btowc( '"' ), output );
     print_string_contents( output, pointer );
     fputwc( btowc( '"' ), output );
@@ -63,7 +63,7 @@ void print_string( FILE * output, struct cons_pointer pointer ) {
  * a space character.
  */
 void
-print_list_contents( FILE * output, struct cons_pointer pointer,
+print_list_contents( URL_FILE * output, struct cons_pointer pointer,
                      bool initial_space ) {
     struct cons_space_object *cell = &pointer2cell( pointer );
 
@@ -84,7 +84,7 @@ print_list_contents( FILE * output, struct cons_pointer pointer,
     }
 }
 
-void print_list( FILE * output, struct cons_pointer pointer ) {
+void print_list( URL_FILE * output, struct cons_pointer pointer ) {
     if ( print_use_colours ) {
         fwprintf( output, L"%s(%s", "\x1B[31m", "\x1B[39m" );
     } else {
@@ -104,7 +104,7 @@ void print_list( FILE * output, struct cons_pointer pointer ) {
  * Print the cons-space object indicated by `pointer` to the stream indicated
  * by `output`.
  */
-struct cons_pointer print( FILE * output, struct cons_pointer pointer ) {
+struct cons_pointer print( URL_FILE * output, struct cons_pointer pointer ) {
     struct cons_space_object cell = pointer2cell( pointer );
     char *buffer;
 
@@ -225,6 +225,6 @@ struct cons_pointer print( FILE * output, struct cons_pointer pointer ) {
     return pointer;
 }
 
-void println( FILE * output ) {
+void println( URL_FILE * output ) {
     fputws( L"\n", output );
 }
diff --git a/src/ops/print.h b/src/ops/print.h
index 2751032..f59f090 100644
--- a/src/ops/print.h
+++ b/src/ops/print.h
@@ -14,8 +14,8 @@
 #ifndef __print_h
 #define __print_h
 
-struct cons_pointer print( FILE * output, struct cons_pointer pointer );
-void println( FILE * output );
+struct cons_pointer print( URL_FILE * output, struct cons_pointer pointer );
+void println( URL_FILE * output );
 extern int print_use_colours;
 
 #endif
diff --git a/src/ops/read.c b/src/ops/read.c
index 4006c99..d2f79c4 100644
--- a/src/ops/read.c
+++ b/src/ops/read.c
@@ -38,13 +38,13 @@
 
 struct cons_pointer read_number( struct stack_frame *frame,
                                  struct cons_pointer frame_pointer,
-                                 FILE * input, wint_t initial,
+                                 URL_FILE * input, wint_t initial,
                                  bool seen_period );
 struct cons_pointer read_list( struct stack_frame *frame,
-                               struct cons_pointer frame_pointer, FILE * input,
+                               struct cons_pointer frame_pointer, URL_FILE * input,
                                wint_t initial );
-struct cons_pointer read_string( FILE * input, wint_t initial );
-struct cons_pointer read_symbol( FILE * input, wint_t initial );
+struct cons_pointer read_string( URL_FILE * input, wint_t initial );
+struct cons_pointer read_symbol( URL_FILE * input, wint_t initial );
 
 /**
  * quote reader macro in C (!)
@@ -61,7 +61,7 @@ struct cons_pointer c_quote( struct cons_pointer arg ) {
  */
 struct cons_pointer read_continuation( struct stack_frame *frame,
                                        struct cons_pointer frame_pointer,
-                                       FILE * input, wint_t initial ) {
+                                       URL_FILE * input, wint_t initial ) {
     debug_print( L"entering read_continuation\n", DEBUG_IO );
     struct cons_pointer result = NIL;
 
@@ -129,6 +129,7 @@ struct cons_pointer read_continuation( struct stack_frame *frame,
                     }
                 }
                 break;
+          //case ':': reserved for keywords and paths
             default:
                 if ( iswdigit( c ) ) {
                     result =
@@ -158,7 +159,7 @@ struct cons_pointer read_continuation( struct stack_frame *frame,
  */
 struct cons_pointer read_number( struct stack_frame *frame,
                                  struct cons_pointer frame_pointer,
-                                 FILE * input,
+                                 URL_FILE * input,
                                  wint_t initial, bool seen_period ) {
     debug_print( L"entering read_number\n", DEBUG_IO );
 
@@ -267,7 +268,7 @@ struct cons_pointer read_number( struct stack_frame *frame,
  */
 struct cons_pointer read_list( struct stack_frame *frame,
                                struct cons_pointer frame_pointer,
-                               FILE * input, wint_t initial ) {
+                               URL_FILE * input, wint_t initial ) {
     struct cons_pointer result = NIL;
     if ( initial != ')' ) {
         debug_printf( DEBUG_IO,
@@ -293,7 +294,7 @@ struct cons_pointer read_list( struct stack_frame *frame,
  * so delimited in which case it may not contain whitespace (unless escaped)
  * but may contain a double quote character (probably not a good idea!)
  */
-struct cons_pointer read_string( FILE * input, wint_t initial ) {
+struct cons_pointer read_string( URL_FILE * input, wint_t initial ) {
     struct cons_pointer cdr = NIL;
     struct cons_pointer result;
     switch ( initial ) {
@@ -315,7 +316,7 @@ struct cons_pointer read_string( FILE * input, wint_t initial ) {
     return result;
 }
 
-struct cons_pointer read_symbol( FILE * input, wint_t initial ) {
+struct cons_pointer read_symbol( URL_FILE * input, wint_t initial ) {
     struct cons_pointer cdr = NIL;
     struct cons_pointer result;
     switch ( initial ) {
@@ -331,7 +332,7 @@ struct cons_pointer read_symbol( FILE * input, wint_t initial ) {
             break;
         case ')':
             /*
-             * symbols may not include right-parenthesis
+             * symbols may not include right-parenthesis;
              */
             result = NIL;
             /*
@@ -367,6 +368,6 @@ struct cons_pointer read_symbol( FILE * input, wint_t initial ) {
 struct cons_pointer read( struct
                           stack_frame
                           *frame, struct cons_pointer frame_pointer,
-                          FILE * input ) {
+                          URL_FILE * input ) {
     return read_continuation( frame, frame_pointer, input, fgetwc( input ) );
 }
diff --git a/src/ops/read.h b/src/ops/read.h
index c6dbba3..a1674d6 100644
--- a/src/ops/read.h
+++ b/src/ops/read.h
@@ -15,6 +15,6 @@
  * read the next object on this input stream and return a cons_pointer to it.
  */
 struct cons_pointer read( struct stack_frame *frame,
-                          struct cons_pointer frame_pointer, FILE * input );
+                          struct cons_pointer frame_pointer, URL_FILE * input );
 
 #endif
diff --git a/unit-tests/bignum-print.sh b/unit-tests/bignum-print.sh
index 5615871..d556e71 100755
--- a/unit-tests/bignum-print.sh
+++ b/unit-tests/bignum-print.sh
@@ -18,17 +18,6 @@ else
     exit 1
 fi
 
-echo -n "checking no bignum was created: "
-grep -v 'BIGNUM!' psse.log > /dev/null
-if [ $? -eq "0" ]
-then
-    echo "OK"
-else
-    echo "Fail"
-    exit 1
-fi
-
-
 
 #####################################################################
 # right on the boundary
@@ -48,17 +37,6 @@ else
     exit 1
 fi
 
-echo -n "checking no bignum was created: "
-grep -v 'BIGNUM!' psse.log > /dev/null
-if [ $? -eq "0" ]
-then
-    echo "OK"
-else
-    echo "Fail"
-    exit 1
-fi
-
-
 
 #####################################################################
 # definitely a bignum
@@ -79,16 +57,10 @@ else
 fi
 
 
-echo -n "checking a bignum was created: "
-grep 'BIGNUM!' psse.log > /dev/null
-if [ $? -eq "0" ]
-then
-    echo "OK"
-else
-    echo "Fail"
-    exit 1
-fi
-
+# Currently failing from here on, but it's failing in read because of
+# the multiply bug. We know printing blows up at the 3 cell boundary
+# because `lisp/scratchpad2.lisp` constructs a 3 cell bignum by
+# repeated addition.
 #####################################################################
 # Just on the three cell boundary
 expected='1329227995784915872903807060280344576'
@@ -103,7 +75,7 @@ if [ "${expected}" = "${actual}" ]
 then
     echo "OK"
 else
-    echo "Fail: expected '${expected}', got '${actual}'"
+    echo "Fail: expected '${expected}', \n           got '${actual}'"
     exit 1
 fi
 
diff --git a/unit-tests/string-cons.sh b/unit-tests/string-cons.sh
old mode 100644
new mode 100755
diff --git a/unit-tests/wide-character.sh b/unit-tests/wide-character.sh
new file mode 100755
index 0000000..d56544e
--- /dev/null
+++ b/unit-tests/wide-character.sh
@@ -0,0 +1,12 @@
+#!/bin/bash
+
+expected='"λάμ(β)δα"'
+actual=`echo $expected | target/psse | tail -1`
+
+if [ "${expected}" = "${actual}" ]
+then
+    echo "OK"
+else
+    echo "Fail: expected '${expected}', got '${actual}'"
+    exit 1
+fi

From b8f241c2c51ca00f981e42a3539da3a65dbcbd7d Mon Sep 17 00:00:00 2001
From: Simon Brooke <simon@journeyman.cc>
Date: Sun, 27 Jan 2019 12:23:51 +0000
Subject: [PATCH 03/31] Progress, not working

---
 src/init.c                   |  4 +--
 src/io/fopen.c               | 48 +++++++++++++++++++++++++++---------
 src/io/fopen.h               | 16 ++++++++++--
 src/memory/consspaceobject.h |  1 -
 4 files changed, 52 insertions(+), 17 deletions(-)

diff --git a/src/init.c b/src/init.c
index e8a33a9..8f278bf 100644
--- a/src/init.c
+++ b/src/init.c
@@ -130,7 +130,7 @@ int main( int argc, char *argv[] ) {
     fwide( stdin, 1 );
     fwide( stdout, 1 );
     fwide( stderr, 1 );
-    fwide( sink, 1 );
+    fwide( sink->handle.file, 1 );
     bind_value( L"*in*", make_read_stream( file_to_url_file(stdin) ) );
     bind_value( L"*out*", make_write_stream( file_to_url_file(stdout) ) );
     bind_value( L"*log*", make_write_stream( file_to_url_file(stderr) ) );
@@ -200,7 +200,7 @@ int main( int argc, char *argv[] ) {
     debug_dump_object( oblist, DEBUG_BOOTSTRAP );
 
     if ( dump_at_end ) {
-        dump_pages( stdout );
+        dump_pages( file_to_url_file(stdout) );
     }
 
     return ( 0 );
diff --git a/src/io/fopen.c b/src/io/fopen.c
index d13250f..14c95e8 100644
--- a/src/io/fopen.c
+++ b/src/io/fopen.c
@@ -3,8 +3,11 @@
  *
  * adapted from https://curl.haxx.se/libcurl/c/fopen.html.
  *
+ * Modifications to read/write wide character streams by
+ * Simon Brooke.
+ *
  * Copyright (c) 2003, 2017 Simtec Electronics
- * Some portions (c) 2017 Simon Brooke <simon@journeyman.cc>
+ * Some portions (c) 2019 Simon Brooke <simon@journeyman.cc>
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
@@ -41,11 +44,6 @@
 #include <errno.h>
 
 #include <curl/curl.h>
-/*
- * wide characters
- */
-#include <wchar.h>
-#include <wctype.h>
 
 #include "fopen.h"
 
@@ -177,8 +175,11 @@ static int use_buffer(URL_FILE *file, size_t want)
     /* ditch buffer - write will recreate */
     free(file->buffer);
     file->buffer = NULL;
+    free(file->wide_buffer);
+    file->wide_buffer = NULL;
     file->buffer_pos = 0;
     file->buffer_len = 0;
+    file->wide_cursor = 0;
   }
   else {
     /* move rest down make it available for later */
@@ -187,6 +188,7 @@ static int use_buffer(URL_FILE *file, size_t want)
             (file->buffer_pos - want));
 
     file->buffer_pos -= want;
+    // TODO: something to adjust the wide_cursor
   }
   return 0;
 }
@@ -424,18 +426,40 @@ URL_FILE * file_to_url_file( FILE* f) {
   return result;
 }
 
-
-wint_t url_fgetwc(URL_FILE *file) {
+/**
+ * get one wide character from the buffer.
+ *
+ * @param file the stream to read from;
+ * @return the next wide character on the stream, or zero if no more.
+ */
+wint_t url_fgetwc(URL_FILE *input) {
   wint_t result = 0;
 
-  switch(file->type) {
+  switch(input->type) {
   case CFTYPE_FILE:
-    fwide( file->handle.file, 1 ); /* wide characters */
-    result = fgetc(file->handle.file); /* passthrough */
+    fwide( input->handle.file, 1 ); /* wide characters */
+    result = fgetc(input->handle.file); /* passthrough */
     break;
 
   case CFTYPE_CURL:
-    url_fread(&result, sizeof(wint_t), 1, file);
+    if (input.buffer_len != 0) {
+      if ( input.wide_buffer == NULL) {
+        /* not initialised */
+        input.wide_buffer = calloc( input.buffer_len, sizeof(wint_t));
+      }
+
+      size_t len = wcslen(input.wide_buffer);
+      if (input.still_running ||
+          len == 0 ||
+          len >= input.wide_cursor) {
+        /* refresh the wide buffer */
+        mbstowcs(input.wide_buffer, input.buffer, input.buffer_pos);
+      }
+
+      result = input.wide_buffer[input.wide_cursor] ++;
+
+      /* do something to fread (advance) one utf character */
+    }
     break;
   }
 
diff --git a/src/io/fopen.h b/src/io/fopen.h
index 9874ac7..83ea5a8 100644
--- a/src/io/fopen.h
+++ b/src/io/fopen.h
@@ -3,8 +3,12 @@
  *
  * adapted from https://curl.haxx.se/libcurl/c/fopen.html.
  *
+ *
+ * Modifications to read/write wide character streams by
+ * Simon Brooke.
+ *
  * Copyright (c) 2003, 2017 Simtec Electronics
- * Some portions (c) 2017 Simon Brooke <simon@journeyman.cc>
+ * Some portions (c) 2019 Simon Brooke <simon@journeyman.cc>
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
@@ -33,6 +37,12 @@
 
 #ifndef __fopen_h
 #define __fopen_h
+#include <curl/curl.h>
+/*
+ * wide characters
+ */
+#include <wchar.h>
+#include <wctype.h>
 
 enum fcurl_type_e {
   CFTYPE_NONE = 0,
@@ -49,8 +59,10 @@ struct fcurl_data
   } handle;                   /* handle */
 
   char *buffer;               /* buffer to store cached data*/
-  size_t buffer_len;          /* currently allocated buffers length */
+  wchar_t *wide_buffer;       /* wide character buffer */
+  size_t buffer_len;          /* currently allocated buffer's length */
   size_t buffer_pos;          /* end of data in buffer*/
+  size_t wide_cursor;         /* cursor into the wide buffer */
   int still_running;          /* Is background url fetch still in progress */
 };
 
diff --git a/src/memory/consspaceobject.h b/src/memory/consspaceobject.h
index 8db8099..b3f587c 100644
--- a/src/memory/consspaceobject.h
+++ b/src/memory/consspaceobject.h
@@ -16,7 +16,6 @@
  */
 #include <wchar.h>
 #include <wctype.h>
-#include <curl/curl.h>
 
 #include "fopen.h"
 

From 0e11adea1cfdafe97f4b0ebe5e8ce74e956132a5 Mon Sep 17 00:00:00 2001
From: Simon Brooke <simon@journeyman.cc>
Date: Sun, 27 Jan 2019 17:22:13 +0000
Subject: [PATCH 04/31] Compiles, most tests break

---
 src/arith/peano.c            | 129 +++---
 src/arith/peano.h            |  14 +-
 src/arith/ratio.c            |  16 +-
 src/debug.c                  |   9 +-
 src/init.c                   |  19 +-
 src/io/fopen.c               | 832 ++++++++++++++++-------------------
 src/io/fopen.h               |  55 +--
 src/io/io.c                  | 177 ++++++++
 src/io/io.h                  |  28 ++
 src/memory/conspage.c        |   2 +-
 src/memory/consspaceobject.h |   4 +
 src/memory/dump.c            | 113 ++---
 src/memory/stack.c           |  24 +-
 src/memory/vectorspace.c     |   5 +-
 src/ops/equal.c              |   4 +-
 src/ops/intern.c             |   8 +-
 src/ops/intern.h             |   6 +-
 src/ops/io.c                 |   8 -
 src/ops/lispops.c            |  56 ++-
 src/ops/print.c              |  50 +--
 src/ops/read.c               |  54 ++-
 src/ops/read.h               |   3 +-
 22 files changed, 902 insertions(+), 714 deletions(-)
 create mode 100644 src/io/io.c
 create mode 100644 src/io/io.h
 delete mode 100644 src/ops/io.c

diff --git a/src/arith/peano.c b/src/arith/peano.c
index 7db638a..8e4cb43 100644
--- a/src/arith/peano.c
+++ b/src/arith/peano.c
@@ -43,13 +43,14 @@ bool zerop( struct cons_pointer arg ) {
     struct cons_space_object cell = pointer2cell( arg );
 
     switch ( cell.tag.value ) {
-        case INTEGERTV: {
+        case INTEGERTV:{
                 do {
-                    debug_print(L"zerop: ", DEBUG_ARITH);
-                    debug_dump_object(arg, DEBUG_ARITH);
-                    result = (pointer2cell( arg ).payload.integer.value == 0);
-                    arg = pointer2cell(arg).payload.integer.more;
-                } while (result && integerp(arg));
+                    debug_print( L"zerop: ", DEBUG_ARITH );
+                    debug_dump_object( arg, DEBUG_ARITH );
+                    result =
+                        ( pointer2cell( arg ).payload.integer.value == 0 );
+                    arg = pointer2cell( arg ).payload.integer.more;
+                } while ( result && integerp( arg ) );
             }
             break;
         case RATIOTV:
@@ -66,7 +67,7 @@ bool zerop( struct cons_pointer arg ) {
 /**
  * does this `arg` point to a negative number?
  */
-bool is_negative( struct cons_pointer arg) {
+bool is_negative( struct cons_pointer arg ) {
     bool result = false;
     struct cons_space_object cell = pointer2cell( arg );
 
@@ -85,27 +86,31 @@ bool is_negative( struct cons_pointer arg) {
     return result;
 }
 
-struct cons_pointer absolute( struct cons_pointer frame_pointer, struct cons_pointer arg) {
-  struct cons_pointer result = NIL;
+struct cons_pointer absolute( struct cons_pointer frame_pointer,
+                              struct cons_pointer arg ) {
+    struct cons_pointer result = NIL;
     struct cons_space_object cell = pointer2cell( arg );
 
-  if ( is_negative( arg)) {
-    switch ( cell.tag.value ) {
-        case INTEGERTV:
-            result = make_integer(llabs(cell.payload.integer.value), cell.payload.integer.more);
-            break;
-        case RATIOTV:
-            result = make_ratio(frame_pointer,
-                                absolute(frame_pointer, cell.payload.ratio.dividend),
-                                cell.payload.ratio.divisor);
-            break;
-        case REALTV:
-            result = make_real( 0 - cell.payload.real.value );
-            break;
+    if ( is_negative( arg ) ) {
+        switch ( cell.tag.value ) {
+            case INTEGERTV:
+                result =
+                    make_integer( llabs( cell.payload.integer.value ),
+                                  cell.payload.integer.more );
+                break;
+            case RATIOTV:
+                result = make_ratio( frame_pointer,
+                                     absolute( frame_pointer,
+                                               cell.payload.ratio.dividend ),
+                                     cell.payload.ratio.divisor );
+                break;
+            case REALTV:
+                result = make_real( 0 - cell.payload.real.value );
+                break;
+        }
     }
-  }
 
-  return result;
+    return result;
 }
 
 /**
@@ -126,7 +131,7 @@ long double to_long_double( struct cons_pointer arg ) {
     switch ( cell.tag.value ) {
         case INTEGERTV:
             // obviously, this doesn't work for bignums
-            result = (long double)cell.payload.integer.value;
+            result = ( long double ) cell.payload.integer.value;
             // sadly, this doesn't work at all.
 //            result += 1.0;
 //            for (bool is_first = false; integerp(arg); is_first = true) {
@@ -141,8 +146,8 @@ long double to_long_double( struct cons_pointer arg ) {
 //            }
             break;
         case RATIOTV:
-            result = to_long_double(cell.payload.ratio.dividend) /
-              to_long_double(cell.payload.ratio.divisor);
+            result = to_long_double( cell.payload.ratio.dividend ) /
+                to_long_double( cell.payload.ratio.divisor );
             break;
         case REALTV:
             result = cell.payload.real.value;
@@ -203,9 +208,9 @@ int64_t to_long_int( struct cons_pointer arg ) {
  * argument, or NIL if it was not a number.
  */
 struct cons_pointer lisp_absolute( struct stack_frame
-                              *frame, struct cons_pointer frame_pointer, struct
-                              cons_pointer env ) {
-  return absolute( frame_pointer, frame->arg[0]);
+                                   *frame, struct cons_pointer frame_pointer, struct
+                                   cons_pointer env ) {
+    return absolute( frame_pointer, frame->arg[0] );
 }
 
 /**
@@ -388,10 +393,12 @@ struct cons_pointer multiply_2( struct stack_frame *frame,
                                        to_long_double( arg2 ) );
                         break;
                     default:
-                        result = throw_exception( make_cons(
-                          c_string_to_lisp_string( L"Cannot multiply: argument 2 is not a number: " ),
-                          c_type(arg2)),
-                          frame_pointer );
+                        result =
+                            throw_exception( make_cons
+                                             ( c_string_to_lisp_string
+                                               ( L"Cannot multiply: argument 2 is not a number: " ),
+                                               c_type( arg2 ) ),
+                                             frame_pointer );
                         break;
                 }
                 break;
@@ -415,11 +422,12 @@ struct cons_pointer multiply_2( struct stack_frame *frame,
                                        to_long_double( arg2 ) );
                         break;
                     default:
-                        result = throw_exception(
-                          make_cons(c_string_to_lisp_string
-                                                  ( L"Cannot multiply: argument 2 is not a number" ),
-                                    c_type(arg2)),
-                                                  frame_pointer );
+                        result =
+                            throw_exception( make_cons
+                                             ( c_string_to_lisp_string
+                                               ( L"Cannot multiply: argument 2 is not a number" ),
+                                               c_type( arg2 ) ),
+                                             frame_pointer );
                 }
                 break;
             case REALTV:
@@ -428,11 +436,10 @@ struct cons_pointer multiply_2( struct stack_frame *frame,
                                to_long_double( arg2 ) );
                 break;
             default:
-                        result = throw_exception(
-                          make_cons(c_string_to_lisp_string
-                                                  ( L"Cannot multiply: argument 1 is not a number" ),
-                                    c_type(arg1)),
-                                                  frame_pointer );
+                result = throw_exception( make_cons( c_string_to_lisp_string
+                                                     ( L"Cannot multiply: argument 1 is not a number" ),
+                                                     c_type( arg1 ) ),
+                                          frame_pointer );
                 break;
         }
     }
@@ -460,30 +467,27 @@ struct cons_pointer lisp_multiply( struct
     struct cons_pointer result = make_integer( 1, NIL );
     struct cons_pointer tmp;
 
-    for ( int i = 0;
-         i < args_in_frame
-           && !nilp( frame->arg[i] )
-           && !exceptionp( result );
-         i++ ) {
-      debug_print( L"lisp_multiply: accumulator = ",DEBUG_ARITH);
-      debug_print_object(result, DEBUG_ARITH);
-      debug_print( L"; arg = ", DEBUG_ARITH);
-      debug_print_object(frame->arg[i], DEBUG_ARITH);
-      debug_println( DEBUG_ARITH);
+    for ( int i = 0; i < args_in_frame && !nilp( frame->arg[i] )
+          && !exceptionp( result ); i++ ) {
+        debug_print( L"lisp_multiply: accumulator = ", DEBUG_ARITH );
+        debug_print_object( result, DEBUG_ARITH );
+        debug_print( L"; arg = ", DEBUG_ARITH );
+        debug_print_object( frame->arg[i], DEBUG_ARITH );
+        debug_println( DEBUG_ARITH );
 
-      multiply_one_arg(frame->arg[i]);
+        multiply_one_arg( frame->arg[i] );
     }
 
     struct cons_pointer more = frame->more;
     while ( consp( more )
             && !exceptionp( result ) ) {
-      multiply_one_arg(c_car( more ));
+        multiply_one_arg( c_car( more ) );
         more = c_cdr( more );
     }
 
-  debug_print( L"lisp_multiply returning: ",DEBUG_ARITH);
-      debug_print_object(result, DEBUG_ARITH);
-  debug_println(DEBUG_ARITH);
+    debug_print( L"lisp_multiply returning: ", DEBUG_ARITH );
+    debug_print_object( result, DEBUG_ARITH );
+    debug_println( DEBUG_ARITH );
 
     return result;
 }
@@ -538,9 +542,10 @@ struct cons_pointer negative( struct cons_pointer frame,
  * was not.
  */
 struct cons_pointer lisp_is_negative( struct stack_frame
-                              *frame, struct cons_pointer frame_pointer, struct
-                              cons_pointer env ) {
-  return is_negative(frame->arg[0]) ? TRUE : NIL;
+                                      *frame,
+                                      struct cons_pointer frame_pointer, struct
+                                      cons_pointer env ) {
+    return is_negative( frame->arg[0] ) ? TRUE : NIL;
 }
 
 
diff --git a/src/arith/peano.h b/src/arith/peano.h
index 7164a24..7ad7662 100644
--- a/src/arith/peano.h
+++ b/src/arith/peano.h
@@ -22,23 +22,25 @@ bool zerop( struct cons_pointer arg );
 struct cons_pointer negative( struct cons_pointer frame,
                               struct cons_pointer arg );
 
-bool is_negative( struct cons_pointer arg);
+bool is_negative( struct cons_pointer arg );
 
-struct cons_pointer absolute( struct cons_pointer frame_pointer, struct cons_pointer arg);
+struct cons_pointer absolute( struct cons_pointer frame_pointer,
+                              struct cons_pointer arg );
 
 long double to_long_double( struct cons_pointer arg );
 
 struct cons_pointer lisp_absolute( struct stack_frame
-                              *frame, struct cons_pointer frame_pointer, struct
-                              cons_pointer env );
+                                   *frame, struct cons_pointer frame_pointer, struct
+                                   cons_pointer env );
 
 struct cons_pointer
 lisp_add( struct stack_frame *frame, struct cons_pointer frame_pointer,
           struct cons_pointer env );
 
 struct cons_pointer lisp_is_negative( struct stack_frame
-                              *frame, struct cons_pointer frame_pointer, struct
-                              cons_pointer env );
+                                      *frame,
+                                      struct cons_pointer frame_pointer, struct
+                                      cons_pointer env );
 
 struct cons_pointer
 lisp_multiply( struct stack_frame *frame,
diff --git a/src/arith/ratio.c b/src/arith/ratio.c
index 784e71e..65b09da 100644
--- a/src/arith/ratio.c
+++ b/src/arith/ratio.c
@@ -55,10 +55,10 @@ struct cons_pointer simplify_ratio( struct cons_pointer frame_pointer,
 
     if ( ratiop( arg ) ) {
         int64_t ddrv =
-            pointer2cell( pointer2cell( arg ).payload.ratio.dividend ).payload.
-            integer.value, drrv =
-            pointer2cell( pointer2cell( arg ).payload.ratio.divisor ).payload.
-            integer.value, gcd = greatest_common_divisor( ddrv, drrv );
+            pointer2cell( pointer2cell( arg ).payload.ratio.dividend ).
+            payload.integer.value, drrv =
+            pointer2cell( pointer2cell( arg ).payload.ratio.divisor ).
+            payload.integer.value, gcd = greatest_common_divisor( ddrv, drrv );
 
         if ( gcd > 1 ) {
             if ( drrv / gcd == 1 ) {
@@ -199,10 +199,10 @@ struct cons_pointer divide_ratio_ratio( struct cons_pointer frame_pointer,
                                         struct cons_pointer arg1,
                                         struct cons_pointer arg2 ) {
     struct cons_pointer i = make_ratio( frame_pointer,
-                                        pointer2cell( arg2 ).payload.ratio.
-                                        divisor,
-                                        pointer2cell( arg2 ).payload.ratio.
-                                        dividend ), result =
+                                        pointer2cell( arg2 ).payload.
+                                        ratio.divisor,
+                                        pointer2cell( arg2 ).payload.
+                                        ratio.dividend ), result =
         multiply_ratio_ratio( frame_pointer, arg1, i );
 
     dec_ref( i );
diff --git a/src/debug.c b/src/debug.c
index d694827..14881f9 100644
--- a/src/debug.c
+++ b/src/debug.c
@@ -19,6 +19,7 @@
 #include <wctype.h>
 
 #include "consspaceobject.h"
+#include "fopen.h"
 #include "debug.h"
 #include "dump.h"
 #include "print.h"
@@ -104,8 +105,10 @@ void debug_printf( int level, wchar_t *format, ... ) {
 void debug_print_object( struct cons_pointer pointer, int level ) {
 #ifdef DEBUG
     if ( level & verbosity ) {
+        URL_FILE *ustderr = file_to_url_file( stderr );
         fwide( stderr, 1 );
-        print( stderr, pointer );
+        print( ustderr, pointer );
+        free( ustderr );
     }
 #endif
 }
@@ -116,8 +119,10 @@ void debug_print_object( struct cons_pointer pointer, int level ) {
 void debug_dump_object( struct cons_pointer pointer, int level ) {
 #ifdef DEBUG
     if ( level & verbosity ) {
+        URL_FILE *ustderr = file_to_url_file( stderr );
         fwide( stderr, 1 );
-        dump_object( stderr, pointer );
+        dump_object( ustderr, pointer );
+        free( ustderr );
     }
 #endif
 }
diff --git a/src/init.c b/src/init.c
index 8f278bf..a45e685 100644
--- a/src/init.c
+++ b/src/init.c
@@ -21,6 +21,7 @@
 #include "consspaceobject.h"
 #include "debug.h"
 #include "intern.h"
+#include "io.h"
 #include "lispops.h"
 #include "peano.h"
 #include "print.h"
@@ -82,7 +83,7 @@ int main( int argc, char *argv[] ) {
     bool dump_at_end = false;
     bool show_prompt = false;
 
-    setlocale(LC_ALL, "");
+    setlocale( LC_ALL, "" );
 
     while ( ( option = getopt( argc, argv, "cpdv:" ) ) != -1 ) {
         switch ( option ) {
@@ -131,9 +132,9 @@ int main( int argc, char *argv[] ) {
     fwide( stdout, 1 );
     fwide( stderr, 1 );
     fwide( sink->handle.file, 1 );
-    bind_value( L"*in*", make_read_stream( file_to_url_file(stdin) ) );
-    bind_value( L"*out*", make_write_stream( file_to_url_file(stdout) ) );
-    bind_value( L"*log*", make_write_stream( file_to_url_file(stderr) ) );
+    bind_value( L"*in*", make_read_stream( file_to_url_file( stdin ) ) );
+    bind_value( L"*out*", make_write_stream( file_to_url_file( stdout ) ) );
+    bind_value( L"*log*", make_write_stream( file_to_url_file( stderr ) ) );
     bind_value( L"*sink*", make_write_stream( sink ) );
 
     /*
@@ -151,6 +152,7 @@ int main( int argc, char *argv[] ) {
     bind_function( L"assoc", &lisp_assoc );
     bind_function( L"car", &lisp_car );
     bind_function( L"cdr", &lisp_cdr );
+    bind_function( L"close", &lisp_close );
     bind_function( L"cons", &lisp_cons );
     bind_function( L"divide", &lisp_divide );
     bind_function( L"eq", &lisp_eq );
@@ -159,12 +161,15 @@ int main( int argc, char *argv[] ) {
     bind_function( L"exception", &lisp_exception );
     bind_function( L"inspect", &lisp_inspect );
     bind_function( L"multiply", &lisp_multiply );
-    bind_function( L"negative?", &lisp_is_negative);
+    bind_function( L"negative?", &lisp_is_negative );
     bind_function( L"read", &lisp_read );
     bind_function( L"repl", &lisp_repl );
     bind_function( L"oblist", &lisp_oblist );
+    bind_function( L"open", &lisp_open );
     bind_function( L"print", &lisp_print );
     bind_function( L"progn", &lisp_progn );
+    bind_function( L"read", &lisp_read );
+    bind_function( L"read_char", &lisp_read_char );
     bind_function( L"reverse", &lisp_reverse );
     bind_function( L"set", &lisp_set );
     bind_function( L"source", &lisp_source );
@@ -183,7 +188,7 @@ int main( int argc, char *argv[] ) {
      */
     bind_special( L"cond", &lisp_cond );
     bind_special( L"lambda", &lisp_lambda );
-    bind_special( L"\u03bb", &lisp_lambda ); // λ
+    bind_special( L"\u03bb", &lisp_lambda );  // λ
     bind_special( L"nlambda", &lisp_nlambda );
     bind_special( L"n\u03bb", &lisp_nlambda );
     bind_special( L"progn", &lisp_progn );
@@ -200,7 +205,7 @@ int main( int argc, char *argv[] ) {
     debug_dump_object( oblist, DEBUG_BOOTSTRAP );
 
     if ( dump_at_end ) {
-        dump_pages( file_to_url_file(stdout) );
+        dump_pages( file_to_url_file( stdout ) );
     }
 
     return ( 0 );
diff --git a/src/io/fopen.c b/src/io/fopen.c
index 14c95e8..499fada 100644
--- a/src/io/fopen.c
+++ b/src/io/fopen.c
@@ -6,6 +6,9 @@
  * Modifications to read/write wide character streams by
  * Simon Brooke.
  *
+ * NOTE THAT: for my purposes, I'm only interested in wide characters,
+ * and I always read them one character at a time.
+ *
  * Copyright (c) 2003, 2017 Simtec Electronics
  * Some portions (c) 2019 Simon Brooke <simon@journeyman.cc>
  *
@@ -34,14 +37,13 @@
  * This example requires libcurl 7.9.7 or later.
  */
 
-
+#include <errno.h>
 #include <stdio.h>
+#include <stdlib.h>
 #include <string.h>
 #ifndef WIN32
-#  include <sys/time.h>
+#include <sys/time.h>
 #endif
-#include <stdlib.h>
-#include <errno.h>
 
 #include <curl/curl.h>
 
@@ -51,362 +53,376 @@
 static CURLM *multi_handle;
 
 /* curl calls this routine to get more data */
-static size_t write_callback(char *buffer,
-                             size_t size,
-                             size_t nitems,
-                             void *userp)
-{
-  char *newbuff;
-  size_t rembuff;
+static size_t write_callback( char *buffer,
+                              size_t size, size_t nitems, void *userp ) {
+    char *newbuff;
+    size_t rembuff;
 
-  URL_FILE *url = (URL_FILE *)userp;
-  size *= nitems;
+    URL_FILE *url = ( URL_FILE * ) userp;
+    size *= nitems;
 
-  rembuff = url->buffer_len - url->buffer_pos; /* remaining space in buffer */
+    rembuff = url->buffer_len - url->buffer_pos;  /* remaining space in buffer */
 
-  if(size > rembuff) {
-    /* not enough space in buffer */
-    newbuff = realloc(url->buffer, url->buffer_len + (size - rembuff));
-    if(newbuff == NULL) {
-      fprintf(stderr, "callback buffer grow failed\n");
-      size = rembuff;
+    if ( size > rembuff ) {
+        /* not enough space in buffer */
+        newbuff = realloc( url->buffer, url->buffer_len + ( size - rembuff ) );
+        if ( newbuff == NULL ) {
+            fprintf( stderr, "callback buffer grow failed\n" );
+            size = rembuff;
+        } else {
+            /* realloc succeeded increase buffer size */
+            url->buffer_len += size - rembuff;
+            url->buffer = newbuff;
+        }
     }
-    else {
-      /* realloc succeeded increase buffer size*/
-      url->buffer_len += size - rembuff;
-      url->buffer = newbuff;
-    }
-  }
 
-  memcpy(&url->buffer[url->buffer_pos], buffer, size);
-  url->buffer_pos += size;
+    memcpy( &url->buffer[url->buffer_pos], buffer, size );
+    url->buffer_pos += size;
 
-  return size;
+    return size;
 }
 
 /* use to attempt to fill the read buffer up to requested number of bytes */
-static int fill_buffer(URL_FILE *file, size_t want)
-{
-  fd_set fdread;
-  fd_set fdwrite;
-  fd_set fdexcep;
-  struct timeval timeout;
-  int rc;
-  CURLMcode mc; /* curl_multi_fdset() return code */
+static int fill_buffer( URL_FILE * file, size_t want ) {
+    fd_set fdread;
+    fd_set fdwrite;
+    fd_set fdexcep;
+    struct timeval timeout;
+    int rc;
+    CURLMcode mc;               /* curl_multi_fdset() return code */
 
-  /* only attempt to fill buffer if transactions still running and buffer
-   * doesn't exceed required size already
-   */
-  if((!file->still_running) || (file->buffer_pos > want))
-    return 0;
+    /* only attempt to fill buffer if transactions still running and buffer
+     * doesn't exceed required size already
+     */
+    if ( ( !file->still_running ) || ( file->buffer_pos > want ) )
+        return 0;
 
-  /* attempt to fill buffer */
-  do {
-    int maxfd = -1;
-    long curl_timeo = -1;
+    /* attempt to fill buffer */
+    do {
+        int maxfd = -1;
+        long curl_timeo = -1;
 
-    FD_ZERO(&fdread);
-    FD_ZERO(&fdwrite);
-    FD_ZERO(&fdexcep);
+        FD_ZERO( &fdread );
+        FD_ZERO( &fdwrite );
+        FD_ZERO( &fdexcep );
 
-    /* set a suitable timeout to fail on */
-    timeout.tv_sec = 60; /* 1 minute */
-    timeout.tv_usec = 0;
+        /* set a suitable timeout to fail on */
+        timeout.tv_sec = 60;    /* 1 minute */
+        timeout.tv_usec = 0;
 
-    curl_multi_timeout(multi_handle, &curl_timeo);
-    if(curl_timeo >= 0) {
-      timeout.tv_sec = curl_timeo / 1000;
-      if(timeout.tv_sec > 1)
-        timeout.tv_sec = 1;
-      else
-        timeout.tv_usec = (curl_timeo % 1000) * 1000;
-    }
+        curl_multi_timeout( multi_handle, &curl_timeo );
+        if ( curl_timeo >= 0 ) {
+            timeout.tv_sec = curl_timeo / 1000;
+            if ( timeout.tv_sec > 1 )
+                timeout.tv_sec = 1;
+            else
+                timeout.tv_usec = ( curl_timeo % 1000 ) * 1000;
+        }
 
-    /* get file descriptors from the transfers */
-    mc = curl_multi_fdset(multi_handle, &fdread, &fdwrite, &fdexcep, &maxfd);
+        /* get file descriptors from the transfers */
+        mc = curl_multi_fdset( multi_handle, &fdread, &fdwrite, &fdexcep,
+                               &maxfd );
 
-    if(mc != CURLM_OK) {
-      fprintf(stderr, "curl_multi_fdset() failed, code %d.\n", mc);
-      break;
-    }
+        if ( mc != CURLM_OK ) {
+            fprintf( stderr, "curl_multi_fdset() failed, code %d.\n", mc );
+            break;
+        }
 
-    /* On success the value of maxfd is guaranteed to be >= -1. We call
-       select(maxfd + 1, ...); specially in case of (maxfd == -1) there are
-       no fds ready yet so we call select(0, ...) --or Sleep() on Windows--
-       to sleep 100ms, which is the minimum suggested value in the
-       curl_multi_fdset() doc. */
+        /* On success the value of maxfd is guaranteed to be >= -1. We call
+           select(maxfd + 1, ...); specially in case of (maxfd == -1) there are
+           no fds ready yet so we call select(0, ...) --or Sleep() on Windows--
+           to sleep 100ms, which is the minimum suggested value in the
+           curl_multi_fdset() doc. */
 
-    if(maxfd == -1) {
+        if ( maxfd == -1 ) {
 #ifdef _WIN32
-      Sleep(100);
-      rc = 0;
+            Sleep( 100 );
+            rc = 0;
 #else
-      /* Portable sleep for platforms other than Windows. */
-      struct timeval wait = { 0, 100 * 1000 }; /* 100ms */
-      rc = select(0, NULL, NULL, NULL, &wait);
+            /* Portable sleep for platforms other than Windows. */
+            struct timeval wait = { 0, 100 * 1000 };  /* 100ms */
+            rc = select( 0, NULL, NULL, NULL, &wait );
 #endif
-    }
-    else {
-      /* Note that on some platforms 'timeout' may be modified by select().
-         If you need access to the original value save a copy beforehand. */
-      rc = select(maxfd + 1, &fdread, &fdwrite, &fdexcep, &timeout);
-    }
+        } else {
+            /* Note that on some platforms 'timeout' may be modified by select().
+               If you need access to the original value save a copy beforehand. */
+            rc = select( maxfd + 1, &fdread, &fdwrite, &fdexcep, &timeout );
+        }
 
-    switch(rc) {
-    case -1:
-      /* select error */
-      break;
+        switch ( rc ) {
+            case -1:
+                /* select error */
+                break;
 
-    case 0:
-    default:
-      /* timeout or readable/writable sockets */
-      curl_multi_perform(multi_handle, &file->still_running);
-      break;
-    }
-  } while(file->still_running && (file->buffer_pos < want));
-  return 1;
+            case 0:
+            default:
+                /* timeout or readable/writable sockets */
+                curl_multi_perform( multi_handle, &file->still_running );
+                break;
+        }
+    } while ( file->still_running && ( file->buffer_pos < want ) );
+
+    return 1;
 }
 
 /* use to remove want bytes from the front of a files buffer */
-static int use_buffer(URL_FILE *file, size_t want)
-{
-  /* sort out buffer */
-  if((file->buffer_pos - want) <= 0) {
-    /* ditch buffer - write will recreate */
-    free(file->buffer);
-    file->buffer = NULL;
-    free(file->wide_buffer);
-    file->wide_buffer = NULL;
-    file->buffer_pos = 0;
-    file->buffer_len = 0;
-    file->wide_cursor = 0;
-  }
-  else {
-    /* move rest down make it available for later */
-    memmove(file->buffer,
-            &file->buffer[want],
-            (file->buffer_pos - want));
+static int use_buffer( URL_FILE * file, size_t want ) {
+    /* sort out buffer */
+    if ( ( file->buffer_pos - want ) <= 0 ) {
+        /* ditch buffer - write will recreate */
+        free( file->buffer );
+        file->buffer = NULL;
+        file->buffer_pos = 0;
+        file->buffer_len = 0;
+    } else {
+        /* move rest down make it available for later */
+        memmove( file->buffer,
+                 &file->buffer[want], ( file->buffer_pos - want ) );
 
-    file->buffer_pos -= want;
-    // TODO: something to adjust the wide_cursor
-  }
-  return 0;
-}
-
-URL_FILE *url_fopen(const char *url, const char *operation)
-{
-  /* this code could check for URLs or types in the 'url' and
-     basically use the real fopen() for standard files */
-
-  URL_FILE *file;
-  (void)operation;
-
-  file = calloc(1, sizeof(URL_FILE));
-  if(!file)
-    return NULL;
-
-  file->handle.file = fopen(url, operation);
-  if(file->handle.file)
-    file->type = CFTYPE_FILE; /* marked as URL */
-
-  else {
-    file->type = CFTYPE_CURL; /* marked as URL */
-    file->handle.curl = curl_easy_init();
-
-    curl_easy_setopt(file->handle.curl, CURLOPT_URL, url);
-    curl_easy_setopt(file->handle.curl, CURLOPT_WRITEDATA, file);
-    curl_easy_setopt(file->handle.curl, CURLOPT_VERBOSE, 0L);
-    curl_easy_setopt(file->handle.curl, CURLOPT_WRITEFUNCTION, write_callback);
-
-    if(!multi_handle)
-      multi_handle = curl_multi_init();
-
-    curl_multi_add_handle(multi_handle, file->handle.curl);
-
-    /* lets start the fetch */
-    curl_multi_perform(multi_handle, &file->still_running);
-
-    if((file->buffer_pos == 0) && (!file->still_running)) {
-      /* if still_running is 0 now, we should return NULL */
-
-      /* make sure the easy handle is not in the multi handle anymore */
-      curl_multi_remove_handle(multi_handle, file->handle.curl);
-
-      /* cleanup */
-      curl_easy_cleanup(file->handle.curl);
-
-      free(file);
-
-      file = NULL;
+        file->buffer_pos -= want;
     }
-  }
-  return file;
+    return 0;
 }
 
-int url_fclose(URL_FILE *file)
-{
-  int ret = 0;/* default is good return */
+/**
+ * consume one wide character on the buffer of this file.
+ *
+ * @param file the url or file from which the character is consumed.
+ */
+static int use_one_wide( URL_FILE * file ) {
+    int c = ( int ) file->buffer[file->buffer_pos];
+    size_t count = 0;
 
-  switch(file->type) {
-  case CFTYPE_FILE:
-    ret = fclose(file->handle.file); /* passthrough */
-    break;
-
-  case CFTYPE_CURL:
-    /* make sure the easy handle is not in the multi handle anymore */
-    curl_multi_remove_handle(multi_handle, file->handle.curl);
-
-    /* cleanup */
-    curl_easy_cleanup(file->handle.curl);
-    break;
-
-  default: /* unknown or supported type - oh dear */
-    ret = EOF;
-    errno = EBADF;
-    break;
-  }
-
-  free(file->buffer);/* free any allocated buffer space */
-  free(file);
-
-  return ret;
-}
-
-int url_feof(URL_FILE *file)
-{
-  int ret = 0;
-
-  switch(file->type) {
-  case CFTYPE_FILE:
-    ret = feof(file->handle.file);
-    break;
-
-  case CFTYPE_CURL:
-    if((file->buffer_pos == 0) && (!file->still_running))
-      ret = 1;
-    break;
-
-  default: /* unknown or supported type - oh dear */
-    ret = -1;
-    errno = EBADF;
-    break;
-  }
-  return ret;
-}
-
-size_t url_fread(void *ptr, size_t size, size_t nmemb, URL_FILE *file)
-{
-  size_t want;
-
-  switch(file->type) {
-  case CFTYPE_FILE:
-    want = fread(ptr, size, nmemb, file->handle.file);
-    break;
-
-  case CFTYPE_CURL:
-    want = nmemb * size;
-
-    fill_buffer(file, want);
-
-    /* check if there's data in the buffer - if not fill_buffer()
-     * either errored or EOF */
-    if(!file->buffer_pos)
-      return 0;
-
-    /* ensure only available data is considered */
-    if(file->buffer_pos < want)
-      want = file->buffer_pos;
-
-    /* xfer data to caller */
-    memcpy(ptr, file->buffer, want);
-
-    use_buffer(file, want);
-
-    want = want / size;     /* number of items */
-    break;
-
-  default: /* unknown or supported type - oh dear */
-    want = 0;
-    errno = EBADF;
-    break;
-
-  }
-  return want;
-}
-
-char *url_fgets(char *ptr, size_t size, URL_FILE *file)
-{
-  size_t want = size - 1;/* always need to leave room for zero termination */
-  size_t loop;
-
-  switch(file->type) {
-  case CFTYPE_FILE:
-    ptr = fgets(ptr, (int)size, file->handle.file);
-    break;
-
-  case CFTYPE_CURL:
-    fill_buffer(file, want);
-
-    /* check if there's data in the buffer - if not fill either errored or
-     * EOF */
-    if(!file->buffer_pos)
-      return NULL;
-
-    /* ensure only available data is considered */
-    if(file->buffer_pos < want)
-      want = file->buffer_pos;
-
-    /*buffer contains data */
-    /* look for newline or eof */
-    for(loop = 0; loop < want; loop++) {
-      if(file->buffer[loop] == '\n') {
-        want = loop + 1;/* include newline */
-        break;
-      }
+    /* The value of each individual byte indicates its UTF-8 function, as follows:
+     *
+     * 00 to 7F hex (0 to 127): first and only byte of a sequence.
+     * 80 to BF hex (128 to 191): continuing byte in a multi-byte sequence.
+     * C2 to DF hex (194 to 223): first byte of a two-byte sequence.
+     * E0 to EF hex (224 to 239): first byte of a three-byte sequence.
+     * F0 to FF hex (240 to 255): first byte of a four-byte sequence.
+     */
+    if ( c <= '0x07' ) {
+        count = 1;
+    } else if ( c >= '0xc2' && c <= '0xdf' ) {
+        count = 2;
+    } else if ( c >= '0xe0' && c <= '0xef' ) {
+        count = 3;
+    } else if ( c >= '0xf0' && c <= '0xff' ) {
+        count = 4;
     }
 
-    /* xfer data to caller */
-    memcpy(ptr, file->buffer, want);
-    ptr[want] = 0;/* always null terminate */
-
-    use_buffer(file, want);
-
-    break;
-
-  default: /* unknown or supported type - oh dear */
-    ptr = NULL;
-    errno = EBADF;
-    break;
-  }
-
-  return ptr;/*success */
+    return use_buffer( file, c );
 }
 
-void url_rewind(URL_FILE *file)
-{
-  switch(file->type) {
-  case CFTYPE_FILE:
-    rewind(file->handle.file); /* passthrough */
-    break;
+URL_FILE *url_fopen( const char *url, const char *operation ) {
+    /* this code could check for URLs or types in the 'url' and
+       basically use the real fopen() for standard files */
 
-  case CFTYPE_CURL:
-    /* halt transaction */
-    curl_multi_remove_handle(multi_handle, file->handle.curl);
+    URL_FILE *file;
+    ( void ) operation;
 
-    /* restart */
-    curl_multi_add_handle(multi_handle, file->handle.curl);
+    file = calloc( 1, sizeof( URL_FILE ) );
+    if ( !file )
+        return NULL;
 
-    /* ditch buffer - write will recreate - resets stream pos*/
-    free(file->buffer);
-    file->buffer = NULL;
-    file->buffer_pos = 0;
-    file->buffer_len = 0;
+    file->handle.file = fopen( url, operation );
+    if ( file->handle.file )
+        file->type = CFTYPE_FILE; /* marked as URL */
 
-    break;
+    else {
+        file->type = CFTYPE_CURL; /* marked as URL */
+        file->handle.curl = curl_easy_init(  );
 
-  default: /* unknown or supported type - oh dear */
-    break;
-  }
+        curl_easy_setopt( file->handle.curl, CURLOPT_URL, url );
+        curl_easy_setopt( file->handle.curl, CURLOPT_WRITEDATA, file );
+        curl_easy_setopt( file->handle.curl, CURLOPT_VERBOSE, 0L );
+        curl_easy_setopt( file->handle.curl, CURLOPT_WRITEFUNCTION,
+                          write_callback );
+
+        if ( !multi_handle )
+            multi_handle = curl_multi_init(  );
+
+        curl_multi_add_handle( multi_handle, file->handle.curl );
+
+        /* lets start the fetch */
+        curl_multi_perform( multi_handle, &file->still_running );
+
+        if ( ( file->buffer_pos == 0 ) && ( !file->still_running ) ) {
+            /* if still_running is 0 now, we should return NULL */
+
+            /* make sure the easy handle is not in the multi handle anymore */
+            curl_multi_remove_handle( multi_handle, file->handle.curl );
+
+            /* cleanup */
+            curl_easy_cleanup( file->handle.curl );
+
+            free( file );
+
+            file = NULL;
+        }
+    }
+    return file;
+}
+
+int url_fclose( URL_FILE * file ) {
+    int ret = 0;                /* default is good return */
+
+    switch ( file->type ) {
+        case CFTYPE_FILE:
+            ret = fclose( file->handle.file );  /* passthrough */
+            break;
+
+        case CFTYPE_CURL:
+            /* make sure the easy handle is not in the multi handle anymore */
+            curl_multi_remove_handle( multi_handle, file->handle.curl );
+
+            /* cleanup */
+            curl_easy_cleanup( file->handle.curl );
+            break;
+
+        default:               /* unknown or supported type - oh dear */
+            ret = EOF;
+            errno = EBADF;
+            break;
+    }
+
+    free( file->buffer );       /* free any allocated buffer space */
+    free( file );
+
+    return ret;
+}
+
+int url_feof( URL_FILE * file ) {
+    int ret = 0;
+
+    switch ( file->type ) {
+        case CFTYPE_FILE:
+            ret = feof( file->handle.file );
+            break;
+
+        case CFTYPE_CURL:
+            if ( ( file->buffer_pos == 0 ) && ( !file->still_running ) )
+                ret = 1;
+            break;
+
+        default:               /* unknown or supported type - oh dear */
+            ret = -1;
+            errno = EBADF;
+            break;
+    }
+    return ret;
+}
+
+size_t url_fread( void *ptr, size_t size, size_t nmemb, URL_FILE * file ) {
+    size_t want;
+
+    switch ( file->type ) {
+        case CFTYPE_FILE:
+            want = fread( ptr, size, nmemb, file->handle.file );
+            break;
+
+        case CFTYPE_CURL:
+            want = nmemb * size;
+
+            fill_buffer( file, want );
+
+            /* check if there's data in the buffer - if not fill_buffer()
+             * either errored or EOF */
+            if ( !file->buffer_pos )
+                return 0;
+
+            /* ensure only available data is considered */
+            if ( file->buffer_pos < want )
+                want = file->buffer_pos;
+
+            /* xfer data to caller */
+            memcpy( ptr, file->buffer, want );
+
+            use_buffer( file, want );
+
+            want = want / size; /* number of items */
+            break;
+
+        default:               /* unknown or supported type - oh dear */
+            want = 0;
+            errno = EBADF;
+            break;
+
+    }
+    return want;
+}
+
+char *url_fgets( char *ptr, size_t size, URL_FILE * file ) {
+    size_t want = size - 1;     /* always need to leave room for zero termination */
+    size_t loop;
+
+    switch ( file->type ) {
+        case CFTYPE_FILE:
+            ptr = fgets( ptr, ( int ) size, file->handle.file );
+            break;
+
+        case CFTYPE_CURL:
+            fill_buffer( file, want );
+
+            /* check if there's data in the buffer - if not fill either errored or
+             * EOF */
+            if ( !file->buffer_pos )
+                return NULL;
+
+            /* ensure only available data is considered */
+            if ( file->buffer_pos < want )
+                want = file->buffer_pos;
+
+            /*buffer contains data */
+            /* look for newline or eof */
+            for ( loop = 0; loop < want; loop++ ) {
+                if ( file->buffer[loop] == '\n' ) {
+                    want = loop + 1;  /* include newline */
+                    break;
+                }
+            }
+
+            /* xfer data to caller */
+            memcpy( ptr, file->buffer, want );
+            ptr[want] = 0;      /* always null terminate */
+
+            use_buffer( file, want );
+
+            break;
+
+        default:               /* unknown or supported type - oh dear */
+            ptr = NULL;
+            errno = EBADF;
+            break;
+    }
+
+    return ptr;                 /*success */
+}
+
+void url_rewind( URL_FILE * file ) {
+    switch ( file->type ) {
+        case CFTYPE_FILE:
+            rewind( file->handle.file );  /* passthrough */
+            break;
+
+        case CFTYPE_CURL:
+            /* halt transaction */
+            curl_multi_remove_handle( multi_handle, file->handle.curl );
+
+            /* restart */
+            curl_multi_add_handle( multi_handle, file->handle.curl );
+
+            /* ditch buffer - write will recreate - resets stream pos */
+            free( file->buffer );
+            file->buffer = NULL;
+            file->buffer_pos = 0;
+            file->buffer_len = 0;
+
+            break;
+
+        default:               /* unknown or supported type - oh dear */
+            break;
+    }
 }
 
 /**
@@ -415,153 +431,79 @@ void url_rewind(URL_FILE *file)
  * @param f the file to be wrapped;
  * @return the new handle, or null if no such handle could be allocated.
  */
-URL_FILE * file_to_url_file( FILE* f) {
-  URL_FILE * result = (URL_FILE *)malloc(sizeof(URL_FILE));
+URL_FILE *file_to_url_file( FILE * f ) {
+    URL_FILE *result = ( URL_FILE * ) malloc( sizeof( URL_FILE ) );
 
-  if ( result != NULL) {
-    result->type = CFTYPE_FILE,
-    result->handle.file = f;
-  }
+    if ( result != NULL ) {
+        result->type = CFTYPE_FILE, result->handle.file = f;
+    }
 
-  return result;
+    return result;
 }
 
+
 /**
  * get one wide character from the buffer.
  *
  * @param file the stream to read from;
  * @return the next wide character on the stream, or zero if no more.
  */
-wint_t url_fgetwc(URL_FILE *input) {
-  wint_t result = 0;
+wint_t url_fgetwc( URL_FILE * input ) {
+    wint_t result = -1;
 
-  switch(input->type) {
-  case CFTYPE_FILE:
-    fwide( input->handle.file, 1 ); /* wide characters */
-    result = fgetc(input->handle.file); /* passthrough */
-    break;
+    switch ( input->type ) {
+        case CFTYPE_FILE:
+            fwide( input->handle.file, 1 ); /* wide characters */
+            result = fgetwc( input->handle.file );  /* passthrough */
+            break;
 
-  case CFTYPE_CURL:
-    if (input.buffer_len != 0) {
-      if ( input.wide_buffer == NULL) {
-        /* not initialised */
-        input.wide_buffer = calloc( input.buffer_len, sizeof(wint_t));
-      }
+        case CFTYPE_CURL:{
+                wchar_t *wbuff = calloc( 2, sizeof( wchar_t ) );
+                char *cbuff = calloc( 5, sizeof( char ) );
 
-      size_t len = wcslen(input.wide_buffer);
-      if (input.still_running ||
-          len == 0 ||
-          len >= input.wide_cursor) {
-        /* refresh the wide buffer */
-        mbstowcs(input.wide_buffer, input.buffer, input.buffer_pos);
-      }
+                url_fread( cbuff, sizeof( char ), 4, input );
+                mbstowcs( wbuff, cbuff, 1 );
+                result = wbuff[0];
+                use_one_wide( input );
 
-      result = input.wide_buffer[input.wide_cursor] ++;
-
-      /* do something to fread (advance) one utf character */
+                free( cbuff );
+                free( wbuff );
+            }
+            break;
+        case CFTYPE_NONE:
+            break;
     }
-    break;
-  }
 
-  return result;
+    return result;
 }
 
-/* #define FGETSFILE "fgets.test" */
-/* #define FREADFILE "fread.test" */
-/* #define REWINDFILE "rewind.test" */
+wint_t url_ungetwc( wint_t wc, URL_FILE * input ) {
+    wint_t result = -1;
 
-/* /\* Small main program to retrieve from a url using fgets and fread saving the */
-/*  * output to two test files (note the fgets method will corrupt binary files if */
-/*  * they contain 0 chars *\/ */
-/* int main(int argc, char *argv[]) */
-/* { */
-/*   URL_FILE *handle; */
-/*   FILE *outf; */
+    switch ( input->type ) {
+        case CFTYPE_FILE:
+            fwide( input->handle.file, 1 ); /* wide characters */
+            result = fgetwc( input->handle.file );  /* passthrough */
+            break;
 
-/*   size_t nread; */
-/*   char buffer[256]; */
-/*   const char *url; */
+        case CFTYPE_CURL:{
+                wchar_t *wbuff = calloc( 2, sizeof( wchar_t ) );
+                char *cbuff = calloc( 5, sizeof( char ) );
 
-/*   if(argc < 2) */
-/*     url = "http://192.168.7.3/testfile";/\* default to testurl *\/ */
-/*   else */
-/*     url = argv[1];/\* use passed url *\/ */
+                wbuff[0] = wc;
+                result = wcstombs( cbuff, wbuff, 1 );
 
-/*   /\* copy from url line by line with fgets *\/ */
-/*   outf = fopen(FGETSFILE, "wb+"); */
-/*   if(!outf) { */
-/*     perror("couldn't open fgets output file\n"); */
-/*     return 1; */
-/*   } */
+                input->buffer_pos -= strlen( cbuff );
 
-/*   handle = url_fopen(url, "r"); */
-/*   if(!handle) { */
-/*     printf("couldn't url_fopen() %s\n", url); */
-/*     fclose(outf); */
-/*     return 2; */
-/*   } */
+                free( cbuff );
+                free( wbuff );
 
-/*   while(!url_feof(handle)) { */
-/*     url_fgets(buffer, sizeof(buffer), handle); */
-/*     fwrite(buffer, 1, strlen(buffer), outf); */
-/*   } */
+                result = result > 0 ? wc : result;
+                break;
+        case CFTYPE_NONE:
+                break;
+            }
+    }
 
-/*   url_fclose(handle); */
-
-/*   fclose(outf); */
-
-
-/*   /\* Copy from url with fread *\/ */
-/*   outf = fopen(FREADFILE, "wb+"); */
-/*   if(!outf) { */
-/*     perror("couldn't open fread output file\n"); */
-/*     return 1; */
-/*   } */
-
-/*   handle = url_fopen("testfile", "r"); */
-/*   if(!handle) { */
-/*     printf("couldn't url_fopen() testfile\n"); */
-/*     fclose(outf); */
-/*     return 2; */
-/*   } */
-
-/*   do { */
-/*     nread = url_fread(buffer, 1, sizeof(buffer), handle); */
-/*     fwrite(buffer, 1, nread, outf); */
-/*   } while(nread); */
-
-/*   url_fclose(handle); */
-
-/*   fclose(outf); */
-
-
-/*   /\* Test rewind *\/ */
-/*   outf = fopen(REWINDFILE, "wb+"); */
-/*   if(!outf) { */
-/*     perror("couldn't open fread output file\n"); */
-/*     return 1; */
-/*   } */
-
-/*   handle = url_fopen("testfile", "r"); */
-/*   if(!handle) { */
-/*     printf("couldn't url_fopen() testfile\n"); */
-/*     fclose(outf); */
-/*     return 2; */
-/*   } */
-
-/*   nread = url_fread(buffer, 1, sizeof(buffer), handle); */
-/*   fwrite(buffer, 1, nread, outf); */
-/*   url_rewind(handle); */
-
-/*   buffer[0]='\n'; */
-/*   fwrite(buffer, 1, 1, outf); */
-
-/*   nread = url_fread(buffer, 1, sizeof(buffer), handle); */
-/*   fwrite(buffer, 1, nread, outf); */
-
-/*   url_fclose(handle); */
-
-/*   fclose(outf); */
-
-/*   return 0;/\* all done *\/ */
-/* } */
+    return result;
+}
diff --git a/src/io/fopen.h b/src/io/fopen.h
index 83ea5a8..f952a65 100644
--- a/src/io/fopen.h
+++ b/src/io/fopen.h
@@ -7,6 +7,9 @@
  * Modifications to read/write wide character streams by
  * Simon Brooke.
  *
+ * NOTE THAT: for my purposes, I'm only interested in wide characters,
+ * and I always read them one character at a time.
+ *
  * Copyright (c) 2003, 2017 Simtec Electronics
  * Some portions (c) 2019 Simon Brooke <simon@journeyman.cc>
  *
@@ -44,41 +47,41 @@
 #include <wchar.h>
 #include <wctype.h>
 
+#define url_fwprintf(f, ...) ((f->type = CFTYPE_FILE) ? fwprintf( f->handle.file, __VA_ARGS__) : -1)
+#define url_fputws(ws, f) ((f->type = CFTYPE_FILE) ?  fputws(ws, f->handle.file) : 0)
+#define url_fputwc(wc, f) ((f->type = CFTYPE_FILE) ?  fputwc(wc, f->handle.file) : 0)
+
 enum fcurl_type_e {
-  CFTYPE_NONE = 0,
-  CFTYPE_FILE = 1,
-  CFTYPE_CURL = 2
+    CFTYPE_NONE = 0,
+    CFTYPE_FILE = 1,
+    CFTYPE_CURL = 2
 };
 
-struct fcurl_data
-{
-  enum fcurl_type_e type;     /* type of handle */
-  union {
-    CURL *curl;
-    FILE *file;
-  } handle;                   /* handle */
+struct fcurl_data {
+    enum fcurl_type_e type;     /* type of handle */
+    union {
+        CURL *curl;
+        FILE *file;
+    } handle;                   /* handle */
 
-  char *buffer;               /* buffer to store cached data*/
-  wchar_t *wide_buffer;       /* wide character buffer */
-  size_t buffer_len;          /* currently allocated buffer's length */
-  size_t buffer_pos;          /* end of data in buffer*/
-  size_t wide_cursor;         /* cursor into the wide buffer */
-  int still_running;          /* Is background url fetch still in progress */
+    char *buffer;               /* buffer to store cached data */
+    size_t buffer_len;          /* currently allocated buffer's length */
+    size_t buffer_pos;          /* cursor into in buffer */
+    int still_running;          /* Is background url fetch still in progress */
 };
 
 typedef struct fcurl_data URL_FILE;
 
 /* exported functions */
-URL_FILE *url_fopen(const char *url, const char *operation);
-int url_fclose(URL_FILE *file);
-int url_feof(URL_FILE *file);
-size_t url_fread(void *ptr, size_t size, size_t nmemb, URL_FILE *file);
-char *url_fgets(char *ptr, size_t size, URL_FILE *file);
-void url_rewind(URL_FILE *file);
-
-wint_t url_fgetwc(URL_FILE *file);
-URL_FILE * file_to_url_file( FILE* f);
-
+URL_FILE *url_fopen( const char *url, const char *operation );
+int url_fclose( URL_FILE * file );
+int url_feof( URL_FILE * file );
+size_t url_fread( void *ptr, size_t size, size_t nmemb, URL_FILE * file );
+char *url_fgets( char *ptr, size_t size, URL_FILE * file );
+void url_rewind( URL_FILE * file );
 
+wint_t url_fgetwc( URL_FILE * file );
+wint_t url_ungetwc( wint_t wc, URL_FILE * input );
+URL_FILE *file_to_url_file( FILE * f );
 
 #endif
diff --git a/src/io/io.c b/src/io/io.c
new file mode 100644
index 0000000..5d2c652
--- /dev/null
+++ b/src/io/io.c
@@ -0,0 +1,177 @@
+/*
+ * io.c
+ *
+ * Communication between PSSE and the outside world, via libcurl.
+ *
+ * (c) 2019 Simon Brooke <simon@journeyman.cc>
+ * Licensed under GPL version 2.0, or, at your option, any later version.
+ */
+
+#include <stdlib.h>
+
+#include "conspage.h"
+#include "consspaceobject.h"
+#include "debug.h"
+#include "fopen.h"
+#include "lispops.h"
+
+/**
+ * Convert this lisp string-like-thing (also works for symbols, and, later
+ * keywords) into a UTF-8 string. NOTE that the returned value has been
+ * malloced and must be freed. TODO: candidate to moving into a utilities
+ * file.
+ *
+ * @param s the lisp string or symbol;
+ * @return the c string.
+ */
+char *lisp_string_to_c_string( struct cons_pointer s ) {
+    char *result = NULL;
+
+    if ( stringp( s ) || symbolp( s ) ) {
+        int len = 0;
+
+        for ( struct cons_pointer c = s; !nilp( c );
+              c = pointer2cell( c ).payload.string.cdr ) {
+            len++;
+        }
+
+        wchar_t *buffer = calloc( len + 1, sizeof( wchar_t ) );
+        /* worst case, one wide char = four utf bytes */
+        result = calloc( ( len * 4 ) + 1, sizeof( char ) );
+
+        int i = 0;
+        for ( struct cons_pointer c = s; !nilp( c );
+              c = pointer2cell( c ).payload.string.cdr ) {
+            buffer[i++] = pointer2cell( c ).payload.string.character;
+        }
+
+        wcstombs( result, buffer, len );
+        free( buffer );
+    }
+
+    return result;
+}
+
+/**
+ * Function, sort-of: close the file indicated by my first arg, and return
+ * nil. If the first arg is not a stream, does nothing. All other args are
+ * ignored.
+ *
+ * * (close stream)
+ *
+ * @param frame my stack_frame.
+ * @param frame_pointer a pointer to my stack_frame.
+ * @param env my environment.
+ * @return T if the stream was successfully closed, else NIL.
+ */
+struct cons_pointer
+lisp_close( struct stack_frame *frame, struct cons_pointer frame_pointer,
+            struct cons_pointer env ) {
+    struct cons_pointer result = NIL;
+
+    if ( readp( frame->arg[0] ) || writep( frame->arg[0] ) ) {
+        if ( url_fclose( pointer2cell( frame->arg[0] ).payload.stream.stream )
+             == 0 ) {
+            result = TRUE;
+        }
+    }
+
+    return result;
+}
+
+/**
+ * Function: return a stream open on the URL indicated by the first argument;
+ * if a second argument is present and is non-nil, open it for reading. At
+ * present, further arguments are ignored and there is no mechanism to open
+ * to append, or error if the URL is faulty or indicates an unavailable
+ * resource.
+ *
+ * * (read-char stream)
+ *
+ * @param frame my stack_frame.
+ * @param frame_pointer a pointer to my stack_frame.
+ * @param env my environment.
+ * @return a string of one character, namely the next available character
+ * on my stream, if any, else NIL.
+ */
+struct cons_pointer
+lisp_open( struct stack_frame *frame, struct cons_pointer frame_pointer,
+           struct cons_pointer env ) {
+    struct cons_pointer result = NIL;
+
+    if ( stringp( frame->arg[0] ) ) {
+        char *url = lisp_string_to_c_string( frame->arg[0] );
+
+        if ( nilp( frame->arg[1] ) ) {
+            result = make_read_stream( url_fopen( url, "r" ) );
+        } else {
+            // TODO: anything more complex is a problem for another day.
+            result = make_write_stream( url_fopen( url, "w" ) );
+        }
+
+        free( url );
+    }
+
+    return result;
+}
+
+/**
+ * Function: return the next character from the stream indicated by arg 0;
+ * further arguments are ignored.
+ *
+ * * (read-char stream)
+ *
+ * @param frame my stack_frame.
+ * @param frame_pointer a pointer to my stack_frame.
+ * @param env my environment.
+ * @return a string of one character, namely the next available character
+ * on my stream, if any, else NIL.
+ */
+struct cons_pointer
+lisp_read_char( struct stack_frame *frame, struct cons_pointer frame_pointer,
+                struct cons_pointer env ) {
+    struct cons_pointer result = NIL;
+
+    if ( readp( frame->arg[0] ) ) {
+        result =
+            make_string( url_fgetwc
+                         ( pointer2cell( frame->arg[0] ).payload.stream.
+                           stream ), NIL );
+    }
+
+    return result;
+}
+
+/**
+ * Function: return a string representing all characters from the stream
+ * indicated by arg 0; further arguments are ignored.
+ *
+ * * (slurp stream)
+ *
+ * @param frame my stack_frame.
+ * @param frame_pointer a pointer to my stack_frame.
+ * @param env my environment.
+ * @return a string of one character, namely the next available character
+ * on my stream, if any, else NIL.
+ */
+struct cons_pointer
+lisp_slurp( struct stack_frame *frame, struct cons_pointer frame_pointer,
+            struct cons_pointer env ) {
+    struct cons_pointer result = NIL;
+    struct cons_pointer cdr = NIL;
+
+    if ( readp( frame->arg[0] ) ) {
+        URL_FILE *stream = pointer2cell( frame->arg[0] ).payload.stream.stream;
+
+        for ( wint_t c = url_fgetwc( stream ); c != -1;
+              c = url_fgetwc( stream ) ) {
+            cdr = make_string( ( ( wchar_t ) c ), cdr );
+
+            if ( nilp( result ) ) {
+                result = cdr;
+            }
+        }
+    }
+
+    return result;
+}
diff --git a/src/io/io.h b/src/io/io.h
new file mode 100644
index 0000000..06dcaed
--- /dev/null
+++ b/src/io/io.h
@@ -0,0 +1,28 @@
+
+/*
+ * io.h
+ *
+ * Communication between PSSE and the outside world, via libcurl.
+ *
+ * (c) 2019 Simon Brooke <simon@journeyman.cc>
+ * Licensed under GPL version 2.0, or, at your option, any later version.
+ */
+
+#ifndef __psse_io_h
+#define __psse_io_h
+
+struct cons_pointer
+lisp_close( struct stack_frame *frame, struct cons_pointer frame_pointer,
+            struct cons_pointer env );
+struct cons_pointer
+lisp_open( struct stack_frame *frame, struct cons_pointer frame_pointer,
+           struct cons_pointer env );
+struct cons_pointer
+lisp_read_char( struct stack_frame *frame, struct cons_pointer frame_pointer,
+                struct cons_pointer env );
+struct cons_pointer
+lisp_slurp( struct stack_frame *frame, struct cons_pointer frame_pointer,
+            struct cons_pointer env );
+
+
+#endif
diff --git a/src/memory/conspage.c b/src/memory/conspage.c
index 03034e4..7a1a0d8 100644
--- a/src/memory/conspage.c
+++ b/src/memory/conspage.c
@@ -117,7 +117,7 @@ void make_cons_page(  ) {
  */
 void dump_pages( URL_FILE * output ) {
     for ( int i = 0; i < initialised_cons_pages; i++ ) {
-        fwprintf( output, L"\nDUMPING PAGE %d\n", i );
+        url_fwprintf( output, L"\nDUMPING PAGE %d\n", i );
 
         for ( int j = 0; j < CONSPAGESIZE; j++ ) {
             dump_object( output, ( struct cons_pointer ) {
diff --git a/src/memory/consspaceobject.h b/src/memory/consspaceobject.h
index b3f587c..6230e64 100644
--- a/src/memory/consspaceobject.h
+++ b/src/memory/consspaceobject.h
@@ -491,6 +491,10 @@ struct special_payload {
 struct stream_payload {
     /** the stream to read from or write to. */
     URL_FILE *stream;
+    /** metadata on the stream (e.g. its file attributes if a file, its HTTP
+     * headers if a URL, etc). Expected to be an association, or nil. Not yet
+     * implemented. */
+    struct cons_pointer meta;
 };
 
 /**
diff --git a/src/memory/dump.c b/src/memory/dump.c
index cec0dfd..e99d306 100644
--- a/src/memory/dump.c
+++ b/src/memory/dump.c
@@ -30,22 +30,22 @@ void dump_string_cell( URL_FILE * output, wchar_t *prefix,
                        struct cons_pointer pointer ) {
     struct cons_space_object cell = pointer2cell( pointer );
     if ( cell.payload.string.character == 0 ) {
-        fwprintf( output,
-                  L"\t\t%ls cell: termination; next at page %d offset %d, count %u\n",
-                  prefix,
-                  cell.payload.string.cdr.page, cell.payload.string.cdr.offset,
-                  cell.count );
+        url_fwprintf( output,
+                      L"\t\t%ls cell: termination; next at page %d offset %d, count %u\n",
+                      prefix,
+                      cell.payload.string.cdr.page,
+                      cell.payload.string.cdr.offset, cell.count );
     } else {
-        fwprintf( output,
-                  L"\t\t%ls cell: character '%lc' (%d) next at page %d offset %d, count %u\n",
-                  prefix,
-                  ( wint_t ) cell.payload.string.character,
-                  cell.payload.string.character,
-                  cell.payload.string.cdr.page,
-                  cell.payload.string.cdr.offset, cell.count );
-        fwprintf( output, L"\t\t value: " );
+        url_fwprintf( output,
+                      L"\t\t%ls cell: character '%lc' (%d) next at page %d offset %d, count %u\n",
+                      prefix,
+                      ( wint_t ) cell.payload.string.character,
+                      cell.payload.string.character,
+                      cell.payload.string.cdr.page,
+                      cell.payload.string.cdr.offset, cell.count );
+        url_fwprintf( output, L"\t\t value: " );
         print( output, pointer );
-        fwprintf( output, L"\n" );
+        url_fwprintf( output, L"\n" );
     }
 }
 
@@ -54,70 +54,71 @@ void dump_string_cell( URL_FILE * output, wchar_t *prefix,
  */
 void dump_object( URL_FILE * output, struct cons_pointer pointer ) {
     struct cons_space_object cell = pointer2cell( pointer );
-    fwprintf( output,
-              L"\t%4.4s (%d) at page %d, offset %d count %u\n",
-              cell.tag.bytes,
-              cell.tag.value, pointer.page, pointer.offset, cell.count );
+    url_fwprintf( output,
+                  L"\t%4.4s (%d) at page %d, offset %d count %u\n",
+                  cell.tag.bytes,
+                  cell.tag.value, pointer.page, pointer.offset, cell.count );
 
     switch ( cell.tag.value ) {
         case CONSTV:
-            fwprintf( output,
-                      L"\t\tCons cell: car at page %d offset %d, cdr at page %d offset %d, count %u :",
-                      cell.payload.cons.car.page,
-                      cell.payload.cons.car.offset,
-                      cell.payload.cons.cdr.page,
-                      cell.payload.cons.cdr.offset, cell.count );
+            url_fwprintf( output,
+                          L"\t\tCons cell: car at page %d offset %d, cdr at page %d offset %d, count %u :",
+                          cell.payload.cons.car.page,
+                          cell.payload.cons.car.offset,
+                          cell.payload.cons.cdr.page,
+                          cell.payload.cons.cdr.offset, cell.count );
             print( output, pointer );
-            fputws( L"\n", output );
+            url_fputws( L"\n", output );
             break;
         case EXCEPTIONTV:
-            fwprintf( output, L"\t\tException cell: " );
+            url_fwprintf( output, L"\t\tException cell: " );
             dump_stack_trace( output, pointer );
             break;
         case FREETV:
-            fwprintf( output, L"\t\tFree cell: next at page %d offset %d\n",
-                      cell.payload.cons.cdr.page,
-                      cell.payload.cons.cdr.offset );
+            url_fwprintf( output,
+                          L"\t\tFree cell: next at page %d offset %d\n",
+                          cell.payload.cons.cdr.page,
+                          cell.payload.cons.cdr.offset );
             break;
         case INTEGERTV:
-            fwprintf( output,
-                      L"\t\tInteger cell: value %ld, count %u\n",
-                      cell.payload.integer.value, cell.count );
+            url_fwprintf( output,
+                          L"\t\tInteger cell: value %ld, count %u\n",
+                          cell.payload.integer.value, cell.count );
             if ( !nilp( cell.payload.integer.more ) ) {
-                fputws( L"\t\tBIGNUM! More at:\n", output );
+                url_fputws( L"\t\tBIGNUM! More at:\n", output );
                 dump_object( output, cell.payload.integer.more );
             }
             break;
         case LAMBDATV:
-            fwprintf( output, L"\t\t\u03bb cell;\n\t\t args: " );
+            url_fwprintf( output, L"\t\t\u03bb cell;\n\t\t args: " );
             print( output, cell.payload.lambda.args );
-            fwprintf( output, L";\n\t\t\tbody: " );
+            url_fwprintf( output, L";\n\t\t\tbody: " );
             print( output, cell.payload.lambda.body );
-            fputws( L"\n", output );
+            url_fputws( L"\n", output );
             break;
         case NILTV:
             break;
         case NLAMBDATV:
-            fwprintf( output, L"\t\tn\u03bb cell; \n\t\targs: " );
+            url_fwprintf( output, L"\t\tn\u03bb cell; \n\t\targs: " );
             print( output, cell.payload.lambda.args );
-            fwprintf( output, L";\n\t\t\tbody: " );
+            url_fwprintf( output, L";\n\t\t\tbody: " );
             print( output, cell.payload.lambda.body );
-            fputws( L"\n", output );
+            url_fputws( L"\n", output );
             break;
         case RATIOTV:
-            fwprintf( output,
-                      L"\t\tRational cell: value %ld/%ld, count %u\n",
-                      pointer2cell( cell.payload.ratio.dividend ).payload.
-                      integer.value,
-                      pointer2cell( cell.payload.ratio.divisor ).payload.
-                      integer.value, cell.count );
+            url_fwprintf( output,
+                          L"\t\tRational cell: value %ld/%ld, count %u\n",
+                          pointer2cell( cell.payload.ratio.dividend ).
+                          payload.integer.value,
+                          pointer2cell( cell.payload.ratio.divisor ).
+                          payload.integer.value, cell.count );
             break;
         case READTV:
-            fwprintf( output, L"\t\tInput stream\n" );
+            url_fwprintf( output, L"\t\tInput stream\n" );
             break;
         case REALTV:
-            fwprintf( output, L"\t\tReal cell: value %Lf, count %u\n",
-                      cell.payload.real.value, cell.count );
+            url_fwprintf( output, L"\t\tReal cell: value %Lf, count %u\n",
+                          cell.payload.real.value, cell.count );
             break;
         case STRINGTV:
             dump_string_cell( output, L"String", pointer );
@@ -128,14 +129,14 @@ void dump_object( URL_FILE * output, struct cons_pointer pointer ) {
         case TRUETV:
             break;
         case VECTORPOINTTV:{
-                fwprintf( output,
-                          L"\t\tPointer to vector-space object at %p\n",
-                          cell.payload.vectorp.address );
+                url_fwprintf( output,
+                              L"\t\tPointer to vector-space object at %p\n",
+                              cell.payload.vectorp.address );
                 struct vector_space_object *vso = cell.payload.vectorp.address;
-                fwprintf( output,
-                          L"\t\tVector space object of type %4.4s (%d), payload size %d bytes\n",
-                          &vso->header.tag.bytes, vso->header.tag.value,
-                          vso->header.size );
+                url_fwprintf( output,
+                              L"\t\tVector space object of type %4.4s (%d), payload size %d bytes\n",
+                              &vso->header.tag.bytes, vso->header.tag.value,
+                              vso->header.size );
                 if ( stackframep( vso ) ) {
                     dump_frame( output, pointer );
                 }
@@ -147,7 +148,7 @@ void dump_object( URL_FILE * output, struct cons_pointer pointer ) {
             }
             break;
         case WRITETV:
-            fwprintf( output, L"\t\tOutput stream\n" );
+            url_fwprintf( output, L"\t\tOutput stream\n" );
             break;
     }
 }
diff --git a/src/memory/stack.c b/src/memory/stack.c
index b2585c7..3f4a271 100644
--- a/src/memory/stack.c
+++ b/src/memory/stack.c
@@ -34,9 +34,9 @@ void set_reg( struct stack_frame *frame, int reg, struct cons_pointer value ) {
     debug_printf( DEBUG_STACK, L"Setting register %d to ", reg );
     debug_print_object( value, DEBUG_STACK );
     debug_println( DEBUG_STACK );
-    dec_ref(frame->arg[reg]); /* if there was anything in that slot
-                               * previously other than NIL, we need to decrement it;
-                               * NIL won't be decremented as it is locked. */
+    dec_ref( frame->arg[reg] ); /* if there was anything in that slot
+                                 * previously other than NIL, we need to decrement it;
+                                 * NIL won't be decremented as it is locked. */
     frame->arg[reg] = value;
     inc_ref( value );
 
@@ -245,22 +245,22 @@ void dump_frame( URL_FILE * output, struct cons_pointer frame_pointer ) {
     struct stack_frame *frame = get_stack_frame( frame_pointer );
 
     if ( frame != NULL ) {
-        fwprintf( output, L"Stack frame with %d arguments:\n", frame->args );
+        url_fwprintf( output, L"Stack frame with %d arguments:\n",
+                      frame->args );
         for ( int arg = 0; arg < frame->args; arg++ ) {
             struct cons_space_object cell = pointer2cell( frame->arg[arg] );
 
-            fwprintf( output, L"Arg %d:\t%c%c%c%c\tcount: %10u\tvalue: ", arg,
-                      cell.tag.bytes[0],
-                      cell.tag.bytes[1], cell.tag.bytes[2], cell.tag.bytes[3],
-                      cell.count );
+            url_fwprintf( output, L"Arg %d:\t%c%c%c%c\tcount: %10u\tvalue: ",
+                          arg, cell.tag.bytes[0], cell.tag.bytes[1],
+                          cell.tag.bytes[2], cell.tag.bytes[3], cell.count );
 
             print( output, frame->arg[arg] );
-            fputws( L"\n", output );
+            url_fputws( L"\n", output );
         }
         if ( !nilp( frame->more ) ) {
-            fputws( L"More: \t", output );
+            url_fputws( L"More: \t", output );
             print( output, frame->more );
-            fputws( L"\n", output );
+            url_fputws( L"\n", output );
         }
     }
 }
@@ -268,7 +268,7 @@ void dump_frame( URL_FILE * output, struct cons_pointer frame_pointer ) {
 void dump_stack_trace( URL_FILE * output, struct cons_pointer pointer ) {
     if ( exceptionp( pointer ) ) {
         print( output, pointer2cell( pointer ).payload.exception.message );
-        fputws( L"\n", output );
+        url_fputws( L"\n", output );
         dump_stack_trace( output,
                           pointer2cell( pointer ).payload.exception.frame );
     } else {
diff --git a/src/memory/vectorspace.c b/src/memory/vectorspace.c
index 9d98a77..480effb 100644
--- a/src/memory/vectorspace.c
+++ b/src/memory/vectorspace.c
@@ -36,7 +36,8 @@
  * @return a cons_pointer to the object, or NIL if the object could not be
  * allocated due to memory exhaustion.
  */
-struct cons_pointer make_vec_pointer( struct vector_space_object *address, char *tag ) {
+struct cons_pointer make_vec_pointer( struct vector_space_object *address,
+                                      char *tag ) {
     debug_print( L"Entered make_vec_pointer\n", DEBUG_ALLOC );
     struct cons_pointer pointer = allocate_cell( VECTORPOINTTAG );
     struct cons_space_object *cell = &pointer2cell( pointer );
@@ -46,7 +47,7 @@ struct cons_pointer make_vec_pointer( struct vector_space_object *address, char
                   address );
 
     cell->payload.vectorp.address = address;
-    strncpy(&cell->payload.vectorp.tag.bytes[0], tag, TAGLENGTH);
+    strncpy( &cell->payload.vectorp.tag.bytes[0], tag, TAGLENGTH );
 
     debug_printf( DEBUG_ALLOC,
                   L"make_vec_pointer: all good, returning pointer to %p\n",
diff --git a/src/ops/equal.c b/src/ops/equal.c
index 0c01a81..2775218 100644
--- a/src/ops/equal.c
+++ b/src/ops/equal.c
@@ -80,8 +80,8 @@ bool equal( struct cons_pointer a, struct cons_pointer b ) {
                     && ( equal( cell_a->payload.string.cdr,
                                 cell_b->payload.string.cdr )
                          || ( end_of_string( cell_a->payload.string.cdr )
-                              && end_of_string( cell_b->payload.string.
-                                                cdr ) ) );
+                              && end_of_string( cell_b->payload.
+                                                string.cdr ) ) );
                 break;
             case INTEGERTV:
                 result =
diff --git a/src/ops/intern.c b/src/ops/intern.c
index 1e32a36..87d116e 100644
--- a/src/ops/intern.c
+++ b/src/ops/intern.c
@@ -110,8 +110,8 @@ struct cons_pointer c_assoc( struct cons_pointer key,
  * with this key/value pair added to the front.
  */
 struct cons_pointer
-bind( struct cons_pointer key, struct cons_pointer value,
-      struct cons_pointer store ) {
+set( struct cons_pointer key, struct cons_pointer value,
+     struct cons_pointer store ) {
     debug_print( L"Binding ", DEBUG_BIND );
     debug_print_object( key, DEBUG_BIND );
     debug_print( L" to ", DEBUG_BIND );
@@ -131,7 +131,7 @@ deep_bind( struct cons_pointer key, struct cons_pointer value ) {
     debug_print( L"Entering deep_bind\n", DEBUG_BIND );
     struct cons_pointer old = oblist;
 
-    oblist = bind( key, value, oblist );
+    oblist = set( key, value, oblist );
     inc_ref( oblist );
     dec_ref( old );
 
@@ -153,7 +153,7 @@ intern( struct cons_pointer key, struct cons_pointer environment ) {
         /*
          * not currently bound
          */
-        result = bind( key, NIL, environment );
+        result = set( key, NIL, environment );
     }
 
     return result;
diff --git a/src/ops/intern.h b/src/ops/intern.h
index b261242..fa17563 100644
--- a/src/ops/intern.h
+++ b/src/ops/intern.h
@@ -28,9 +28,9 @@ struct cons_pointer c_assoc( struct cons_pointer key,
 struct cons_pointer internedp( struct cons_pointer key,
                                struct cons_pointer environment );
 
-struct cons_pointer bind( struct cons_pointer key,
-                          struct cons_pointer value,
-                          struct cons_pointer store );
+struct cons_pointer set( struct cons_pointer key,
+                         struct cons_pointer value,
+                         struct cons_pointer store );
 
 struct cons_pointer deep_bind( struct cons_pointer key,
                                struct cons_pointer value );
diff --git a/src/ops/io.c b/src/ops/io.c
deleted file mode 100644
index ccd0af5..0000000
--- a/src/ops/io.c
+++ /dev/null
@@ -1,8 +0,0 @@
-/*
- * io.c
- *
- * Communication between PSSE and the outside world, via libcurl.
- *
- * (c) 2017 Simon Brooke <simon@journeyman.cc>
- * Licensed under GPL version 2.0, or, at your option, any later version.
- */
diff --git a/src/ops/lispops.c b/src/ops/lispops.c
index 9448c55..4bfe6f0 100644
--- a/src/ops/lispops.c
+++ b/src/ops/lispops.c
@@ -29,6 +29,7 @@
 #include "debug.h"
 #include "dump.h"
 #include "equal.h"
+#include "fopen.h"
 #include "integer.h"
 #include "intern.h"
 #include "lispops.h"
@@ -231,7 +232,7 @@ eval_lambda( struct cons_space_object cell, struct stack_frame *frame,
             struct cons_pointer name = c_car( names );
             struct cons_pointer val = frame->arg[i];
 
-            new_env = bind( name, val, new_env );
+            new_env = set( name, val, new_env );
             log_binding( name, val );
 
             names = c_cdr( names );
@@ -256,7 +257,7 @@ eval_lambda( struct cons_space_object cell, struct stack_frame *frame,
             }
         }
 
-        new_env = bind( names, vals, new_env );
+        new_env = set( names, vals, new_env );
         inc_ref( new_env );
     }
 
@@ -377,10 +378,9 @@ c_apply( struct stack_frame *frame, struct cons_pointer frame_pointer,
                         result = next_pointer;
                     } else {
                         result =
-                            ( *fn_cell.payload.
-                              special.executable ) ( get_stack_frame
-                                                     ( next_pointer ),
-                                                     next_pointer, env );
+                            ( *fn_cell.payload.special.
+                              executable ) ( get_stack_frame( next_pointer ),
+                                             next_pointer, env );
                         debug_print( L"Special form returning: ", DEBUG_EVAL );
                         debug_print_object( result, DEBUG_EVAL );
                         debug_println( DEBUG_EVAL );
@@ -627,10 +627,10 @@ lisp_set_shriek( struct stack_frame *frame, struct cons_pointer frame_pointer,
  * @return true if `arg` represents an end of string, else false.
  * \todo candidate for moving to a memory/string.c file
  */
-bool end_of_stringp(struct cons_pointer arg) {
-  return nilp(arg) ||
-    ( stringp( arg ) &&
-     pointer2cell(arg).payload.string.character == (wint_t)'\0');
+bool end_of_stringp( struct cons_pointer arg ) {
+    return nilp( arg ) ||
+        ( stringp( arg ) &&
+          pointer2cell( arg ).payload.string.character == ( wint_t ) '\0' );
 }
 
 /**
@@ -656,8 +656,8 @@ lisp_cons( struct stack_frame *frame, struct cons_pointer frame_pointer,
     if ( nilp( car ) && nilp( cdr ) ) {
         return NIL;
     } else if ( stringp( car ) && stringp( cdr ) &&
-                end_of_stringp( c_cdr( car)) ) {
-      // \todo check that car is of length 1
+                end_of_stringp( c_cdr( car ) ) ) {
+        // \todo check that car is of length 1
         result =
             make_string( pointer2cell( car ).payload.string.character, cdr );
     } else {
@@ -691,7 +691,8 @@ lisp_car( struct stack_frame *frame, struct cons_pointer frame_pointer,
             result = cell.payload.cons.car;
             break;
         case READTV:
-            result = make_string( fgetwc( cell.payload.stream.stream ), NIL );
+            result =
+                make_string( url_fgetwc( cell.payload.stream.stream ), NIL );
             break;
         case NILTV:
             break;
@@ -734,7 +735,7 @@ lisp_cdr( struct stack_frame *frame, struct cons_pointer frame_pointer,
             result = cell.payload.cons.cdr;
             break;
         case READTV:
-            fgetwc( cell.payload.stream.stream );
+            url_fgetwc( cell.payload.stream.stream );
             result = frame->arg[0];
             break;
         case STRINGTV:
@@ -839,7 +840,8 @@ lisp_read( struct stack_frame *frame, struct cons_pointer frame_pointer,
 #ifdef DEBUG
     debug_print( L"entering lisp_read\n", DEBUG_IO );
 #endif
-    URL_FILE *input = stdin;
+    URL_FILE *input;
+
     struct cons_pointer in_stream = readp( frame->arg[0] ) ?
         frame->arg[0] : get_default_stream( true, env );
 
@@ -848,6 +850,8 @@ lisp_read( struct stack_frame *frame, struct cons_pointer frame_pointer,
         debug_dump_object( in_stream, DEBUG_IO );
         input = pointer2cell( in_stream ).payload.stream.stream;
         inc_ref( in_stream );
+    } else {
+        input = file_to_url_file( stdin );
     }
 
     struct cons_pointer result = read( frame, frame_pointer, input );
@@ -856,8 +860,11 @@ lisp_read( struct stack_frame *frame, struct cons_pointer frame_pointer,
 
     if ( readp( in_stream ) ) {
         dec_ref( in_stream );
+    } else {
+        free( input );
     }
 
+
     return result;
 }
 
@@ -922,7 +929,7 @@ lisp_print( struct stack_frame *frame, struct cons_pointer frame_pointer,
             struct cons_pointer env ) {
     debug_print( L"Entering print\n", DEBUG_IO );
     struct cons_pointer result = NIL;
-    URL_FILE *output = stdout;
+    URL_FILE *output;
     struct cons_pointer out_stream = writep( frame->arg[1] ) ?
         frame->arg[1] : get_default_stream( false, env );
 
@@ -931,6 +938,8 @@ lisp_print( struct stack_frame *frame, struct cons_pointer frame_pointer,
         debug_dump_object( out_stream, DEBUG_IO );
         output = pointer2cell( out_stream ).payload.stream.stream;
         inc_ref( out_stream );
+    } else {
+        output = file_to_url_file( stderr );
     }
 
     debug_print( L"lisp_print: about to print\n", DEBUG_IO );
@@ -943,6 +952,8 @@ lisp_print( struct stack_frame *frame, struct cons_pointer frame_pointer,
 
     if ( writep( out_stream ) ) {
         dec_ref( out_stream );
+    } else {
+        free( output );
     }
 
     return result;
@@ -1035,7 +1046,7 @@ lisp_progn( struct stack_frame *frame, struct cons_pointer frame_pointer,
  * @return the value of the last expression of the first successful `clause`.
  */
 struct cons_pointer
- lisp_cond( struct stack_frame *frame, struct cons_pointer frame_pointer,
+lisp_cond( struct stack_frame *frame, struct cons_pointer frame_pointer,
            struct cons_pointer env ) {
     struct cons_pointer result = NIL;
     bool done = false;
@@ -1165,7 +1176,7 @@ struct cons_pointer lisp_repl( struct stack_frame *frame,
      * print as parent.
      */
     while ( readp( input ) && writep( output )
-            && !feof( pointer2cell( input ).payload.stream.stream ) ) {
+            && !url_feof( pointer2cell( input ).payload.stream.stream ) ) {
         /* OK, here's a really subtle problem: because lists are immutable, anything
          * bound in the oblist subsequent to this function being invoked isn't in the
          * environment. So, for example, changes to *prompt* or *log* made in the oblist
@@ -1203,7 +1214,7 @@ struct cons_pointer lisp_repl( struct stack_frame *frame,
         inc_ref( expr );
 
         if ( exceptionp( expr )
-             && feof( pointer2cell( input ).payload.stream.stream ) ) {
+             && url_feof( pointer2cell( input ).payload.stream.stream ) ) {
             /* suppress printing end of stream exception */
             break;
         }
@@ -1282,7 +1293,7 @@ struct cons_pointer lisp_inspect( struct stack_frame *frame,
                                   struct cons_pointer frame_pointer,
                                   struct cons_pointer env ) {
     debug_print( L"Entering print\n", DEBUG_IO );
-    URL_FILE *output = stdout;
+    URL_FILE *output;
     struct cons_pointer out_stream = writep( frame->arg[1] ) ?
         frame->arg[1] : get_default_stream( false, env );
 
@@ -1291,11 +1302,16 @@ struct cons_pointer lisp_inspect( struct stack_frame *frame,
         debug_dump_object( out_stream, DEBUG_IO );
         output = pointer2cell( out_stream ).payload.stream.stream;
         inc_ref( out_stream );
+    } else {
+        output = file_to_url_file( stdout );
     }
+
     dump_object( output, frame->arg[0] );
 
     if ( writep( out_stream ) ) {
         dec_ref( out_stream );
+    } else {
+        free( output );
     }
 
     return frame->arg[0];
diff --git a/src/ops/print.c b/src/ops/print.c
index d313960..8cb137e 100644
--- a/src/ops/print.c
+++ b/src/ops/print.c
@@ -40,7 +40,7 @@ void print_string_contents( URL_FILE * output, struct cons_pointer pointer ) {
         wchar_t c = cell->payload.string.character;
 
         if ( c != '\0' ) {
-            fputwc( c, output );
+            url_fputwc( c, output );
         }
         pointer = cell->payload.string.cdr;
     }
@@ -52,9 +52,9 @@ void print_string_contents( URL_FILE * output, struct cons_pointer pointer ) {
  * characters.
  */
 void print_string( URL_FILE * output, struct cons_pointer pointer ) {
-    fputwc( btowc( '"' ), output );
+    url_fputwc( btowc( '"' ), output );
     print_string_contents( output, pointer );
-    fputwc( btowc( '"' ), output );
+    url_fputwc( btowc( '"' ), output );
 }
 
 /**
@@ -70,7 +70,7 @@ print_list_contents( URL_FILE * output, struct cons_pointer pointer,
     switch ( cell->tag.value ) {
         case CONSTV:
             if ( initial_space ) {
-                fputwc( btowc( ' ' ), output );
+                url_fputwc( btowc( ' ' ), output );
             }
             print( output, cell->payload.cons.car );
 
@@ -79,23 +79,23 @@ print_list_contents( URL_FILE * output, struct cons_pointer pointer,
         case NILTV:
             break;
         default:
-            fwprintf( output, L" . " );
+            url_fwprintf( output, L" . " );
             print( output, pointer );
     }
 }
 
 void print_list( URL_FILE * output, struct cons_pointer pointer ) {
     if ( print_use_colours ) {
-        fwprintf( output, L"%s(%s", "\x1B[31m", "\x1B[39m" );
+        url_fwprintf( output, L"%s(%s", "\x1B[31m", "\x1B[39m" );
     } else {
-        fputws( L"(", output );
+        url_fputws( L"(", output );
     };
 
     print_list_contents( output, pointer, false );
     if ( print_use_colours ) {
-        fwprintf( output, L"%s)%s", "\x1B[31m", "\x1B[39m" );
+        url_fwprintf( output, L"%s)%s", "\x1B[31m", "\x1B[39m" );
     } else {
-        fputws( L")", output );
+        url_fputws( L")", output );
     }
 
 }
@@ -117,18 +117,18 @@ struct cons_pointer print( URL_FILE * output, struct cons_pointer pointer ) {
             print_list( output, pointer );
             break;
         case EXCEPTIONTV:
-            fwprintf( output, L"\n%sException: ",
-                      print_use_colours ? "\x1B[31m" : "" );
+            url_fwprintf( output, L"\n%sException: ",
+                          print_use_colours ? "\x1B[31m" : "" );
             dump_stack_trace( output, pointer );
             break;
         case FUNCTIONTV:
-            fwprintf( output, L"<Function>" );
+            url_fwprintf( output, L"<Function>" );
             break;
         case INTEGERTV:{
                 struct cons_pointer s = integer_to_string( pointer, 10 );
                 inc_ref( s );
                 if ( print_use_colours ) {
-                    fputws( L"\x1B[34m", output );
+                    url_fputws( L"\x1B[34m", output );
                 }
                 print_string_contents( output, s );
                 dec_ref( s );
@@ -147,7 +147,7 @@ struct cons_pointer print( URL_FILE * output, struct cons_pointer pointer ) {
             }
             break;
         case NILTV:
-            fwprintf( output, L"nil" );
+            url_fwprintf( output, L"nil" );
             break;
         case NLAMBDATV:{
                 struct cons_pointer to_print =
@@ -163,11 +163,11 @@ struct cons_pointer print( URL_FILE * output, struct cons_pointer pointer ) {
             break;
         case RATIOTV:
             print( output, cell.payload.ratio.dividend );
-            fputws( L"/", output );
+            url_fputws( L"/", output );
             print( output, cell.payload.ratio.divisor );
             break;
         case READTV:
-            fwprintf( output, L"<Input stream>" );
+            url_fwprintf( output, L"<Input stream>" );
             break;
         case REALTV:
             /* \todo using the C heap is a bad plan because it will fragment.
@@ -183,31 +183,31 @@ struct cons_pointer print( URL_FILE * output, struct cons_pointer pointer ) {
                 }
             }
             if ( print_use_colours ) {
-                fputws( L"\x1B[34m", output );
+                url_fputws( L"\x1B[34m", output );
             }
-            fwprintf( output, L"%s", buffer );
+            url_fwprintf( output, L"%s", buffer );
             free( buffer );
             break;
         case STRINGTV:
             if ( print_use_colours ) {
-                fputws( L"\x1B[36m", output );
+                url_fputws( L"\x1B[36m", output );
             }
             print_string( output, pointer );
             break;
         case SYMBOLTV:
             if ( print_use_colours ) {
-                fputws( L"\x1B[1;33m", output );
+                url_fputws( L"\x1B[1;33m", output );
             }
             print_string_contents( output, pointer );
             break;
         case SPECIALTV:
-            fwprintf( output, L"<Special form>" );
+            url_fwprintf( output, L"<Special form>" );
             break;
         case TRUETV:
-            fwprintf( output, L"t" );
+            url_fwprintf( output, L"t" );
             break;
         case WRITETV:
-            fwprintf( output, L"<Output stream>" );
+            url_fwprintf( output, L"<Output stream>" );
             break;
         default:
             fwprintf( stderr,
@@ -219,12 +219,12 @@ struct cons_pointer print( URL_FILE * output, struct cons_pointer pointer ) {
     }
 
     if ( print_use_colours ) {
-        fputws( L"\x1B[39m", output );
+        url_fputws( L"\x1B[39m", output );
     }
 
     return pointer;
 }
 
 void println( URL_FILE * output ) {
-    fputws( L"\n", output );
+    url_fputws( L"\n", output );
 }
diff --git a/src/ops/read.c b/src/ops/read.c
index d2f79c4..989aa67 100644
--- a/src/ops/read.c
+++ b/src/ops/read.c
@@ -41,8 +41,8 @@ struct cons_pointer read_number( struct stack_frame *frame,
                                  URL_FILE * input, wint_t initial,
                                  bool seen_period );
 struct cons_pointer read_list( struct stack_frame *frame,
-                               struct cons_pointer frame_pointer, URL_FILE * input,
-                               wint_t initial );
+                               struct cons_pointer frame_pointer,
+                               URL_FILE * input, wint_t initial );
 struct cons_pointer read_string( URL_FILE * input, wint_t initial );
 struct cons_pointer read_symbol( URL_FILE * input, wint_t initial );
 
@@ -68,16 +68,18 @@ struct cons_pointer read_continuation( struct stack_frame *frame,
     wint_t c;
 
     for ( c = initial;
-          c == '\0' || iswblank( c ) || iswcntrl( c ); c = fgetwc( input ) );
+          c == '\0' || iswblank( c ) || iswcntrl( c );
+          c = url_fgetwc( input ) );
 
-    if ( feof( input ) ) {
+    if ( url_feof( input ) ) {
         result =
             throw_exception( c_string_to_lisp_string
                              ( L"End of file while reading" ), frame_pointer );
     } else {
         switch ( c ) {
             case ';':
-                for ( c = fgetwc( input ); c != '\n'; c = fgetwc( input ) );
+                for ( c = url_fgetwc( input ); c != '\n';
+                      c = url_fgetwc( input ) );
                 /* skip all characters from semi-colon to the end of the line */
                 break;
             case EOF:
@@ -89,18 +91,19 @@ struct cons_pointer read_continuation( struct stack_frame *frame,
                 result =
                     c_quote( read_continuation
                              ( frame, frame_pointer, input,
-                               fgetwc( input ) ) );
+                               url_fgetwc( input ) ) );
                 break;
             case '(':
                 result =
-                    read_list( frame, frame_pointer, input, fgetwc( input ) );
+                    read_list( frame, frame_pointer, input,
+                               url_fgetwc( input ) );
                 break;
             case '"':
-                result = read_string( input, fgetwc( input ) );
+                result = read_string( input, url_fgetwc( input ) );
                 break;
             case '-':{
-                    wint_t next = fgetwc( input );
-                    ungetwc( next, input );
+                    wint_t next = url_fgetwc( input );
+                    url_ungetwc( next, input );
                     if ( iswdigit( next ) ) {
                         result =
                             read_number( frame, frame_pointer, input, c,
@@ -112,9 +115,9 @@ struct cons_pointer read_continuation( struct stack_frame *frame,
                 break;
             case '.':
                 {
-                    wint_t next = fgetwc( input );
+                    wint_t next = url_fgetwc( input );
                     if ( iswdigit( next ) ) {
-                        ungetwc( next, input );
+                        url_ungetwc( next, input );
                         result =
                             read_number( frame, frame_pointer, input, c,
                                          true );
@@ -123,13 +126,13 @@ struct cons_pointer read_continuation( struct stack_frame *frame,
                          * really need to backtrack up a level. */
                         result =
                             read_continuation( frame, frame_pointer, input,
-                                               fgetwc( input ) );
+                                               url_fgetwc( input ) );
                     } else {
                         read_symbol( input, c );
                     }
                 }
                 break;
-          //case ':': reserved for keywords and paths
+                //case ':': reserved for keywords and paths
             default:
                 if ( iswdigit( c ) ) {
                     result =
@@ -173,14 +176,14 @@ struct cons_pointer read_number( struct stack_frame *frame,
     bool neg = initial == btowc( '-' );
 
     if ( neg ) {
-        initial = fgetwc( input );
+        initial = url_fgetwc( input );
     }
 
     debug_printf( DEBUG_IO, L"read_number starting '%c' (%d)\n", initial,
                   initial );
 
     for ( c = initial; iswdigit( c )
-          || c == L'.' || c == L'/' || c == L','; c = fgetwc( input ) ) {
+          || c == L'.' || c == L'/' || c == L','; c = url_fgetwc( input ) ) {
         switch ( c ) {
             case L'.':
                 if ( seen_period || !nilp( dividend ) ) {
@@ -229,7 +232,7 @@ struct cons_pointer read_number( struct stack_frame *frame,
     /*
      * push back the character read which was not a digit
      */
-    ungetwc( c, input );
+    url_ungetwc( c, input );
 
     if ( seen_period ) {
         debug_print( L"read_number: converting result to real\n", DEBUG_IO );
@@ -279,7 +282,7 @@ struct cons_pointer read_list( struct stack_frame *frame,
         result =
             make_cons( car,
                        read_list( frame, frame_pointer, input,
-                                  fgetwc( input ) ) );
+                                  url_fgetwc( input ) ) );
     } else {
         debug_print( L"End of list detected\n", DEBUG_IO );
     }
@@ -309,7 +312,8 @@ struct cons_pointer read_string( URL_FILE * input, wint_t initial ) {
             break;
         default:
             result =
-                make_string( initial, read_string( input, fgetwc( input ) ) );
+                make_string( initial,
+                             read_string( input, url_fgetwc( input ) ) );
             break;
     }
 
@@ -328,7 +332,8 @@ struct cons_pointer read_symbol( URL_FILE * input, wint_t initial ) {
              * THIS IS NOT A GOOD IDEA, but is legal
              */
             result =
-                make_symbol( initial, read_symbol( input, fgetwc( input ) ) );
+                make_symbol( initial,
+                             read_symbol( input, url_fgetwc( input ) ) );
             break;
         case ')':
             /*
@@ -338,20 +343,20 @@ struct cons_pointer read_symbol( URL_FILE * input, wint_t initial ) {
             /*
              * push back the character read
              */
-            ungetwc( initial, input );
+            url_ungetwc( initial, input );
             break;
         default:
             if ( iswprint( initial )
                  && !iswblank( initial ) ) {
                 result =
                     make_symbol( initial,
-                                 read_symbol( input, fgetwc( input ) ) );
+                                 read_symbol( input, url_fgetwc( input ) ) );
             } else {
                 result = NIL;
                 /*
                  * push back the character read
                  */
-                ungetwc( initial, input );
+                url_ungetwc( initial, input );
             }
             break;
     }
@@ -369,5 +374,6 @@ struct cons_pointer read( struct
                           stack_frame
                           *frame, struct cons_pointer frame_pointer,
                           URL_FILE * input ) {
-    return read_continuation( frame, frame_pointer, input, fgetwc( input ) );
+    return read_continuation( frame, frame_pointer, input,
+                              url_fgetwc( input ) );
 }
diff --git a/src/ops/read.h b/src/ops/read.h
index a1674d6..64f36b0 100644
--- a/src/ops/read.h
+++ b/src/ops/read.h
@@ -15,6 +15,7 @@
  * read the next object on this input stream and return a cons_pointer to it.
  */
 struct cons_pointer read( struct stack_frame *frame,
-                          struct cons_pointer frame_pointer, URL_FILE * input );
+                          struct cons_pointer frame_pointer,
+                          URL_FILE * input );
 
 #endif

From d9acb277bf463ef959744f66d60fb74bbf9cde48 Mon Sep 17 00:00:00 2001
From: Simon Brooke <simon@journeyman.cc>
Date: Sun, 27 Jan 2019 17:51:28 +0000
Subject: [PATCH 05/31] Tests now pass

at least, all the ones that did before!
---
 src/init.c     | 6 +++---
 src/io/fopen.c | 4 +++-
 2 files changed, 6 insertions(+), 4 deletions(-)

diff --git a/src/init.c b/src/init.c
index a45e685..2814f1d 100644
--- a/src/init.c
+++ b/src/init.c
@@ -162,16 +162,16 @@ int main( int argc, char *argv[] ) {
     bind_function( L"inspect", &lisp_inspect );
     bind_function( L"multiply", &lisp_multiply );
     bind_function( L"negative?", &lisp_is_negative );
-    bind_function( L"read", &lisp_read );
-    bind_function( L"repl", &lisp_repl );
     bind_function( L"oblist", &lisp_oblist );
     bind_function( L"open", &lisp_open );
     bind_function( L"print", &lisp_print );
     bind_function( L"progn", &lisp_progn );
     bind_function( L"read", &lisp_read );
-    bind_function( L"read_char", &lisp_read_char );
+    bind_function( L"read-char", &lisp_read_char );
+    bind_function( L"repl", &lisp_repl );
     bind_function( L"reverse", &lisp_reverse );
     bind_function( L"set", &lisp_set );
+    bind_function( L"slurp", &lisp_slurp );
     bind_function( L"source", &lisp_source );
     bind_function( L"subtract", &lisp_subtract );
     bind_function( L"throw", &lisp_exception );
diff --git a/src/io/fopen.c b/src/io/fopen.c
index 499fada..3b09957 100644
--- a/src/io/fopen.c
+++ b/src/io/fopen.c
@@ -47,6 +47,7 @@
 
 #include <curl/curl.h>
 
+#include "debug.h"
 #include "fopen.h"
 
 /* we use a global one for convenience */
@@ -474,6 +475,7 @@ wint_t url_fgetwc( URL_FILE * input ) {
             break;
     }
 
+    debug_printf( DEBUG_IO, L"url_fgetwc returning %d (%C)\n", result, result);
     return result;
 }
 
@@ -483,7 +485,7 @@ wint_t url_ungetwc( wint_t wc, URL_FILE * input ) {
     switch ( input->type ) {
         case CFTYPE_FILE:
             fwide( input->handle.file, 1 ); /* wide characters */
-            result = fgetwc( input->handle.file );  /* passthrough */
+            result = ungetwc( wc, input->handle.file );  /* passthrough */
             break;
 
         case CFTYPE_CURL:{

From 3470f27585f20db741cf498b616d08c34dd5a1c4 Mon Sep 17 00:00:00 2001
From: Simon Brooke <simon@journeyman.cc>
Date: Sun, 27 Jan 2019 18:54:23 +0000
Subject: [PATCH 06/31] Can now read files from the filesystem.

---
 hi                  |  1 +
 src/io/io.c         | 27 ++++++++++++++++++++-------
 unit-tests/slurp.sh | 13 +++++++++++++
 3 files changed, 34 insertions(+), 7 deletions(-)
 create mode 100644 hi
 create mode 100755 unit-tests/slurp.sh

diff --git a/hi b/hi
new file mode 100644
index 0000000..cf57f2a
--- /dev/null
+++ b/hi
@@ -0,0 +1 @@
+Hello, this is used by `slurp.sh` test, please do not remove.
diff --git a/src/io/io.c b/src/io/io.c
index 5d2c652..e510580 100644
--- a/src/io/io.c
+++ b/src/io/io.c
@@ -31,7 +31,7 @@ char *lisp_string_to_c_string( struct cons_pointer s ) {
         int len = 0;
 
         for ( struct cons_pointer c = s; !nilp( c );
-              c = pointer2cell( c ).payload.string.cdr ) {
+            c = pointer2cell( c ).payload.string.cdr ) {
             len++;
         }
 
@@ -49,6 +49,10 @@ char *lisp_string_to_c_string( struct cons_pointer s ) {
         free( buffer );
     }
 
+    debug_print(L"lisp_string_to_c_string( ", DEBUG_IO);
+    debug_print_object( s, DEBUG_IO);
+    debug_printf( DEBUG_IO, L") => '%s'\n", result);
+
     return result;
 }
 
@@ -110,6 +114,10 @@ lisp_open( struct stack_frame *frame, struct cons_pointer frame_pointer,
         }
 
         free( url );
+
+        if ( pointer2cell(result).payload.stream.stream == NULL) {
+            result = NIL;
+        }
     }
 
     return result;
@@ -158,18 +166,23 @@ struct cons_pointer
 lisp_slurp( struct stack_frame *frame, struct cons_pointer frame_pointer,
             struct cons_pointer env ) {
     struct cons_pointer result = NIL;
-    struct cons_pointer cdr = NIL;
 
     if ( readp( frame->arg[0] ) ) {
         URL_FILE *stream = pointer2cell( frame->arg[0] ).payload.stream.stream;
+        struct cons_pointer cursor = make_string( url_fgetwc( stream ), NIL);
+        result = cursor;
 
-        for ( wint_t c = url_fgetwc( stream ); c != -1;
+        for ( wint_t c = url_fgetwc( stream ); !url_feof(stream);
               c = url_fgetwc( stream ) ) {
-            cdr = make_string( ( ( wchar_t ) c ), cdr );
+            debug_print(L"slurp: cursor is: ", DEBUG_IO);
+            debug_dump_object( cursor, DEBUG_IO);
+            debug_print(L"; result is: ", DEBUG_IO);
+            debug_dump_object( result, DEBUG_IO);
+            debug_println( DEBUG_IO);
 
-            if ( nilp( result ) ) {
-                result = cdr;
-            }
+            struct cons_space_object * cell = &pointer2cell(cursor);
+            cursor = make_string( ( wchar_t ) c , NIL);
+            cell->payload.string.cdr = cursor;
         }
     }
 
diff --git a/unit-tests/slurp.sh b/unit-tests/slurp.sh
new file mode 100755
index 0000000..e285988
--- /dev/null
+++ b/unit-tests/slurp.sh
@@ -0,0 +1,13 @@
+#!/bin/bash
+
+expected='"Hello, this is used by `slurp.sh` test, please do not remove.'
+actual=`echo '(slurp (open "hi"))' | target/psse | tail -2 | head -1`
+
+if [ "${expected}" = "${actual}" ]
+then
+    echo "OK"
+    exit 0
+else
+    echo "Fail: expected '$expected', got '$actual'"
+    exit 1
+fi

From 8334e2bf1f3a92ff7af37adfb15fc977a361f772 Mon Sep 17 00:00:00 2001
From: Simon Brooke <simon@journeyman.cc>
Date: Mon, 28 Jan 2019 10:32:34 +0000
Subject: [PATCH 07/31] Still segfaults on read from URL.

---
 src/init.c     | 4 ++++
 src/io/fopen.c | 5 +----
 2 files changed, 5 insertions(+), 4 deletions(-)

diff --git a/src/init.c b/src/init.c
index 2814f1d..1fba3f2 100644
--- a/src/init.c
+++ b/src/init.c
@@ -16,6 +16,9 @@
 #include <unistd.h>
 #include <wchar.h>
 
+/* libcurl, used for io */
+#include <curl/curl.h>
+
 #include "version.h"
 #include "conspage.h"
 #include "consspaceobject.h"
@@ -84,6 +87,7 @@ int main( int argc, char *argv[] ) {
     bool show_prompt = false;
 
     setlocale( LC_ALL, "" );
+    curl_global_init(CURL_GLOBAL_DEFAULT);
 
     while ( ( option = getopt( argc, argv, "cpdv:" ) ) != -1 ) {
         switch ( option ) {
diff --git a/src/io/fopen.c b/src/io/fopen.c
index 3b09957..a2eddab 100644
--- a/src/io/fopen.c
+++ b/src/io/fopen.c
@@ -460,14 +460,11 @@ wint_t url_fgetwc( URL_FILE * input ) {
 
         case CFTYPE_CURL:{
                 wchar_t *wbuff = calloc( 2, sizeof( wchar_t ) );
-                char *cbuff = calloc( 5, sizeof( char ) );
 
-                url_fread( cbuff, sizeof( char ), 4, input );
-                mbstowcs( wbuff, cbuff, 1 );
+                mbstowcs( wbuff, (char *)&input->buffer[input->buffer_pos], 1 );
                 result = wbuff[0];
                 use_one_wide( input );
 
-                free( cbuff );
                 free( wbuff );
             }
             break;

From b15c0e8f892283802f668d13ff9ec43f61f387d8 Mon Sep 17 00:00:00 2001
From: Simon Brooke <simon@journeyman.cc>
Date: Mon, 28 Jan 2019 15:02:46 +0000
Subject: [PATCH 08/31] Tactical commit

---
 src/arith/integer.c | 158 ++++++++++++++++++++++----------------------
 src/init.c          |   2 +-
 src/io/fopen.c      | 103 +++++++++++++++++++++--------
 src/io/io.c         |  28 ++++----
 4 files changed, 167 insertions(+), 124 deletions(-)

diff --git a/src/arith/integer.c b/src/arith/integer.c
index 679bf37..1195c53 100644
--- a/src/arith/integer.c
+++ b/src/arith/integer.c
@@ -76,20 +76,16 @@ struct cons_pointer make_integer( int64_t value, struct cons_pointer more ) {
  * \see add_integers
  */
 __int128_t cell_value( struct cons_pointer c, char op, bool is_first_cell ) {
-    long int val = nilp( c ) ?
-      0 :
-      pointer2cell( c ).payload.integer.value;
+    long int val = nilp( c ) ? 0 : pointer2cell( c ).payload.integer.value;
 
     long int carry = is_first_cell ? 0 : ( MAX_INTEGER + 1 );
 
     __int128_t result = ( __int128_t ) integerp( c ) ?
-        ( val == 0 ) ?
-          carry :
-          val :
-         op == '*' ? 1 : 0;
+        ( val == 0 ) ? carry : val : op == '*' ? 1 : 0;
     debug_printf( DEBUG_ARITH,
                   L"cell_value: raw value is %ld, is_first_cell = %s; %4.4s; returning ",
-                  val, is_first_cell ? "true" : "false", pointer2cell(c).tag.bytes);
+                  val, is_first_cell ? "true" : "false",
+                  pointer2cell( c ).tag.bytes );
     debug_print_128bit( result, DEBUG_ARITH );
     debug_println( DEBUG_ARITH );
 
@@ -109,9 +105,8 @@ __int128_t cell_value( struct cons_pointer c, char op, bool is_first_cell ) {
  * @return carry, if any, else 0.
  */
 __int128_t int128_to_integer( __int128_t val,
-                                      struct cons_pointer less_significant,
-                                      struct cons_pointer new)
-{
+                              struct cons_pointer less_significant,
+                              struct cons_pointer new ) {
     struct cons_pointer cursor = NIL;
     __int128_t carry = 0;
 
@@ -120,12 +115,12 @@ __int128_t int128_to_integer( __int128_t val,
     } else {
         carry = val >> 60;
         debug_printf( DEBUG_ARITH,
-                     L"int128_to_integer: 64 bit overflow; setting carry to %ld\n",
-                     ( int64_t ) carry );
+                      L"int128_to_integer: 64 bit overflow; setting carry to %ld\n",
+                      ( int64_t ) carry );
         val &= MAX_INTEGER;
     }
 
-    struct cons_space_object * newc = &pointer2cell( new);
+    struct cons_space_object *newc = &pointer2cell( new );
     newc->payload.integer.value = val;
 
     if ( integerp( less_significant ) ) {
@@ -137,19 +132,21 @@ __int128_t int128_to_integer( __int128_t val,
     return carry;
 }
 
-struct cons_pointer make_integer_128(__int128_t val,
-                                     struct cons_pointer less_significant) {
+struct cons_pointer make_integer_128( __int128_t val,
+                                      struct cons_pointer less_significant ) {
     struct cons_pointer result = NIL;
 
     do {
         if ( MAX_INTEGER >= val ) {
-            result = make_integer( (long int) val, less_significant);
+            result = make_integer( ( long int ) val, less_significant );
         } else {
-            less_significant = make_integer( (long int)val & MAX_INTEGER, less_significant);
+            less_significant =
+                make_integer( ( long int ) val & MAX_INTEGER,
+                              less_significant );
             val = val >> 60;
         }
 
-    } while (nilp(result));
+    } while ( nilp( result ) );
 
     return result;
 }
@@ -164,10 +161,10 @@ struct cons_pointer add_integers( struct cons_pointer a,
     struct cons_pointer cursor = NIL;
 
     debug_print( L"add_integers: a = ", DEBUG_ARITH );
-    debug_print_object(a, DEBUG_ARITH);
+    debug_print_object( a, DEBUG_ARITH );
     debug_print( L"; b = ", DEBUG_ARITH );
-    debug_print_object(b, DEBUG_ARITH);
-    debug_println(DEBUG_ARITH);
+    debug_print_object( b, DEBUG_ARITH );
+    debug_println( DEBUG_ARITH );
 
     __int128_t carry = 0;
     bool is_first_cell = true;
@@ -194,8 +191,8 @@ struct cons_pointer add_integers( struct cons_pointer a,
             debug_print_128bit( rv, DEBUG_ARITH );
             debug_print( L"\n", DEBUG_ARITH );
 
-            struct cons_pointer new = make_integer( 0, NIL);
-            carry = int128_to_integer(rv, cursor, new);
+            struct cons_pointer new = make_integer( 0, NIL );
+            carry = int128_to_integer( rv, cursor, new );
             cursor = new;
 
             if ( nilp( result ) ) {
@@ -215,14 +212,14 @@ struct cons_pointer add_integers( struct cons_pointer a,
     return result;
 }
 
-struct cons_pointer base_partial(int depth) {
-  struct cons_pointer result = NIL;
+struct cons_pointer base_partial( int depth ) {
+    struct cons_pointer result = NIL;
 
-  for (int i = 0; i < depth; i++) {
-    result = make_integer(0, result);
-  }
+    for ( int i = 0; i < depth; i++ ) {
+        result = make_integer( 0, result );
+    }
 
-  return result;
+    return result;
 }
 
 /**
@@ -236,69 +233,70 @@ struct cons_pointer base_partial(int depth) {
 struct cons_pointer multiply_integers( struct cons_pointer a,
                                        struct cons_pointer b ) {
     struct cons_pointer result = NIL;
-    bool neg = is_negative(a) != is_negative(b);
+    bool neg = is_negative( a ) != is_negative( b );
     bool is_first_b = true;
     int oom = -1;
 
     debug_print( L"multiply_integers: a = ", DEBUG_ARITH );
-    debug_print_object(a, DEBUG_ARITH);
+    debug_print_object( a, DEBUG_ARITH );
     debug_print( L"; b = ", DEBUG_ARITH );
-    debug_print_object(b, DEBUG_ARITH);
-    debug_println(DEBUG_ARITH);
+    debug_print_object( b, DEBUG_ARITH );
+    debug_println( DEBUG_ARITH );
 
     if ( integerp( a ) && integerp( b ) ) {
         while ( !nilp( b ) ) {
-          bool is_first_d = true;
-          struct cons_pointer d = a;
-          struct cons_pointer partial = base_partial(++oom);
-          __int128_t carry = 0;
+            bool is_first_d = true;
+            struct cons_pointer d = a;
+            struct cons_pointer partial = base_partial( ++oom );
+            __int128_t carry = 0;
 
-          while ( !nilp(d) || carry != 0) {
-            partial = make_integer(0, partial);
-            struct cons_pointer new = NIL;
-            __int128_t dv = cell_value( d, '+', is_first_d );
-            __int128_t bv = cell_value( b, '+', is_first_b );
+            while ( !nilp( d ) || carry != 0 ) {
+                partial = make_integer( 0, partial );
+                struct cons_pointer new = NIL;
+                __int128_t dv = cell_value( d, '+', is_first_d );
+                __int128_t bv = cell_value( b, '+', is_first_b );
 
-            __int128_t rv = (dv * bv) + carry;
+                __int128_t rv = ( dv * bv ) + carry;
 
-            debug_print( L"multiply_integers: d = ", DEBUG_ARITH);
-            debug_print_object( d, DEBUG_ARITH);
-            debug_print( L"; dv = ", DEBUG_ARITH );
-            debug_print_128bit( dv, DEBUG_ARITH );
-            debug_print( L"; bv = ", DEBUG_ARITH );
-            debug_print_128bit( bv, DEBUG_ARITH );
-            debug_print( L"; carry = ", DEBUG_ARITH );
-            debug_print_128bit( carry, DEBUG_ARITH );
-            debug_print( L"; rv = ", DEBUG_ARITH );
-            debug_print_128bit( rv, DEBUG_ARITH );
-            debug_print( L"; acc = ", DEBUG_ARITH );
-            debug_print_object( result, DEBUG_ARITH);
-            debug_print( L"; partial = ", DEBUG_ARITH );
-            debug_print_object( partial, DEBUG_ARITH);
-            debug_print( L"\n", DEBUG_ARITH );
+                debug_print( L"multiply_integers: d = ", DEBUG_ARITH );
+                debug_print_object( d, DEBUG_ARITH );
+                debug_print( L"; dv = ", DEBUG_ARITH );
+                debug_print_128bit( dv, DEBUG_ARITH );
+                debug_print( L"; bv = ", DEBUG_ARITH );
+                debug_print_128bit( bv, DEBUG_ARITH );
+                debug_print( L"; carry = ", DEBUG_ARITH );
+                debug_print_128bit( carry, DEBUG_ARITH );
+                debug_print( L"; rv = ", DEBUG_ARITH );
+                debug_print_128bit( rv, DEBUG_ARITH );
+                debug_print( L"; acc = ", DEBUG_ARITH );
+                debug_print_object( result, DEBUG_ARITH );
+                debug_print( L"; partial = ", DEBUG_ARITH );
+                debug_print_object( partial, DEBUG_ARITH );
+                debug_print( L"\n", DEBUG_ARITH );
 
-            new = make_integer_128(rv, base_partial(oom));
+                new = make_integer_128( rv, base_partial( oom ) );
 
-            if ( zerop(partial)) {
-              partial = new;
-            } else {
-              partial = add_integers(partial, new);
+                if ( zerop( partial ) ) {
+                    partial = new;
+                } else {
+                    partial = add_integers( partial, new );
+                }
+
+                d = integerp( d ) ? pointer2cell( d ).payload.integer.
+                    more : NIL;
+                is_first_d = false;
             }
 
-            d = integerp(d) ? pointer2cell( d ).payload.integer.more : NIL;
-            is_first_d = false;
-          }
-
-          if (nilp(result) || zerop(result)) {
-            result = partial;
-          } else {
-            struct cons_pointer old = result;
-            result = add_integers(partial, result);
-            //if (!eq(result, old)) dec_ref(old);
-            //if (!eq(result, partial)) dec_ref(partial);
-          }
-          b = pointer2cell( b ).payload.integer.more;
-          is_first_b = false;
+            if ( nilp( result ) || zerop( result ) ) {
+                result = partial;
+            } else {
+                struct cons_pointer old = result;
+                result = add_integers( partial, result );
+                //if (!eq(result, old)) dec_ref(old);
+                //if (!eq(result, partial)) dec_ref(partial);
+            }
+            b = pointer2cell( b ).payload.integer.more;
+            is_first_b = false;
         }
     }
 
@@ -365,8 +363,8 @@ struct cons_pointer integer_to_string( struct cons_pointer int_pointer,
                               L"integer_to_string: digit is %ld, hexadecimal is %c, accumulator is: ",
                               offset, hex_digits[offset] );
                 debug_print_128bit( accumulator, DEBUG_IO );
-                debug_print( L"; result is: ", DEBUG_IO);
-                debug_print_object( result, DEBUG_IO);
+                debug_print( L"; result is: ", DEBUG_IO );
+                debug_print_object( result, DEBUG_IO );
                 debug_println( DEBUG_IO );
 
                 result =
diff --git a/src/init.c b/src/init.c
index 1fba3f2..c180b10 100644
--- a/src/init.c
+++ b/src/init.c
@@ -87,7 +87,7 @@ int main( int argc, char *argv[] ) {
     bool show_prompt = false;
 
     setlocale( LC_ALL, "" );
-    curl_global_init(CURL_GLOBAL_DEFAULT);
+    curl_global_init( CURL_GLOBAL_DEFAULT );
 
     while ( ( option = getopt( argc, argv, "cpdv:" ) ) != -1 ) {
         switch ( option ) {
diff --git a/src/io/fopen.c b/src/io/fopen.c
index a2eddab..3c26cd9 100644
--- a/src/io/fopen.c
+++ b/src/io/fopen.c
@@ -53,6 +53,8 @@
 /* we use a global one for convenience */
 static CURLM *multi_handle;
 
+wint_t ungotten = 0;
+
 /* curl calls this routine to get more data */
 static size_t write_callback( char *buffer,
                               size_t size, size_t nitems, void *userp ) {
@@ -452,27 +454,69 @@ URL_FILE *file_to_url_file( FILE * f ) {
 wint_t url_fgetwc( URL_FILE * input ) {
     wint_t result = -1;
 
-    switch ( input->type ) {
-        case CFTYPE_FILE:
-            fwide( input->handle.file, 1 ); /* wide characters */
-            result = fgetwc( input->handle.file );  /* passthrough */
-            break;
+    debug_printf( DEBUG_IO, L"url_fgetwc: ungotten = %d\n", ungotten );
 
-        case CFTYPE_CURL:{
-                wchar_t *wbuff = calloc( 2, sizeof( wchar_t ) );
+    if ( ungotten != 0 ) {
+        /* TODO: not thread safe */
+        result = ungotten;
+        ungotten = 0;
+    } else {
+        switch ( input->type ) {
+            case CFTYPE_FILE:
+                fwide( input->handle.file, 1 ); /* wide characters */
+                result = fgetwc( input->handle.file );  /* passthrough */
+                break;
 
-                mbstowcs( wbuff, (char *)&input->buffer[input->buffer_pos], 1 );
-                result = wbuff[0];
-                use_one_wide( input );
+            case CFTYPE_CURL:{
+                    debug_print( L"url_fgetwc: stream is URL\n", DEBUG_IO );
 
-                free( wbuff );
-            }
-            break;
-        case CFTYPE_NONE:
-            break;
+                    char *cbuff =
+                        calloc( sizeof( wchar_t ) + 1, sizeof( char ) );
+                    wchar_t *wbuff = calloc( 2, sizeof( wchar_t ) );
+
+                    size_t count = 0;
+
+                    debug_print( L"url_fgetwc: about to call url_fgets\n", DEBUG_IO );
+                    url_fgets( cbuff, 1, input );
+                    debug_print( L"url_fgetwc: back from url_fgets\n", DEBUG_IO );
+                    int c = ( int ) cbuff[0];
+    debug_printf( DEBUG_IO, L"url_fgetwc: (first) character = %d (%c)\n", c, c & 0xf7 );
+                    /* The value of each individual byte indicates its UTF-8 function, as follows:
+                     *
+                     * 00 to 7F hex (0 to 127): first and only byte of a sequence.
+                     * 80 to BF hex (128 to 191): continuing byte in a multi-byte sequence.
+                     * C2 to DF hex (194 to 223): first byte of a two-byte sequence.
+                     * E0 to EF hex (224 to 239): first byte of a three-byte sequence.
+                     * F0 to FF hex (240 to 255): first byte of a four-byte sequence.
+                     */
+                    if ( c <= 0x07 ) {
+                        count = 1;
+                    } else if ( c >= '0xc2' && c <= '0xdf' ) {
+                        count = 2;
+                    } else if ( c >= '0xe0' && c <= '0xef' ) {
+                        count = 3;
+                    } else if ( c >= '0xf0' && c <= '0xff' ) {
+                        count = 4;
+                    }
+
+                    if ( count > 1 ) {
+                        url_fgets( cbuff, --count, input );
+                    }
+                    mbstowcs( wbuff, cbuff, 1 );  //(char *)(&input->buffer[input->buffer_pos]), 1 );
+                    result = wbuff[0];
+                    use_one_wide( input );
+
+                    free( wbuff );
+                    free( cbuff );
+                }
+                break;
+            case CFTYPE_NONE:
+                break;
+        }
     }
 
-    debug_printf( DEBUG_IO, L"url_fgetwc returning %d (%C)\n", result, result);
+    debug_printf( DEBUG_IO, L"url_fgetwc returning %d (%C)\n", result,
+                  result );
     return result;
 }
 
@@ -482,22 +526,23 @@ wint_t url_ungetwc( wint_t wc, URL_FILE * input ) {
     switch ( input->type ) {
         case CFTYPE_FILE:
             fwide( input->handle.file, 1 ); /* wide characters */
-            result = ungetwc( wc, input->handle.file );  /* passthrough */
+            result = ungetwc( wc, input->handle.file ); /* passthrough */
             break;
 
         case CFTYPE_CURL:{
-                wchar_t *wbuff = calloc( 2, sizeof( wchar_t ) );
-                char *cbuff = calloc( 5, sizeof( char ) );
-
-                wbuff[0] = wc;
-                result = wcstombs( cbuff, wbuff, 1 );
-
-                input->buffer_pos -= strlen( cbuff );
-
-                free( cbuff );
-                free( wbuff );
-
-                result = result > 0 ? wc : result;
+                ungotten = wc;
+//                wchar_t *wbuff = calloc( 2, sizeof( wchar_t ) );
+//                char *cbuff = calloc( 5, sizeof( char ) );
+//
+//                wbuff[0] = wc;
+//                result = wcstombs( cbuff, wbuff, 1 );
+//
+//                input->buffer_pos -= strlen( cbuff );
+//
+//                free( cbuff );
+//                free( wbuff );
+//
+//                result = result > 0 ? wc : result;
                 break;
         case CFTYPE_NONE:
                 break;
diff --git a/src/io/io.c b/src/io/io.c
index e510580..4577a11 100644
--- a/src/io/io.c
+++ b/src/io/io.c
@@ -31,7 +31,7 @@ char *lisp_string_to_c_string( struct cons_pointer s ) {
         int len = 0;
 
         for ( struct cons_pointer c = s; !nilp( c );
-            c = pointer2cell( c ).payload.string.cdr ) {
+              c = pointer2cell( c ).payload.string.cdr ) {
             len++;
         }
 
@@ -49,9 +49,9 @@ char *lisp_string_to_c_string( struct cons_pointer s ) {
         free( buffer );
     }
 
-    debug_print(L"lisp_string_to_c_string( ", DEBUG_IO);
-    debug_print_object( s, DEBUG_IO);
-    debug_printf( DEBUG_IO, L") => '%s'\n", result);
+    debug_print( L"lisp_string_to_c_string( ", DEBUG_IO );
+    debug_print_object( s, DEBUG_IO );
+    debug_printf( DEBUG_IO, L") => '%s'\n", result );
 
     return result;
 }
@@ -115,7 +115,7 @@ lisp_open( struct stack_frame *frame, struct cons_pointer frame_pointer,
 
         free( url );
 
-        if ( pointer2cell(result).payload.stream.stream == NULL) {
+        if ( pointer2cell( result ).payload.stream.stream == NULL ) {
             result = NIL;
         }
     }
@@ -169,19 +169,19 @@ lisp_slurp( struct stack_frame *frame, struct cons_pointer frame_pointer,
 
     if ( readp( frame->arg[0] ) ) {
         URL_FILE *stream = pointer2cell( frame->arg[0] ).payload.stream.stream;
-        struct cons_pointer cursor = make_string( url_fgetwc( stream ), NIL);
+        struct cons_pointer cursor = make_string( url_fgetwc( stream ), NIL );
         result = cursor;
 
-        for ( wint_t c = url_fgetwc( stream ); !url_feof(stream);
+        for ( wint_t c = url_fgetwc( stream ); !url_feof( stream );
               c = url_fgetwc( stream ) ) {
-            debug_print(L"slurp: cursor is: ", DEBUG_IO);
-            debug_dump_object( cursor, DEBUG_IO);
-            debug_print(L"; result is: ", DEBUG_IO);
-            debug_dump_object( result, DEBUG_IO);
-            debug_println( DEBUG_IO);
+            debug_print( L"slurp: cursor is: ", DEBUG_IO );
+            debug_dump_object( cursor, DEBUG_IO );
+            debug_print( L"; result is: ", DEBUG_IO );
+            debug_dump_object( result, DEBUG_IO );
+            debug_println( DEBUG_IO );
 
-            struct cons_space_object * cell = &pointer2cell(cursor);
-            cursor = make_string( ( wchar_t ) c , NIL);
+            struct cons_space_object *cell = &pointer2cell( cursor );
+            cursor = make_string( ( wchar_t ) c, NIL );
             cell->payload.string.cdr = cursor;
         }
     }

From a640c9dff9c076190a7e83cea9ecb84aba35aaa5 Mon Sep 17 00:00:00 2001
From: Simon Brooke <simon@journeyman.cc>
Date: Mon, 28 Jan 2019 18:46:24 +0000
Subject: [PATCH 09/31] It works!

---
 .gitignore            |   2 +
 lisp/slurp.lisp       |   1 +
 src/debug.c           |   2 +-
 src/io/fopen.c        | 855 +++++++++++++++++++++---------------------
 src/io/fopen.h        |   4 -
 src/io/io.c           | 131 ++++++-
 src/io/io.h           |   4 +
 src/memory/conspage.c |   4 +
 src/ops/lispops.c     |   2 +-
 src/ops/read.c        |   1 +
 10 files changed, 568 insertions(+), 438 deletions(-)
 create mode 100644 lisp/slurp.lisp

diff --git a/.gitignore b/.gitignore
index 6fa1cd9..ec1281e 100644
--- a/.gitignore
+++ b/.gitignore
@@ -34,3 +34,5 @@ utils_src/readprintwc/out
 *.dump
 
 *.bak
+
+src/io/fopen
diff --git a/lisp/slurp.lisp b/lisp/slurp.lisp
new file mode 100644
index 0000000..e927bcb
--- /dev/null
+++ b/lisp/slurp.lisp
@@ -0,0 +1 @@
+(slurp (set! f (open "http://www.journeyman.cc/")))
diff --git a/src/debug.c b/src/debug.c
index 14881f9..c8b9771 100644
--- a/src/debug.c
+++ b/src/debug.c
@@ -19,9 +19,9 @@
 #include <wctype.h>
 
 #include "consspaceobject.h"
-#include "fopen.h"
 #include "debug.h"
 #include "dump.h"
+#include "io.h"
 #include "print.h"
 
 /**
diff --git a/src/io/fopen.c b/src/io/fopen.c
index 3c26cd9..f0ea012 100644
--- a/src/io/fopen.c
+++ b/src/io/fopen.c
@@ -37,517 +37,510 @@
  * This example requires libcurl 7.9.7 or later.
  */
 
-#include <errno.h>
 #include <stdio.h>
-#include <stdlib.h>
 #include <string.h>
 #ifndef WIN32
 #include <sys/time.h>
 #endif
+#include <stdlib.h>
+#include <errno.h>
 
 #include <curl/curl.h>
 
-#include "debug.h"
-#include "fopen.h"
+enum fcurl_type_e {
+  CFTYPE_NONE = 0,
+  CFTYPE_FILE = 1,
+  CFTYPE_CURL = 2
+};
+
+struct fcurl_data
+{
+  enum fcurl_type_e type;     /* type of handle */
+  union {
+    CURL *curl;
+    FILE *file;
+  } handle;                   /* handle */
+
+  char *buffer;               /* buffer to store cached data*/
+  size_t buffer_len;          /* currently allocated buffers length */
+  size_t buffer_pos;          /* end of data in buffer*/
+  int still_running;          /* Is background url fetch still in progress */
+};
+
+typedef struct fcurl_data URL_FILE;
+
+/* exported functions */
+URL_FILE *url_fopen(const char *url, const char *operation);
+int url_fclose(URL_FILE *file);
+int url_feof(URL_FILE *file);
+size_t url_fread(void *ptr, size_t size, size_t nmemb, URL_FILE *file);
+char *url_fgets(char *ptr, size_t size, URL_FILE *file);
+void url_rewind(URL_FILE *file);
 
 /* we use a global one for convenience */
 static CURLM *multi_handle;
 
-wint_t ungotten = 0;
-
 /* curl calls this routine to get more data */
-static size_t write_callback( char *buffer,
-                              size_t size, size_t nitems, void *userp ) {
-    char *newbuff;
-    size_t rembuff;
+static size_t write_callback(char *buffer,
+                             size_t size,
+                             size_t nitems,
+                             void *userp)
+{
+  char *newbuff;
+  size_t rembuff;
 
-    URL_FILE *url = ( URL_FILE * ) userp;
-    size *= nitems;
+  URL_FILE *url = (URL_FILE *)userp;
+  size *= nitems;
 
-    rembuff = url->buffer_len - url->buffer_pos;  /* remaining space in buffer */
+  rembuff = url->buffer_len - url->buffer_pos; /* remaining space in buffer */
 
-    if ( size > rembuff ) {
-        /* not enough space in buffer */
-        newbuff = realloc( url->buffer, url->buffer_len + ( size - rembuff ) );
-        if ( newbuff == NULL ) {
-            fprintf( stderr, "callback buffer grow failed\n" );
-            size = rembuff;
-        } else {
-            /* realloc succeeded increase buffer size */
-            url->buffer_len += size - rembuff;
-            url->buffer = newbuff;
-        }
+  if(size > rembuff) {
+    /* not enough space in buffer */
+    newbuff = realloc(url->buffer, url->buffer_len + (size - rembuff));
+    if(newbuff == NULL) {
+      fprintf(stderr, "callback buffer grow failed\n");
+      size = rembuff;
     }
+    else {
+      /* realloc succeeded increase buffer size*/
+      url->buffer_len += size - rembuff;
+      url->buffer = newbuff;
+    }
+  }
 
-    memcpy( &url->buffer[url->buffer_pos], buffer, size );
-    url->buffer_pos += size;
+  memcpy(&url->buffer[url->buffer_pos], buffer, size);
+  url->buffer_pos += size;
 
-    return size;
+  return size;
 }
 
 /* use to attempt to fill the read buffer up to requested number of bytes */
-static int fill_buffer( URL_FILE * file, size_t want ) {
-    fd_set fdread;
-    fd_set fdwrite;
-    fd_set fdexcep;
-    struct timeval timeout;
-    int rc;
-    CURLMcode mc;               /* curl_multi_fdset() return code */
+static int fill_buffer(URL_FILE *file, size_t want)
+{
+  fd_set fdread;
+  fd_set fdwrite;
+  fd_set fdexcep;
+  struct timeval timeout;
+  int rc;
+  CURLMcode mc; /* curl_multi_fdset() return code */
 
-    /* only attempt to fill buffer if transactions still running and buffer
-     * doesn't exceed required size already
-     */
-    if ( ( !file->still_running ) || ( file->buffer_pos > want ) )
-        return 0;
+  /* only attempt to fill buffer if transactions still running and buffer
+   * doesn't exceed required size already
+   */
+  if((!file->still_running) || (file->buffer_pos > want))
+    return 0;
 
-    /* attempt to fill buffer */
-    do {
-        int maxfd = -1;
-        long curl_timeo = -1;
+  /* attempt to fill buffer */
+  do {
+    int maxfd = -1;
+    long curl_timeo = -1;
 
-        FD_ZERO( &fdread );
-        FD_ZERO( &fdwrite );
-        FD_ZERO( &fdexcep );
+    FD_ZERO(&fdread);
+    FD_ZERO(&fdwrite);
+    FD_ZERO(&fdexcep);
 
-        /* set a suitable timeout to fail on */
-        timeout.tv_sec = 60;    /* 1 minute */
-        timeout.tv_usec = 0;
+    /* set a suitable timeout to fail on */
+    timeout.tv_sec = 60; /* 1 minute */
+    timeout.tv_usec = 0;
 
-        curl_multi_timeout( multi_handle, &curl_timeo );
-        if ( curl_timeo >= 0 ) {
-            timeout.tv_sec = curl_timeo / 1000;
-            if ( timeout.tv_sec > 1 )
-                timeout.tv_sec = 1;
-            else
-                timeout.tv_usec = ( curl_timeo % 1000 ) * 1000;
-        }
+    curl_multi_timeout(multi_handle, &curl_timeo);
+    if(curl_timeo >= 0) {
+      timeout.tv_sec = curl_timeo / 1000;
+      if(timeout.tv_sec > 1)
+        timeout.tv_sec = 1;
+      else
+        timeout.tv_usec = (curl_timeo % 1000) * 1000;
+    }
 
-        /* get file descriptors from the transfers */
-        mc = curl_multi_fdset( multi_handle, &fdread, &fdwrite, &fdexcep,
-                               &maxfd );
+    /* get file descriptors from the transfers */
+    mc = curl_multi_fdset(multi_handle, &fdread, &fdwrite, &fdexcep, &maxfd);
 
-        if ( mc != CURLM_OK ) {
-            fprintf( stderr, "curl_multi_fdset() failed, code %d.\n", mc );
-            break;
-        }
+    if(mc != CURLM_OK) {
+      fprintf(stderr, "curl_multi_fdset() failed, code %d.\n", mc);
+      break;
+    }
 
-        /* On success the value of maxfd is guaranteed to be >= -1. We call
-           select(maxfd + 1, ...); specially in case of (maxfd == -1) there are
-           no fds ready yet so we call select(0, ...) --or Sleep() on Windows--
-           to sleep 100ms, which is the minimum suggested value in the
-           curl_multi_fdset() doc. */
+    /* On success the value of maxfd is guaranteed to be >= -1. We call
+       select(maxfd + 1, ...); specially in case of (maxfd == -1) there are
+       no fds ready yet so we call select(0, ...) --or Sleep() on Windows--
+       to sleep 100ms, which is the minimum suggested value in the
+       curl_multi_fdset() doc. */
 
-        if ( maxfd == -1 ) {
+    if(maxfd == -1) {
 #ifdef _WIN32
-            Sleep( 100 );
-            rc = 0;
+      Sleep(100);
+      rc = 0;
 #else
-            /* Portable sleep for platforms other than Windows. */
-            struct timeval wait = { 0, 100 * 1000 };  /* 100ms */
-            rc = select( 0, NULL, NULL, NULL, &wait );
+      /* Portable sleep for platforms other than Windows. */
+      struct timeval wait = { 0, 100 * 1000 }; /* 100ms */
+      rc = select(0, NULL, NULL, NULL, &wait);
 #endif
-        } else {
-            /* Note that on some platforms 'timeout' may be modified by select().
-               If you need access to the original value save a copy beforehand. */
-            rc = select( maxfd + 1, &fdread, &fdwrite, &fdexcep, &timeout );
-        }
+    }
+    else {
+      /* Note that on some platforms 'timeout' may be modified by select().
+         If you need access to the original value save a copy beforehand. */
+      rc = select(maxfd + 1, &fdread, &fdwrite, &fdexcep, &timeout);
+    }
 
-        switch ( rc ) {
-            case -1:
-                /* select error */
-                break;
+    switch(rc) {
+    case -1:
+      /* select error */
+      break;
 
-            case 0:
-            default:
-                /* timeout or readable/writable sockets */
-                curl_multi_perform( multi_handle, &file->still_running );
-                break;
-        }
-    } while ( file->still_running && ( file->buffer_pos < want ) );
-
-    return 1;
+    case 0:
+    default:
+      /* timeout or readable/writable sockets */
+      curl_multi_perform(multi_handle, &file->still_running);
+      break;
+    }
+  } while(file->still_running && (file->buffer_pos < want));
+  return 1;
 }
 
 /* use to remove want bytes from the front of a files buffer */
-static int use_buffer( URL_FILE * file, size_t want ) {
-    /* sort out buffer */
-    if ( ( file->buffer_pos - want ) <= 0 ) {
-        /* ditch buffer - write will recreate */
-        free( file->buffer );
-        file->buffer = NULL;
-        file->buffer_pos = 0;
-        file->buffer_len = 0;
-    } else {
-        /* move rest down make it available for later */
-        memmove( file->buffer,
-                 &file->buffer[want], ( file->buffer_pos - want ) );
+static int use_buffer(URL_FILE *file, size_t want)
+{
+  /* sort out buffer */
+  if((file->buffer_pos - want) <= 0) {
+    /* ditch buffer - write will recreate */
+    free(file->buffer);
+    file->buffer = NULL;
+    file->buffer_pos = 0;
+    file->buffer_len = 0;
+  }
+  else {
+    /* move rest down make it available for later */
+    memmove(file->buffer,
+            &file->buffer[want],
+            (file->buffer_pos - want));
 
-        file->buffer_pos -= want;
-    }
-    return 0;
+    file->buffer_pos -= want;
+  }
+  return 0;
 }
 
-/**
- * consume one wide character on the buffer of this file.
- *
- * @param file the url or file from which the character is consumed.
- */
-static int use_one_wide( URL_FILE * file ) {
-    int c = ( int ) file->buffer[file->buffer_pos];
-    size_t count = 0;
+URL_FILE *url_fopen(const char *url, const char *operation)
+{
+  /* this code could check for URLs or types in the 'url' and
+     basically use the real fopen() for standard files */
 
-    /* The value of each individual byte indicates its UTF-8 function, as follows:
-     *
-     * 00 to 7F hex (0 to 127): first and only byte of a sequence.
-     * 80 to BF hex (128 to 191): continuing byte in a multi-byte sequence.
-     * C2 to DF hex (194 to 223): first byte of a two-byte sequence.
-     * E0 to EF hex (224 to 239): first byte of a three-byte sequence.
-     * F0 to FF hex (240 to 255): first byte of a four-byte sequence.
-     */
-    if ( c <= '0x07' ) {
-        count = 1;
-    } else if ( c >= '0xc2' && c <= '0xdf' ) {
-        count = 2;
-    } else if ( c >= '0xe0' && c <= '0xef' ) {
-        count = 3;
-    } else if ( c >= '0xf0' && c <= '0xff' ) {
-        count = 4;
+  URL_FILE *file;
+  (void)operation;
+
+  file = calloc(1, sizeof(URL_FILE));
+  if(!file)
+    return NULL;
+
+  file->handle.file = fopen(url, operation);
+  if(file->handle.file)
+    file->type = CFTYPE_FILE; /* marked as URL */
+
+  else {
+    file->type = CFTYPE_CURL; /* marked as URL */
+    file->handle.curl = curl_easy_init();
+
+    curl_easy_setopt(file->handle.curl, CURLOPT_URL, url);
+    curl_easy_setopt(file->handle.curl, CURLOPT_WRITEDATA, file);
+    curl_easy_setopt(file->handle.curl, CURLOPT_VERBOSE, 0L);
+    curl_easy_setopt(file->handle.curl, CURLOPT_WRITEFUNCTION, write_callback);
+
+    if(!multi_handle)
+      multi_handle = curl_multi_init();
+
+    curl_multi_add_handle(multi_handle, file->handle.curl);
+
+    /* lets start the fetch */
+    curl_multi_perform(multi_handle, &file->still_running);
+
+    if((file->buffer_pos == 0) && (!file->still_running)) {
+      /* if still_running is 0 now, we should return NULL */
+
+      /* make sure the easy handle is not in the multi handle anymore */
+      curl_multi_remove_handle(multi_handle, file->handle.curl);
+
+      /* cleanup */
+      curl_easy_cleanup(file->handle.curl);
+
+      free(file);
+
+      file = NULL;
     }
-
-    return use_buffer( file, c );
+  }
+  return file;
 }
 
-URL_FILE *url_fopen( const char *url, const char *operation ) {
-    /* this code could check for URLs or types in the 'url' and
-       basically use the real fopen() for standard files */
+int url_fclose(URL_FILE *file)
+{
+  int ret = 0;/* default is good return */
 
-    URL_FILE *file;
-    ( void ) operation;
+  switch(file->type) {
+  case CFTYPE_FILE:
+    ret = fclose(file->handle.file); /* passthrough */
+    break;
 
-    file = calloc( 1, sizeof( URL_FILE ) );
-    if ( !file )
-        return NULL;
+  case CFTYPE_CURL:
+    /* make sure the easy handle is not in the multi handle anymore */
+    curl_multi_remove_handle(multi_handle, file->handle.curl);
 
-    file->handle.file = fopen( url, operation );
-    if ( file->handle.file )
-        file->type = CFTYPE_FILE; /* marked as URL */
+    /* cleanup */
+    curl_easy_cleanup(file->handle.curl);
+    break;
 
-    else {
-        file->type = CFTYPE_CURL; /* marked as URL */
-        file->handle.curl = curl_easy_init(  );
+  default: /* unknown or supported type - oh dear */
+    ret = EOF;
+    errno = EBADF;
+    break;
+  }
 
-        curl_easy_setopt( file->handle.curl, CURLOPT_URL, url );
-        curl_easy_setopt( file->handle.curl, CURLOPT_WRITEDATA, file );
-        curl_easy_setopt( file->handle.curl, CURLOPT_VERBOSE, 0L );
-        curl_easy_setopt( file->handle.curl, CURLOPT_WRITEFUNCTION,
-                          write_callback );
+  free(file->buffer);/* free any allocated buffer space */
+  free(file);
 
-        if ( !multi_handle )
-            multi_handle = curl_multi_init(  );
-
-        curl_multi_add_handle( multi_handle, file->handle.curl );
-
-        /* lets start the fetch */
-        curl_multi_perform( multi_handle, &file->still_running );
-
-        if ( ( file->buffer_pos == 0 ) && ( !file->still_running ) ) {
-            /* if still_running is 0 now, we should return NULL */
-
-            /* make sure the easy handle is not in the multi handle anymore */
-            curl_multi_remove_handle( multi_handle, file->handle.curl );
-
-            /* cleanup */
-            curl_easy_cleanup( file->handle.curl );
-
-            free( file );
-
-            file = NULL;
-        }
-    }
-    return file;
+  return ret;
 }
 
-int url_fclose( URL_FILE * file ) {
-    int ret = 0;                /* default is good return */
+int url_feof(URL_FILE *file)
+{
+  int ret = 0;
 
-    switch ( file->type ) {
-        case CFTYPE_FILE:
-            ret = fclose( file->handle.file );  /* passthrough */
-            break;
+  switch(file->type) {
+  case CFTYPE_FILE:
+    ret = feof(file->handle.file);
+    break;
 
-        case CFTYPE_CURL:
-            /* make sure the easy handle is not in the multi handle anymore */
-            curl_multi_remove_handle( multi_handle, file->handle.curl );
+  case CFTYPE_CURL:
+    if((file->buffer_pos == 0) && (!file->still_running))
+      ret = 1;
+    break;
 
-            /* cleanup */
-            curl_easy_cleanup( file->handle.curl );
-            break;
-
-        default:               /* unknown or supported type - oh dear */
-            ret = EOF;
-            errno = EBADF;
-            break;
-    }
-
-    free( file->buffer );       /* free any allocated buffer space */
-    free( file );
-
-    return ret;
+  default: /* unknown or supported type - oh dear */
+    ret = -1;
+    errno = EBADF;
+    break;
+  }
+  return ret;
 }
 
-int url_feof( URL_FILE * file ) {
-    int ret = 0;
+size_t url_fread(void *ptr, size_t size, size_t nmemb, URL_FILE *file)
+{
+  size_t want;
 
-    switch ( file->type ) {
-        case CFTYPE_FILE:
-            ret = feof( file->handle.file );
-            break;
+  switch(file->type) {
+  case CFTYPE_FILE:
+    want = fread(ptr, size, nmemb, file->handle.file);
+    break;
 
-        case CFTYPE_CURL:
-            if ( ( file->buffer_pos == 0 ) && ( !file->still_running ) )
-                ret = 1;
-            break;
+  case CFTYPE_CURL:
+    want = nmemb * size;
 
-        default:               /* unknown or supported type - oh dear */
-            ret = -1;
-            errno = EBADF;
-            break;
-    }
-    return ret;
+    fill_buffer(file, want);
+
+    /* check if there's data in the buffer - if not fill_buffer()
+     * either errored or EOF */
+    if(!file->buffer_pos)
+      return 0;
+
+    /* ensure only available data is considered */
+    if(file->buffer_pos < want)
+      want = file->buffer_pos;
+
+    /* xfer data to caller */
+    memcpy(ptr, file->buffer, want);
+
+    use_buffer(file, want);
+
+    want = want / size;     /* number of items */
+    break;
+
+  default: /* unknown or supported type - oh dear */
+    want = 0;
+    errno = EBADF;
+    break;
+
+  }
+  return want;
 }
 
-size_t url_fread( void *ptr, size_t size, size_t nmemb, URL_FILE * file ) {
-    size_t want;
+char *url_fgets(char *ptr, size_t size, URL_FILE *file)
+{
+  size_t want = size - 1;/* always need to leave room for zero termination */
+  size_t loop;
 
-    switch ( file->type ) {
-        case CFTYPE_FILE:
-            want = fread( ptr, size, nmemb, file->handle.file );
-            break;
+  switch(file->type) {
+  case CFTYPE_FILE:
+    ptr = fgets(ptr, (int)size, file->handle.file);
+    break;
 
-        case CFTYPE_CURL:
-            want = nmemb * size;
+  case CFTYPE_CURL:
+    fill_buffer(file, want);
 
-            fill_buffer( file, want );
+    /* check if there's data in the buffer - if not fill either errored or
+     * EOF */
+    if(!file->buffer_pos)
+      return NULL;
 
-            /* check if there's data in the buffer - if not fill_buffer()
-             * either errored or EOF */
-            if ( !file->buffer_pos )
-                return 0;
+    /* ensure only available data is considered */
+    if(file->buffer_pos < want)
+      want = file->buffer_pos;
 
-            /* ensure only available data is considered */
-            if ( file->buffer_pos < want )
-                want = file->buffer_pos;
-
-            /* xfer data to caller */
-            memcpy( ptr, file->buffer, want );
-
-            use_buffer( file, want );
-
-            want = want / size; /* number of items */
-            break;
-
-        default:               /* unknown or supported type - oh dear */
-            want = 0;
-            errno = EBADF;
-            break;
-
-    }
-    return want;
-}
-
-char *url_fgets( char *ptr, size_t size, URL_FILE * file ) {
-    size_t want = size - 1;     /* always need to leave room for zero termination */
-    size_t loop;
-
-    switch ( file->type ) {
-        case CFTYPE_FILE:
-            ptr = fgets( ptr, ( int ) size, file->handle.file );
-            break;
-
-        case CFTYPE_CURL:
-            fill_buffer( file, want );
-
-            /* check if there's data in the buffer - if not fill either errored or
-             * EOF */
-            if ( !file->buffer_pos )
-                return NULL;
-
-            /* ensure only available data is considered */
-            if ( file->buffer_pos < want )
-                want = file->buffer_pos;
-
-            /*buffer contains data */
-            /* look for newline or eof */
-            for ( loop = 0; loop < want; loop++ ) {
-                if ( file->buffer[loop] == '\n' ) {
-                    want = loop + 1;  /* include newline */
-                    break;
-                }
-            }
-
-            /* xfer data to caller */
-            memcpy( ptr, file->buffer, want );
-            ptr[want] = 0;      /* always null terminate */
-
-            use_buffer( file, want );
-
-            break;
-
-        default:               /* unknown or supported type - oh dear */
-            ptr = NULL;
-            errno = EBADF;
-            break;
+    /*buffer contains data */
+    /* look for newline or eof */
+    for(loop = 0; loop < want; loop++) {
+      if(file->buffer[loop] == '\n') {
+        want = loop + 1;/* include newline */
+        break;
+      }
     }
 
-    return ptr;                 /*success */
+    /* xfer data to caller */
+    memcpy(ptr, file->buffer, want);
+    ptr[want] = 0;/* always null terminate */
+
+    use_buffer(file, want);
+
+    break;
+
+  default: /* unknown or supported type - oh dear */
+    ptr = NULL;
+    errno = EBADF;
+    break;
+  }
+
+  return ptr;/*success */
 }
 
-void url_rewind( URL_FILE * file ) {
-    switch ( file->type ) {
-        case CFTYPE_FILE:
-            rewind( file->handle.file );  /* passthrough */
-            break;
+void url_rewind(URL_FILE *file)
+{
+  switch(file->type) {
+  case CFTYPE_FILE:
+    rewind(file->handle.file); /* passthrough */
+    break;
 
-        case CFTYPE_CURL:
-            /* halt transaction */
-            curl_multi_remove_handle( multi_handle, file->handle.curl );
+  case CFTYPE_CURL:
+    /* halt transaction */
+    curl_multi_remove_handle(multi_handle, file->handle.curl);
 
-            /* restart */
-            curl_multi_add_handle( multi_handle, file->handle.curl );
+    /* restart */
+    curl_multi_add_handle(multi_handle, file->handle.curl);
 
-            /* ditch buffer - write will recreate - resets stream pos */
-            free( file->buffer );
-            file->buffer = NULL;
-            file->buffer_pos = 0;
-            file->buffer_len = 0;
+    /* ditch buffer - write will recreate - resets stream pos*/
+    free(file->buffer);
+    file->buffer = NULL;
+    file->buffer_pos = 0;
+    file->buffer_len = 0;
 
-            break;
+    break;
 
-        default:               /* unknown or supported type - oh dear */
-            break;
-    }
+  default: /* unknown or supported type - oh dear */
+    break;
+  }
 }
 
-/**
- * given this file handle f, return a new url_file handle wrapping it.
- *
- * @param f the file to be wrapped;
- * @return the new handle, or null if no such handle could be allocated.
- */
-URL_FILE *file_to_url_file( FILE * f ) {
-    URL_FILE *result = ( URL_FILE * ) malloc( sizeof( URL_FILE ) );
+#ifdef FOPEN_STANDALONE
+#define FGETSFILE "fgets.test"
+#define FREADFILE "fread.test"
+#define REWINDFILE "rewind.test"
 
-    if ( result != NULL ) {
-        result->type = CFTYPE_FILE, result->handle.file = f;
-    }
+/* Small main program to retrieve from a url using fgets and fread saving the
+ * output to two test files (note the fgets method will corrupt binary files if
+ * they contain 0 chars */
+int main(int argc, char *argv[])
+{
+  URL_FILE *handle;
+  FILE *outf;
 
-    return result;
-}
-
-
-/**
- * get one wide character from the buffer.
- *
- * @param file the stream to read from;
- * @return the next wide character on the stream, or zero if no more.
- */
-wint_t url_fgetwc( URL_FILE * input ) {
-    wint_t result = -1;
-
-    debug_printf( DEBUG_IO, L"url_fgetwc: ungotten = %d\n", ungotten );
-
-    if ( ungotten != 0 ) {
-        /* TODO: not thread safe */
-        result = ungotten;
-        ungotten = 0;
-    } else {
-        switch ( input->type ) {
-            case CFTYPE_FILE:
-                fwide( input->handle.file, 1 ); /* wide characters */
-                result = fgetwc( input->handle.file );  /* passthrough */
-                break;
-
-            case CFTYPE_CURL:{
-                    debug_print( L"url_fgetwc: stream is URL\n", DEBUG_IO );
-
-                    char *cbuff =
-                        calloc( sizeof( wchar_t ) + 1, sizeof( char ) );
-                    wchar_t *wbuff = calloc( 2, sizeof( wchar_t ) );
-
-                    size_t count = 0;
-
-                    debug_print( L"url_fgetwc: about to call url_fgets\n", DEBUG_IO );
-                    url_fgets( cbuff, 1, input );
-                    debug_print( L"url_fgetwc: back from url_fgets\n", DEBUG_IO );
-                    int c = ( int ) cbuff[0];
-    debug_printf( DEBUG_IO, L"url_fgetwc: (first) character = %d (%c)\n", c, c & 0xf7 );
-                    /* The value of each individual byte indicates its UTF-8 function, as follows:
-                     *
-                     * 00 to 7F hex (0 to 127): first and only byte of a sequence.
-                     * 80 to BF hex (128 to 191): continuing byte in a multi-byte sequence.
-                     * C2 to DF hex (194 to 223): first byte of a two-byte sequence.
-                     * E0 to EF hex (224 to 239): first byte of a three-byte sequence.
-                     * F0 to FF hex (240 to 255): first byte of a four-byte sequence.
-                     */
-                    if ( c <= 0x07 ) {
-                        count = 1;
-                    } else if ( c >= '0xc2' && c <= '0xdf' ) {
-                        count = 2;
-                    } else if ( c >= '0xe0' && c <= '0xef' ) {
-                        count = 3;
-                    } else if ( c >= '0xf0' && c <= '0xff' ) {
-                        count = 4;
-                    }
-
-                    if ( count > 1 ) {
-                        url_fgets( cbuff, --count, input );
-                    }
-                    mbstowcs( wbuff, cbuff, 1 );  //(char *)(&input->buffer[input->buffer_pos]), 1 );
-                    result = wbuff[0];
-                    use_one_wide( input );
-
-                    free( wbuff );
-                    free( cbuff );
-                }
-                break;
-            case CFTYPE_NONE:
-                break;
-        }
-    }
-
-    debug_printf( DEBUG_IO, L"url_fgetwc returning %d (%C)\n", result,
-                  result );
-    return result;
-}
-
-wint_t url_ungetwc( wint_t wc, URL_FILE * input ) {
-    wint_t result = -1;
-
-    switch ( input->type ) {
-        case CFTYPE_FILE:
-            fwide( input->handle.file, 1 ); /* wide characters */
-            result = ungetwc( wc, input->handle.file ); /* passthrough */
-            break;
-
-        case CFTYPE_CURL:{
-                ungotten = wc;
-//                wchar_t *wbuff = calloc( 2, sizeof( wchar_t ) );
-//                char *cbuff = calloc( 5, sizeof( char ) );
-//
-//                wbuff[0] = wc;
-//                result = wcstombs( cbuff, wbuff, 1 );
-//
-//                input->buffer_pos -= strlen( cbuff );
-//
-//                free( cbuff );
-//                free( wbuff );
-//
-//                result = result > 0 ? wc : result;
-                break;
-        case CFTYPE_NONE:
-                break;
-            }
-    }
-
-    return result;
+  size_t nread;
+  char buffer[256];
+  const char *url;
+
+  CURL *curl;
+  CURLcode res;
+
+  curl_global_init(CURL_GLOBAL_DEFAULT);
+
+  curl = curl_easy_init();
+
+
+  if(argc < 2)
+    url = "http://192.168.7.3/testfile";/* default to testurl */
+  else
+    url = argv[1];/* use passed url */
+
+  /* copy from url line by line with fgets */
+  outf = fopen(FGETSFILE, "wb+");
+  if(!outf) {
+    perror("couldn't open fgets output file\n");
+    return 1;
+  }
+
+  handle = url_fopen(url, "r");
+  if(!handle) {
+    printf("couldn't url_fopen() %s\n", url);
+    fclose(outf);
+    return 2;
+  }
+
+  while(!url_feof(handle)) {
+    url_fgets(buffer, sizeof(buffer), handle);
+    fwrite(buffer, 1, strlen(buffer), outf);
+  }
+
+  url_fclose(handle);
+
+  fclose(outf);
+
+
+  /* Copy from url with fread */
+  outf = fopen(FREADFILE, "wb+");
+  if(!outf) {
+    perror("couldn't open fread output file\n");
+    return 1;
+  }
+
+  handle = url_fopen("testfile", "r");
+  if(!handle) {
+    printf("couldn't url_fopen() testfile\n");
+    fclose(outf);
+    return 2;
+  }
+
+  do {
+    nread = url_fread(buffer, 1, sizeof(buffer), handle);
+    fwrite(buffer, 1, nread, outf);
+  } while(nread);
+
+  url_fclose(handle);
+
+  fclose(outf);
+
+
+  /* Test rewind */
+  outf = fopen(REWINDFILE, "wb+");
+  if(!outf) {
+    perror("couldn't open fread output file\n");
+    return 1;
+  }
+
+  handle = url_fopen("testfile", "r");
+  if(!handle) {
+    printf("couldn't url_fopen() testfile\n");
+    fclose(outf);
+    return 2;
+  }
+
+  nread = url_fread(buffer, 1, sizeof(buffer), handle);
+  fwrite(buffer, 1, nread, outf);
+  url_rewind(handle);
+
+  buffer[0]='\n';
+  fwrite(buffer, 1, 1, outf);
+
+  nread = url_fread(buffer, 1, sizeof(buffer), handle);
+  fwrite(buffer, 1, nread, outf);
+
+  url_fclose(handle);
+
+  fclose(outf);
+
+  return 0;/* all done */
 }
+#endif
diff --git a/src/io/fopen.h b/src/io/fopen.h
index f952a65..5f87bd2 100644
--- a/src/io/fopen.h
+++ b/src/io/fopen.h
@@ -80,8 +80,4 @@ size_t url_fread( void *ptr, size_t size, size_t nmemb, URL_FILE * file );
 char *url_fgets( char *ptr, size_t size, URL_FILE * file );
 void url_rewind( URL_FILE * file );
 
-wint_t url_fgetwc( URL_FILE * file );
-wint_t url_ungetwc( wint_t wc, URL_FILE * input );
-URL_FILE *file_to_url_file( FILE * f );
-
 #endif
diff --git a/src/io/io.c b/src/io/io.c
index 4577a11..d7c2024 100644
--- a/src/io/io.c
+++ b/src/io/io.c
@@ -15,6 +15,12 @@
 #include "fopen.h"
 #include "lispops.h"
 
+/**
+ * Allow a one-character unget facility. This may not be enough - we may need
+ * to allocate a buffer.
+ */
+wint_t ungotten = 0;
+
 /**
  * Convert this lisp string-like-thing (also works for symbols, and, later
  * keywords) into a UTF-8 string. NOTE that the returned value has been
@@ -56,6 +62,129 @@ char *lisp_string_to_c_string( struct cons_pointer s ) {
     return result;
 }
 
+
+/**
+ * given this file handle f, return a new url_file handle wrapping it.
+ *
+ * @param f the file to be wrapped;
+ * @return the new handle, or null if no such handle could be allocated.
+ */
+URL_FILE *file_to_url_file( FILE * f ) {
+    URL_FILE *result = ( URL_FILE * ) malloc( sizeof( URL_FILE ) );
+
+    if ( result != NULL ) {
+        result->type = CFTYPE_FILE, result->handle.file = f;
+    }
+
+    return result;
+}
+
+
+/**
+ * get one wide character from the buffer.
+ *
+ * @param file the stream to read from;
+ * @return the next wide character on the stream, or zero if no more.
+ */
+wint_t url_fgetwc( URL_FILE * input ) {
+    wint_t result = -1;
+
+    if ( ungotten != 0 ) {
+        /* TODO: not thread safe */
+        result = ungotten;
+        ungotten = 0;
+    } else {
+        switch ( input->type ) {
+            case CFTYPE_FILE:
+                fwide( input->handle.file, 1 ); /* wide characters */
+                result = fgetwc( input->handle.file );  /* passthrough */
+                break;
+
+            case CFTYPE_CURL:{
+                    char *cbuff =
+                        calloc( sizeof( wchar_t ) + 2, sizeof( char ) );
+                    wchar_t *wbuff = calloc( 2, sizeof( wchar_t ) );
+
+                    size_t count = 0;
+
+                    debug_print( L"url_fgetwc: about to call url_fgets\n", DEBUG_IO );
+                    url_fgets( cbuff, 2, input );
+                    debug_print( L"url_fgetwc: back from url_fgets\n", DEBUG_IO );
+                    int c = ( int ) cbuff[0];
+                    debug_printf( DEBUG_IO,
+                                 L"url_fgetwc: cbuff is '%s'; (first) character = %d (%c)\n",
+                                 cbuff, c, c & 0xf7 );
+                    /* The value of each individual byte indicates its UTF-8 function, as follows:
+                     *
+                     * 00 to 7F hex (0 to 127): first and only byte of a sequence.
+                     * 80 to BF hex (128 to 191): continuing byte in a multi-byte sequence.
+                     * C2 to DF hex (194 to 223): first byte of a two-byte sequence.
+                     * E0 to EF hex (224 to 239): first byte of a three-byte sequence.
+                     * F0 to FF hex (240 to 255): first byte of a four-byte sequence.
+                     */
+                    if ( c <= 0x07 ) {
+                        count = 1;
+                    } else if ( c >= '0xc2' && c <= '0xdf' ) {
+                        count = 2;
+                    } else if ( c >= '0xe0' && c <= '0xef' ) {
+                        count = 3;
+                    } else if ( c >= '0xf0' && c <= '0xff' ) {
+                        count = 4;
+                    }
+
+                    if ( count > 1 ) {
+                        url_fgets( (char *)&cbuff[1], count, input );
+                    }
+                    mbstowcs( wbuff, cbuff, 1 );  //(char *)(&input->buffer[input->buffer_pos]), 1 );
+                    result = wbuff[0];
+
+                    free( wbuff );
+                    free( cbuff );
+                }
+                break;
+            case CFTYPE_NONE:
+                break;
+        }
+    }
+
+    debug_printf( DEBUG_IO, L"url_fgetwc returning %d (%C)\n", result,
+                  result );
+    return result;
+}
+
+wint_t url_ungetwc( wint_t wc, URL_FILE * input ) {
+    wint_t result = -1;
+
+    switch ( input->type ) {
+        case CFTYPE_FILE:
+            fwide( input->handle.file, 1 ); /* wide characters */
+            result = ungetwc( wc, input->handle.file ); /* passthrough */
+            break;
+
+        case CFTYPE_CURL:{
+                ungotten = wc;
+//                wchar_t *wbuff = calloc( 2, sizeof( wchar_t ) );
+//                char *cbuff = calloc( 5, sizeof( char ) );
+//
+//                wbuff[0] = wc;
+//                result = wcstombs( cbuff, wbuff, 1 );
+//
+//                input->buffer_pos -= strlen( cbuff );
+//
+//                free( cbuff );
+//                free( wbuff );
+//
+//                result = result > 0 ? wc : result;
+                break;
+        case CFTYPE_NONE:
+                break;
+            }
+    }
+
+    return result;
+}
+
+
 /**
  * Function, sort-of: close the file indicated by my first arg, and return
  * nil. If the first arg is not a stream, does nothing. All other args are
@@ -172,7 +301,7 @@ lisp_slurp( struct stack_frame *frame, struct cons_pointer frame_pointer,
         struct cons_pointer cursor = make_string( url_fgetwc( stream ), NIL );
         result = cursor;
 
-        for ( wint_t c = url_fgetwc( stream ); !url_feof( stream );
+        for ( wint_t c = url_fgetwc( stream ); !url_feof( stream ) && c != 0;
               c = url_fgetwc( stream ) ) {
             debug_print( L"slurp: cursor is: ", DEBUG_IO );
             debug_dump_object( cursor, DEBUG_IO );
diff --git a/src/io/io.h b/src/io/io.h
index 06dcaed..d46f8b1 100644
--- a/src/io/io.h
+++ b/src/io/io.h
@@ -11,6 +11,10 @@
 #ifndef __psse_io_h
 #define __psse_io_h
 
+URL_FILE *file_to_url_file( FILE * f );
+wint_t url_fgetwc( URL_FILE * input );
+wint_t url_ungetwc( wint_t wc, URL_FILE * input );
+
 struct cons_pointer
 lisp_close( struct stack_frame *frame, struct cons_pointer frame_pointer,
             struct cons_pointer env );
diff --git a/src/memory/conspage.c b/src/memory/conspage.c
index 7a1a0d8..54d14e9 100644
--- a/src/memory/conspage.c
+++ b/src/memory/conspage.c
@@ -166,6 +166,10 @@ void free_cell( struct cons_pointer pointer ) {
                     dec_ref( cell->payload.ratio.dividend );
                     dec_ref( cell->payload.ratio.divisor );
                     break;
+                case READTV:
+                case WRITETV:
+                    url_fclose( cell->payload.stream.stream);
+                    break;
                 case SPECIALTV:
                     dec_ref( cell->payload.special.source );
                     break;
diff --git a/src/ops/lispops.c b/src/ops/lispops.c
index 4bfe6f0..1220835 100644
--- a/src/ops/lispops.c
+++ b/src/ops/lispops.c
@@ -29,9 +29,9 @@
 #include "debug.h"
 #include "dump.h"
 #include "equal.h"
-#include "fopen.h"
 #include "integer.h"
 #include "intern.h"
+#include "io.h"
 #include "lispops.h"
 #include "print.h"
 #include "read.h"
diff --git a/src/ops/read.c b/src/ops/read.c
index 989aa67..69899c0 100644
--- a/src/ops/read.c
+++ b/src/ops/read.c
@@ -22,6 +22,7 @@
 #include "dump.h"
 #include "integer.h"
 #include "intern.h"
+#include "io.h"
 #include "lispops.h"
 #include "peano.h"
 #include "print.h"

From 10098a83bf8d9e1e21ab8ee1d68c1f912f38e236 Mon Sep 17 00:00:00 2001
From: Simon Brooke <simon@journeyman.cc>
Date: Mon, 28 Jan 2019 19:00:29 +0000
Subject: [PATCH 10/31] Made the slurp unit test more robust.

---
 hi                  | 1 -
 unit-tests/slurp.sh | 7 +++++--
 2 files changed, 5 insertions(+), 3 deletions(-)
 delete mode 100644 hi

diff --git a/hi b/hi
deleted file mode 100644
index cf57f2a..0000000
--- a/hi
+++ /dev/null
@@ -1 +0,0 @@
-Hello, this is used by `slurp.sh` test, please do not remove.
diff --git a/unit-tests/slurp.sh b/unit-tests/slurp.sh
index e285988..b389143 100755
--- a/unit-tests/slurp.sh
+++ b/unit-tests/slurp.sh
@@ -1,11 +1,14 @@
 #!/bin/bash
 
-expected='"Hello, this is used by `slurp.sh` test, please do not remove.'
-actual=`echo '(slurp (open "hi"))' | target/psse | tail -2 | head -1`
+tmp=hi$$
+echo "Hello, there." > ${tmp}
+expected='"Hello, there.'
+actual=`echo "(slurp (open \"${tmp}\"))" | target/psse | tail -2 | head -1`
 
 if [ "${expected}" = "${actual}" ]
 then
     echo "OK"
+    rm ${tmp}
     exit 0
 else
     echo "Fail: expected '$expected', got '$actual'"

From eb394d153f6a4e586d5f975d89114fbb6668ab8b Mon Sep 17 00:00:00 2001
From: Simon Brooke <simon@journeyman.cc>
Date: Tue, 29 Jan 2019 18:31:30 +0000
Subject: [PATCH 11/31] Setting up medatata works...

And the `inspect` function correctly shows it. However, the `metadata` function segfaults.
---
 src/init.c                   |  76 ++--
 src/io/fopen.c               | 774 +++++++++++++++++------------------
 src/io/io.c                  | 192 +++++++--
 src/io/io.h                  |   6 +
 src/memory/conspage.c        |   7 +-
 src/memory/conspage.h        |  18 +-
 src/memory/consspaceobject.c | 102 ++++-
 src/memory/consspaceobject.h |  56 ++-
 src/memory/dump.c            |  16 +-
 src/ops/equal.c              |   5 +-
 src/ops/lispops.c            |  59 +--
 src/ops/lispops.h            |  21 +-
 src/ops/meta.c               |  47 +++
 src/ops/meta.h               |  17 +
 src/ops/print.c              |   9 +-
 src/ops/read.c               |  41 +-
 16 files changed, 866 insertions(+), 580 deletions(-)
 create mode 100644 src/ops/meta.c
 create mode 100644 src/ops/meta.h

diff --git a/src/init.c b/src/init.c
index c180b10..6cceadd 100644
--- a/src/init.c
+++ b/src/init.c
@@ -26,6 +26,7 @@
 #include "intern.h"
 #include "io.h"
 #include "lispops.h"
+#include "meta.h"
 #include "peano.h"
 #include "print.h"
 #include "repl.h"
@@ -40,14 +41,17 @@
  * more readable and aid debugging generally.
  */
 void bind_function( wchar_t *name, struct cons_pointer ( *executable )
-                     ( struct stack_frame *,
-                       struct cons_pointer, struct cons_pointer ) ) {
-    struct cons_pointer n = c_string_to_lisp_symbol( name );
-    inc_ref( n );
+                   ( struct stack_frame *,
+                    struct cons_pointer, struct cons_pointer ) ) {
+  struct cons_pointer n = c_string_to_lisp_symbol( name );
+  struct cons_pointer meta = make_cons(
+    make_cons(c_string_to_lisp_keyword(L"primitive"), TRUE),
+              make_cons( make_cons(
+                c_string_to_lisp_keyword(L"name"),
+                n),
+              NIL));
 
-    deep_bind( n, make_function( NIL, executable ) );
-
-    dec_ref( n );
+  deep_bind( n, make_function( meta, executable ) );
 }
 
 /**
@@ -58,11 +62,14 @@ void bind_special( wchar_t *name, struct cons_pointer ( *executable )
                     ( struct stack_frame *,
                       struct cons_pointer, struct cons_pointer ) ) {
     struct cons_pointer n = c_string_to_lisp_symbol( name );
-    inc_ref( n );
+    struct cons_pointer meta = make_cons(
+      make_cons(c_string_to_lisp_keyword(L"primitive"), TRUE),
+                make_cons( make_cons(
+                  c_string_to_lisp_keyword(L"name"),
+                  n),
+                NIL));
 
     deep_bind( n, make_special( NIL, executable ) );
-
-    dec_ref( n );
 }
 
 /**
@@ -87,7 +94,10 @@ int main( int argc, char *argv[] ) {
     bool show_prompt = false;
 
     setlocale( LC_ALL, "" );
-    curl_global_init( CURL_GLOBAL_DEFAULT );
+    if (io_init() != 0) {
+      fputs("Failed to initialise I/O subsystem\n", stderr);
+      exit(1);
+    }
 
     while ( ( option = getopt( argc, argv, "cpdv:" ) ) != -1 ) {
         switch ( option ) {
@@ -136,17 +146,40 @@ int main( int argc, char *argv[] ) {
     fwide( stdout, 1 );
     fwide( stderr, 1 );
     fwide( sink->handle.file, 1 );
-    bind_value( L"*in*", make_read_stream( file_to_url_file( stdin ) ) );
-    bind_value( L"*out*", make_write_stream( file_to_url_file( stdout ) ) );
-    bind_value( L"*log*", make_write_stream( file_to_url_file( stderr ) ) );
-    bind_value( L"*sink*", make_write_stream( sink ) );
-
+    bind_value( L"*in*", make_read_stream( file_to_url_file( stdin ),
+                                           make_cons( make_cons
+                                                      ( c_string_to_lisp_keyword
+                                                        ( L"url" ),
+                                                        c_string_to_lisp_string
+                                                        ( L"system:standard input" ) ),
+                                                      NIL ) ) );
+    bind_value( L"*out*",
+                make_write_stream( file_to_url_file( stdout ),
+                                   make_cons( make_cons
+                                              ( c_string_to_lisp_keyword
+                                                ( L"url" ),
+                                                c_string_to_lisp_string
+                                                ( L"system:standard output]" ) ),
+                                              NIL ) ) );
+    bind_value( L"*log*", make_write_stream( file_to_url_file( stderr ),
+                                             make_cons( make_cons
+                                                        ( c_string_to_lisp_keyword
+                                                          ( L"url" ),
+                                                          c_string_to_lisp_string
+                                                          ( L"system:standard log" ) ),
+                                                        NIL ) ) );
+    bind_value( L"*sink*", make_write_stream( sink,
+                                              make_cons( make_cons
+                                                         ( c_string_to_lisp_keyword
+                                                           ( L"url" ),
+                                                           c_string_to_lisp_string
+                                                           ( L"system:standard sink" ) ),
+                                                         NIL ) ) );
     /*
      * the default prompt
      */
     bind_value( L"*prompt*",
                 show_prompt ? c_string_to_lisp_symbol( L":: " ) : NIL );
-
     /*
      * primitive function operations
      */
@@ -164,6 +197,8 @@ int main( int argc, char *argv[] ) {
     bind_function( L"eval", &lisp_eval );
     bind_function( L"exception", &lisp_exception );
     bind_function( L"inspect", &lisp_inspect );
+    bind_function( L"meta", &lisp_metadata );
+    bind_function( L"metadata", &lisp_metadata );
     bind_function( L"multiply", &lisp_multiply );
     bind_function( L"negative?", &lisp_is_negative );
     bind_function( L"oblist", &lisp_oblist );
@@ -180,13 +215,11 @@ int main( int argc, char *argv[] ) {
     bind_function( L"subtract", &lisp_subtract );
     bind_function( L"throw", &lisp_exception );
     bind_function( L"type", &lisp_type );
-
     bind_function( L"+", &lisp_add );
     bind_function( L"*", &lisp_multiply );
     bind_function( L"-", &lisp_subtract );
     bind_function( L"/", &lisp_divide );
     bind_function( L"=", &lisp_equal );
-
     /*
      * primitive special forms
      */
@@ -198,19 +231,16 @@ int main( int argc, char *argv[] ) {
     bind_special( L"progn", &lisp_progn );
     bind_special( L"quote", &lisp_quote );
     bind_special( L"set!", &lisp_set_shriek );
-
     debug_print( L"Initialised oblist\n", DEBUG_BOOTSTRAP );
     debug_dump_object( oblist, DEBUG_BOOTSTRAP );
-
     repl( show_prompt );
-
     debug_print( L"Freeing oblist\n", DEBUG_BOOTSTRAP );
     dec_ref( oblist );
     debug_dump_object( oblist, DEBUG_BOOTSTRAP );
-
     if ( dump_at_end ) {
         dump_pages( file_to_url_file( stdout ) );
     }
 
+    curl_global_cleanup(  );
     return ( 0 );
 }
diff --git a/src/io/fopen.c b/src/io/fopen.c
index f0ea012..50c09b5 100644
--- a/src/io/fopen.c
+++ b/src/io/fopen.c
@@ -47,392 +47,369 @@
 
 #include <curl/curl.h>
 
-enum fcurl_type_e {
-  CFTYPE_NONE = 0,
-  CFTYPE_FILE = 1,
-  CFTYPE_CURL = 2
-};
+#include "fopen.h"
+#ifdef FOPEN_STANDALONE
+CURLSH *io_share;
+#else
+#include "io.h"
+#include "consspaceobject.h"
+#endif
 
-struct fcurl_data
-{
-  enum fcurl_type_e type;     /* type of handle */
-  union {
-    CURL *curl;
-    FILE *file;
-  } handle;                   /* handle */
-
-  char *buffer;               /* buffer to store cached data*/
-  size_t buffer_len;          /* currently allocated buffers length */
-  size_t buffer_pos;          /* end of data in buffer*/
-  int still_running;          /* Is background url fetch still in progress */
-};
-
-typedef struct fcurl_data URL_FILE;
 
 /* exported functions */
-URL_FILE *url_fopen(const char *url, const char *operation);
-int url_fclose(URL_FILE *file);
-int url_feof(URL_FILE *file);
-size_t url_fread(void *ptr, size_t size, size_t nmemb, URL_FILE *file);
-char *url_fgets(char *ptr, size_t size, URL_FILE *file);
-void url_rewind(URL_FILE *file);
+URL_FILE *url_fopen( const char *url, const char *operation );
+int url_fclose( URL_FILE * file );
+int url_feof( URL_FILE * file );
+size_t url_fread( void *ptr, size_t size, size_t nmemb, URL_FILE * file );
+char *url_fgets( char *ptr, size_t size, URL_FILE * file );
+void url_rewind( URL_FILE * file );
 
 /* we use a global one for convenience */
 static CURLM *multi_handle;
 
 /* curl calls this routine to get more data */
-static size_t write_callback(char *buffer,
-                             size_t size,
-                             size_t nitems,
-                             void *userp)
-{
-  char *newbuff;
-  size_t rembuff;
+static size_t write_callback( char *buffer,
+                              size_t size, size_t nitems, void *userp ) {
+    char *newbuff;
+    size_t rembuff;
 
-  URL_FILE *url = (URL_FILE *)userp;
-  size *= nitems;
+    URL_FILE *url = ( URL_FILE * ) userp;
+    size *= nitems;
 
-  rembuff = url->buffer_len - url->buffer_pos; /* remaining space in buffer */
+    rembuff = url->buffer_len - url->buffer_pos;  /* remaining space in buffer */
 
-  if(size > rembuff) {
-    /* not enough space in buffer */
-    newbuff = realloc(url->buffer, url->buffer_len + (size - rembuff));
-    if(newbuff == NULL) {
-      fprintf(stderr, "callback buffer grow failed\n");
-      size = rembuff;
+    if ( size > rembuff ) {
+        /* not enough space in buffer */
+        newbuff = realloc( url->buffer, url->buffer_len + ( size - rembuff ) );
+        if ( newbuff == NULL ) {
+            fprintf( stderr, "callback buffer grow failed\n" );
+            size = rembuff;
+        } else {
+            /* realloc succeeded increase buffer size */
+            url->buffer_len += size - rembuff;
+            url->buffer = newbuff;
+        }
     }
-    else {
-      /* realloc succeeded increase buffer size*/
-      url->buffer_len += size - rembuff;
-      url->buffer = newbuff;
-    }
-  }
 
-  memcpy(&url->buffer[url->buffer_pos], buffer, size);
-  url->buffer_pos += size;
+    memcpy( &url->buffer[url->buffer_pos], buffer, size );
+    url->buffer_pos += size;
 
-  return size;
+    return size;
 }
 
 /* use to attempt to fill the read buffer up to requested number of bytes */
-static int fill_buffer(URL_FILE *file, size_t want)
-{
-  fd_set fdread;
-  fd_set fdwrite;
-  fd_set fdexcep;
-  struct timeval timeout;
-  int rc;
-  CURLMcode mc; /* curl_multi_fdset() return code */
+static int fill_buffer( URL_FILE * file, size_t want ) {
+    fd_set fdread;
+    fd_set fdwrite;
+    fd_set fdexcep;
+    struct timeval timeout;
+    int rc;
+    CURLMcode mc;               /* curl_multi_fdset() return code */
 
-  /* only attempt to fill buffer if transactions still running and buffer
-   * doesn't exceed required size already
-   */
-  if((!file->still_running) || (file->buffer_pos > want))
-    return 0;
+    /* only attempt to fill buffer if transactions still running and buffer
+     * doesn't exceed required size already
+     */
+    if ( ( !file->still_running ) || ( file->buffer_pos > want ) )
+        return 0;
 
-  /* attempt to fill buffer */
-  do {
-    int maxfd = -1;
-    long curl_timeo = -1;
+    /* attempt to fill buffer */
+    do {
+        int maxfd = -1;
+        long curl_timeo = -1;
 
-    FD_ZERO(&fdread);
-    FD_ZERO(&fdwrite);
-    FD_ZERO(&fdexcep);
+        FD_ZERO( &fdread );
+        FD_ZERO( &fdwrite );
+        FD_ZERO( &fdexcep );
 
-    /* set a suitable timeout to fail on */
-    timeout.tv_sec = 60; /* 1 minute */
-    timeout.tv_usec = 0;
+        /* set a suitable timeout to fail on */
+        timeout.tv_sec = 60;    /* 1 minute */
+        timeout.tv_usec = 0;
 
-    curl_multi_timeout(multi_handle, &curl_timeo);
-    if(curl_timeo >= 0) {
-      timeout.tv_sec = curl_timeo / 1000;
-      if(timeout.tv_sec > 1)
-        timeout.tv_sec = 1;
-      else
-        timeout.tv_usec = (curl_timeo % 1000) * 1000;
-    }
+        curl_multi_timeout( multi_handle, &curl_timeo );
+        if ( curl_timeo >= 0 ) {
+            timeout.tv_sec = curl_timeo / 1000;
+            if ( timeout.tv_sec > 1 )
+                timeout.tv_sec = 1;
+            else
+                timeout.tv_usec = ( curl_timeo % 1000 ) * 1000;
+        }
 
-    /* get file descriptors from the transfers */
-    mc = curl_multi_fdset(multi_handle, &fdread, &fdwrite, &fdexcep, &maxfd);
+        /* get file descriptors from the transfers */
+        mc = curl_multi_fdset( multi_handle, &fdread, &fdwrite, &fdexcep,
+                               &maxfd );
 
-    if(mc != CURLM_OK) {
-      fprintf(stderr, "curl_multi_fdset() failed, code %d.\n", mc);
-      break;
-    }
+        if ( mc != CURLM_OK ) {
+            fprintf( stderr, "curl_multi_fdset() failed, code %d.\n", mc );
+            break;
+        }
 
-    /* On success the value of maxfd is guaranteed to be >= -1. We call
-       select(maxfd + 1, ...); specially in case of (maxfd == -1) there are
-       no fds ready yet so we call select(0, ...) --or Sleep() on Windows--
-       to sleep 100ms, which is the minimum suggested value in the
-       curl_multi_fdset() doc. */
+        /* On success the value of maxfd is guaranteed to be >= -1. We call
+           select(maxfd + 1, ...); specially in case of (maxfd == -1) there are
+           no fds ready yet so we call select(0, ...) --or Sleep() on Windows--
+           to sleep 100ms, which is the minimum suggested value in the
+           curl_multi_fdset() doc. */
 
-    if(maxfd == -1) {
+        if ( maxfd == -1 ) {
 #ifdef _WIN32
-      Sleep(100);
-      rc = 0;
+            Sleep( 100 );
+            rc = 0;
 #else
-      /* Portable sleep for platforms other than Windows. */
-      struct timeval wait = { 0, 100 * 1000 }; /* 100ms */
-      rc = select(0, NULL, NULL, NULL, &wait);
+            /* Portable sleep for platforms other than Windows. */
+            struct timeval wait = { 0, 100 * 1000 };  /* 100ms */
+            rc = select( 0, NULL, NULL, NULL, &wait );
 #endif
-    }
-    else {
-      /* Note that on some platforms 'timeout' may be modified by select().
-         If you need access to the original value save a copy beforehand. */
-      rc = select(maxfd + 1, &fdread, &fdwrite, &fdexcep, &timeout);
-    }
+        } else {
+            /* Note that on some platforms 'timeout' may be modified by select().
+               If you need access to the original value save a copy beforehand. */
+            rc = select( maxfd + 1, &fdread, &fdwrite, &fdexcep, &timeout );
+        }
 
-    switch(rc) {
-    case -1:
-      /* select error */
-      break;
+        switch ( rc ) {
+            case -1:
+                /* select error */
+                break;
 
-    case 0:
-    default:
-      /* timeout or readable/writable sockets */
-      curl_multi_perform(multi_handle, &file->still_running);
-      break;
-    }
-  } while(file->still_running && (file->buffer_pos < want));
-  return 1;
+            case 0:
+            default:
+                /* timeout or readable/writable sockets */
+                curl_multi_perform( multi_handle, &file->still_running );
+                break;
+        }
+    } while ( file->still_running && ( file->buffer_pos < want ) );
+    return 1;
 }
 
 /* use to remove want bytes from the front of a files buffer */
-static int use_buffer(URL_FILE *file, size_t want)
-{
-  /* sort out buffer */
-  if((file->buffer_pos - want) <= 0) {
-    /* ditch buffer - write will recreate */
-    free(file->buffer);
-    file->buffer = NULL;
-    file->buffer_pos = 0;
-    file->buffer_len = 0;
-  }
-  else {
-    /* move rest down make it available for later */
-    memmove(file->buffer,
-            &file->buffer[want],
-            (file->buffer_pos - want));
+static int use_buffer( URL_FILE * file, size_t want ) {
+    /* sort out buffer */
+    if ( ( file->buffer_pos - want ) <= 0 ) {
+        /* ditch buffer - write will recreate */
+        free( file->buffer );
+        file->buffer = NULL;
+        file->buffer_pos = 0;
+        file->buffer_len = 0;
+    } else {
+        /* move rest down make it available for later */
+        memmove( file->buffer,
+                 &file->buffer[want], ( file->buffer_pos - want ) );
 
-    file->buffer_pos -= want;
-  }
-  return 0;
-}
-
-URL_FILE *url_fopen(const char *url, const char *operation)
-{
-  /* this code could check for URLs or types in the 'url' and
-     basically use the real fopen() for standard files */
-
-  URL_FILE *file;
-  (void)operation;
-
-  file = calloc(1, sizeof(URL_FILE));
-  if(!file)
-    return NULL;
-
-  file->handle.file = fopen(url, operation);
-  if(file->handle.file)
-    file->type = CFTYPE_FILE; /* marked as URL */
-
-  else {
-    file->type = CFTYPE_CURL; /* marked as URL */
-    file->handle.curl = curl_easy_init();
-
-    curl_easy_setopt(file->handle.curl, CURLOPT_URL, url);
-    curl_easy_setopt(file->handle.curl, CURLOPT_WRITEDATA, file);
-    curl_easy_setopt(file->handle.curl, CURLOPT_VERBOSE, 0L);
-    curl_easy_setopt(file->handle.curl, CURLOPT_WRITEFUNCTION, write_callback);
-
-    if(!multi_handle)
-      multi_handle = curl_multi_init();
-
-    curl_multi_add_handle(multi_handle, file->handle.curl);
-
-    /* lets start the fetch */
-    curl_multi_perform(multi_handle, &file->still_running);
-
-    if((file->buffer_pos == 0) && (!file->still_running)) {
-      /* if still_running is 0 now, we should return NULL */
-
-      /* make sure the easy handle is not in the multi handle anymore */
-      curl_multi_remove_handle(multi_handle, file->handle.curl);
-
-      /* cleanup */
-      curl_easy_cleanup(file->handle.curl);
-
-      free(file);
-
-      file = NULL;
+        file->buffer_pos -= want;
     }
-  }
-  return file;
+    return 0;
 }
 
-int url_fclose(URL_FILE *file)
-{
-  int ret = 0;/* default is good return */
+URL_FILE *url_fopen( const char *url, const char *operation ) {
+    /* this code could check for URLs or types in the 'url' and
+       basically use the real fopen() for standard files */
 
-  switch(file->type) {
-  case CFTYPE_FILE:
-    ret = fclose(file->handle.file); /* passthrough */
-    break;
+    URL_FILE *file;
+    ( void ) operation;
 
-  case CFTYPE_CURL:
-    /* make sure the easy handle is not in the multi handle anymore */
-    curl_multi_remove_handle(multi_handle, file->handle.curl);
+    file = calloc( 1, sizeof( URL_FILE ) );
+    if ( !file )
+        return NULL;
 
-    /* cleanup */
-    curl_easy_cleanup(file->handle.curl);
-    break;
+    file->handle.file = fopen( url, operation );
+    if ( file->handle.file )
+        file->type = CFTYPE_FILE; /* marked as URL */
 
-  default: /* unknown or supported type - oh dear */
-    ret = EOF;
-    errno = EBADF;
-    break;
-  }
+    else {
+        file->type = CFTYPE_CURL; /* marked as URL */
+        file->handle.curl = curl_easy_init(  );
 
-  free(file->buffer);/* free any allocated buffer space */
-  free(file);
+        curl_easy_setopt( file->handle.curl, CURLOPT_URL, url );
+        curl_easy_setopt( file->handle.curl, CURLOPT_WRITEDATA, file );
+        curl_easy_setopt( file->handle.curl, CURLOPT_VERBOSE, 0L );
+        curl_easy_setopt( file->handle.curl, CURLOPT_WRITEFUNCTION,
+                          write_callback );
+        /* use the share object */
+        curl_easy_setopt(file->handle.curl, CURLOPT_SHARE, io_share);
 
-  return ret;
+
+        if ( !multi_handle )
+            multi_handle = curl_multi_init(  );
+
+        curl_multi_add_handle( multi_handle, file->handle.curl );
+
+        /* lets start the fetch */
+        curl_multi_perform( multi_handle, &file->still_running );
+
+        if ( ( file->buffer_pos == 0 ) && ( !file->still_running ) ) {
+            /* if still_running is 0 now, we should return NULL */
+
+            /* make sure the easy handle is not in the multi handle anymore */
+            curl_multi_remove_handle( multi_handle, file->handle.curl );
+
+            /* cleanup */
+            curl_easy_cleanup( file->handle.curl );
+
+            free( file );
+
+            file = NULL;
+        }
+    }
+    return file;
 }
 
-int url_feof(URL_FILE *file)
-{
-  int ret = 0;
+int url_fclose( URL_FILE * file ) {
+    int ret = 0;                /* default is good return */
 
-  switch(file->type) {
-  case CFTYPE_FILE:
-    ret = feof(file->handle.file);
-    break;
+    switch ( file->type ) {
+        case CFTYPE_FILE:
+            ret = fclose( file->handle.file );  /* passthrough */
+            break;
 
-  case CFTYPE_CURL:
-    if((file->buffer_pos == 0) && (!file->still_running))
-      ret = 1;
-    break;
+        case CFTYPE_CURL:
+            /* make sure the easy handle is not in the multi handle anymore */
+            curl_multi_remove_handle( multi_handle, file->handle.curl );
 
-  default: /* unknown or supported type - oh dear */
-    ret = -1;
-    errno = EBADF;
-    break;
-  }
-  return ret;
-}
+            /* cleanup */
+            curl_easy_cleanup( file->handle.curl );
+            break;
 
-size_t url_fread(void *ptr, size_t size, size_t nmemb, URL_FILE *file)
-{
-  size_t want;
-
-  switch(file->type) {
-  case CFTYPE_FILE:
-    want = fread(ptr, size, nmemb, file->handle.file);
-    break;
-
-  case CFTYPE_CURL:
-    want = nmemb * size;
-
-    fill_buffer(file, want);
-
-    /* check if there's data in the buffer - if not fill_buffer()
-     * either errored or EOF */
-    if(!file->buffer_pos)
-      return 0;
-
-    /* ensure only available data is considered */
-    if(file->buffer_pos < want)
-      want = file->buffer_pos;
-
-    /* xfer data to caller */
-    memcpy(ptr, file->buffer, want);
-
-    use_buffer(file, want);
-
-    want = want / size;     /* number of items */
-    break;
-
-  default: /* unknown or supported type - oh dear */
-    want = 0;
-    errno = EBADF;
-    break;
-
-  }
-  return want;
-}
-
-char *url_fgets(char *ptr, size_t size, URL_FILE *file)
-{
-  size_t want = size - 1;/* always need to leave room for zero termination */
-  size_t loop;
-
-  switch(file->type) {
-  case CFTYPE_FILE:
-    ptr = fgets(ptr, (int)size, file->handle.file);
-    break;
-
-  case CFTYPE_CURL:
-    fill_buffer(file, want);
-
-    /* check if there's data in the buffer - if not fill either errored or
-     * EOF */
-    if(!file->buffer_pos)
-      return NULL;
-
-    /* ensure only available data is considered */
-    if(file->buffer_pos < want)
-      want = file->buffer_pos;
-
-    /*buffer contains data */
-    /* look for newline or eof */
-    for(loop = 0; loop < want; loop++) {
-      if(file->buffer[loop] == '\n') {
-        want = loop + 1;/* include newline */
-        break;
-      }
+        default:               /* unknown or supported type - oh dear */
+            ret = EOF;
+            errno = EBADF;
+            break;
     }
 
-    /* xfer data to caller */
-    memcpy(ptr, file->buffer, want);
-    ptr[want] = 0;/* always null terminate */
+    free( file->buffer );       /* free any allocated buffer space */
+    free( file );
 
-    use_buffer(file, want);
-
-    break;
-
-  default: /* unknown or supported type - oh dear */
-    ptr = NULL;
-    errno = EBADF;
-    break;
-  }
-
-  return ptr;/*success */
+    return ret;
 }
 
-void url_rewind(URL_FILE *file)
-{
-  switch(file->type) {
-  case CFTYPE_FILE:
-    rewind(file->handle.file); /* passthrough */
-    break;
+int url_feof( URL_FILE * file ) {
+    int ret = 0;
 
-  case CFTYPE_CURL:
-    /* halt transaction */
-    curl_multi_remove_handle(multi_handle, file->handle.curl);
+    switch ( file->type ) {
+        case CFTYPE_FILE:
+            ret = feof( file->handle.file );
+            break;
 
-    /* restart */
-    curl_multi_add_handle(multi_handle, file->handle.curl);
+        case CFTYPE_CURL:
+            if ( ( file->buffer_pos == 0 ) && ( !file->still_running ) )
+                ret = 1;
+            break;
 
-    /* ditch buffer - write will recreate - resets stream pos*/
-    free(file->buffer);
-    file->buffer = NULL;
-    file->buffer_pos = 0;
-    file->buffer_len = 0;
+        default:               /* unknown or supported type - oh dear */
+            ret = -1;
+            errno = EBADF;
+            break;
+    }
+    return ret;
+}
 
-    break;
+size_t url_fread( void *ptr, size_t size, size_t nmemb, URL_FILE * file ) {
+    size_t want;
 
-  default: /* unknown or supported type - oh dear */
-    break;
-  }
+    switch ( file->type ) {
+        case CFTYPE_FILE:
+            want = fread( ptr, size, nmemb, file->handle.file );
+            break;
+
+        case CFTYPE_CURL:
+            want = nmemb * size;
+
+            fill_buffer( file, want );
+
+            /* check if there's data in the buffer - if not fill_buffer()
+             * either errored or EOF */
+            if ( !file->buffer_pos )
+                return 0;
+
+            /* ensure only available data is considered */
+            if ( file->buffer_pos < want )
+                want = file->buffer_pos;
+
+            /* xfer data to caller */
+            memcpy( ptr, file->buffer, want );
+
+            use_buffer( file, want );
+
+            want = want / size; /* number of items */
+            break;
+
+        default:               /* unknown or supported type - oh dear */
+            want = 0;
+            errno = EBADF;
+            break;
+
+    }
+    return want;
+}
+
+char *url_fgets( char *ptr, size_t size, URL_FILE * file ) {
+    size_t want = size - 1;     /* always need to leave room for zero termination */
+    size_t loop;
+
+    switch ( file->type ) {
+        case CFTYPE_FILE:
+            ptr = fgets( ptr, ( int ) size, file->handle.file );
+            break;
+
+        case CFTYPE_CURL:
+            fill_buffer( file, want );
+
+            /* check if there's data in the buffer - if not fill either errored or
+             * EOF */
+            if ( !file->buffer_pos )
+                return NULL;
+
+            /* ensure only available data is considered */
+            if ( file->buffer_pos < want )
+                want = file->buffer_pos;
+
+            /*buffer contains data */
+            /* look for newline or eof */
+            for ( loop = 0; loop < want; loop++ ) {
+                if ( file->buffer[loop] == '\n' ) {
+                    want = loop + 1;  /* include newline */
+                    break;
+                }
+            }
+
+            /* xfer data to caller */
+            memcpy( ptr, file->buffer, want );
+            ptr[want] = 0;      /* always null terminate */
+
+            use_buffer( file, want );
+
+            break;
+
+        default:               /* unknown or supported type - oh dear */
+            ptr = NULL;
+            errno = EBADF;
+            break;
+    }
+
+    return ptr;                 /*success */
+}
+
+void url_rewind( URL_FILE * file ) {
+    switch ( file->type ) {
+        case CFTYPE_FILE:
+            rewind( file->handle.file );  /* passthrough */
+            break;
+
+        case CFTYPE_CURL:
+            /* halt transaction */
+            curl_multi_remove_handle( multi_handle, file->handle.curl );
+
+            /* restart */
+            curl_multi_add_handle( multi_handle, file->handle.curl );
+
+            /* ditch buffer - write will recreate - resets stream pos */
+            free( file->buffer );
+            file->buffer = NULL;
+            file->buffer_pos = 0;
+            file->buffer_len = 0;
+
+            break;
+
+        default:               /* unknown or supported type - oh dear */
+            break;
+    }
 }
 
 #ifdef FOPEN_STANDALONE
@@ -443,104 +420,103 @@ void url_rewind(URL_FILE *file)
 /* Small main program to retrieve from a url using fgets and fread saving the
  * output to two test files (note the fgets method will corrupt binary files if
  * they contain 0 chars */
-int main(int argc, char *argv[])
-{
-  URL_FILE *handle;
-  FILE *outf;
+int main( int argc, char *argv[] ) {
+    URL_FILE *handle;
+    FILE *outf;
 
-  size_t nread;
-  char buffer[256];
-  const char *url;
+    size_t nread;
+    char buffer[256];
+    const char *url;
 
-  CURL *curl;
-  CURLcode res;
+    CURL *curl;
+    CURLcode res;
 
-  curl_global_init(CURL_GLOBAL_DEFAULT);
+    curl_global_init( CURL_GLOBAL_DEFAULT );
 
-  curl = curl_easy_init();
+    curl = curl_easy_init(  );
 
 
-  if(argc < 2)
-    url = "http://192.168.7.3/testfile";/* default to testurl */
-  else
-    url = argv[1];/* use passed url */
+    if ( argc < 2 )
+        url = "http://192.168.7.3/testfile";  /* default to testurl */
+    else
+        url = argv[1];          /* use passed url */
 
-  /* copy from url line by line with fgets */
-  outf = fopen(FGETSFILE, "wb+");
-  if(!outf) {
-    perror("couldn't open fgets output file\n");
-    return 1;
-  }
+    /* copy from url line by line with fgets */
+    outf = fopen( FGETSFILE, "wb+" );
+    if ( !outf ) {
+        perror( "couldn't open fgets output file\n" );
+        return 1;
+    }
 
-  handle = url_fopen(url, "r");
-  if(!handle) {
-    printf("couldn't url_fopen() %s\n", url);
-    fclose(outf);
-    return 2;
-  }
+    handle = url_fopen( url, "r" );
+    if ( !handle ) {
+        printf( "couldn't url_fopen() %s\n", url );
+        fclose( outf );
+        return 2;
+    }
 
-  while(!url_feof(handle)) {
-    url_fgets(buffer, sizeof(buffer), handle);
-    fwrite(buffer, 1, strlen(buffer), outf);
-  }
+    while ( !url_feof( handle ) ) {
+        url_fgets( buffer, sizeof( buffer ), handle );
+        fwrite( buffer, 1, strlen( buffer ), outf );
+    }
 
-  url_fclose(handle);
+    url_fclose( handle );
 
-  fclose(outf);
+    fclose( outf );
 
 
-  /* Copy from url with fread */
-  outf = fopen(FREADFILE, "wb+");
-  if(!outf) {
-    perror("couldn't open fread output file\n");
-    return 1;
-  }
+    /* Copy from url with fread */
+    outf = fopen( FREADFILE, "wb+" );
+    if ( !outf ) {
+        perror( "couldn't open fread output file\n" );
+        return 1;
+    }
 
-  handle = url_fopen("testfile", "r");
-  if(!handle) {
-    printf("couldn't url_fopen() testfile\n");
-    fclose(outf);
-    return 2;
-  }
+    handle = url_fopen( "testfile", "r" );
+    if ( !handle ) {
+        printf( "couldn't url_fopen() testfile\n" );
+        fclose( outf );
+        return 2;
+    }
 
-  do {
-    nread = url_fread(buffer, 1, sizeof(buffer), handle);
-    fwrite(buffer, 1, nread, outf);
-  } while(nread);
+    do {
+        nread = url_fread( buffer, 1, sizeof( buffer ), handle );
+        fwrite( buffer, 1, nread, outf );
+    } while ( nread );
 
-  url_fclose(handle);
+    url_fclose( handle );
 
-  fclose(outf);
+    fclose( outf );
 
 
-  /* Test rewind */
-  outf = fopen(REWINDFILE, "wb+");
-  if(!outf) {
-    perror("couldn't open fread output file\n");
-    return 1;
-  }
+    /* Test rewind */
+    outf = fopen( REWINDFILE, "wb+" );
+    if ( !outf ) {
+        perror( "couldn't open fread output file\n" );
+        return 1;
+    }
 
-  handle = url_fopen("testfile", "r");
-  if(!handle) {
-    printf("couldn't url_fopen() testfile\n");
-    fclose(outf);
-    return 2;
-  }
+    handle = url_fopen( "testfile", "r" );
+    if ( !handle ) {
+        printf( "couldn't url_fopen() testfile\n" );
+        fclose( outf );
+        return 2;
+    }
 
-  nread = url_fread(buffer, 1, sizeof(buffer), handle);
-  fwrite(buffer, 1, nread, outf);
-  url_rewind(handle);
+    nread = url_fread( buffer, 1, sizeof( buffer ), handle );
+    fwrite( buffer, 1, nread, outf );
+    url_rewind( handle );
 
-  buffer[0]='\n';
-  fwrite(buffer, 1, 1, outf);
+    buffer[0] = '\n';
+    fwrite( buffer, 1, 1, outf );
 
-  nread = url_fread(buffer, 1, sizeof(buffer), handle);
-  fwrite(buffer, 1, nread, outf);
+    nread = url_fread( buffer, 1, sizeof( buffer ), handle );
+    fwrite( buffer, 1, nread, outf );
 
-  url_fclose(handle);
+    url_fclose( handle );
 
-  fclose(outf);
+    fclose( outf );
 
-  return 0;/* all done */
+    return 0;                   /* all done */
 }
 #endif
diff --git a/src/io/io.c b/src/io/io.c
index d7c2024..3d9eb36 100644
--- a/src/io/io.c
+++ b/src/io/io.c
@@ -8,6 +8,17 @@
  */
 
 #include <stdlib.h>
+#include <string.h>
+#include <sys/stat.h>
+#include <sys/types.h>
+#include <unistd.h>
+/*
+ * wide characters
+ */
+#include <wchar.h>
+#include <wctype.h>
+
+#include <curl/curl.h>
 
 #include "conspage.h"
 #include "consspaceobject.h"
@@ -15,12 +26,42 @@
 #include "fopen.h"
 #include "lispops.h"
 
+/**
+ * The sharing hub for all connections. TODO: Ultimately this probably doesn't
+ * work for a multi-user environment and we will need one sharing hub for each
+ * user, or else we will need to not share at least cookies and ssl sessions.
+ */
+CURLSH *io_share;
+
 /**
  * Allow a one-character unget facility. This may not be enough - we may need
  * to allocate a buffer.
  */
 wint_t ungotten = 0;
 
+/**
+ * Initialise the I/O subsystem.
+ *
+ * @return 0 on success; any other value means failure.
+ */
+int io_init() {
+  CURL *curl;
+  CURLcode res;
+  int result = curl_global_init( CURL_GLOBAL_SSL );
+
+  io_share = curl_share_init();
+
+  if (result == 0) {
+      curl_share_setopt(io_share, CURLSHOPT_SHARE, CURL_LOCK_DATA_CONNECT);
+      curl_share_setopt(io_share, CURLSHOPT_SHARE, CURL_LOCK_DATA_COOKIE );
+      curl_share_setopt(io_share, CURLSHOPT_SHARE, CURL_LOCK_DATA_DNS );
+      curl_share_setopt(io_share, CURLSHOPT_SHARE, CURL_LOCK_DATA_SSL_SESSION );
+      curl_share_setopt(io_share, CURLSHOPT_SHARE, CURL_LOCK_DATA_PSL );
+  }
+
+  return result;
+}
+
 /**
  * Convert this lisp string-like-thing (also works for symbols, and, later
  * keywords) into a UTF-8 string. NOTE that the returned value has been
@@ -107,13 +148,15 @@ wint_t url_fgetwc( URL_FILE * input ) {
 
                     size_t count = 0;
 
-                    debug_print( L"url_fgetwc: about to call url_fgets\n", DEBUG_IO );
+                    debug_print( L"url_fgetwc: about to call url_fgets\n",
+                                 DEBUG_IO );
                     url_fgets( cbuff, 2, input );
-                    debug_print( L"url_fgetwc: back from url_fgets\n", DEBUG_IO );
+                    debug_print( L"url_fgetwc: back from url_fgets\n",
+                                 DEBUG_IO );
                     int c = ( int ) cbuff[0];
                     debug_printf( DEBUG_IO,
-                                 L"url_fgetwc: cbuff is '%s'; (first) character = %d (%c)\n",
-                                 cbuff, c, c & 0xf7 );
+                                  L"url_fgetwc: cbuff is '%s'; (first) character = %d (%c)\n",
+                                  cbuff, c, c & 0xf7 );
                     /* The value of each individual byte indicates its UTF-8 function, as follows:
                      *
                      * 00 to 7F hex (0 to 127): first and only byte of a sequence.
@@ -133,7 +176,7 @@ wint_t url_fgetwc( URL_FILE * input ) {
                     }
 
                     if ( count > 1 ) {
-                        url_fgets( (char *)&cbuff[1], count, input );
+                        url_fgets( ( char * ) &cbuff[1], count, input );
                     }
                     mbstowcs( wbuff, cbuff, 1 );  //(char *)(&input->buffer[input->buffer_pos]), 1 );
                     result = wbuff[0];
@@ -163,18 +206,6 @@ wint_t url_ungetwc( wint_t wc, URL_FILE * input ) {
 
         case CFTYPE_CURL:{
                 ungotten = wc;
-//                wchar_t *wbuff = calloc( 2, sizeof( wchar_t ) );
-//                char *cbuff = calloc( 5, sizeof( char ) );
-//
-//                wbuff[0] = wc;
-//                result = wcstombs( cbuff, wbuff, 1 );
-//
-//                input->buffer_pos -= strlen( cbuff );
-//
-//                free( cbuff );
-//                free( wbuff );
-//
-//                result = result > 0 ? wc : result;
                 break;
         case CFTYPE_NONE:
                 break;
@@ -212,6 +243,85 @@ lisp_close( struct stack_frame *frame, struct cons_pointer frame_pointer,
     return result;
 }
 
+int index_of( char c, char * s) {
+  int i;
+
+  for (i = 0; s[i] != c && s[i] != 0; i++);
+
+  return s[i] == c ? i : -1;
+}
+
+char * trim(char *s) {
+  int i;
+
+  for (i = strlen(s); (isblank(s[i]) || iscntrl(s[i])) && i > -1; i--) {
+    s[i] = (char) 0;
+  }
+  for (i = 0; isblank(s[i]) && s[i] != 0; i++);
+
+  return (char *)&s[i];
+}
+
+/**
+ * Callback to assemble metadata for a URL stream. This is naughty because
+ * it modifies data, but it's really the only way to create metadata.
+ */
+static size_t write_meta_callback(void *ptr, size_t size, size_t nmemb, struct cons_pointer stream)
+{
+  struct cons_space_object * cell = &pointer2cell(stream);
+
+  if (strncmp(&cell->tag.bytes[0], READTAG, 4) ||
+      strncmp(&cell->tag.bytes[0], WRITETAG, 4)) {
+    char * s = (char *)ptr;
+    int offset = index_of (':', ptr);
+
+    if (offset != -1) {
+      s[offset] = (char)0;
+      char * name = s;
+      char * value = trim( &s[++offset]);
+      wchar_t * wname = calloc(strlen(name), sizeof(wchar_t));
+      wchar_t * wvalue = calloc(strlen(value), sizeof(wchar_t));
+
+      mbstowcs(wname, name, strlen(name));
+      mbstowcs(wvalue, value, strlen(value));
+
+      cell->payload.stream.meta = make_cons(
+        make_cons(
+          c_string_to_lisp_keyword( wname),
+          c_string_to_lisp_string(wvalue)),
+        cell->payload.stream.meta);
+
+      debug_printf( DEBUG_IO, L"write_meta_callback: added header '%s': value '%s'\n", name, value);
+    }
+  } else {
+    debug_print( L"Pointer passed to write_meta_callback did not point to a stream: ", DEBUG_IO);
+    debug_dump_object(stream, DEBUG_IO);
+  }
+
+  return nmemb;
+}
+
+
+void collect_meta( struct cons_pointer stream, struct cons_pointer url ) {
+    URL_FILE * s = pointer2cell(stream).payload.stream.stream;
+
+    switch ( s->type ) {
+        case CFTYPE_NONE:
+            break;
+        case CFTYPE_FILE:
+            /* don't know whether you can get metadata on an open stream in C,
+             * although we could of course get it from the URL */
+            break;
+        case CFTYPE_CURL:
+            curl_easy_setopt( s->handle.curl, CURLOPT_VERBOSE, 1L );
+            curl_easy_setopt( s->handle.curl, CURLOPT_HEADER, 1L );
+            curl_easy_setopt( s->handle.curl, CURLOPT_HEADERFUNCTION, write_meta_callback);
+            curl_easy_setopt( s->handle.curl, CURLOPT_HEADERDATA, stream);
+            break;
+    }
+}
+
+
 /**
  * Function: return a stream open on the URL indicated by the first argument;
  * if a second argument is present and is non-nil, open it for reading. At
@@ -228,28 +338,38 @@ lisp_close( struct stack_frame *frame, struct cons_pointer frame_pointer,
  * on my stream, if any, else NIL.
  */
 struct cons_pointer
-lisp_open( struct stack_frame *frame, struct cons_pointer frame_pointer,
-           struct cons_pointer env ) {
-    struct cons_pointer result = NIL;
+  lisp_open( struct stack_frame *frame, struct cons_pointer frame_pointer,
+            struct cons_pointer env ) {
+  struct cons_pointer result = NIL;
 
-    if ( stringp( frame->arg[0] ) ) {
-        char *url = lisp_string_to_c_string( frame->arg[0] );
+  if ( stringp( frame->arg[0] ) ) {
+    struct cons_pointer meta =
+      make_cons( make_cons(
+        c_string_to_lisp_keyword( L"url" ),
+        frame->arg[0] ),
+                NIL );
 
-        if ( nilp( frame->arg[1] ) ) {
-            result = make_read_stream( url_fopen( url, "r" ) );
-        } else {
-            // TODO: anything more complex is a problem for another day.
-            result = make_write_stream( url_fopen( url, "w" ) );
-        }
+    char *url = lisp_string_to_c_string( frame->arg[0] );
 
-        free( url );
-
-        if ( pointer2cell( result ).payload.stream.stream == NULL ) {
-            result = NIL;
-        }
+    if ( nilp( frame->arg[1] ) ) {
+      URL_FILE *stream = url_fopen( url, "r" );
+      result = make_read_stream( stream, meta );
+    } else {
+      // TODO: anything more complex is a problem for another day.
+      URL_FILE *stream = url_fopen( url, "w" );
+      result = make_write_stream( stream, meta);
     }
 
-    return result;
+    free( url );
+
+    if ( pointer2cell( result ).payload.stream.stream == NULL ) {
+      result = NIL;
+    } else {
+      collect_meta( result, frame->arg[0]);
+    }
+  }
+
+  return result;
 }
 
 /**
@@ -272,8 +392,8 @@ lisp_read_char( struct stack_frame *frame, struct cons_pointer frame_pointer,
     if ( readp( frame->arg[0] ) ) {
         result =
             make_string( url_fgetwc
-                         ( pointer2cell( frame->arg[0] ).payload.stream.
-                           stream ), NIL );
+                         ( pointer2cell( frame->arg[0] ).payload.
+                           stream.stream ), NIL );
     }
 
     return result;
diff --git a/src/io/io.h b/src/io/io.h
index d46f8b1..167660b 100644
--- a/src/io/io.h
+++ b/src/io/io.h
@@ -10,6 +10,12 @@
 
 #ifndef __psse_io_h
 #define __psse_io_h
+#include <curl/curl.h>
+#include "consspaceobject.h"
+
+extern CURLSH *io_share;
+
+int io_init();
 
 URL_FILE *file_to_url_file( FILE * f );
 wint_t url_fgetwc( URL_FILE * input );
diff --git a/src/memory/conspage.c b/src/memory/conspage.c
index 54d14e9..5f8c3a8 100644
--- a/src/memory/conspage.c
+++ b/src/memory/conspage.c
@@ -152,7 +152,7 @@ void free_cell( struct cons_pointer pointer ) {
                     dec_ref( cell->payload.exception.frame );
                     break;
                 case FUNCTIONTV:
-                    dec_ref( cell->payload.function.source );
+                    dec_ref( cell->payload.function.meta );
                     break;
                 case INTEGERTV:
                     dec_ref( cell->payload.integer.more );
@@ -168,10 +168,11 @@ void free_cell( struct cons_pointer pointer ) {
                     break;
                 case READTV:
                 case WRITETV:
-                    url_fclose( cell->payload.stream.stream);
+                    dec_ref(cell->payload.stream.meta);
+                    url_fclose( cell->payload.stream.stream );
                     break;
                 case SPECIALTV:
-                    dec_ref( cell->payload.special.source );
+                    dec_ref( cell->payload.special.meta );
                     break;
                 case STRINGTV:
                 case SYMBOLTV:
diff --git a/src/memory/conspage.h b/src/memory/conspage.h
index fa11da9..f13a46b 100644
--- a/src/memory/conspage.h
+++ b/src/memory/conspage.h
@@ -1,7 +1,19 @@
-#include "consspaceobject.h"
+/*
+ * conspage.h
+ *
+ * Setup and tear down cons pages, and (FOR NOW) do primitive
+ * allocation/deallocation of cells.
+ * NOTE THAT before we go multi-threaded, these functions must be
+ * aggressively
+ * thread safe.
+ *
+ * (c) 2017 Simon Brooke <simon@journeyman.cc>
+ * Licensed under GPL version 2.0, or, at your option, any later version.
+ */
+#ifndef __psse_conspage_h
+#define __psse_conspage_h
 
-#ifndef __conspage_h
-#define __conspage_h
+#include "consspaceobject.h"
 
 /**
  * the number of cons cells on a cons page. The maximum value this can
diff --git a/src/memory/consspaceobject.c b/src/memory/consspaceobject.c
index 9edbf66..f7b5ca9 100644
--- a/src/memory/consspaceobject.c
+++ b/src/memory/consspaceobject.c
@@ -21,6 +21,7 @@
 #include "conspage.h"
 #include "consspaceobject.h"
 #include "debug.h"
+#include "intern.h"
 #include "print.h"
 #include "stack.h"
 
@@ -65,6 +66,48 @@ void dec_ref( struct cons_pointer pointer ) {
 }
 
 
+/**
+ * Get the Lisp type of the single argument.
+ * @param pointer a pointer to the object whose type is requested.
+ * @return As a Lisp string, the tag of the object which is at that pointer.
+ */
+struct cons_pointer c_type( struct cons_pointer pointer ) {
+    struct cons_pointer result = NIL;
+    struct cons_space_object cell = pointer2cell( pointer );
+
+    for ( int i = TAGLENGTH - 1; i >= 0; i-- ) {
+        result = make_string( ( wchar_t ) cell.tag.bytes[i], result );
+    }
+
+    return result;
+}
+
+/**
+ * Implementation of car in C. If arg is not a cons, does not error but returns nil.
+ */
+struct cons_pointer c_car( struct cons_pointer arg ) {
+    struct cons_pointer result = NIL;
+
+    if ( consp( arg ) ) {
+        result = pointer2cell( arg ).payload.cons.car;
+    }
+
+    return result;
+}
+
+/**
+ * Implementation of cdr in C. If arg is not a cons, does not error but returns nil.
+ */
+struct cons_pointer c_cdr( struct cons_pointer arg ) {
+    struct cons_pointer result = NIL;
+
+    if ( consp( arg ) || stringp( arg ) || symbolp( arg ) ) {
+        result = pointer2cell( arg ).payload.cons.cdr;
+    }
+
+    return result;
+}
+
 /**
  * Construct a cons cell from this pair of pointers.
  */
@@ -107,16 +150,17 @@ struct cons_pointer make_exception( struct cons_pointer message,
 
 
 /**
- * Construct a cell which points to an executable Lisp special form.
+ * Construct a cell which points to an executable Lisp function.
  */
 struct cons_pointer
-make_function( struct cons_pointer src, struct cons_pointer ( *executable )
+make_function( struct cons_pointer meta, struct cons_pointer ( *executable )
                 ( struct stack_frame *,
                   struct cons_pointer, struct cons_pointer ) ) {
     struct cons_pointer pointer = allocate_cell( FUNCTIONTAG );
     struct cons_space_object *cell = &pointer2cell( pointer );
+    inc_ref( meta);
 
-    cell->payload.function.source = src;
+    cell->payload.function.meta = meta;
     cell->payload.function.executable = executable;
 
     return pointer;
@@ -203,27 +247,42 @@ struct cons_pointer make_string( wint_t c, struct cons_pointer tail ) {
 }
 
 /**
- * Construct a symbol from the character `c` and this `tail`. A symbol is
- * internally identical to a string except for having a different tag.
+ * Construct a symbol or keyword from the character `c` and this `tail`.
+ * Each is internally identical to a string except for having a different tag.
  *
  * @param c the character to add (prepend);
  * @param tail the symbol which is being built.
+ * @param tag the tag to use: expected to be "SYMB" or "KEYW"
  */
-struct cons_pointer make_symbol( wint_t c, struct cons_pointer tail ) {
-    return make_string_like_thing( c, tail, SYMBOLTAG );
+struct cons_pointer make_symbol_or_key( wint_t c, struct cons_pointer tail,
+                                        char *tag ) {
+    struct cons_pointer result = make_string_like_thing( c, tail, tag );
+
+    if ( strncmp( tag, KEYTAG, 4 ) == 0 ) {
+        struct cons_pointer r = internedp( result, oblist );
+
+      if ( nilp(r)) {
+        intern(result, oblist);
+      } else {
+        result = r;
+      }
+    }
+
+    return result;
 }
 
 /**
  * Construct a cell which points to an executable Lisp special form.
  */
 struct cons_pointer
-make_special( struct cons_pointer src, struct cons_pointer ( *executable )
+make_special( struct cons_pointer meta, struct cons_pointer ( *executable )
                ( struct stack_frame * frame,
                  struct cons_pointer, struct cons_pointer env ) ) {
     struct cons_pointer pointer = allocate_cell( SPECIALTAG );
     struct cons_space_object *cell = &pointer2cell( pointer );
+    inc_ref( meta);
 
-    cell->payload.special.source = src;
+    cell->payload.special.meta = meta;
     cell->payload.special.executable = executable;
 
     return pointer;
@@ -232,12 +291,16 @@ make_special( struct cons_pointer src, struct cons_pointer ( *executable )
 /**
  * Construct a cell which points to a stream open for reading.
  * @param input the C stream to wrap.
+ * @param metadata a pointer to an associaton containing metadata on the stream.
+ * @return a pointer to the new read stream.
  */
-struct cons_pointer make_read_stream( URL_FILE * input ) {
+struct cons_pointer make_read_stream( URL_FILE * input,
+                                      struct cons_pointer metadata ) {
     struct cons_pointer pointer = allocate_cell( READTAG );
     struct cons_space_object *cell = &pointer2cell( pointer );
 
     cell->payload.stream.stream = input;
+    cell->payload.stream.meta = metadata;
 
     return pointer;
 }
@@ -245,16 +308,33 @@ struct cons_pointer make_read_stream( URL_FILE * input ) {
 /**
  * Construct a cell which points to a stream open for writing.
  * @param output the C stream to wrap.
+ * @param metadata a pointer to an associaton containing metadata on the stream.
+ * @return a pointer to the new read stream.
  */
-struct cons_pointer make_write_stream( URL_FILE * output ) {
+struct cons_pointer make_write_stream( URL_FILE * output,
+                                       struct cons_pointer metadata ) {
     struct cons_pointer pointer = allocate_cell( WRITETAG );
     struct cons_space_object *cell = &pointer2cell( pointer );
 
     cell->payload.stream.stream = output;
+    cell->payload.stream.meta = metadata;
 
     return pointer;
 }
 
+/**
+ * Return a lisp keyword representation of this wide character string.
+ */
+struct cons_pointer c_string_to_lisp_keyword( wchar_t *symbol ) {
+    struct cons_pointer result = NIL;
+
+    for ( int i = wcslen( symbol ); i > 0; i-- ) {
+        result = make_keyword( symbol[i - 1], result );
+    }
+
+    return result;
+}
+
 /**
  * Return a lisp string representation of this wide character string.
  */
diff --git a/src/memory/consspaceobject.h b/src/memory/consspaceobject.h
index 6230e64..1bbbcd1 100644
--- a/src/memory/consspaceobject.h
+++ b/src/memory/consspaceobject.h
@@ -8,6 +8,9 @@
  *  Licensed under GPL version 2.0, or, at your option, any later version.
  */
 
+#ifndef __psse_consspaceobject_h
+#define __psse_consspaceobject_h
+
 #include <stdbool.h>
 #include <stdint.h>
 #include <stdio.h>
@@ -19,8 +22,6 @@
 
 #include "fopen.h"
 
-#ifndef __consspaceobject_h
-#define __consspaceobject_h
 
 /**
  * The length of a tag, in bytes.
@@ -39,6 +40,7 @@
 
 /**
  * The string `CONS`, considered as an `unsigned int`.
+ * @todo tag values should be collected into an enum.
  */
 #define CONSTV      1397641027
 
@@ -85,6 +87,16 @@
  */
 #define INTEGERTV   1381256777
 
+/**
+ * A keyword - an interned, self-evaluating string.
+ */
+#define KEYTAG	    "KEYW"
+
+/**
+ * The string `KEYW`, considered as an `unsigned int`.
+ */
+#define KEYTV       1465468235
+
 /**
  * A lambda cell. Lambdas are the interpretable (source) versions of functions.
  * \see FUNCTIONTAG.
@@ -258,6 +270,11 @@
  */
 #define functionp(conspoint) (check_tag(conspoint,FUNCTIONTAG))
 
+/**
+ * true if `conspoint` points to a keyword, else false
+ */
+#define keywordp(conspoint) (check_tag(conspoint,KEYTAG))
+
 /**
  * true if `conspoint` points to a special Lambda cell, else false
  */
@@ -320,6 +337,8 @@
  */
 #define writep(conspoint) (check_tag(conspoint,WRITETAG))
 
+#define streamp(conspoint) (check_tag(conspoint,READTAG)||check_tag(conspoint,WRITETAG))
+
 /**
  * true if `conspoint` points to a true cell, else false
  * (there should only be one of these so it's slightly redundant).
@@ -397,10 +416,9 @@ struct exception_payload {
  */
 struct function_payload {
     /**
-     * pointer to the source from which the function was compiled, or NIL
-     * if it is a primitive.
+     * pointer to metadata (e.g. the source from which the function was compiled).
      */
-    struct cons_pointer source;
+    struct cons_pointer meta;
     /**  pointer to a function which takes a cons pointer (representing
      * its argument list) and a cons pointer (representing its environment) and a
      * stack frame (representing the previous stack frame) as arguments and returns
@@ -475,7 +493,7 @@ struct special_payload {
      * pointer to the source from which the special form was compiled, or NIL
      * if it is a primitive.
      */
-    struct cons_pointer source;
+    struct cons_pointer meta;
     /**  pointer to a function which takes a cons pointer (representing
      * its argument list) and a cons pointer (representing its environment) and a
      * stack frame (representing the previous stack frame) as arguments and returns
@@ -500,8 +518,9 @@ struct stream_payload {
 /**
  * payload of a string cell. At least at first, only one UTF character will
  * be stored in each cell. The doctrine that 'a symbol is just a string'
- * didn't work; however, the payload of a symbol cell is identical to the
- * payload of a string cell.
+ * didn't work; however, the payload of a symbol or keyword cell is identical
+ * to the payload of a string cell, except that a keyword may store a hash
+ * of its own value in the padding.
  */
 struct string_payload {
     /** the actual character stored in this cell */
@@ -614,6 +633,12 @@ void inc_ref( struct cons_pointer pointer );
 
 void dec_ref( struct cons_pointer pointer );
 
+struct cons_pointer c_type( struct cons_pointer pointer );
+
+struct cons_pointer c_car( struct cons_pointer arg );
+
+struct cons_pointer c_cdr( struct cons_pointer arg );
+
 struct cons_pointer make_cons( struct cons_pointer car,
                                struct cons_pointer cdr );
 
@@ -626,6 +651,8 @@ struct cons_pointer make_function( struct cons_pointer src,
                                       struct cons_pointer,
                                       struct cons_pointer ) );
 
+struct cons_pointer c_string_to_lisp_keyword( wchar_t *symbol );
+
 struct cons_pointer make_lambda( struct cons_pointer args,
                                  struct cons_pointer body );
 
@@ -640,11 +667,18 @@ struct cons_pointer make_special( struct cons_pointer src,
 
 struct cons_pointer make_string( wint_t c, struct cons_pointer tail );
 
-struct cons_pointer make_symbol( wint_t c, struct cons_pointer tail );
+struct cons_pointer make_symbol_or_key( wint_t c, struct cons_pointer tail,
+                                        char *tag );
 
-struct cons_pointer make_read_stream( URL_FILE * input );
+#define make_symbol(c, t) (make_symbol_or_key( c, t, SYMBOLTAG))
 
-struct cons_pointer make_write_stream( URL_FILE * output );
+#define make_keyword(c, t) (make_symbol_or_key( c, t, KEYTAG))
+
+struct cons_pointer make_read_stream( URL_FILE * input,
+                                      struct cons_pointer metadata );
+
+struct cons_pointer make_write_stream( URL_FILE * output,
+                                       struct cons_pointer metadata );
 
 struct cons_pointer c_string_to_lisp_string( wchar_t *string );
 
diff --git a/src/memory/dump.c b/src/memory/dump.c
index e99d306..7f7701f 100644
--- a/src/memory/dump.c
+++ b/src/memory/dump.c
@@ -108,13 +108,15 @@ void dump_object( URL_FILE * output, struct cons_pointer pointer ) {
         case RATIOTV:
             url_fwprintf( output,
                           L"\t\tRational cell: value %ld/%ld, count %u\n",
-                          pointer2cell( cell.payload.ratio.dividend ).
-                          payload.integer.value,
-                          pointer2cell( cell.payload.ratio.divisor ).
-                          payload.integer.value, cell.count );
+                          pointer2cell( cell.payload.ratio.dividend ).payload.
+                          integer.value,
+                          pointer2cell( cell.payload.ratio.divisor ).payload.
+                          integer.value, cell.count );
             break;
         case READTV:
-            url_fwprintf( output, L"\t\tInput stream\n" );
+            url_fputws(  L"\t\tInput stream; metadata: ", output );
+            print(output, cell.payload.stream.meta);
+            url_fputws( L"\n", output );
             break;
         case REALTV:
             url_fwprintf( output, L"\t\tReal cell: value %Lf, count %u\n",
@@ -148,7 +150,9 @@ void dump_object( URL_FILE * output, struct cons_pointer pointer ) {
             }
             break;
         case WRITETV:
-            url_fwprintf( output, L"\t\tOutput stream\n" );
+            url_fputws(  L"\t\tOutput stream; metadata: ", output );
+            print(output, cell.payload.stream.meta);
+            url_fputws( L"\n", output );
             break;
     }
 }
diff --git a/src/ops/equal.c b/src/ops/equal.c
index 2775218..c4d7f54 100644
--- a/src/ops/equal.c
+++ b/src/ops/equal.c
@@ -67,6 +67,7 @@ bool equal( struct cons_pointer a, struct cons_pointer b ) {
                     && equal( cell_a->payload.cons.cdr,
                               cell_b->payload.cons.cdr );
                 break;
+            case KEYTV:
             case STRINGTV:
             case SYMBOLTV:
                 /*
@@ -80,8 +81,8 @@ bool equal( struct cons_pointer a, struct cons_pointer b ) {
                     && ( equal( cell_a->payload.string.cdr,
                                 cell_b->payload.string.cdr )
                          || ( end_of_string( cell_a->payload.string.cdr )
-                              && end_of_string( cell_b->payload.
-                                                string.cdr ) ) );
+                              && end_of_string( cell_b->payload.string.
+                                                cdr ) ) );
                 break;
             case INTEGERTV:
                 result =
diff --git a/src/ops/lispops.c b/src/ops/lispops.c
index 1220835..91ec2cf 100644
--- a/src/ops/lispops.c
+++ b/src/ops/lispops.c
@@ -47,32 +47,6 @@
  * and others I haven't thought of yet.
  */
 
-/**
- * Implementation of car in C. If arg is not a cons, does not error but returns nil.
- */
-struct cons_pointer c_car( struct cons_pointer arg ) {
-    struct cons_pointer result = NIL;
-
-    if ( consp( arg ) ) {
-        result = pointer2cell( arg ).payload.cons.car;
-    }
-
-    return result;
-}
-
-/**
- * Implementation of cdr in C. If arg is not a cons, does not error but returns nil.
- */
-struct cons_pointer c_cdr( struct cons_pointer arg ) {
-    struct cons_pointer result = NIL;
-
-    if ( consp( arg ) || stringp( arg ) || symbolp( arg ) ) {
-        result = pointer2cell( arg ).payload.cons.cdr;
-    }
-
-    return result;
-}
-
 
 /**
  * Useful building block; evaluate this single form in the context of this
@@ -378,9 +352,10 @@ c_apply( struct stack_frame *frame, struct cons_pointer frame_pointer,
                         result = next_pointer;
                     } else {
                         result =
-                            ( *fn_cell.payload.special.
-                              executable ) ( get_stack_frame( next_pointer ),
-                                             next_pointer, env );
+                            ( *fn_cell.payload.
+                              special.executable ) ( get_stack_frame
+                                                     ( next_pointer ),
+                                                     next_pointer, env );
                         debug_print( L"Special form returning: ", DEBUG_EVAL );
                         debug_print_object( result, DEBUG_EVAL );
                         debug_println( DEBUG_EVAL );
@@ -411,24 +386,6 @@ c_apply( struct stack_frame *frame, struct cons_pointer frame_pointer,
     return result;
 }
 
-
-/**
- * Get the Lisp type of the single argument.
- * @param pointer a pointer to the object whose type is requested.
- * @return As a Lisp string, the tag of the object which is at that pointer.
- */
-struct cons_pointer c_type( struct cons_pointer pointer ) {
-    struct cons_pointer result = NIL;
-    struct cons_space_object cell = pointer2cell( pointer );
-
-    for ( int i = TAGLENGTH - 1; i >= 0; i-- ) {
-        result = make_string( ( wchar_t ) cell.tag.bytes[i], result );
-    }
-
-    return result;
-}
-
-
 /**
  * Function; evaluate the expression which is the first argument in the frame;
  * further arguments are ignored.
@@ -885,7 +842,7 @@ struct cons_pointer c_reverse( struct cons_pointer arg ) {
                 result = make_string( o.payload.string.character, result );
                 break;
             case SYMBOLTV:
-                result = make_symbol( o.payload.string.character, result );
+                result = make_symbol_or_key( o.payload.string.character, result, SYMBOLTAG );
                 break;
         }
     }
@@ -1251,13 +1208,13 @@ struct cons_pointer lisp_source( struct stack_frame *frame,
                                  struct cons_pointer env ) {
     struct cons_pointer result = NIL;
     struct cons_space_object cell = pointer2cell( frame->arg[0] );
-
+    struct cons_pointer source_key = c_string_to_lisp_keyword(L"source");
     switch ( cell.tag.value ) {
         case FUNCTIONTV:
-            result = cell.payload.function.source;
+            result = c_assoc( source_key, cell.payload.function.meta);
             break;
         case SPECIALTV:
-            result = cell.payload.special.source;
+            result = c_assoc( source_key, cell.payload.special.meta);
             break;
         case LAMBDATV:
             result = make_cons( c_string_to_lisp_symbol( L"lambda" ),
diff --git a/src/ops/lispops.h b/src/ops/lispops.h
index 1aff486..ea8a883 100644
--- a/src/ops/lispops.h
+++ b/src/ops/lispops.h
@@ -19,26 +19,13 @@
  * Licensed under GPL version 2.0, or, at your option, any later version.
  */
 
+#ifndef __psse_lispops_h
+#define __psse_lispops_h
+
 /*
  * utilities
  */
 
-/**
- * Get the Lisp type of the single argument.
- * @param pointer a pointer to the object whose type is requested.
- * @return As a Lisp string, the tag of the object which is at that pointer.
- */
-struct cons_pointer c_type( struct cons_pointer pointer );
-
-/**
- * Implementation of car in C. If arg is not a cons, does not error but returns nil.
- */
-struct cons_pointer c_car( struct cons_pointer arg );
-
-/**
- * Implementation of cdr in C. If arg is not a cons, does not error but returns nil.
- */
-struct cons_pointer c_cdr( struct cons_pointer arg );
 
 struct cons_pointer c_reverse( struct cons_pointer arg );
 
@@ -205,3 +192,5 @@ struct cons_pointer lisp_source( struct stack_frame *frame,
 struct cons_pointer lisp_inspect( struct stack_frame *frame,
                                   struct cons_pointer frame_pointer,
                                   struct cons_pointer env );
+
+#endif
diff --git a/src/ops/meta.c b/src/ops/meta.c
new file mode 100644
index 0000000..5e48709
--- /dev/null
+++ b/src/ops/meta.c
@@ -0,0 +1,47 @@
+/*
+ * meta.c
+ *
+ * Get metadata from a cell which has it.
+ *
+ * (c) 2019 Simon Brooke <simon@journeyman.cc>
+ * Licensed under GPL version 2.0, or, at your option, any later version.
+ */
+
+#include "conspage.h"
+#include "debug.h"
+
+/**
+ * Function: get metadata describing my first argument.
+ *
+ * * (metadata any)
+ *
+ * @return a pointer to the metadata of my first argument, or nil if none.
+ */
+struct cons_pointer lisp_metadata( struct stack_frame *frame, struct cons_pointer frame_pointer,
+                                  struct cons_pointer env ) {
+  debug_print(L"lisp_metadata: entered\n", DEBUG_EVAL);
+  debug_dump_object(frame->arg[0], DEBUG_EVAL);
+  struct cons_pointer result = NIL;
+  struct cons_space_object cell = pointer2cell(frame->arg[0]);
+
+  switch( cell.tag.value) {
+    case FUNCTIONTV:
+    result = cell.payload.function.meta;
+    break;
+    case SPECIALTV:
+    result = cell.payload.special.meta;
+    break;
+    case READTV:
+    case WRITETV:
+    result = cell.payload.special.meta;
+    break;
+  }
+
+  return make_cons(
+    make_cons(
+      c_string_to_lisp_keyword( L"type"),
+      c_type(frame->arg[0])),
+    result);
+
+//  return result;
+}
diff --git a/src/ops/meta.h b/src/ops/meta.h
new file mode 100644
index 0000000..2c6ccf2
--- /dev/null
+++ b/src/ops/meta.h
@@ -0,0 +1,17 @@
+/*
+ * meta.h
+ *
+ * Get metadata from a cell which has it.
+ *
+ * (c) 2019 Simon Brooke <simon@journeyman.cc>
+ * Licensed under GPL version 2.0, or, at your option, any later version.
+ */
+
+#ifndef __psse_meta_h
+#define __psse_meta_h
+
+
+struct cons_pointer lisp_metadata( struct stack_frame *frame, struct cons_pointer frame_pointer,
+                                  struct cons_pointer env ) ;
+
+#endif
diff --git a/src/ops/print.c b/src/ops/print.c
index 8cb137e..e13f17a 100644
--- a/src/ops/print.c
+++ b/src/ops/print.c
@@ -35,7 +35,7 @@ int print_use_colours = 0;
  * don't print anything but just return.
  */
 void print_string_contents( URL_FILE * output, struct cons_pointer pointer ) {
-    while ( stringp( pointer ) || symbolp( pointer ) ) {
+    while ( stringp( pointer ) || symbolp( pointer ) || keywordp(pointer)) {
         struct cons_space_object *cell = &pointer2cell( pointer );
         wchar_t c = cell->payload.string.character;
 
@@ -134,6 +134,13 @@ struct cons_pointer print( URL_FILE * output, struct cons_pointer pointer ) {
                 dec_ref( s );
             }
             break;
+        case KEYTV:
+            if ( print_use_colours ) {
+                url_fputws( L"\x1B[1;33m", output );
+            }
+            url_fputws( L":", output );
+            print_string_contents( output, pointer );
+            break;
         case LAMBDATV:{
                 struct cons_pointer to_print =
                     make_cons( c_string_to_lisp_symbol( L"lambda" ),
diff --git a/src/ops/read.c b/src/ops/read.c
index 69899c0..7362ecb 100644
--- a/src/ops/read.c
+++ b/src/ops/read.c
@@ -45,7 +45,8 @@ struct cons_pointer read_list( struct stack_frame *frame,
                                struct cons_pointer frame_pointer,
                                URL_FILE * input, wint_t initial );
 struct cons_pointer read_string( URL_FILE * input, wint_t initial );
-struct cons_pointer read_symbol( URL_FILE * input, wint_t initial );
+struct cons_pointer read_symbol_or_key( URL_FILE * input, char *tag,
+                                        wint_t initial );
 
 /**
  * quote reader macro in C (!)
@@ -110,7 +111,7 @@ struct cons_pointer read_continuation( struct stack_frame *frame,
                             read_number( frame, frame_pointer, input, c,
                                          false );
                     } else {
-                        result = read_symbol( input, c );
+                        result = read_symbol_or_key( input, SYMBOLTAG, c );
                     }
                 }
                 break;
@@ -129,17 +130,20 @@ struct cons_pointer read_continuation( struct stack_frame *frame,
                             read_continuation( frame, frame_pointer, input,
                                                url_fgetwc( input ) );
                     } else {
-                        read_symbol( input, c );
+                        read_symbol_or_key( input, SYMBOLTAG, c );
                     }
                 }
                 break;
-                //case ':': reserved for keywords and paths
+            case ':':
+                result =
+                    read_symbol_or_key( input, KEYTAG, url_fgetwc( input ) );
+                break;
             default:
                 if ( iswdigit( c ) ) {
                     result =
                         read_number( frame, frame_pointer, input, c, false );
                 } else if ( iswprint( c ) ) {
-                    result = read_symbol( input, c );
+                    result = read_symbol_or_key( input, SYMBOLTAG, c );
                 } else {
                     result =
                         throw_exception( make_cons( c_string_to_lisp_string
@@ -321,24 +325,22 @@ struct cons_pointer read_string( URL_FILE * input, wint_t initial ) {
     return result;
 }
 
-struct cons_pointer read_symbol( URL_FILE * input, wint_t initial ) {
+struct cons_pointer read_symbol_or_key( URL_FILE * input, char *tag,
+                                        wint_t initial ) {
     struct cons_pointer cdr = NIL;
     struct cons_pointer result;
     switch ( initial ) {
         case '\0':
-            result = make_symbol( initial, NIL );
+            result = make_symbol_or_key( initial, NIL, tag );
             break;
         case '"':
-            /*
-             * THIS IS NOT A GOOD IDEA, but is legal
-             */
-            result =
-                make_symbol( initial,
-                             read_symbol( input, url_fgetwc( input ) ) );
-            break;
+        case '\'':
+            /* unwise to allow embedded quotation marks in symbols */
         case ')':
+        case ':':
             /*
-             * symbols may not include right-parenthesis;
+             * symbols and keywords may not include right-parenthesis
+             * or colons.
              */
             result = NIL;
             /*
@@ -350,8 +352,11 @@ struct cons_pointer read_symbol( URL_FILE * input, wint_t initial ) {
             if ( iswprint( initial )
                  && !iswblank( initial ) ) {
                 result =
-                    make_symbol( initial,
-                                 read_symbol( input, url_fgetwc( input ) ) );
+                    make_symbol_or_key( initial,
+                                        read_symbol_or_key( input,
+                                                            tag,
+                                                            url_fgetwc( input ) ),
+                                        tag );
             } else {
                 result = NIL;
                 /*
@@ -362,7 +367,7 @@ struct cons_pointer read_symbol( URL_FILE * input, wint_t initial ) {
             break;
     }
 
-    debug_print( L"read_symbol returning\n", DEBUG_IO );
+    debug_print( L"read_symbol_or_key returning\n", DEBUG_IO );
     debug_dump_object( result, DEBUG_IO );
 
     return result;

From f9bcac10e7765edfad479276b549a11783612207 Mon Sep 17 00:00:00 2001
From: Simon Brooke <simon@journeyman.cc>
Date: Tue, 29 Jan 2019 22:36:20 +0000
Subject: [PATCH 12/31] Fixed, working.

---
 src/init.c                   |  36 ++++----
 src/io/fopen.c               |   2 +-
 src/io/io.c                  | 170 ++++++++++++++++++-----------------
 src/io/io.h                  |   2 +-
 src/{ops => io}/print.c      |   2 +-
 src/{ops => io}/print.h      |   0
 src/{ops => io}/read.c       |   4 +-
 src/{ops => io}/read.h       |   0
 src/memory/conspage.c        |   2 +-
 src/memory/consspaceobject.c |  14 +--
 src/memory/dump.c            |  16 ++--
 src/ops/lispops.c            |  17 ++--
 src/ops/meta.c               |  44 +++++----
 src/ops/meta.h               |   5 +-
 14 files changed, 159 insertions(+), 155 deletions(-)
 rename src/{ops => io}/print.c (99%)
 rename src/{ops => io}/print.h (100%)
 rename src/{ops => io}/read.c (99%)
 rename src/{ops => io}/read.h (100%)

diff --git a/src/init.c b/src/init.c
index 6cceadd..47ba772 100644
--- a/src/init.c
+++ b/src/init.c
@@ -41,17 +41,16 @@
  * more readable and aid debugging generally.
  */
 void bind_function( wchar_t *name, struct cons_pointer ( *executable )
-                   ( struct stack_frame *,
-                    struct cons_pointer, struct cons_pointer ) ) {
-  struct cons_pointer n = c_string_to_lisp_symbol( name );
-  struct cons_pointer meta = make_cons(
-    make_cons(c_string_to_lisp_keyword(L"primitive"), TRUE),
-              make_cons( make_cons(
-                c_string_to_lisp_keyword(L"name"),
-                n),
-              NIL));
+                     ( struct stack_frame *,
+                       struct cons_pointer, struct cons_pointer ) ) {
+    struct cons_pointer n = c_string_to_lisp_symbol( name );
+    struct cons_pointer meta =
+        make_cons( make_cons( c_string_to_lisp_keyword( L"primitive" ), TRUE ),
+                   make_cons( make_cons( c_string_to_lisp_keyword( L"name" ),
+                                         n ),
+                              NIL ) );
 
-  deep_bind( n, make_function( meta, executable ) );
+    deep_bind( n, make_function( meta, executable ) );
 }
 
 /**
@@ -62,12 +61,11 @@ void bind_special( wchar_t *name, struct cons_pointer ( *executable )
                     ( struct stack_frame *,
                       struct cons_pointer, struct cons_pointer ) ) {
     struct cons_pointer n = c_string_to_lisp_symbol( name );
-    struct cons_pointer meta = make_cons(
-      make_cons(c_string_to_lisp_keyword(L"primitive"), TRUE),
-                make_cons( make_cons(
-                  c_string_to_lisp_keyword(L"name"),
-                  n),
-                NIL));
+    struct cons_pointer meta =
+        make_cons( make_cons( c_string_to_lisp_keyword( L"primitive" ), TRUE ),
+                   make_cons( make_cons( c_string_to_lisp_keyword( L"name" ),
+                                         n ),
+                              NIL ) );
 
     deep_bind( n, make_special( NIL, executable ) );
 }
@@ -94,9 +92,9 @@ int main( int argc, char *argv[] ) {
     bool show_prompt = false;
 
     setlocale( LC_ALL, "" );
-    if (io_init() != 0) {
-      fputs("Failed to initialise I/O subsystem\n", stderr);
-      exit(1);
+    if ( io_init(  ) != 0 ) {
+        fputs( "Failed to initialise I/O subsystem\n", stderr );
+        exit( 1 );
     }
 
     while ( ( option = getopt( argc, argv, "cpdv:" ) ) != -1 ) {
diff --git a/src/io/fopen.c b/src/io/fopen.c
index 50c09b5..d5e4cd6 100644
--- a/src/io/fopen.c
+++ b/src/io/fopen.c
@@ -223,7 +223,7 @@ URL_FILE *url_fopen( const char *url, const char *operation ) {
         curl_easy_setopt( file->handle.curl, CURLOPT_WRITEFUNCTION,
                           write_callback );
         /* use the share object */
-        curl_easy_setopt(file->handle.curl, CURLOPT_SHARE, io_share);
+        curl_easy_setopt( file->handle.curl, CURLOPT_SHARE, io_share );
 
 
         if ( !multi_handle )
diff --git a/src/io/io.c b/src/io/io.c
index 3d9eb36..82a6b32 100644
--- a/src/io/io.c
+++ b/src/io/io.c
@@ -44,22 +44,23 @@ wint_t ungotten = 0;
  *
  * @return 0 on success; any other value means failure.
  */
-int io_init() {
-  CURL *curl;
-  CURLcode res;
-  int result = curl_global_init( CURL_GLOBAL_SSL );
+int io_init(  ) {
+    CURL *curl;
+    CURLcode res;
+    int result = curl_global_init( CURL_GLOBAL_SSL );
 
-  io_share = curl_share_init();
+    io_share = curl_share_init(  );
 
-  if (result == 0) {
-      curl_share_setopt(io_share, CURLSHOPT_SHARE, CURL_LOCK_DATA_CONNECT);
-      curl_share_setopt(io_share, CURLSHOPT_SHARE, CURL_LOCK_DATA_COOKIE );
-      curl_share_setopt(io_share, CURLSHOPT_SHARE, CURL_LOCK_DATA_DNS );
-      curl_share_setopt(io_share, CURLSHOPT_SHARE, CURL_LOCK_DATA_SSL_SESSION );
-      curl_share_setopt(io_share, CURLSHOPT_SHARE, CURL_LOCK_DATA_PSL );
-  }
+    if ( result == 0 ) {
+        curl_share_setopt( io_share, CURLSHOPT_SHARE, CURL_LOCK_DATA_CONNECT );
+        curl_share_setopt( io_share, CURLSHOPT_SHARE, CURL_LOCK_DATA_COOKIE );
+        curl_share_setopt( io_share, CURLSHOPT_SHARE, CURL_LOCK_DATA_DNS );
+        curl_share_setopt( io_share, CURLSHOPT_SHARE,
+                           CURL_LOCK_DATA_SSL_SESSION );
+        curl_share_setopt( io_share, CURLSHOPT_SHARE, CURL_LOCK_DATA_PSL );
+    }
 
-  return result;
+    return result;
 }
 
 /**
@@ -243,67 +244,72 @@ lisp_close( struct stack_frame *frame, struct cons_pointer frame_pointer,
     return result;
 }
 
-int index_of( char c, char * s) {
-  int i;
+int index_of( char c, char *s ) {
+    int i;
 
-  for (i = 0; s[i] != c && s[i] != 0; i++);
+    for ( i = 0; s[i] != c && s[i] != 0; i++ );
 
-  return s[i] == c ? i : -1;
+    return s[i] == c ? i : -1;
 }
 
-char * trim(char *s) {
-  int i;
+char *trim( char *s ) {
+    int i;
 
-  for (i = strlen(s); (isblank(s[i]) || iscntrl(s[i])) && i > -1; i--) {
-    s[i] = (char) 0;
-  }
-  for (i = 0; isblank(s[i]) && s[i] != 0; i++);
+    for ( i = strlen( s ); ( isblank( s[i] ) || iscntrl( s[i] ) ) && i > -1;
+          i-- ) {
+        s[i] = ( char ) 0;
+    }
+    for ( i = 0; isblank( s[i] ) && s[i] != 0; i++ );
 
-  return (char *)&s[i];
+    return ( char * ) &s[i];
 }
 
 /**
  * Callback to assemble metadata for a URL stream. This is naughty because
  * it modifies data, but it's really the only way to create metadata.
  */
-static size_t write_meta_callback(void *ptr, size_t size, size_t nmemb, struct cons_pointer stream)
-{
-  struct cons_space_object * cell = &pointer2cell(stream);
+static size_t write_meta_callback( void *ptr, size_t size, size_t nmemb,
+                                   struct cons_pointer stream ) {
+    struct cons_space_object *cell = &pointer2cell( stream );
 
-  if (strncmp(&cell->tag.bytes[0], READTAG, 4) ||
-      strncmp(&cell->tag.bytes[0], WRITETAG, 4)) {
-    char * s = (char *)ptr;
-    int offset = index_of (':', ptr);
+    if ( strncmp( &cell->tag.bytes[0], READTAG, 4 ) ||
+         strncmp( &cell->tag.bytes[0], WRITETAG, 4 ) ) {
+        char *s = ( char * ) ptr;
+        int offset = index_of( ':', ptr );
 
-    if (offset != -1) {
-      s[offset] = (char)0;
-      char * name = s;
-      char * value = trim( &s[++offset]);
-      wchar_t * wname = calloc(strlen(name), sizeof(wchar_t));
-      wchar_t * wvalue = calloc(strlen(value), sizeof(wchar_t));
+        if ( offset != -1 ) {
+            s[offset] = ( char ) 0;
+            char *name = s;
+            char *value = trim( &s[++offset] );
+            wchar_t *wname = calloc( strlen( name ), sizeof( wchar_t ) );
+            wchar_t *wvalue = calloc( strlen( value ), sizeof( wchar_t ) );
 
-      mbstowcs(wname, name, strlen(name));
-      mbstowcs(wvalue, value, strlen(value));
+            mbstowcs( wname, name, strlen( name ) );
+            mbstowcs( wvalue, value, strlen( value ) );
 
-      cell->payload.stream.meta = make_cons(
-        make_cons(
-          c_string_to_lisp_keyword( wname),
-          c_string_to_lisp_string(wvalue)),
-        cell->payload.stream.meta);
+            cell->payload.stream.meta =
+                make_cons( make_cons
+                           ( c_string_to_lisp_keyword( wname ),
+                             c_string_to_lisp_string( wvalue ) ),
+                           cell->payload.stream.meta );
 
-      debug_printf( DEBUG_IO, L"write_meta_callback: added header '%s': value '%s'\n", name, value);
+            debug_printf( DEBUG_IO,
+                          L"write_meta_callback: added header '%s': value '%s'\n",
+                          name, value );
+        }
+    } else {
+        debug_print
+            ( L"Pointer passed to write_meta_callback did not point to a stream: ",
+              DEBUG_IO );
+        debug_dump_object( stream, DEBUG_IO );
     }
-  } else {
-    debug_print( L"Pointer passed to write_meta_callback did not point to a stream: ", DEBUG_IO);
-    debug_dump_object(stream, DEBUG_IO);
-  }
 
-  return nmemb;
+    return nmemb;
 }
 
 
 void collect_meta( struct cons_pointer stream, struct cons_pointer url ) {
-    URL_FILE * s = pointer2cell(stream).payload.stream.stream;
+    URL_FILE *s = pointer2cell( stream ).payload.stream.stream;
 
     switch ( s->type ) {
         case CFTYPE_NONE:
@@ -315,8 +321,9 @@ void collect_meta( struct cons_pointer stream, struct cons_pointer url ) {
         case CFTYPE_CURL:
             curl_easy_setopt( s->handle.curl, CURLOPT_VERBOSE, 1L );
             curl_easy_setopt( s->handle.curl, CURLOPT_HEADER, 1L );
-            curl_easy_setopt( s->handle.curl, CURLOPT_HEADERFUNCTION, write_meta_callback);
-            curl_easy_setopt( s->handle.curl, CURLOPT_HEADERDATA, stream);
+            curl_easy_setopt( s->handle.curl, CURLOPT_HEADERFUNCTION,
+                              write_meta_callback );
+            curl_easy_setopt( s->handle.curl, CURLOPT_HEADERDATA, stream );
             break;
     }
 }
@@ -338,38 +345,37 @@ void collect_meta( struct cons_pointer stream, struct cons_pointer url ) {
  * on my stream, if any, else NIL.
  */
 struct cons_pointer
-  lisp_open( struct stack_frame *frame, struct cons_pointer frame_pointer,
-            struct cons_pointer env ) {
-  struct cons_pointer result = NIL;
+lisp_open( struct stack_frame *frame, struct cons_pointer frame_pointer,
+           struct cons_pointer env ) {
+    struct cons_pointer result = NIL;
 
-  if ( stringp( frame->arg[0] ) ) {
-    struct cons_pointer meta =
-      make_cons( make_cons(
-        c_string_to_lisp_keyword( L"url" ),
-        frame->arg[0] ),
-                NIL );
+    if ( stringp( frame->arg[0] ) ) {
+        struct cons_pointer meta =
+            make_cons( make_cons( c_string_to_lisp_keyword( L"url" ),
+                                  frame->arg[0] ),
+                       NIL );
 
-    char *url = lisp_string_to_c_string( frame->arg[0] );
+        char *url = lisp_string_to_c_string( frame->arg[0] );
 
-    if ( nilp( frame->arg[1] ) ) {
-      URL_FILE *stream = url_fopen( url, "r" );
-      result = make_read_stream( stream, meta );
-    } else {
-      // TODO: anything more complex is a problem for another day.
-      URL_FILE *stream = url_fopen( url, "w" );
-      result = make_write_stream( stream, meta);
+        if ( nilp( frame->arg[1] ) ) {
+            URL_FILE *stream = url_fopen( url, "r" );
+            result = make_read_stream( stream, meta );
+        } else {
+            // TODO: anything more complex is a problem for another day.
+            URL_FILE *stream = url_fopen( url, "w" );
+            result = make_write_stream( stream, meta );
+        }
+
+        free( url );
+
+        if ( pointer2cell( result ).payload.stream.stream == NULL ) {
+            result = NIL;
+        } else {
+            collect_meta( result, frame->arg[0] );
+        }
     }
 
-    free( url );
-
-    if ( pointer2cell( result ).payload.stream.stream == NULL ) {
-      result = NIL;
-    } else {
-      collect_meta( result, frame->arg[0]);
-    }
-  }
-
-  return result;
+    return result;
 }
 
 /**
@@ -392,8 +398,8 @@ lisp_read_char( struct stack_frame *frame, struct cons_pointer frame_pointer,
     if ( readp( frame->arg[0] ) ) {
         result =
             make_string( url_fgetwc
-                         ( pointer2cell( frame->arg[0] ).payload.
-                           stream.stream ), NIL );
+                         ( pointer2cell( frame->arg[0] ).payload.stream.
+                           stream ), NIL );
     }
 
     return result;
diff --git a/src/io/io.h b/src/io/io.h
index 167660b..33f733f 100644
--- a/src/io/io.h
+++ b/src/io/io.h
@@ -15,7 +15,7 @@
 
 extern CURLSH *io_share;
 
-int io_init();
+int io_init(  );
 
 URL_FILE *file_to_url_file( FILE * f );
 wint_t url_fgetwc( URL_FILE * input );
diff --git a/src/ops/print.c b/src/io/print.c
similarity index 99%
rename from src/ops/print.c
rename to src/io/print.c
index e13f17a..854c63a 100644
--- a/src/ops/print.c
+++ b/src/io/print.c
@@ -35,7 +35,7 @@ int print_use_colours = 0;
  * don't print anything but just return.
  */
 void print_string_contents( URL_FILE * output, struct cons_pointer pointer ) {
-    while ( stringp( pointer ) || symbolp( pointer ) || keywordp(pointer)) {
+    while ( stringp( pointer ) || symbolp( pointer ) || keywordp( pointer ) ) {
         struct cons_space_object *cell = &pointer2cell( pointer );
         wchar_t c = cell->payload.string.character;
 
diff --git a/src/ops/print.h b/src/io/print.h
similarity index 100%
rename from src/ops/print.h
rename to src/io/print.h
diff --git a/src/ops/read.c b/src/io/read.c
similarity index 99%
rename from src/ops/read.c
rename to src/io/read.c
index 7362ecb..c49d043 100644
--- a/src/ops/read.c
+++ b/src/io/read.c
@@ -355,8 +355,8 @@ struct cons_pointer read_symbol_or_key( URL_FILE * input, char *tag,
                     make_symbol_or_key( initial,
                                         read_symbol_or_key( input,
                                                             tag,
-                                                            url_fgetwc( input ) ),
-                                        tag );
+                                                            url_fgetwc
+                                                            ( input ) ), tag );
             } else {
                 result = NIL;
                 /*
diff --git a/src/ops/read.h b/src/io/read.h
similarity index 100%
rename from src/ops/read.h
rename to src/io/read.h
diff --git a/src/memory/conspage.c b/src/memory/conspage.c
index 5f8c3a8..2d0958d 100644
--- a/src/memory/conspage.c
+++ b/src/memory/conspage.c
@@ -168,7 +168,7 @@ void free_cell( struct cons_pointer pointer ) {
                     break;
                 case READTV:
                 case WRITETV:
-                    dec_ref(cell->payload.stream.meta);
+                    dec_ref( cell->payload.stream.meta );
                     url_fclose( cell->payload.stream.stream );
                     break;
                 case SPECIALTV:
diff --git a/src/memory/consspaceobject.c b/src/memory/consspaceobject.c
index f7b5ca9..816618f 100644
--- a/src/memory/consspaceobject.c
+++ b/src/memory/consspaceobject.c
@@ -158,7 +158,7 @@ make_function( struct cons_pointer meta, struct cons_pointer ( *executable )
                   struct cons_pointer, struct cons_pointer ) ) {
     struct cons_pointer pointer = allocate_cell( FUNCTIONTAG );
     struct cons_space_object *cell = &pointer2cell( pointer );
-    inc_ref( meta);
+    inc_ref( meta );
 
     cell->payload.function.meta = meta;
     cell->payload.function.executable = executable;
@@ -261,11 +261,11 @@ struct cons_pointer make_symbol_or_key( wint_t c, struct cons_pointer tail,
     if ( strncmp( tag, KEYTAG, 4 ) == 0 ) {
         struct cons_pointer r = internedp( result, oblist );
 
-      if ( nilp(r)) {
-        intern(result, oblist);
-      } else {
-        result = r;
-      }
+        if ( nilp( r ) ) {
+            intern( result, oblist );
+        } else {
+            result = r;
+        }
     }
 
     return result;
@@ -280,7 +280,7 @@ make_special( struct cons_pointer meta, struct cons_pointer ( *executable )
                  struct cons_pointer, struct cons_pointer env ) ) {
     struct cons_pointer pointer = allocate_cell( SPECIALTAG );
     struct cons_space_object *cell = &pointer2cell( pointer );
-    inc_ref( meta);
+    inc_ref( meta );
 
     cell->payload.special.meta = meta;
     cell->payload.special.executable = executable;
diff --git a/src/memory/dump.c b/src/memory/dump.c
index 7f7701f..28bd36a 100644
--- a/src/memory/dump.c
+++ b/src/memory/dump.c
@@ -108,14 +108,14 @@ void dump_object( URL_FILE * output, struct cons_pointer pointer ) {
         case RATIOTV:
             url_fwprintf( output,
                           L"\t\tRational cell: value %ld/%ld, count %u\n",
-                          pointer2cell( cell.payload.ratio.dividend ).payload.
-                          integer.value,
-                          pointer2cell( cell.payload.ratio.divisor ).payload.
-                          integer.value, cell.count );
+                          pointer2cell( cell.payload.ratio.dividend ).
+                          payload.integer.value,
+                          pointer2cell( cell.payload.ratio.divisor ).
+                          payload.integer.value, cell.count );
             break;
         case READTV:
-            url_fputws(  L"\t\tInput stream; metadata: ", output );
-            print(output, cell.payload.stream.meta);
+            url_fputws( L"\t\tInput stream; metadata: ", output );
+            print( output, cell.payload.stream.meta );
             url_fputws( L"\n", output );
             break;
         case REALTV:
@@ -150,8 +150,8 @@ void dump_object( URL_FILE * output, struct cons_pointer pointer ) {
             }
             break;
         case WRITETV:
-            url_fputws(  L"\t\tOutput stream; metadata: ", output );
-            print(output, cell.payload.stream.meta);
+            url_fputws( L"\t\tOutput stream; metadata: ", output );
+            print( output, cell.payload.stream.meta );
             url_fputws( L"\n", output );
             break;
     }
diff --git a/src/ops/lispops.c b/src/ops/lispops.c
index 91ec2cf..e390ac0 100644
--- a/src/ops/lispops.c
+++ b/src/ops/lispops.c
@@ -352,10 +352,9 @@ c_apply( struct stack_frame *frame, struct cons_pointer frame_pointer,
                         result = next_pointer;
                     } else {
                         result =
-                            ( *fn_cell.payload.
-                              special.executable ) ( get_stack_frame
-                                                     ( next_pointer ),
-                                                     next_pointer, env );
+                            ( *fn_cell.payload.special.
+                              executable ) ( get_stack_frame( next_pointer ),
+                                             next_pointer, env );
                         debug_print( L"Special form returning: ", DEBUG_EVAL );
                         debug_print_object( result, DEBUG_EVAL );
                         debug_println( DEBUG_EVAL );
@@ -842,7 +841,9 @@ struct cons_pointer c_reverse( struct cons_pointer arg ) {
                 result = make_string( o.payload.string.character, result );
                 break;
             case SYMBOLTV:
-                result = make_symbol_or_key( o.payload.string.character, result, SYMBOLTAG );
+                result =
+                    make_symbol_or_key( o.payload.string.character, result,
+                                        SYMBOLTAG );
                 break;
         }
     }
@@ -1208,13 +1209,13 @@ struct cons_pointer lisp_source( struct stack_frame *frame,
                                  struct cons_pointer env ) {
     struct cons_pointer result = NIL;
     struct cons_space_object cell = pointer2cell( frame->arg[0] );
-    struct cons_pointer source_key = c_string_to_lisp_keyword(L"source");
+    struct cons_pointer source_key = c_string_to_lisp_keyword( L"source" );
     switch ( cell.tag.value ) {
         case FUNCTIONTV:
-            result = c_assoc( source_key, cell.payload.function.meta);
+            result = c_assoc( source_key, cell.payload.function.meta );
             break;
         case SPECIALTV:
-            result = c_assoc( source_key, cell.payload.special.meta);
+            result = c_assoc( source_key, cell.payload.special.meta );
             break;
         case LAMBDATV:
             result = make_cons( c_string_to_lisp_symbol( L"lambda" ),
diff --git a/src/ops/meta.c b/src/ops/meta.c
index 5e48709..a27d2af 100644
--- a/src/ops/meta.c
+++ b/src/ops/meta.c
@@ -17,31 +17,29 @@
  *
  * @return a pointer to the metadata of my first argument, or nil if none.
  */
-struct cons_pointer lisp_metadata( struct stack_frame *frame, struct cons_pointer frame_pointer,
-                                  struct cons_pointer env ) {
-  debug_print(L"lisp_metadata: entered\n", DEBUG_EVAL);
-  debug_dump_object(frame->arg[0], DEBUG_EVAL);
-  struct cons_pointer result = NIL;
-  struct cons_space_object cell = pointer2cell(frame->arg[0]);
+struct cons_pointer lisp_metadata( struct stack_frame *frame,
+                                   struct cons_pointer frame_pointer,
+                                   struct cons_pointer env ) {
+    debug_print( L"lisp_metadata: entered\n", DEBUG_EVAL );
+    debug_dump_object( frame->arg[0], DEBUG_EVAL );
+    struct cons_pointer result = NIL;
+    struct cons_space_object cell = pointer2cell( frame->arg[0] );
 
-  switch( cell.tag.value) {
-    case FUNCTIONTV:
-    result = cell.payload.function.meta;
-    break;
-    case SPECIALTV:
-    result = cell.payload.special.meta;
-    break;
-    case READTV:
-    case WRITETV:
-    result = cell.payload.special.meta;
-    break;
-  }
+    switch ( cell.tag.value ) {
+        case FUNCTIONTV:
+            result = cell.payload.function.meta;
+            break;
+        case SPECIALTV:
+            result = cell.payload.special.meta;
+            break;
+        case READTV:
+        case WRITETV:
+            result = cell.payload.stream.meta;
+            break;
+    }
 
-  return make_cons(
-    make_cons(
-      c_string_to_lisp_keyword( L"type"),
-      c_type(frame->arg[0])),
-    result);
+    return make_cons( make_cons( c_string_to_lisp_keyword( L"type" ),
+                                 c_type( frame->arg[0] ) ), result );
 
 //  return result;
 }
diff --git a/src/ops/meta.h b/src/ops/meta.h
index 2c6ccf2..f441a50 100644
--- a/src/ops/meta.h
+++ b/src/ops/meta.h
@@ -11,7 +11,8 @@
 #define __psse_meta_h
 
 
-struct cons_pointer lisp_metadata( struct stack_frame *frame, struct cons_pointer frame_pointer,
-                                  struct cons_pointer env ) ;
+struct cons_pointer lisp_metadata( struct stack_frame *frame,
+                                   struct cons_pointer frame_pointer,
+                                   struct cons_pointer env );
 
 #endif

From eb49ca4e2d112ea76a764117108888496e76da16 Mon Sep 17 00:00:00 2001
From: Simon Brooke <simon@journeyman.cc>
Date: Wed, 30 Jan 2019 00:32:55 +0000
Subject: [PATCH 13/31] Improvements to URL metadata collection

Still not perfect - some corruption of data.
---
 src/io/io.c                  | 77 +++++++++++++++++++++++++++++++-----
 src/memory/consspaceobject.c |  6 +++
 2 files changed, 74 insertions(+), 9 deletions(-)

diff --git a/src/io/io.c b/src/io/io.c
index 82a6b32..1ff53db 100644
--- a/src/io/io.c
+++ b/src/io/io.c
@@ -1,7 +1,10 @@
 /*
  * io.c
  *
- * Communication between PSSE and the outside world, via libcurl.
+ * Communication between PSSE and the outside world, via libcurl. NOTE
+ * that this file destructively changes metadata on URL connections,
+ * because the metadata is not available until the stream has been read
+ * from. It would be better to find a workaround!
  *
  * (c) 2019 Simon Brooke <simon@journeyman.cc>
  * Licensed under GPL version 2.0, or, at your option, any later version.
@@ -24,6 +27,8 @@
 #include "consspaceobject.h"
 #include "debug.h"
 #include "fopen.h"
+#include "integer.h"
+#include "intern.h"
 #include "lispops.h"
 
 /**
@@ -264,18 +269,47 @@ char *trim( char *s ) {
     return ( char * ) &s[i];
 }
 
+
+void maybe_add_status_meta(struct cons_space_object *cell) {
+    struct cons_pointer status_key = c_string_to_lisp_keyword( L"status-code" );
+
+    debug_print(L"maybe_add_status_meta: entered\n", DEBUG_IO);
+
+    if (cell->payload.stream.stream->type == CFTYPE_CURL &&
+        nilp(c_assoc( status_key, cell->payload.stream.meta))) {
+        long status = 0;
+        curl_easy_getinfo(cell->payload.stream.stream->handle.curl,
+                          CURLINFO_RESPONSE_CODE,
+                          &status);
+
+        debug_printf( DEBUG_IO, L"maybe_add_status_meta: read HTTP status %d\n", status);
+
+        if (status > 0) {
+            cell->payload.stream.meta = make_cons(
+                make_cons(status_key,
+                          make_integer(status, NIL)),
+                cell->payload.stream.meta);
+        }
+    }
+}
+
+
 /**
  * Callback to assemble metadata for a URL stream. This is naughty because
  * it modifies data, but it's really the only way to create metadata.
  */
-static size_t write_meta_callback( void *ptr, size_t size, size_t nmemb,
+static size_t write_meta_callback( char *string, size_t size, size_t nmemb,
                                    struct cons_pointer stream ) {
     struct cons_space_object *cell = &pointer2cell( stream );
 
+    /* make a copy of the string that we can destructively change */
+    char * s = calloc(strlen(string), sizeof(char));
+
+    strcpy( s, string);
+
     if ( strncmp( &cell->tag.bytes[0], READTAG, 4 ) ||
          strncmp( &cell->tag.bytes[0], WRITETAG, 4 ) ) {
-        char *s = ( char * ) ptr;
-        int offset = index_of( ':', ptr );
+        int offset = index_of( ':', s );
 
         if ( offset != -1 ) {
             s[offset] = ( char ) 0;
@@ -293,18 +327,43 @@ static size_t write_meta_callback( void *ptr, size_t size, size_t nmemb,
                              c_string_to_lisp_string( wvalue ) ),
                            cell->payload.stream.meta );
 
+            free(wname);
+            free(wvalue);
+
             debug_printf( DEBUG_IO,
                           L"write_meta_callback: added header '%s': value '%s'\n",
                           name, value );
+        } else if (strncmp( "HTTP", s, 4) == 0) {
+            int offset = index_of( ' ', s );
+            char *value = trim( &s[offset] );
+            wchar_t *wvalue = calloc( strlen( value ), sizeof( wchar_t ) );
+            mbstowcs( wvalue, value, strlen( value ) );
+
+            cell->payload.stream.meta =
+                make_cons( make_cons
+                           ( c_string_to_lisp_keyword( L"status" ),
+                             c_string_to_lisp_string( wvalue ) ),
+                           cell->payload.stream.meta );
+
+            maybe_add_status_meta( cell);
+
+            debug_printf( DEBUG_IO,
+                          L"write_meta_callback: added header 'status': value '%s'\n",
+                          value );
+        } else {
+            debug_printf( DEBUG_IO,
+                          L"write_meta_callback: header passed with no colon: '%s'\n",
+                          s );
         }
-    } else {
+      } else {
         debug_print
             ( L"Pointer passed to write_meta_callback did not point to a stream: ",
               DEBUG_IO );
         debug_dump_object( stream, DEBUG_IO );
     }
 
-    return nmemb;
+    free(s);
+    return strlen(string);
 }
 
 
@@ -351,7 +410,7 @@ lisp_open( struct stack_frame *frame, struct cons_pointer frame_pointer,
 
     if ( stringp( frame->arg[0] ) ) {
         struct cons_pointer meta =
-            make_cons( make_cons( c_string_to_lisp_keyword( L"url" ),
+              make_cons(make_cons( c_string_to_lisp_keyword( L"url" ),
                                   frame->arg[0] ),
                        NIL );
 
@@ -366,13 +425,13 @@ lisp_open( struct stack_frame *frame, struct cons_pointer frame_pointer,
             result = make_write_stream( stream, meta );
         }
 
-        free( url );
-
         if ( pointer2cell( result ).payload.stream.stream == NULL ) {
             result = NIL;
         } else {
             collect_meta( result, frame->arg[0] );
         }
+
+        free( url );
     }
 
     return result;
diff --git a/src/memory/consspaceobject.c b/src/memory/consspaceobject.c
index 816618f..0baba69 100644
--- a/src/memory/consspaceobject.c
+++ b/src/memory/consspaceobject.c
@@ -328,6 +328,12 @@ struct cons_pointer make_write_stream( URL_FILE * output,
 struct cons_pointer c_string_to_lisp_keyword( wchar_t *symbol ) {
     struct cons_pointer result = NIL;
 
+    for (int i = 0; symbol[i] != '\0'; i++) {
+        if(iswalpha(symbol[i] && !iswlower(symbol[i]))) {
+            symbol[i] = towlower(symbol[i]);
+        }
+    }
+
     for ( int i = wcslen( symbol ); i > 0; i-- ) {
         result = make_keyword( symbol[i - 1], result );
     }

From 45af898f5e37771b84acf22a7042313f0c84956a Mon Sep 17 00:00:00 2001
From: Simon Brooke <simon@journeyman.cc>
Date: Wed, 30 Jan 2019 00:39:43 +0000
Subject: [PATCH 14/31] That seems to fix it!

---
 src/io/io.c | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/io/io.c b/src/io/io.c
index 1ff53db..e7554ec 100644
--- a/src/io/io.c
+++ b/src/io/io.c
@@ -260,11 +260,11 @@ int index_of( char c, char *s ) {
 char *trim( char *s ) {
     int i;
 
-    for ( i = strlen( s ); ( isblank( s[i] ) || iscntrl( s[i] ) ) && i > -1;
+    for ( i = strlen( s ); ( isblank( s[i] ) || iscntrl( s[i] ) ) && i >= 0;
           i-- ) {
         s[i] = ( char ) 0;
     }
-    for ( i = 0; isblank( s[i] ) && s[i] != 0; i++ );
+    for ( i = 0; ( isblank( s[i] ) || iscntrl( s[i] ) ) && s[i] != 0; i++ );
 
     return ( char * ) &s[i];
 }
@@ -313,7 +313,7 @@ static size_t write_meta_callback( char *string, size_t size, size_t nmemb,
 
         if ( offset != -1 ) {
             s[offset] = ( char ) 0;
-            char *name = s;
+            char *name = trim( s );
             char *value = trim( &s[++offset] );
             wchar_t *wname = calloc( strlen( name ), sizeof( wchar_t ) );
             wchar_t *wvalue = calloc( strlen( value ), sizeof( wchar_t ) );

From 86319fd1c32ab1accd109e0bfa5b79cfc6ba1446 Mon Sep 17 00:00:00 2001
From: Simon Brooke <simon@journeyman.cc>
Date: Wed, 30 Jan 2019 00:39:43 +0000
Subject: [PATCH 15/31] That seems to fix it!

---
 src/io/io.c                  |  6 +++---
 src/memory/consspaceobject.c | 21 +++++++++++----------
 2 files changed, 14 insertions(+), 13 deletions(-)

diff --git a/src/io/io.c b/src/io/io.c
index 1ff53db..e7554ec 100644
--- a/src/io/io.c
+++ b/src/io/io.c
@@ -260,11 +260,11 @@ int index_of( char c, char *s ) {
 char *trim( char *s ) {
     int i;
 
-    for ( i = strlen( s ); ( isblank( s[i] ) || iscntrl( s[i] ) ) && i > -1;
+    for ( i = strlen( s ); ( isblank( s[i] ) || iscntrl( s[i] ) ) && i >= 0;
           i-- ) {
         s[i] = ( char ) 0;
     }
-    for ( i = 0; isblank( s[i] ) && s[i] != 0; i++ );
+    for ( i = 0; ( isblank( s[i] ) || iscntrl( s[i] ) ) && s[i] != 0; i++ );
 
     return ( char * ) &s[i];
 }
@@ -313,7 +313,7 @@ static size_t write_meta_callback( char *string, size_t size, size_t nmemb,
 
         if ( offset != -1 ) {
             s[offset] = ( char ) 0;
-            char *name = s;
+            char *name = trim( s );
             char *value = trim( &s[++offset] );
             wchar_t *wname = calloc( strlen( name ), sizeof( wchar_t ) );
             wchar_t *wvalue = calloc( strlen( value ), sizeof( wchar_t ) );
diff --git a/src/memory/consspaceobject.c b/src/memory/consspaceobject.c
index 0baba69..aa1cece 100644
--- a/src/memory/consspaceobject.c
+++ b/src/memory/consspaceobject.c
@@ -323,19 +323,18 @@ struct cons_pointer make_write_stream( URL_FILE * output,
 }
 
 /**
- * Return a lisp keyword representation of this wide character string.
+ * Return a lisp keyword representation of this wide character string. In keywords,
+ * I am accepting only lower case characters and numbers.
  */
 struct cons_pointer c_string_to_lisp_keyword( wchar_t *symbol ) {
     struct cons_pointer result = NIL;
 
-    for (int i = 0; symbol[i] != '\0'; i++) {
-        if(iswalpha(symbol[i] && !iswlower(symbol[i]))) {
-            symbol[i] = towlower(symbol[i]);
-        }
-    }
+    for ( int i = wcslen( symbol ) -1; i >= 0; i-- ) {
+      wchar_t c = towlower(symbol[i]);
 
-    for ( int i = wcslen( symbol ); i > 0; i-- ) {
-        result = make_keyword( symbol[i - 1], result );
+      if (iswalnum(c) || c == L'-') {
+        result = make_keyword( c, result );
+      }
     }
 
     return result;
@@ -347,8 +346,10 @@ struct cons_pointer c_string_to_lisp_keyword( wchar_t *symbol ) {
 struct cons_pointer c_string_to_lisp_string( wchar_t *string ) {
     struct cons_pointer result = NIL;
 
-    for ( int i = wcslen( string ); i > 0; i-- ) {
-        result = make_string( string[i - 1], result );
+    for ( int i = wcslen( string ) - 1; i >= 0; i-- ) {
+      if (iswprint(string[i]) && string[i] != '"') {
+        result = make_string( string[i], result );
+      }
     }
 
     return result;

From bd4d65536247bbf50c3bba268da45bffdfba2193 Mon Sep 17 00:00:00 2001
From: Simon Brooke <simon@journeyman.cc>
Date: Thu, 31 Jan 2019 13:24:06 +0000
Subject: [PATCH 16/31] Metadata for file streams

---
 src/io/io.c       | 137 ++++++++++++++++++++++++++--------------------
 src/ops/lispops.c |   8 +--
 2 files changed, 82 insertions(+), 63 deletions(-)

diff --git a/src/io/io.c b/src/io/io.c
index e7554ec..58ee88d 100644
--- a/src/io/io.c
+++ b/src/io/io.c
@@ -10,11 +10,15 @@
  * Licensed under GPL version 2.0, or, at your option, any later version.
  */
 
+#include <grp.h>
+#include <langinfo.h>
+#include <pwd.h>
 #include <stdlib.h>
 #include <string.h>
 #include <sys/stat.h>
 #include <sys/types.h>
 #include <unistd.h>
+#include <uuid/uuid.h>
 /*
  * wide characters
  */
@@ -270,29 +274,33 @@ char *trim( char *s ) {
 }
 
 
-void maybe_add_status_meta(struct cons_space_object *cell) {
-    struct cons_pointer status_key = c_string_to_lisp_keyword( L"status-code" );
-
-    debug_print(L"maybe_add_status_meta: entered\n", DEBUG_IO);
-
-    if (cell->payload.stream.stream->type == CFTYPE_CURL &&
-        nilp(c_assoc( status_key, cell->payload.stream.meta))) {
-        long status = 0;
-        curl_easy_getinfo(cell->payload.stream.stream->handle.curl,
-                          CURLINFO_RESPONSE_CODE,
-                          &status);
-
-        debug_printf( DEBUG_IO, L"maybe_add_status_meta: read HTTP status %d\n", status);
-
-        if (status > 0) {
-            cell->payload.stream.meta = make_cons(
-                make_cons(status_key,
-                          make_integer(status, NIL)),
-                cell->payload.stream.meta);
-        }
-    }
+struct cons_pointer add_meta_integer( struct cons_pointer meta, wchar_t *key,
+                                      long int value ) {
+    return
+        make_cons( make_cons
+                   ( c_string_to_lisp_keyword( key ),
+                     make_integer( value, NIL ) ), meta );
 }
 
+struct cons_pointer add_meta_string( struct cons_pointer meta, wchar_t *key,
+                                     char *value ) {
+    wchar_t buffer[strlen( value ) + 1];
+    mbstowcs( buffer, value, strlen( value ) );
+    return make_cons( make_cons( c_string_to_lisp_keyword( key ),
+                                 c_string_to_lisp_string( buffer ) ), meta );
+}
+
+struct cons_pointer add_meta_time( struct cons_pointer meta, wchar_t *key,
+                                   time_t * value ) {
+    /* I don't yet have a concept of a date-time object, which is a
+     * bit of an oversight! */
+    char datestring[256];
+    struct tm *tm = localtime( value );
+
+    strftime( datestring, sizeof( datestring ), nl_langinfo( D_T_FMT ), tm );
+
+    return add_meta_string( meta, key, datestring );
+}
 
 /**
  * Callback to assemble metadata for a URL stream. This is naughty because
@@ -303,9 +311,9 @@ static size_t write_meta_callback( char *string, size_t size, size_t nmemb,
     struct cons_space_object *cell = &pointer2cell( stream );
 
     /* make a copy of the string that we can destructively change */
-    char * s = calloc(strlen(string), sizeof(char));
+    char *s = calloc( strlen( string ), sizeof( char ) );
 
-    strcpy( s, string);
+    strcpy( s, string );
 
     if ( strncmp( &cell->tag.bytes[0], READTAG, 4 ) ||
          strncmp( &cell->tag.bytes[0], WRITETAG, 4 ) ) {
@@ -315,37 +323,26 @@ static size_t write_meta_callback( char *string, size_t size, size_t nmemb,
             s[offset] = ( char ) 0;
             char *name = trim( s );
             char *value = trim( &s[++offset] );
-            wchar_t *wname = calloc( strlen( name ), sizeof( wchar_t ) );
-            wchar_t *wvalue = calloc( strlen( value ), sizeof( wchar_t ) );
+            wchar_t wname[strlen( name )];
 
             mbstowcs( wname, name, strlen( name ) );
-            mbstowcs( wvalue, value, strlen( value ) );
 
             cell->payload.stream.meta =
-                make_cons( make_cons
-                           ( c_string_to_lisp_keyword( wname ),
-                             c_string_to_lisp_string( wvalue ) ),
-                           cell->payload.stream.meta );
-
-            free(wname);
-            free(wvalue);
+                add_meta_string( cell->payload.stream.meta, wname, value );
 
             debug_printf( DEBUG_IO,
                           L"write_meta_callback: added header '%s': value '%s'\n",
                           name, value );
-        } else if (strncmp( "HTTP", s, 4) == 0) {
+        } else if ( strncmp( "HTTP", s, 4 ) == 0 ) {
             int offset = index_of( ' ', s );
             char *value = trim( &s[offset] );
-            wchar_t *wvalue = calloc( strlen( value ), sizeof( wchar_t ) );
-            mbstowcs( wvalue, value, strlen( value ) );
 
             cell->payload.stream.meta =
-                make_cons( make_cons
-                           ( c_string_to_lisp_keyword( L"status" ),
-                             c_string_to_lisp_string( wvalue ) ),
-                           cell->payload.stream.meta );
-
-            maybe_add_status_meta( cell);
+                add_meta_integer( add_meta_string
+                                  ( cell->payload.stream.meta, L"status",
+                                    value ), L"status-code", strtol( value,
+                                                                     NULL,
+                                                                     10 ) );
 
             debug_printf( DEBUG_IO,
                           L"write_meta_callback: added header 'status': value '%s'\n",
@@ -355,27 +352,54 @@ static size_t write_meta_callback( char *string, size_t size, size_t nmemb,
                           L"write_meta_callback: header passed with no colon: '%s'\n",
                           s );
         }
-      } else {
+    } else {
         debug_print
             ( L"Pointer passed to write_meta_callback did not point to a stream: ",
               DEBUG_IO );
         debug_dump_object( stream, DEBUG_IO );
     }
 
-    free(s);
-    return strlen(string);
+    free( s );
+    return strlen( string );
 }
 
-
-void collect_meta( struct cons_pointer stream, struct cons_pointer url ) {
+void collect_meta( struct cons_pointer stream, char *url ) {
+    struct cons_space_object *cell = &pointer2cell( stream );
     URL_FILE *s = pointer2cell( stream ).payload.stream.stream;
+    struct cons_pointer meta =
+        add_meta_string( cell->payload.stream.meta, L"url", url );
+    struct stat statbuf;
+    int result = stat( url, &statbuf );
+    struct passwd *pwd;
+    struct group *grp;
 
     switch ( s->type ) {
         case CFTYPE_NONE:
             break;
         case CFTYPE_FILE:
-            /* don't know whether you can get metadata on an open stream in C,
-             * although we could of course get it from the URL */
+            if ( result == 0 ) {
+                if ( ( pwd = getpwuid( statbuf.st_uid ) ) != NULL ) {
+                    meta = add_meta_string( meta, L"owner", pwd->pw_name );
+                } else {
+                    meta = add_meta_integer( meta, L"owner", statbuf.st_uid );
+                }
+
+                if ( ( grp = getgrgid( statbuf.st_gid ) ) != NULL ) {
+                    meta = add_meta_string( meta, L"group", grp->gr_name );
+                } else {
+                    meta = add_meta_integer( meta, L"group", statbuf.st_gid );
+                }
+
+                meta =
+                    add_meta_integer( meta, L"size",
+                                      ( intmax_t ) statbuf.st_size );
+
+                meta = add_meta_time( meta, L"modified", &statbuf.st_mtime );
+
+                /* this is destructive change before the cell is released into the
+                 * wild, and consequently permissible, just. */
+                cell->payload.stream.meta = meta;
+            }
             break;
         case CFTYPE_CURL:
             curl_easy_setopt( s->handle.curl, CURLOPT_VERBOSE, 1L );
@@ -409,26 +433,21 @@ lisp_open( struct stack_frame *frame, struct cons_pointer frame_pointer,
     struct cons_pointer result = NIL;
 
     if ( stringp( frame->arg[0] ) ) {
-        struct cons_pointer meta =
-              make_cons(make_cons( c_string_to_lisp_keyword( L"url" ),
-                                  frame->arg[0] ),
-                       NIL );
-
         char *url = lisp_string_to_c_string( frame->arg[0] );
 
         if ( nilp( frame->arg[1] ) ) {
             URL_FILE *stream = url_fopen( url, "r" );
-            result = make_read_stream( stream, meta );
+            result = make_read_stream( stream, NIL );
         } else {
             // TODO: anything more complex is a problem for another day.
             URL_FILE *stream = url_fopen( url, "w" );
-            result = make_write_stream( stream, meta );
+            result = make_write_stream( stream, NIL );
         }
 
         if ( pointer2cell( result ).payload.stream.stream == NULL ) {
             result = NIL;
         } else {
-            collect_meta( result, frame->arg[0] );
+            collect_meta( result, url );
         }
 
         free( url );
@@ -457,8 +476,8 @@ lisp_read_char( struct stack_frame *frame, struct cons_pointer frame_pointer,
     if ( readp( frame->arg[0] ) ) {
         result =
             make_string( url_fgetwc
-                         ( pointer2cell( frame->arg[0] ).payload.stream.
-                           stream ), NIL );
+                         ( pointer2cell( frame->arg[0] ).payload.
+                           stream.stream ), NIL );
     }
 
     return result;
diff --git a/src/ops/lispops.c b/src/ops/lispops.c
index e390ac0..5471c3f 100644
--- a/src/ops/lispops.c
+++ b/src/ops/lispops.c
@@ -646,12 +646,12 @@ lisp_car( struct stack_frame *frame, struct cons_pointer frame_pointer,
         case CONSTV:
             result = cell.payload.cons.car;
             break;
+        case NILTV:
+            break;
         case READTV:
             result =
                 make_string( url_fgetwc( cell.payload.stream.stream ), NIL );
             break;
-        case NILTV:
-            break;
         case STRINGTV:
             result = make_string( cell.payload.string.character, NIL );
             break;
@@ -690,6 +690,8 @@ lisp_cdr( struct stack_frame *frame, struct cons_pointer frame_pointer,
         case CONSTV:
             result = cell.payload.cons.cdr;
             break;
+        case NILTV:
+            break;
         case READTV:
             url_fgetwc( cell.payload.stream.stream );
             result = frame->arg[0];
@@ -697,8 +699,6 @@ lisp_cdr( struct stack_frame *frame, struct cons_pointer frame_pointer,
         case STRINGTV:
             result = cell.payload.string.cdr;
             break;
-        case NILTV:
-            break;
         default:
             result =
                 throw_exception( c_string_to_lisp_string

From 0fea9580fa3a59bc73da17d5d7973a26e8f30766 Mon Sep 17 00:00:00 2001
From: Simon Brooke <simon@journeyman.cc>
Date: Thu, 31 Jan 2019 14:17:29 +0000
Subject: [PATCH 17/31] Investigating the junk character problem.

---
 src/io/io.c | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/src/io/io.c b/src/io/io.c
index 58ee88d..1f7191c 100644
--- a/src/io/io.c
+++ b/src/io/io.c
@@ -266,9 +266,9 @@ char *trim( char *s ) {
 
     for ( i = strlen( s ); ( isblank( s[i] ) || iscntrl( s[i] ) ) && i >= 0;
           i-- ) {
-        s[i] = ( char ) 0;
+        s[i] = '\0';
     }
-    for ( i = 0; ( isblank( s[i] ) || iscntrl( s[i] ) ) && s[i] != 0; i++ );
+    for ( i = 0; ( isblank( s[i] ) || iscntrl( s[i] ) ) && s[i] != '\0'; i++ );
 
     return ( char * ) &s[i];
 }
@@ -284,7 +284,10 @@ struct cons_pointer add_meta_integer( struct cons_pointer meta, wchar_t *key,
 
 struct cons_pointer add_meta_string( struct cons_pointer meta, wchar_t *key,
                                      char *value ) {
+    value = trim( value);
     wchar_t buffer[strlen( value ) + 1];
+    /* \todo something goes wrong here: I sometimes get junk characters on the
+     * end of the string. */
     mbstowcs( buffer, value, strlen( value ) );
     return make_cons( make_cons( c_string_to_lisp_keyword( key ),
                                  c_string_to_lisp_string( buffer ) ), meta );

From 83accb2be4ca526ce763d7bdf0f0debfb7d0c0b6 Mon Sep 17 00:00:00 2001
From: Simon Brooke <simon@journeyman.cc>
Date: Thu, 31 Jan 2019 22:39:32 +0000
Subject: [PATCH 18/31] #13: Fixed

---
 src/io/fopen.c | 14 +++++++-----
 src/io/io.c    | 60 +++++++++++++++++++++++++++++---------------------
 src/utils.c    | 33 +++++++++++++++++++++++++++
 src/utils.h    | 15 +++++++++++++
 4 files changed, 92 insertions(+), 30 deletions(-)
 create mode 100644 src/utils.c
 create mode 100644 src/utils.h

diff --git a/src/io/fopen.c b/src/io/fopen.c
index d5e4cd6..d3ece5c 100644
--- a/src/io/fopen.c
+++ b/src/io/fopen.c
@@ -51,8 +51,9 @@
 #ifdef FOPEN_STANDALONE
 CURLSH *io_share;
 #else
-#include "io.h"
 #include "consspaceobject.h"
+#include "io.h"
+#include "utils.h"
 #endif
 
 
@@ -210,10 +211,9 @@ URL_FILE *url_fopen( const char *url, const char *operation ) {
         return NULL;
 
     file->handle.file = fopen( url, operation );
-    if ( file->handle.file )
-        file->type = CFTYPE_FILE; /* marked as URL */
-
-    else {
+    if ( file->handle.file ) {
+        file->type = CFTYPE_FILE; /* marked as file */
+    } else if ( index_of(':', url ) > -1 ) {
         file->type = CFTYPE_CURL; /* marked as URL */
         file->handle.curl = curl_easy_init(  );
 
@@ -247,7 +247,11 @@ URL_FILE *url_fopen( const char *url, const char *operation ) {
 
             file = NULL;
         }
+    } else {
+        file->type = CFTYPE_NONE;
+        /* not a file, and doesn't look like a URL. */
     }
+
     return file;
 }
 
diff --git a/src/io/io.c b/src/io/io.c
index 1f7191c..1cf3c9e 100644
--- a/src/io/io.c
+++ b/src/io/io.c
@@ -34,6 +34,7 @@
 #include "integer.h"
 #include "intern.h"
 #include "lispops.h"
+#include "utils.h"
 
 /**
  * The sharing hub for all connections. TODO: Ultimately this probably doesn't
@@ -253,27 +254,6 @@ lisp_close( struct stack_frame *frame, struct cons_pointer frame_pointer,
     return result;
 }
 
-int index_of( char c, char *s ) {
-    int i;
-
-    for ( i = 0; s[i] != c && s[i] != 0; i++ );
-
-    return s[i] == c ? i : -1;
-}
-
-char *trim( char *s ) {
-    int i;
-
-    for ( i = strlen( s ); ( isblank( s[i] ) || iscntrl( s[i] ) ) && i >= 0;
-          i-- ) {
-        s[i] = '\0';
-    }
-    for ( i = 0; ( isblank( s[i] ) || iscntrl( s[i] ) ) && s[i] != '\0'; i++ );
-
-    return ( char * ) &s[i];
-}
-
-
 struct cons_pointer add_meta_integer( struct cons_pointer meta, wchar_t *key,
                                       long int value ) {
     return
@@ -289,6 +269,13 @@ struct cons_pointer add_meta_string( struct cons_pointer meta, wchar_t *key,
     /* \todo something goes wrong here: I sometimes get junk characters on the
      * end of the string. */
     mbstowcs( buffer, value, strlen( value ) );
+
+    /* hack: get rid of 32766 as a junk character, to see whether there are
+     * others. */
+    for (int i = 0; i < wcslen( buffer); i++) {
+      if (buffer[i] == (wchar_t)32766) buffer[i] = (wchar_t)0;
+    }
+
     return make_cons( make_cons( c_string_to_lisp_keyword( key ),
                                  c_string_to_lisp_string( buffer ) ), meta );
 }
@@ -398,10 +385,6 @@ void collect_meta( struct cons_pointer stream, char *url ) {
                                       ( intmax_t ) statbuf.st_size );
 
                 meta = add_meta_time( meta, L"modified", &statbuf.st_mtime );
-
-                /* this is destructive change before the cell is released into the
-                 * wild, and consequently permissible, just. */
-                cell->payload.stream.meta = meta;
             }
             break;
         case CFTYPE_CURL:
@@ -412,6 +395,10 @@ void collect_meta( struct cons_pointer stream, char *url ) {
             curl_easy_setopt( s->handle.curl, CURLOPT_HEADERDATA, stream );
             break;
     }
+
+    /* this is destructive change before the cell is released into the
+                   * wild, and consequently permissible, just. */
+    cell->payload.stream.meta = meta;
 }
 
 
@@ -440,6 +427,29 @@ lisp_open( struct stack_frame *frame, struct cons_pointer frame_pointer,
 
         if ( nilp( frame->arg[1] ) ) {
             URL_FILE *stream = url_fopen( url, "r" );
+
+            debug_printf( DEBUG_IO,
+                         L"lisp_open: stream @ %d, stream type = %d, stream handle = %d\n",
+                         (int) &stream, (int)stream->type, (int)stream->handle.file);
+
+            switch (stream->type) {
+                case CFTYPE_NONE:
+                    return make_exception(
+                        c_string_to_lisp_string( L"Could not open stream"),
+                        frame_pointer);
+                    break;
+                case CFTYPE_FILE:
+                    if (stream->handle.file == NULL) {
+                      return make_exception(
+                          c_string_to_lisp_string( L"Could not open file"),
+                          frame_pointer);
+                    }
+                    break;
+                case CFTYPE_CURL:
+                    /* can't tell whether a URL is bad without reading it */
+                    break;
+            }
+
             result = make_read_stream( stream, NIL );
         } else {
             // TODO: anything more complex is a problem for another day.
diff --git a/src/utils.c b/src/utils.c
new file mode 100644
index 0000000..5b22516
--- /dev/null
+++ b/src/utils.c
@@ -0,0 +1,33 @@
+/*
+ * utils.c
+ *
+ * little generally useful functions which aren't in any way special to PSSE.
+ *
+ * (c) 2019 Simon Brooke <simon@journeyman.cc>
+ * Licensed under GPL version 2.0, or, at your option, any later version.
+ */
+
+#include <ctype.h>
+#include <stdlib.h>
+#include <string.h>
+
+
+int index_of( char c, char *s ) {
+    int i;
+
+    for ( i = 0; s[i] != c && s[i] != 0; i++ );
+
+    return s[i] == c ? i : -1;
+}
+
+char *trim( char *s ) {
+    int i;
+
+    for ( i = strlen( s ); ( isblank( s[i] ) || iscntrl( s[i] ) ) && i >= 0;
+          i-- ) {
+        s[i] = '\0';
+    }
+    for ( i = 0; ( isblank( s[i] ) || iscntrl( s[i] ) ) && s[i] != '\0'; i++ );
+
+    return ( char * ) &s[i];
+}
diff --git a/src/utils.h b/src/utils.h
new file mode 100644
index 0000000..e56fd6e
--- /dev/null
+++ b/src/utils.h
@@ -0,0 +1,15 @@
+/*
+ * utils.h
+ *
+ * little generally useful functions which aren't in any way special to PSSE.
+ *
+ * (c) 2019 Simon Brooke <simon@journeyman.cc>
+ * Licensed under GPL version 2.0, or, at your option, any later version.
+ */
+
+#ifndef __psse_utils_h
+#define __psse_utils_h
+
+int index_of( char c, char *s );
+char *trim( char *s );
+#endif

From 8cab28f6c84a46825095402b7cc1f391b1b76291 Mon Sep 17 00:00:00 2001
From: Simon Brooke <simon@journeyman.cc>
Date: Thu, 31 Jan 2019 22:49:25 +0000
Subject: [PATCH 19/31] Proper fix for the junk characters bug.

---
 src/io/io.c | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/src/io/io.c b/src/io/io.c
index 1cf3c9e..dd41190 100644
--- a/src/io/io.c
+++ b/src/io/io.c
@@ -189,7 +189,7 @@ wint_t url_fgetwc( URL_FILE * input ) {
                     if ( count > 1 ) {
                         url_fgets( ( char * ) &cbuff[1], count, input );
                     }
-                    mbstowcs( wbuff, cbuff, 1 );  //(char *)(&input->buffer[input->buffer_pos]), 1 );
+                    mbstowcs( wbuff, cbuff, 2 );  //(char *)(&input->buffer[input->buffer_pos]), 1 );
                     result = wbuff[0];
 
                     free( wbuff );
@@ -268,13 +268,13 @@ struct cons_pointer add_meta_string( struct cons_pointer meta, wchar_t *key,
     wchar_t buffer[strlen( value ) + 1];
     /* \todo something goes wrong here: I sometimes get junk characters on the
      * end of the string. */
-    mbstowcs( buffer, value, strlen( value ) );
+    mbstowcs( buffer, value, strlen( value ) + 1 );
 
     /* hack: get rid of 32766 as a junk character, to see whether there are
-     * others. */
+     * others.
     for (int i = 0; i < wcslen( buffer); i++) {
       if (buffer[i] == (wchar_t)32766) buffer[i] = (wchar_t)0;
-    }
+    } */
 
     return make_cons( make_cons( c_string_to_lisp_keyword( key ),
                                  c_string_to_lisp_string( buffer ) ), meta );
@@ -315,7 +315,7 @@ static size_t write_meta_callback( char *string, size_t size, size_t nmemb,
             char *value = trim( &s[++offset] );
             wchar_t wname[strlen( name )];
 
-            mbstowcs( wname, name, strlen( name ) );
+            mbstowcs( wname, name, strlen( name ) + 1 );
 
             cell->payload.stream.meta =
                 add_meta_string( cell->payload.stream.meta, wname, value );

From 23e4f0befa0497b3fcb21c2ea3cd322291c685ba Mon Sep 17 00:00:00 2001
From: Simon Brooke <simon@journeyman.cc>
Date: Tue, 5 Feb 2019 09:59:05 +0000
Subject: [PATCH 20/31] A bit of work on time, but it doesn't actually work
 yet.

---
 src/arith/integer.c          |  6 ---
 src/init.c                   |  2 +
 src/io/io.c                  |  8 ---
 src/io/print.c               |  4 ++
 src/memory/consspaceobject.h | 32 +++++++++++-
 src/time/time.c              | 98 ++++++++++++++++++++++++++++++++++++
 src/time/time.h              | 20 ++++++++
 src/utils.c                  |  2 +-
 8 files changed, 155 insertions(+), 17 deletions(-)
 create mode 100644 src/time/time.c
 create mode 100644 src/time/time.h

diff --git a/src/arith/integer.c b/src/arith/integer.c
index 1195c53..48992ca 100644
--- a/src/arith/integer.c
+++ b/src/arith/integer.c
@@ -12,12 +12,6 @@
 #include <math.h>
 #include <stdio.h>
 #include <stdlib.h>
-/* safe_iop, as available in the Ubuntu repository, is this one:
- * https://code.google.com/archive/p/safe-iop/wikis/README.wiki
- * which is installed as `libsafe-iop-dev`. There is an alternate
- * implementation here: https://github.com/redpig/safe-iop/
- * which shares the same version number but is not compatible. */
-#include <safe_iop.h>
 /*
  * wide characters
  */
diff --git a/src/init.c b/src/init.c
index 47ba772..06494e9 100644
--- a/src/init.c
+++ b/src/init.c
@@ -30,6 +30,7 @@
 #include "peano.h"
 #include "print.h"
 #include "repl.h"
+#include "time.h"
 
 // extern char *optarg; /* defined in unistd.h */
 
@@ -212,6 +213,7 @@ int main( int argc, char *argv[] ) {
     bind_function( L"source", &lisp_source );
     bind_function( L"subtract", &lisp_subtract );
     bind_function( L"throw", &lisp_exception );
+    bind_function( L"time", &lisp_time );
     bind_function( L"type", &lisp_type );
     bind_function( L"+", &lisp_add );
     bind_function( L"*", &lisp_multiply );
diff --git a/src/io/io.c b/src/io/io.c
index dd41190..b82c6ba 100644
--- a/src/io/io.c
+++ b/src/io/io.c
@@ -266,16 +266,8 @@ struct cons_pointer add_meta_string( struct cons_pointer meta, wchar_t *key,
                                      char *value ) {
     value = trim( value);
     wchar_t buffer[strlen( value ) + 1];
-    /* \todo something goes wrong here: I sometimes get junk characters on the
-     * end of the string. */
     mbstowcs( buffer, value, strlen( value ) + 1 );
 
-    /* hack: get rid of 32766 as a junk character, to see whether there are
-     * others.
-    for (int i = 0; i < wcslen( buffer); i++) {
-      if (buffer[i] == (wchar_t)32766) buffer[i] = (wchar_t)0;
-    } */
-
     return make_cons( make_cons( c_string_to_lisp_keyword( key ),
                                  c_string_to_lisp_string( buffer ) ), meta );
 }
diff --git a/src/io/print.c b/src/io/print.c
index 854c63a..fb0d8a1 100644
--- a/src/io/print.c
+++ b/src/io/print.c
@@ -22,6 +22,7 @@
 #include "integer.h"
 #include "stack.h"
 #include "print.h"
+#include "time.h"
 
 /**
  * Whether or not we colorise output.
@@ -210,6 +211,9 @@ struct cons_pointer print( URL_FILE * output, struct cons_pointer pointer ) {
         case SPECIALTV:
             url_fwprintf( output, L"<Special form>" );
             break;
+        case TIMETV:
+            print_string(output, time_to_string( pointer));
+            break;
         case TRUETV:
             url_fwprintf( output, L"t" );
             break;
diff --git a/src/memory/consspaceobject.h b/src/memory/consspaceobject.h
index 1bbbcd1..91ba3c3 100644
--- a/src/memory/consspaceobject.h
+++ b/src/memory/consspaceobject.h
@@ -193,6 +193,16 @@
  */
 #define SYMBOLTV    1112365395
 
+/**
+ * A time stamp.
+ */
+#define TIMETAG     "TIME"
+
+/**
+ * The string `TIME`, considered as an `unsigned int`.
+ */
+#define TIMETV      1162692948
+
 /**
  * The special cons cell at address {0,1} which is canonically different
  * from NIL.
@@ -344,13 +354,18 @@
  * (there should only be one of these so it's slightly redundant).
  * Also note that anything that is not NIL is truthy.
  */
-#define tp(conspoint) (checktag(conspoint,TRUETAG))
+#define tp(conspoint) (check_tag(conspoint,TRUETAG))
+
+/**
+ * true if `conspoint` points to a time cell, else false.
+ */
+#define timep(conspoint) (check_tag(conspoint,TIMETAG))
 
 /**
  * true if `conspoint` points to something that is truthy, i.e.
  * anything but NIL.
  */
-#define truep(conspoint) (!checktag(conspoint,NILTAG))
+#define truep(conspoint) (!check_tag(conspoint,NILTAG))
 
 /**
  * An indirect pointer to a cons cell
@@ -531,6 +546,15 @@ struct string_payload {
     struct cons_pointer cdr;
 };
 
+/**
+ * The payload of a time cell: an unsigned 128 bit value representing micro-
+ * seconds since the estimated date of the Big Bang (actually, for
+ * convenience, 14Bn years before 1st Jan 1970 (the UNIX epoch))
+ */
+struct time_payload {
+    unsigned __int128 value;
+};
+
 /**
  * payload of a vector pointer cell.
  */
@@ -616,6 +640,10 @@ struct cons_space_object {
          * if tag == STRINGTAG || tag == SYMBOLTAG
          */
         struct string_payload string;
+        /**
+         * if tag == TIMETAG
+         */
+        struct time_payload time;
         /**
          * if tag == TRUETAG; we'll treat the special cell T as just a cons
          */
diff --git a/src/time/time.c b/src/time/time.c
new file mode 100644
index 0000000..146f296
--- /dev/null
+++ b/src/time/time.c
@@ -0,0 +1,98 @@
+/*
+ * time.h
+ *
+ * Bare bones of PSSE time. See issue #16.
+ *
+ * (c) 2019 Simon Brooke <simon@journeyman.cc>
+ * Licensed under GPL version 2.0, or, at your option, any later version.
+ */
+
+#include <stdlib.h>
+#include <time.h>
+/*
+ * wide characters
+ */
+#include <wchar.h>
+#include <wctype.h>
+
+#include "conspage.h"
+#include "consspaceobject.h"
+#include "integer.h"
+#include "time.h"
+#define _GNU_SOURCE
+
+#define seconds_per_year 31557600L
+
+/**
+ * PSSE Lisp epoch is 14 Bn years, or 441,806,400,000,000,000 seconds, before
+ * the UNIX epoch; the value in microseconds will break the C reader.
+ */
+unsigned __int128 epoch_offset = ((__int128)(seconds_per_year * 1000000000L) *
+                                  (__int128)(14L * 1000000000L));
+
+/**
+ * Return the UNIX time value which represents this time, if it falls within
+ * the period representable in UNIX time, or zero otherwise.
+ */
+long int lisp_time_to_unix_time(struct cons_pointer t) {
+    long int result = 0;
+
+    if (timep( t)) {
+        unsigned __int128 value = pointer2cell(t).payload.time.value;
+
+        if (value > epoch_offset) { // \todo && value < UNIX time rollover
+            result = ((value - epoch_offset) / 1000000000);
+        }
+    }
+
+    return result;
+}
+
+unsigned __int128 unix_time_to_lisp_time( time_t t) {
+    unsigned __int128 result = epoch_offset + (t * 1000000000);
+
+    return result;
+}
+
+struct cons_pointer make_time( struct cons_pointer integer_or_nil) {
+    struct cons_pointer pointer = allocate_cell( TIMETAG );
+    struct cons_space_object *cell = &pointer2cell( pointer );
+
+    if (integerp(integer_or_nil)) {
+        cell->payload.time.value = pointer2cell(integer_or_nil).payload.integer.value;
+        // \todo: if integer is a bignum, deal with it.
+    } else {
+        cell->payload.time.value = unix_time_to_lisp_time( time(NULL));
+    }
+
+    return pointer;
+}
+
+/**
+ * Function; return a time representation of the first argument in the frame;
+ * further arguments are ignored.
+ *
+ * * (time integer_or_nil)
+ *
+ * @param frame my stack_frame.
+ * @param frame_pointer a pointer to my stack_frame.
+ * @param env my environment.
+ * @return a lisp time; if `integer_or_nil` is an integer, return a time which
+ * is that number of microseconds after the notional big bang; else the current
+ * time.
+ */
+struct cons_pointer lisp_time( struct stack_frame *frame, struct cons_pointer frame_pointer,
+           struct cons_pointer env ) {
+    return make_time( frame->arg[0]);
+}
+
+/**
+ * This is temporary, for bootstrapping.
+ */
+struct cons_pointer time_to_string( struct cons_pointer pointer) {
+    long int t = lisp_time_to_unix_time(pointer);
+
+    return c_string_to_lisp_string( t == 0 ?
+                                         L"Not yet implemented: cannot print times outside UNIX time\n" :
+                                         ctime(&t));
+}
diff --git a/src/time/time.h b/src/time/time.h
new file mode 100644
index 0000000..661decf
--- /dev/null
+++ b/src/time/time.h
@@ -0,0 +1,20 @@
+/*
+ * time.h
+ *
+ * Bare bones of PSSE time. See issue #16.
+ *
+ * (c) 2019 Simon Brooke <simon@journeyman.cc>
+ * Licensed under GPL version 2.0, or, at your option, any later version.
+ */
+
+#ifndef __psse_time_h
+#define __psse_time_h
+
+#define _GNU_SOURCE
+#include "consspaceobject.h"
+
+struct cons_pointer lisp_time( struct stack_frame *frame, struct cons_pointer frame_pointer,
+           struct cons_pointer env );
+struct cons_pointer time_to_string( struct cons_pointer pointer);
+
+#endif
diff --git a/src/utils.c b/src/utils.c
index 5b22516..ea3919f 100644
--- a/src/utils.c
+++ b/src/utils.c
@@ -27,7 +27,7 @@ char *trim( char *s ) {
           i-- ) {
         s[i] = '\0';
     }
-    for ( i = 0; ( isblank( s[i] ) || iscntrl( s[i] ) ) && s[i] != '\0'; i++ );
+    for ( i = 0; s[i] != '\0' && ( isblank( s[i] ) || iscntrl( s[i] ) ); i++ );
 
     return ( char * ) &s[i];
 }

From 2bebee60027b5104ebbfc327330573da639cbc97 Mon Sep 17 00:00:00 2001
From: Simon Brooke <simon@journeyman.cc>
Date: Tue, 5 Feb 2019 10:27:16 +0000
Subject: [PATCH 21/31] #8: Bare bones

---
 src/memory/map.c   |  8 ++++++
 src/memory/map.h   | 65 ++++++++++++++++++++++++++++++++++++++++++++++
 src/memory/stack.h |  6 ++---
 3 files changed, 76 insertions(+), 3 deletions(-)
 create mode 100644 src/memory/map.c
 create mode 100644 src/memory/map.h

diff --git a/src/memory/map.c b/src/memory/map.c
new file mode 100644
index 0000000..e897647
--- /dev/null
+++ b/src/memory/map.c
@@ -0,0 +1,8 @@
+/*
+ * map.c
+ *
+ * An immutable hashmap in vector space.
+ *
+ * (c) 2019 Simon Brooke <simon@journeyman.cc>
+ * Licensed under GPL version 2.0, or, at your option, any later version.
+ */
diff --git a/src/memory/map.h b/src/memory/map.h
new file mode 100644
index 0000000..d7a65c5
--- /dev/null
+++ b/src/memory/map.h
@@ -0,0 +1,65 @@
+/*
+ * map.h
+ *
+ * An immutable hashmap in vector space.
+ *
+ * (c) 2019 Simon Brooke <simon@journeyman.cc>
+ * Licensed under GPL version 2.0, or, at your option, any later version.
+ */
+
+#ifndef __psse_map_h
+#define __psse_map_h
+
+#include "consspaceobject.h"
+#include "conspage.h"
+
+/**
+ * macros for the tag of a mutable map.
+ */
+#define MAPTAG "IMAP"
+#define MAPTV 1346456905
+
+/**
+ * Number of buckets in a single tier map.
+ */
+#define BUCKETSINMAP 256
+
+/**
+ * Maximum number of entries in an association-list bucket.
+ */
+#define MAXENTRIESINASSOC 16
+
+/**
+ * The vector-space payload of a map object.
+ */
+struct map_payload {
+    /**
+     * There is a default hash function, which is used if `hash_function` is
+     * `nil` (which it normally should be); and keywords will probably carry
+     * their own hash values. But it will be possible to override the hash
+     * function by putting a function of one argument returning an integer
+     * here. */
+    struct cons_pointer hash_function = NIL;
+
+    /**
+     * Obviously the number of buckets in a map is a trade off, and this may need
+     * tuning - or it may even be necessary to have different sized base maps. The
+     * idea here is that the value of a bucket is
+     *
+     * 1. `nil`; or
+     * 2. an association list; or
+     * 3. a map.
+     *
+     * All buckets are initially `nil`. Adding a value to a `nil` bucket returns
+     * a map with a new bucket in the form of an assoc list. Subsequent additions
+     * cons new key/value pairs onto the assoc list, until there are
+     * `MAXENTRIESINASSOC` pairs, at which point if a further value is added to
+     * the same bucket the bucket returned will be in the form of a second level
+     * map. My plan is that buckets the first level map will be indexed on the
+     * first sixteen bits of the hash value, those in the second on the second
+     * sixteen, and, potentially, so on.
+     */
+    struct cons_pointer buckets[BUCKETSINMAP];
+};
+
+#endif
diff --git a/src/memory/stack.h b/src/memory/stack.h
index 0ea903c..f132c69 100644
--- a/src/memory/stack.h
+++ b/src/memory/stack.h
@@ -18,12 +18,12 @@
  * Licensed under GPL version 2.0, or, at your option, any later version.
  */
 
+#ifndef __psse_stack_h
+#define __psse_stack_h
+
 #include "consspaceobject.h"
 #include "conspage.h"
 
-#ifndef __stack_h
-#define __stack_h
-
 /**
  * macros for the tag of a stack frame.
  */

From e7ef82d23f3910726648e60245e71891378e4799 Mon Sep 17 00:00:00 2001
From: Simon Brooke <simon@journeyman.cc>
Date: Tue, 5 Feb 2019 11:02:04 +0000
Subject: [PATCH 22/31] #8: keywords as functions on associations working

---
 src/ops/intern.c  |  6 ++++
 src/ops/lispops.c | 71 ++++++++++++++++++++++++++---------------------
 2 files changed, 45 insertions(+), 32 deletions(-)

diff --git a/src/ops/intern.c b/src/ops/intern.c
index 87d116e..8ce5d71 100644
--- a/src/ops/intern.c
+++ b/src/ops/intern.c
@@ -91,6 +91,12 @@ struct cons_pointer c_assoc( struct cons_pointer key,
                              struct cons_pointer store ) {
     struct cons_pointer result = NIL;
 
+    debug_print( L"c_assoc; key is `", DEBUG_BIND);
+    debug_print_object( key, DEBUG_BIND);
+    debug_print( L"`; store is \n", DEBUG_BIND);
+    debug_dump_object( store, DEBUG_BIND);
+    debug_println(DEBUG_BIND);
+
     for ( struct cons_pointer next = store;
           consp( next ); next = pointer2cell( next ).payload.cons.cdr ) {
         struct cons_space_object entry =
diff --git a/src/ops/lispops.c b/src/ops/lispops.c
index 5471c3f..14724a1 100644
--- a/src/ops/lispops.c
+++ b/src/ops/lispops.c
@@ -269,8 +269,8 @@ eval_lambda( struct cons_space_object cell, struct stack_frame *frame,
  * @return the result of evaluating the function with its arguments.
  */
 struct cons_pointer
-c_apply( struct stack_frame *frame, struct cons_pointer frame_pointer,
-         struct cons_pointer env ) {
+    c_apply( struct stack_frame *frame, struct cons_pointer frame_pointer,
+            struct cons_pointer env ) {
     debug_print( L"Entering c_apply\n", DEBUG_EVAL );
     struct cons_pointer result = NIL;
 
@@ -285,38 +285,47 @@ c_apply( struct stack_frame *frame, struct cons_pointer frame_pointer,
 
         switch ( fn_cell.tag.value ) {
             case EXCEPTIONTV:
-                /* just pass exceptions straight back */
-                result = fn_pointer;
-                break;
+            /* just pass exceptions straight back */
+            result = fn_pointer;
+            break;
             case FUNCTIONTV:
-                {
-                    struct cons_pointer exep = NIL;
-                    struct cons_pointer next_pointer =
-                        make_stack_frame( frame_pointer, args, env );
-                    inc_ref( next_pointer );
-                    if ( exceptionp( next_pointer ) ) {
-                        result = next_pointer;
-                    } else {
-                        struct stack_frame *next =
-                            get_stack_frame( next_pointer );
+            {
+                struct cons_pointer exep = NIL;
+                struct cons_pointer next_pointer =
+                    make_stack_frame( frame_pointer, args, env );
+                inc_ref( next_pointer );
+                if ( exceptionp( next_pointer ) ) {
+                    result = next_pointer;
+                } else {
+                    struct stack_frame *next =
+                        get_stack_frame( next_pointer );
 
-                        result =
-                            ( *fn_cell.payload.function.executable ) ( next,
-                                                                       next_pointer,
-                                                                       env );
-                        dec_ref( next_pointer );
-                    }
+                    result =
+                        ( *fn_cell.payload.function.executable ) ( next,
+                                                                  next_pointer,
+                                                                  env );
+                    dec_ref( next_pointer );
                 }
-                break;
+            }
+            break;
+
+            case KEYTV:
+            result = c_assoc( fn_pointer,
+                             eval_form(frame,
+                                       frame_pointer,
+                                       c_car( c_cdr( frame->arg[0])),
+                                       env));
+            break;
+
             case LAMBDATV:
-                {
-                    struct cons_pointer exep = NIL;
-                    struct cons_pointer next_pointer =
-                        make_stack_frame( frame_pointer, args, env );
-                    inc_ref( next_pointer );
-                    if ( exceptionp( next_pointer ) ) {
-                        result = next_pointer;
-                    } else {
+            {
+                struct cons_pointer exep = NIL;
+                struct cons_pointer next_pointer =
+                    make_stack_frame( frame_pointer, args, env );
+                inc_ref( next_pointer );
+                if ( exceptionp( next_pointer ) ) {
+                    result = next_pointer;
+                } else {
                         struct stack_frame *next =
                             get_stack_frame( next_pointer );
                         result =
@@ -416,9 +425,7 @@ lisp_eval( struct stack_frame *frame, struct cons_pointer frame_pointer,
 
     switch ( cell.tag.value ) {
         case CONSTV:
-            {
                 result = c_apply( frame, frame_pointer, env );
-            }
             break;
 
         case SYMBOLTV:

From b6958bbf6516791a32bf048b3876fc287b027078 Mon Sep 17 00:00:00 2001
From: Simon Brooke <simon@journeyman.cc>
Date: Tue, 5 Feb 2019 13:46:46 +0000
Subject: [PATCH 23/31] #8: compiles, but most tests fail.

---
 src/memory/consspaceobject.c |   27 +-
 src/memory/consspaceobject.h |    2 +
 src/memory/lookup3.c         | 1001 ++++++++++++++++++++++++++++++++++
 src/memory/lookup3.h         |   19 +
 src/memory/map.c             |  243 +++++++++
 src/memory/map.h             |   29 +-
 src/ops/intern.c             |   35 +-
 src/ops/lispops.c            |   16 +
 src/ops/lispops.h            |    4 +-
 9 files changed, 1360 insertions(+), 16 deletions(-)
 create mode 100644 src/memory/lookup3.c
 create mode 100644 src/memory/lookup3.h

diff --git a/src/memory/consspaceobject.c b/src/memory/consspaceobject.c
index aa1cece..344f4ae 100644
--- a/src/memory/consspaceobject.c
+++ b/src/memory/consspaceobject.c
@@ -96,18 +96,41 @@ struct cons_pointer c_car( struct cons_pointer arg ) {
 }
 
 /**
- * Implementation of cdr in C. If arg is not a cons, does not error but returns nil.
+ * Implementation of cdr in C. If arg is not a sequence, does not error but returns nil.
  */
 struct cons_pointer c_cdr( struct cons_pointer arg ) {
     struct cons_pointer result = NIL;
 
-    if ( consp( arg ) || stringp( arg ) || symbolp( arg ) ) {
+    struct cons_space_object cell = pointer2cell( arg );
+
+    switch (cell.tag.value) {
+        case CONSTV:
         result = pointer2cell( arg ).payload.cons.cdr;
+        break;
+        case KEYTV:
+        case STRINGTV:
+        case SYMBOLTV:
+        result = pointer2cell( arg ).payload.string.cdr;
+        break;
     }
 
     return result;
 }
 
+/**
+ * Implementation of `length` in C. If arg is not a cons, does not error but returns 0.
+ */
+int c_length( struct cons_pointer arg) {
+    int result = 0;
+
+    for (struct cons_pointer c = arg; !nilp(c); c = c_cdr(c)) {
+        result ++;
+    }
+
+    return result;
+}
+
+
 /**
  * Construct a cons cell from this pair of pointers.
  */
diff --git a/src/memory/consspaceobject.h b/src/memory/consspaceobject.h
index 91ba3c3..9197172 100644
--- a/src/memory/consspaceobject.h
+++ b/src/memory/consspaceobject.h
@@ -667,6 +667,8 @@ struct cons_pointer c_car( struct cons_pointer arg );
 
 struct cons_pointer c_cdr( struct cons_pointer arg );
 
+int c_length( struct cons_pointer arg);
+
 struct cons_pointer make_cons( struct cons_pointer car,
                                struct cons_pointer cdr );
 
diff --git a/src/memory/lookup3.c b/src/memory/lookup3.c
new file mode 100644
index 0000000..006d513
--- /dev/null
+++ b/src/memory/lookup3.c
@@ -0,0 +1,1001 @@
+/*
+-------------------------------------------------------------------------------
+lookup3.c, by Bob Jenkins, May 2006, Public Domain.
+
+These are functions for producing 32-bit hashes for hash table lookup.
+hashword(), hashlittle(), hashlittle2(), hashbig(), mix(), and final()
+are externally useful functions.  Routines to test the hash are included
+if SELF_TEST is defined.  You can use this free for any purpose.  It's in
+the public domain.  It has no warranty.
+
+You probably want to use hashlittle().  hashlittle() and hashbig()
+hash byte arrays.  hashlittle() is is faster than hashbig() on
+little-endian machines.  Intel and AMD are little-endian machines.
+On second thought, you probably want hashlittle2(), which is identical to
+hashlittle() except it returns two 32-bit hashes for the price of one.
+You could implement hashbig2() if you wanted but I haven't bothered here.
+
+If you want to find a hash of, say, exactly 7 integers, do
+  a = i1;  b = i2;  c = i3;
+  mix(a,b,c);
+  a += i4; b += i5; c += i6;
+  mix(a,b,c);
+  a += i7;
+  final(a,b,c);
+then use c as the hash value.  If you have a variable length array of
+4-byte integers to hash, use hashword().  If you have a byte array (like
+a character string), use hashlittle().  If you have several byte arrays, or
+a mix of things, see the comments above hashlittle().
+
+Why is this so big?  I read 12 bytes at a time into 3 4-byte integers,
+then mix those integers.  This is fast (you can do a lot more thorough
+mixing with 12*3 instructions on 3 integers than you can with 3 instructions
+on 1 byte), but shoehorning those bytes into integers efficiently is messy.
+-------------------------------------------------------------------------------
+*/
+// #define SELF_TEST 1
+
+#include <stdio.h>      /* defines printf for tests */
+#include <time.h>       /* defines time_t for timings in the test */
+#include <stdint.h>     /* defines uint32_t etc */
+#include <sys/param.h>  /* attempt to define endianness */
+#ifdef linux
+# include <endian.h>    /* attempt to define endianness */
+#endif
+
+/*
+ * My best guess at if you are big-endian or little-endian.  This may
+ * need adjustment.
+ */
+#if (defined(__BYTE_ORDER) && defined(__LITTLE_ENDIAN) && \
+     __BYTE_ORDER == __LITTLE_ENDIAN) || \
+    (defined(i386) || defined(__i386__) || defined(__i486__) || \
+     defined(__i586__) || defined(__i686__) || defined(vax) || defined(MIPSEL))
+# define HASH_LITTLE_ENDIAN 1
+# define HASH_BIG_ENDIAN 0
+#elif (defined(__BYTE_ORDER) && defined(__BIG_ENDIAN) && \
+       __BYTE_ORDER == __BIG_ENDIAN) || \
+      (defined(sparc) || defined(POWERPC) || defined(mc68000) || defined(sel))
+# define HASH_LITTLE_ENDIAN 0
+# define HASH_BIG_ENDIAN 1
+#else
+# define HASH_LITTLE_ENDIAN 0
+# define HASH_BIG_ENDIAN 0
+#endif
+
+#define hashsize(n) ((uint32_t)1<<(n))
+#define hashmask(n) (hashsize(n)-1)
+#define rot(x,k) (((x)<<(k)) | ((x)>>(32-(k))))
+
+/*
+-------------------------------------------------------------------------------
+mix -- mix 3 32-bit values reversibly.
+
+This is reversible, so any information in (a,b,c) before mix() is
+still in (a,b,c) after mix().
+
+If four pairs of (a,b,c) inputs are run through mix(), or through
+mix() in reverse, there are at least 32 bits of the output that
+are sometimes the same for one pair and different for another pair.
+This was tested for:
+* pairs that differed by one bit, by two bits, in any combination
+  of top bits of (a,b,c), or in any combination of bottom bits of
+  (a,b,c).
+* "differ" is defined as +, -, ^, or ~^.  For + and -, I transformed
+  the output delta to a Gray code (a^(a>>1)) so a string of 1's (as
+  is commonly produced by subtraction) look like a single 1-bit
+  difference.
+* the base values were pseudorandom, all zero but one bit set, or
+  all zero plus a counter that starts at zero.
+
+Some k values for my "a-=c; a^=rot(c,k); c+=b;" arrangement that
+satisfy this are
+    4  6  8 16 19  4
+    9 15  3 18 27 15
+   14  9  3  7 17  3
+Well, "9 15 3 18 27 15" didn't quite get 32 bits diffing
+for "differ" defined as + with a one-bit base and a two-bit delta.  I
+used http://burtleburtle.net/bob/hash/avalanche.html to choose
+the operations, constants, and arrangements of the variables.
+
+This does not achieve avalanche.  There are input bits of (a,b,c)
+that fail to affect some output bits of (a,b,c), especially of a.  The
+most thoroughly mixed value is c, but it doesn't really even achieve
+avalanche in c.
+
+This allows some parallelism.  Read-after-writes are good at doubling
+the number of bits affected, so the goal of mixing pulls in the opposite
+direction as the goal of parallelism.  I did what I could.  Rotates
+seem to cost as much as shifts on every machine I could lay my hands
+on, and rotates are much kinder to the top and bottom bits, so I used
+rotates.
+-------------------------------------------------------------------------------
+*/
+#define mix(a,b,c) \
+{ \
+  a -= c;  a ^= rot(c, 4);  c += b; \
+  b -= a;  b ^= rot(a, 6);  a += c; \
+  c -= b;  c ^= rot(b, 8);  b += a; \
+  a -= c;  a ^= rot(c,16);  c += b; \
+  b -= a;  b ^= rot(a,19);  a += c; \
+  c -= b;  c ^= rot(b, 4);  b += a; \
+}
+
+/*
+-------------------------------------------------------------------------------
+final -- final mixing of 3 32-bit values (a,b,c) into c
+
+Pairs of (a,b,c) values differing in only a few bits will usually
+produce values of c that look totally different.  This was tested for
+* pairs that differed by one bit, by two bits, in any combination
+  of top bits of (a,b,c), or in any combination of bottom bits of
+  (a,b,c).
+* "differ" is defined as +, -, ^, or ~^.  For + and -, I transformed
+  the output delta to a Gray code (a^(a>>1)) so a string of 1's (as
+  is commonly produced by subtraction) look like a single 1-bit
+  difference.
+* the base values were pseudorandom, all zero but one bit set, or
+  all zero plus a counter that starts at zero.
+
+These constants passed:
+ 14 11 25 16 4 14 24
+ 12 14 25 16 4 14 24
+and these came close:
+  4  8 15 26 3 22 24
+ 10  8 15 26 3 22 24
+ 11  8 15 26 3 22 24
+-------------------------------------------------------------------------------
+*/
+#define final(a,b,c) \
+{ \
+  c ^= b; c -= rot(b,14); \
+  a ^= c; a -= rot(c,11); \
+  b ^= a; b -= rot(a,25); \
+  c ^= b; c -= rot(b,16); \
+  a ^= c; a -= rot(c,4);  \
+  b ^= a; b -= rot(a,14); \
+  c ^= b; c -= rot(b,24); \
+}
+
+/*
+--------------------------------------------------------------------
+ This works on all machines.  To be useful, it requires
+ -- that the key be an array of uint32_t's, and
+ -- that the length be the number of uint32_t's in the key
+
+ The function hashword() is identical to hashlittle() on little-endian
+ machines, and identical to hashbig() on big-endian machines,
+ except that the length has to be measured in uint32_ts rather than in
+ bytes.  hashlittle() is more complicated than hashword() only because
+ hashlittle() has to dance around fitting the key bytes into registers.
+--------------------------------------------------------------------
+*/
+uint32_t hashword(
+const uint32_t *k,                   /* the key, an array of uint32_t values */
+size_t          length,               /* the length of the key, in uint32_ts */
+uint32_t        initval)         /* the previous hash, or an arbitrary value */
+{
+  uint32_t a,b,c;
+
+  /* Set up the internal state */
+  a = b = c = 0xdeadbeef + (((uint32_t)length)<<2) + initval;
+
+  /*------------------------------------------------- handle most of the key */
+  while (length > 3)
+  {
+    a += k[0];
+    b += k[1];
+    c += k[2];
+    mix(a,b,c);
+    length -= 3;
+    k += 3;
+  }
+
+  /*------------------------------------------- handle the last 3 uint32_t's */
+  switch(length)                     /* all the case statements fall through */
+  {
+  case 3 : c+=k[2];
+  case 2 : b+=k[1];
+  case 1 : a+=k[0];
+    final(a,b,c);
+  case 0:     /* case 0: nothing left to add */
+    break;
+  }
+  /*------------------------------------------------------ report the result */
+  return c;
+}
+
+
+/*
+--------------------------------------------------------------------
+hashword2() -- same as hashword(), but take two seeds and return two
+32-bit values.  pc and pb must both be nonnull, and *pc and *pb must
+both be initialized with seeds.  If you pass in (*pb)==0, the output
+(*pc) will be the same as the return value from hashword().
+--------------------------------------------------------------------
+*/
+void hashword2 (
+const uint32_t *k,                   /* the key, an array of uint32_t values */
+size_t          length,               /* the length of the key, in uint32_ts */
+uint32_t       *pc,                      /* IN: seed OUT: primary hash value */
+uint32_t       *pb)               /* IN: more seed OUT: secondary hash value */
+{
+  uint32_t a,b,c;
+
+  /* Set up the internal state */
+  a = b = c = 0xdeadbeef + ((uint32_t)(length<<2)) + *pc;
+  c += *pb;
+
+  /*------------------------------------------------- handle most of the key */
+  while (length > 3)
+  {
+    a += k[0];
+    b += k[1];
+    c += k[2];
+    mix(a,b,c);
+    length -= 3;
+    k += 3;
+  }
+
+  /*------------------------------------------- handle the last 3 uint32_t's */
+  switch(length)                     /* all the case statements fall through */
+  {
+  case 3 : c+=k[2];
+  case 2 : b+=k[1];
+  case 1 : a+=k[0];
+    final(a,b,c);
+  case 0:     /* case 0: nothing left to add */
+    break;
+  }
+  /*------------------------------------------------------ report the result */
+  *pc=c; *pb=b;
+}
+
+
+/*
+-------------------------------------------------------------------------------
+hashlittle() -- hash a variable-length key into a 32-bit value
+  k       : the key (the unaligned variable-length array of bytes)
+  length  : the length of the key, counting by bytes
+  initval : can be any 4-byte value
+Returns a 32-bit value.  Every bit of the key affects every bit of
+the return value.  Two keys differing by one or two bits will have
+totally different hash values.
+
+The best hash table sizes are powers of 2.  There is no need to do
+mod a prime (mod is sooo slow!).  If you need less than 32 bits,
+use a bitmask.  For example, if you need only 10 bits, do
+  h = (h & hashmask(10));
+In which case, the hash table should have hashsize(10) elements.
+
+If you are hashing n strings (uint8_t **)k, do it like this:
+  for (i=0, h=0; i<n; ++i) h = hashlittle( k[i], len[i], h);
+
+By Bob Jenkins, 2006.  bob_jenkins@burtleburtle.net.  You may use this
+code any way you wish, private, educational, or commercial.  It's free.
+
+Use for hash table lookup, or anything where one collision in 2^^32 is
+acceptable.  Do NOT use for cryptographic purposes.
+-------------------------------------------------------------------------------
+*/
+
+uint32_t hashlittle( const void *key, size_t length, uint32_t initval)
+{
+  uint32_t a,b,c;                                          /* internal state */
+  union { const void *ptr; size_t i; } u;     /* needed for Mac Powerbook G4 */
+
+  /* Set up the internal state */
+  a = b = c = 0xdeadbeef + ((uint32_t)length) + initval;
+
+  u.ptr = key;
+  if (HASH_LITTLE_ENDIAN && ((u.i & 0x3) == 0)) {
+    const uint32_t *k = (const uint32_t *)key;         /* read 32-bit chunks */
+    const uint8_t  *k8;
+
+    /*------ all but last block: aligned reads and affect 32 bits of (a,b,c) */
+    while (length > 12)
+    {
+      a += k[0];
+      b += k[1];
+      c += k[2];
+      mix(a,b,c);
+      length -= 12;
+      k += 3;
+    }
+
+    /*----------------------------- handle the last (probably partial) block */
+    /*
+     * "k[2]&0xffffff" actually reads beyond the end of the string, but
+     * then masks off the part it's not allowed to read.  Because the
+     * string is aligned, the masked-off tail is in the same word as the
+     * rest of the string.  Every machine with memory protection I've seen
+     * does it on word boundaries, so is OK with this.  But VALGRIND will
+     * still catch it and complain.  The masking trick does make the hash
+     * noticably faster for short strings (like English words).
+     */
+#ifndef VALGRIND
+
+    switch(length)
+    {
+    case 12: c+=k[2]; b+=k[1]; a+=k[0]; break;
+    case 11: c+=k[2]&0xffffff; b+=k[1]; a+=k[0]; break;
+    case 10: c+=k[2]&0xffff; b+=k[1]; a+=k[0]; break;
+    case 9 : c+=k[2]&0xff; b+=k[1]; a+=k[0]; break;
+    case 8 : b+=k[1]; a+=k[0]; break;
+    case 7 : b+=k[1]&0xffffff; a+=k[0]; break;
+    case 6 : b+=k[1]&0xffff; a+=k[0]; break;
+    case 5 : b+=k[1]&0xff; a+=k[0]; break;
+    case 4 : a+=k[0]; break;
+    case 3 : a+=k[0]&0xffffff; break;
+    case 2 : a+=k[0]&0xffff; break;
+    case 1 : a+=k[0]&0xff; break;
+    case 0 : return c;              /* zero length strings require no mixing */
+    }
+
+#else /* make valgrind happy */
+
+    k8 = (const uint8_t *)k;
+    switch(length)
+    {
+    case 12: c+=k[2]; b+=k[1]; a+=k[0]; break;
+    case 11: c+=((uint32_t)k8[10])<<16;  /* fall through */
+    case 10: c+=((uint32_t)k8[9])<<8;    /* fall through */
+    case 9 : c+=k8[8];                   /* fall through */
+    case 8 : b+=k[1]; a+=k[0]; break;
+    case 7 : b+=((uint32_t)k8[6])<<16;   /* fall through */
+    case 6 : b+=((uint32_t)k8[5])<<8;    /* fall through */
+    case 5 : b+=k8[4];                   /* fall through */
+    case 4 : a+=k[0]; break;
+    case 3 : a+=((uint32_t)k8[2])<<16;   /* fall through */
+    case 2 : a+=((uint32_t)k8[1])<<8;    /* fall through */
+    case 1 : a+=k8[0]; break;
+    case 0 : return c;
+    }
+
+#endif /* !valgrind */
+
+  } else if (HASH_LITTLE_ENDIAN && ((u.i & 0x1) == 0)) {
+    const uint16_t *k = (const uint16_t *)key;         /* read 16-bit chunks */
+    const uint8_t  *k8;
+
+    /*--------------- all but last block: aligned reads and different mixing */
+    while (length > 12)
+    {
+      a += k[0] + (((uint32_t)k[1])<<16);
+      b += k[2] + (((uint32_t)k[3])<<16);
+      c += k[4] + (((uint32_t)k[5])<<16);
+      mix(a,b,c);
+      length -= 12;
+      k += 6;
+    }
+
+    /*----------------------------- handle the last (probably partial) block */
+    k8 = (const uint8_t *)k;
+    switch(length)
+    {
+    case 12: c+=k[4]+(((uint32_t)k[5])<<16);
+             b+=k[2]+(((uint32_t)k[3])<<16);
+             a+=k[0]+(((uint32_t)k[1])<<16);
+             break;
+    case 11: c+=((uint32_t)k8[10])<<16;     /* fall through */
+    case 10: c+=k[4];
+             b+=k[2]+(((uint32_t)k[3])<<16);
+             a+=k[0]+(((uint32_t)k[1])<<16);
+             break;
+    case 9 : c+=k8[8];                      /* fall through */
+    case 8 : b+=k[2]+(((uint32_t)k[3])<<16);
+             a+=k[0]+(((uint32_t)k[1])<<16);
+             break;
+    case 7 : b+=((uint32_t)k8[6])<<16;      /* fall through */
+    case 6 : b+=k[2];
+             a+=k[0]+(((uint32_t)k[1])<<16);
+             break;
+    case 5 : b+=k8[4];                      /* fall through */
+    case 4 : a+=k[0]+(((uint32_t)k[1])<<16);
+             break;
+    case 3 : a+=((uint32_t)k8[2])<<16;      /* fall through */
+    case 2 : a+=k[0];
+             break;
+    case 1 : a+=k8[0];
+             break;
+    case 0 : return c;                     /* zero length requires no mixing */
+    }
+
+  } else {                        /* need to read the key one byte at a time */
+    const uint8_t *k = (const uint8_t *)key;
+
+    /*--------------- all but the last block: affect some 32 bits of (a,b,c) */
+    while (length > 12)
+    {
+      a += k[0];
+      a += ((uint32_t)k[1])<<8;
+      a += ((uint32_t)k[2])<<16;
+      a += ((uint32_t)k[3])<<24;
+      b += k[4];
+      b += ((uint32_t)k[5])<<8;
+      b += ((uint32_t)k[6])<<16;
+      b += ((uint32_t)k[7])<<24;
+      c += k[8];
+      c += ((uint32_t)k[9])<<8;
+      c += ((uint32_t)k[10])<<16;
+      c += ((uint32_t)k[11])<<24;
+      mix(a,b,c);
+      length -= 12;
+      k += 12;
+    }
+
+    /*-------------------------------- last block: affect all 32 bits of (c) */
+    switch(length)                   /* all the case statements fall through */
+    {
+    case 12: c+=((uint32_t)k[11])<<24;
+    case 11: c+=((uint32_t)k[10])<<16;
+    case 10: c+=((uint32_t)k[9])<<8;
+    case 9 : c+=k[8];
+    case 8 : b+=((uint32_t)k[7])<<24;
+    case 7 : b+=((uint32_t)k[6])<<16;
+    case 6 : b+=((uint32_t)k[5])<<8;
+    case 5 : b+=k[4];
+    case 4 : a+=((uint32_t)k[3])<<24;
+    case 3 : a+=((uint32_t)k[2])<<16;
+    case 2 : a+=((uint32_t)k[1])<<8;
+    case 1 : a+=k[0];
+             break;
+    case 0 : return c;
+    }
+  }
+
+  final(a,b,c);
+  return c;
+}
+
+
+/*
+ * hashlittle2: return 2 32-bit hash values
+ *
+ * This is identical to hashlittle(), except it returns two 32-bit hash
+ * values instead of just one.  This is good enough for hash table
+ * lookup with 2^^64 buckets, or if you want a second hash if you're not
+ * happy with the first, or if you want a probably-unique 64-bit ID for
+ * the key.  *pc is better mixed than *pb, so use *pc first.  If you want
+ * a 64-bit value do something like "*pc + (((uint64_t)*pb)<<32)".
+ */
+void hashlittle2(
+  const void *key,       /* the key to hash */
+  size_t      length,    /* length of the key */
+  uint32_t   *pc,        /* IN: primary initval, OUT: primary hash */
+  uint32_t   *pb)        /* IN: secondary initval, OUT: secondary hash */
+{
+  uint32_t a,b,c;                                          /* internal state */
+  union { const void *ptr; size_t i; } u;     /* needed for Mac Powerbook G4 */
+
+  /* Set up the internal state */
+  a = b = c = 0xdeadbeef + ((uint32_t)length) + *pc;
+  c += *pb;
+
+  u.ptr = key;
+  if (HASH_LITTLE_ENDIAN && ((u.i & 0x3) == 0)) {
+    const uint32_t *k = (const uint32_t *)key;         /* read 32-bit chunks */
+    const uint8_t  *k8;
+
+    /*------ all but last block: aligned reads and affect 32 bits of (a,b,c) */
+    while (length > 12)
+    {
+      a += k[0];
+      b += k[1];
+      c += k[2];
+      mix(a,b,c);
+      length -= 12;
+      k += 3;
+    }
+
+    /*----------------------------- handle the last (probably partial) block */
+    /*
+     * "k[2]&0xffffff" actually reads beyond the end of the string, but
+     * then masks off the part it's not allowed to read.  Because the
+     * string is aligned, the masked-off tail is in the same word as the
+     * rest of the string.  Every machine with memory protection I've seen
+     * does it on word boundaries, so is OK with this.  But VALGRIND will
+     * still catch it and complain.  The masking trick does make the hash
+     * noticably faster for short strings (like English words).
+     */
+#ifndef VALGRIND
+
+    switch(length)
+    {
+    case 12: c+=k[2]; b+=k[1]; a+=k[0]; break;
+    case 11: c+=k[2]&0xffffff; b+=k[1]; a+=k[0]; break;
+    case 10: c+=k[2]&0xffff; b+=k[1]; a+=k[0]; break;
+    case 9 : c+=k[2]&0xff; b+=k[1]; a+=k[0]; break;
+    case 8 : b+=k[1]; a+=k[0]; break;
+    case 7 : b+=k[1]&0xffffff; a+=k[0]; break;
+    case 6 : b+=k[1]&0xffff; a+=k[0]; break;
+    case 5 : b+=k[1]&0xff; a+=k[0]; break;
+    case 4 : a+=k[0]; break;
+    case 3 : a+=k[0]&0xffffff; break;
+    case 2 : a+=k[0]&0xffff; break;
+    case 1 : a+=k[0]&0xff; break;
+    case 0 : *pc=c; *pb=b; return;  /* zero length strings require no mixing */
+    }
+
+#else /* make valgrind happy */
+
+    k8 = (const uint8_t *)k;
+    switch(length)
+    {
+    case 12: c+=k[2]; b+=k[1]; a+=k[0]; break;
+    case 11: c+=((uint32_t)k8[10])<<16;  /* fall through */
+    case 10: c+=((uint32_t)k8[9])<<8;    /* fall through */
+    case 9 : c+=k8[8];                   /* fall through */
+    case 8 : b+=k[1]; a+=k[0]; break;
+    case 7 : b+=((uint32_t)k8[6])<<16;   /* fall through */
+    case 6 : b+=((uint32_t)k8[5])<<8;    /* fall through */
+    case 5 : b+=k8[4];                   /* fall through */
+    case 4 : a+=k[0]; break;
+    case 3 : a+=((uint32_t)k8[2])<<16;   /* fall through */
+    case 2 : a+=((uint32_t)k8[1])<<8;    /* fall through */
+    case 1 : a+=k8[0]; break;
+    case 0 : *pc=c; *pb=b; return;  /* zero length strings require no mixing */
+    }
+
+#endif /* !valgrind */
+
+  } else if (HASH_LITTLE_ENDIAN && ((u.i & 0x1) == 0)) {
+    const uint16_t *k = (const uint16_t *)key;         /* read 16-bit chunks */
+    const uint8_t  *k8;
+
+    /*--------------- all but last block: aligned reads and different mixing */
+    while (length > 12)
+    {
+      a += k[0] + (((uint32_t)k[1])<<16);
+      b += k[2] + (((uint32_t)k[3])<<16);
+      c += k[4] + (((uint32_t)k[5])<<16);
+      mix(a,b,c);
+      length -= 12;
+      k += 6;
+    }
+
+    /*----------------------------- handle the last (probably partial) block */
+    k8 = (const uint8_t *)k;
+    switch(length)
+    {
+    case 12: c+=k[4]+(((uint32_t)k[5])<<16);
+             b+=k[2]+(((uint32_t)k[3])<<16);
+             a+=k[0]+(((uint32_t)k[1])<<16);
+             break;
+    case 11: c+=((uint32_t)k8[10])<<16;     /* fall through */
+    case 10: c+=k[4];
+             b+=k[2]+(((uint32_t)k[3])<<16);
+             a+=k[0]+(((uint32_t)k[1])<<16);
+             break;
+    case 9 : c+=k8[8];                      /* fall through */
+    case 8 : b+=k[2]+(((uint32_t)k[3])<<16);
+             a+=k[0]+(((uint32_t)k[1])<<16);
+             break;
+    case 7 : b+=((uint32_t)k8[6])<<16;      /* fall through */
+    case 6 : b+=k[2];
+             a+=k[0]+(((uint32_t)k[1])<<16);
+             break;
+    case 5 : b+=k8[4];                      /* fall through */
+    case 4 : a+=k[0]+(((uint32_t)k[1])<<16);
+             break;
+    case 3 : a+=((uint32_t)k8[2])<<16;      /* fall through */
+    case 2 : a+=k[0];
+             break;
+    case 1 : a+=k8[0];
+             break;
+    case 0 : *pc=c; *pb=b; return;  /* zero length strings require no mixing */
+    }
+
+  } else {                        /* need to read the key one byte at a time */
+    const uint8_t *k = (const uint8_t *)key;
+
+    /*--------------- all but the last block: affect some 32 bits of (a,b,c) */
+    while (length > 12)
+    {
+      a += k[0];
+      a += ((uint32_t)k[1])<<8;
+      a += ((uint32_t)k[2])<<16;
+      a += ((uint32_t)k[3])<<24;
+      b += k[4];
+      b += ((uint32_t)k[5])<<8;
+      b += ((uint32_t)k[6])<<16;
+      b += ((uint32_t)k[7])<<24;
+      c += k[8];
+      c += ((uint32_t)k[9])<<8;
+      c += ((uint32_t)k[10])<<16;
+      c += ((uint32_t)k[11])<<24;
+      mix(a,b,c);
+      length -= 12;
+      k += 12;
+    }
+
+    /*-------------------------------- last block: affect all 32 bits of (c) */
+    switch(length)                   /* all the case statements fall through */
+    {
+    case 12: c+=((uint32_t)k[11])<<24;
+    case 11: c+=((uint32_t)k[10])<<16;
+    case 10: c+=((uint32_t)k[9])<<8;
+    case 9 : c+=k[8];
+    case 8 : b+=((uint32_t)k[7])<<24;
+    case 7 : b+=((uint32_t)k[6])<<16;
+    case 6 : b+=((uint32_t)k[5])<<8;
+    case 5 : b+=k[4];
+    case 4 : a+=((uint32_t)k[3])<<24;
+    case 3 : a+=((uint32_t)k[2])<<16;
+    case 2 : a+=((uint32_t)k[1])<<8;
+    case 1 : a+=k[0];
+             break;
+    case 0 : *pc=c; *pb=b; return;  /* zero length strings require no mixing */
+    }
+  }
+
+  final(a,b,c);
+  *pc=c; *pb=b;
+}
+
+
+
+/*
+ * hashbig():
+ * This is the same as hashword() on big-endian machines.  It is different
+ * from hashlittle() on all machines.  hashbig() takes advantage of
+ * big-endian byte ordering.
+ */
+uint32_t hashbig( const void *key, size_t length, uint32_t initval)
+{
+  uint32_t a,b,c;
+  union { const void *ptr; size_t i; } u; /* to cast key to (size_t) happily */
+
+  /* Set up the internal state */
+  a = b = c = 0xdeadbeef + ((uint32_t)length) + initval;
+
+  u.ptr = key;
+  if (HASH_BIG_ENDIAN && ((u.i & 0x3) == 0)) {
+    const uint32_t *k = (const uint32_t *)key;         /* read 32-bit chunks */
+    const uint8_t  *k8;
+
+    /*------ all but last block: aligned reads and affect 32 bits of (a,b,c) */
+    while (length > 12)
+    {
+      a += k[0];
+      b += k[1];
+      c += k[2];
+      mix(a,b,c);
+      length -= 12;
+      k += 3;
+    }
+
+    /*----------------------------- handle the last (probably partial) block */
+    /*
+     * "k[2]<<8" actually reads beyond the end of the string, but
+     * then shifts out the part it's not allowed to read.  Because the
+     * string is aligned, the illegal read is in the same word as the
+     * rest of the string.  Every machine with memory protection I've seen
+     * does it on word boundaries, so is OK with this.  But VALGRIND will
+     * still catch it and complain.  The masking trick does make the hash
+     * noticably faster for short strings (like English words).
+     */
+#ifndef VALGRIND
+
+    switch(length)
+    {
+    case 12: c+=k[2]; b+=k[1]; a+=k[0]; break;
+    case 11: c+=k[2]&0xffffff00; b+=k[1]; a+=k[0]; break;
+    case 10: c+=k[2]&0xffff0000; b+=k[1]; a+=k[0]; break;
+    case 9 : c+=k[2]&0xff000000; b+=k[1]; a+=k[0]; break;
+    case 8 : b+=k[1]; a+=k[0]; break;
+    case 7 : b+=k[1]&0xffffff00; a+=k[0]; break;
+    case 6 : b+=k[1]&0xffff0000; a+=k[0]; break;
+    case 5 : b+=k[1]&0xff000000; a+=k[0]; break;
+    case 4 : a+=k[0]; break;
+    case 3 : a+=k[0]&0xffffff00; break;
+    case 2 : a+=k[0]&0xffff0000; break;
+    case 1 : a+=k[0]&0xff000000; break;
+    case 0 : return c;              /* zero length strings require no mixing */
+    }
+
+#else  /* make valgrind happy */
+
+    k8 = (const uint8_t *)k;
+    switch(length)                   /* all the case statements fall through */
+    {
+    case 12: c+=k[2]; b+=k[1]; a+=k[0]; break;
+    case 11: c+=((uint32_t)k8[10])<<8;  /* fall through */
+    case 10: c+=((uint32_t)k8[9])<<16;  /* fall through */
+    case 9 : c+=((uint32_t)k8[8])<<24;  /* fall through */
+    case 8 : b+=k[1]; a+=k[0]; break;
+    case 7 : b+=((uint32_t)k8[6])<<8;   /* fall through */
+    case 6 : b+=((uint32_t)k8[5])<<16;  /* fall through */
+    case 5 : b+=((uint32_t)k8[4])<<24;  /* fall through */
+    case 4 : a+=k[0]; break;
+    case 3 : a+=((uint32_t)k8[2])<<8;   /* fall through */
+    case 2 : a+=((uint32_t)k8[1])<<16;  /* fall through */
+    case 1 : a+=((uint32_t)k8[0])<<24; break;
+    case 0 : return c;
+    }
+
+#endif /* !VALGRIND */
+
+  } else {                        /* need to read the key one byte at a time */
+    const uint8_t *k = (const uint8_t *)key;
+
+    /*--------------- all but the last block: affect some 32 bits of (a,b,c) */
+    while (length > 12)
+    {
+      a += ((uint32_t)k[0])<<24;
+      a += ((uint32_t)k[1])<<16;
+      a += ((uint32_t)k[2])<<8;
+      a += ((uint32_t)k[3]);
+      b += ((uint32_t)k[4])<<24;
+      b += ((uint32_t)k[5])<<16;
+      b += ((uint32_t)k[6])<<8;
+      b += ((uint32_t)k[7]);
+      c += ((uint32_t)k[8])<<24;
+      c += ((uint32_t)k[9])<<16;
+      c += ((uint32_t)k[10])<<8;
+      c += ((uint32_t)k[11]);
+      mix(a,b,c);
+      length -= 12;
+      k += 12;
+    }
+
+    /*-------------------------------- last block: affect all 32 bits of (c) */
+    switch(length)                   /* all the case statements fall through */
+    {
+    case 12: c+=k[11];
+    case 11: c+=((uint32_t)k[10])<<8;
+    case 10: c+=((uint32_t)k[9])<<16;
+    case 9 : c+=((uint32_t)k[8])<<24;
+    case 8 : b+=k[7];
+    case 7 : b+=((uint32_t)k[6])<<8;
+    case 6 : b+=((uint32_t)k[5])<<16;
+    case 5 : b+=((uint32_t)k[4])<<24;
+    case 4 : a+=k[3];
+    case 3 : a+=((uint32_t)k[2])<<8;
+    case 2 : a+=((uint32_t)k[1])<<16;
+    case 1 : a+=((uint32_t)k[0])<<24;
+             break;
+    case 0 : return c;
+    }
+  }
+
+  final(a,b,c);
+  return c;
+}
+
+
+#ifdef SELF_TEST
+
+/* used for timings */
+void driver1()
+{
+  uint8_t buf[256];
+  uint32_t i;
+  uint32_t h=0;
+  time_t a,z;
+
+  time(&a);
+  for (i=0; i<256; ++i) buf[i] = 'x';
+  for (i=0; i<1; ++i)
+  {
+    h = hashlittle(&buf[0],1,h);
+  }
+  time(&z);
+  if (z-a > 0) printf("time %d %.8x\n", z-a, h);
+}
+
+/* check that every input bit changes every output bit half the time */
+#define HASHSTATE 1
+#define HASHLEN   1
+#define MAXPAIR 60
+#define MAXLEN  70
+void driver2()
+{
+  uint8_t qa[MAXLEN+1], qb[MAXLEN+2], *a = &qa[0], *b = &qb[1];
+  uint32_t c[HASHSTATE], d[HASHSTATE], i=0, j=0, k, l, m=0, z;
+  uint32_t e[HASHSTATE],f[HASHSTATE],g[HASHSTATE],h[HASHSTATE];
+  uint32_t x[HASHSTATE],y[HASHSTATE];
+  uint32_t hlen;
+
+  printf("No more than %d trials should ever be needed \n",MAXPAIR/2);
+  for (hlen=0; hlen < MAXLEN; ++hlen)
+  {
+    z=0;
+    for (i=0; i<hlen; ++i)  /*----------------------- for each input byte, */
+    {
+      for (j=0; j<8; ++j)   /*------------------------ for each input bit, */
+      {
+	for (m=1; m<8; ++m) /*------------ for serveral possible initvals, */
+	{
+	  for (l=0; l<HASHSTATE; ++l)
+	    e[l]=f[l]=g[l]=h[l]=x[l]=y[l]=~((uint32_t)0);
+
+      	  /*---- check that every output bit is affected by that input bit */
+	  for (k=0; k<MAXPAIR; k+=2)
+	  {
+	    uint32_t finished=1;
+	    /* keys have one bit different */
+	    for (l=0; l<hlen+1; ++l) {a[l] = b[l] = (uint8_t)0;}
+	    /* have a and b be two keys differing in only one bit */
+	    a[i] ^= (k<<j);
+	    a[i] ^= (k>>(8-j));
+	     c[0] = hashlittle(a, hlen, m);
+	    b[i] ^= ((k+1)<<j);
+	    b[i] ^= ((k+1)>>(8-j));
+	     d[0] = hashlittle(b, hlen, m);
+	    /* check every bit is 1, 0, set, and not set at least once */
+	    for (l=0; l<HASHSTATE; ++l)
+	    {
+	      e[l] &= (c[l]^d[l]);
+	      f[l] &= ~(c[l]^d[l]);
+	      g[l] &= c[l];
+	      h[l] &= ~c[l];
+	      x[l] &= d[l];
+	      y[l] &= ~d[l];
+	      if (e[l]|f[l]|g[l]|h[l]|x[l]|y[l]) finished=0;
+	    }
+	    if (finished) break;
+	  }
+	  if (k>z) z=k;
+	  if (k==MAXPAIR)
+	  {
+	     printf("Some bit didn't change: ");
+	     printf("%.8x %.8x %.8x %.8x %.8x %.8x  ",
+	            e[0],f[0],g[0],h[0],x[0],y[0]);
+	     printf("i %d j %d m %d len %d\n", i, j, m, hlen);
+	  }
+	  if (z==MAXPAIR) goto done;
+	}
+      }
+    }
+   done:
+    if (z < MAXPAIR)
+    {
+      printf("Mix success  %2d bytes  %2d initvals  ",i,m);
+      printf("required  %d  trials\n", z/2);
+    }
+  }
+  printf("\n");
+}
+
+/* Check for reading beyond the end of the buffer and alignment problems */
+void driver3()
+{
+  uint8_t buf[MAXLEN+20], *b;
+  uint32_t len;
+  uint8_t q[] = "This is the time for all good men to come to the aid of their country...";
+  uint32_t h;
+  uint8_t qq[] = "xThis is the time for all good men to come to the aid of their country...";
+  uint32_t i;
+  uint8_t qqq[] = "xxThis is the time for all good men to come to the aid of their country...";
+  uint32_t j;
+  uint8_t qqqq[] = "xxxThis is the time for all good men to come to the aid of their country...";
+  uint32_t ref,x,y;
+  uint8_t *p;
+
+  printf("Endianness.  These lines should all be the same (for values filled in):\n");
+  printf("%.8x                            %.8x                            %.8x\n",
+         hashword((const uint32_t *)q, (sizeof(q)-1)/4, 13),
+         hashword((const uint32_t *)q, (sizeof(q)-5)/4, 13),
+         hashword((const uint32_t *)q, (sizeof(q)-9)/4, 13));
+  p = q;
+  printf("%.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x\n",
+         hashlittle(p, sizeof(q)-1, 13), hashlittle(p, sizeof(q)-2, 13),
+         hashlittle(p, sizeof(q)-3, 13), hashlittle(p, sizeof(q)-4, 13),
+         hashlittle(p, sizeof(q)-5, 13), hashlittle(p, sizeof(q)-6, 13),
+         hashlittle(p, sizeof(q)-7, 13), hashlittle(p, sizeof(q)-8, 13),
+         hashlittle(p, sizeof(q)-9, 13), hashlittle(p, sizeof(q)-10, 13),
+         hashlittle(p, sizeof(q)-11, 13), hashlittle(p, sizeof(q)-12, 13));
+  p = &qq[1];
+  printf("%.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x\n",
+         hashlittle(p, sizeof(q)-1, 13), hashlittle(p, sizeof(q)-2, 13),
+         hashlittle(p, sizeof(q)-3, 13), hashlittle(p, sizeof(q)-4, 13),
+         hashlittle(p, sizeof(q)-5, 13), hashlittle(p, sizeof(q)-6, 13),
+         hashlittle(p, sizeof(q)-7, 13), hashlittle(p, sizeof(q)-8, 13),
+         hashlittle(p, sizeof(q)-9, 13), hashlittle(p, sizeof(q)-10, 13),
+         hashlittle(p, sizeof(q)-11, 13), hashlittle(p, sizeof(q)-12, 13));
+  p = &qqq[2];
+  printf("%.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x\n",
+         hashlittle(p, sizeof(q)-1, 13), hashlittle(p, sizeof(q)-2, 13),
+         hashlittle(p, sizeof(q)-3, 13), hashlittle(p, sizeof(q)-4, 13),
+         hashlittle(p, sizeof(q)-5, 13), hashlittle(p, sizeof(q)-6, 13),
+         hashlittle(p, sizeof(q)-7, 13), hashlittle(p, sizeof(q)-8, 13),
+         hashlittle(p, sizeof(q)-9, 13), hashlittle(p, sizeof(q)-10, 13),
+         hashlittle(p, sizeof(q)-11, 13), hashlittle(p, sizeof(q)-12, 13));
+  p = &qqqq[3];
+  printf("%.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x %.8x\n",
+         hashlittle(p, sizeof(q)-1, 13), hashlittle(p, sizeof(q)-2, 13),
+         hashlittle(p, sizeof(q)-3, 13), hashlittle(p, sizeof(q)-4, 13),
+         hashlittle(p, sizeof(q)-5, 13), hashlittle(p, sizeof(q)-6, 13),
+         hashlittle(p, sizeof(q)-7, 13), hashlittle(p, sizeof(q)-8, 13),
+         hashlittle(p, sizeof(q)-9, 13), hashlittle(p, sizeof(q)-10, 13),
+         hashlittle(p, sizeof(q)-11, 13), hashlittle(p, sizeof(q)-12, 13));
+  printf("\n");
+
+  /* check that hashlittle2 and hashlittle produce the same results */
+  i=47; j=0;
+  hashlittle2(q, sizeof(q), &i, &j);
+  if (hashlittle(q, sizeof(q), 47) != i)
+    printf("hashlittle2 and hashlittle mismatch\n");
+
+  /* check that hashword2 and hashword produce the same results */
+  len = 0xdeadbeef;
+  i=47, j=0;
+  hashword2(&len, 1, &i, &j);
+  if (hashword(&len, 1, 47) != i)
+    printf("hashword2 and hashword mismatch %x %x\n",
+	   i, hashword(&len, 1, 47));
+
+  /* check hashlittle doesn't read before or after the ends of the string */
+  for (h=0, b=buf+1; h<8; ++h, ++b)
+  {
+    for (i=0; i<MAXLEN; ++i)
+    {
+      len = i;
+      for (j=0; j<i; ++j) *(b+j)=0;
+
+      /* these should all be equal */
+      ref = hashlittle(b, len, (uint32_t)1);
+      *(b+i)=(uint8_t)~0;
+      *(b-1)=(uint8_t)~0;
+      x = hashlittle(b, len, (uint32_t)1);
+      y = hashlittle(b, len, (uint32_t)1);
+      if ((ref != x) || (ref != y))
+      {
+	printf("alignment error: %.8x %.8x %.8x %d %d\n",ref,x,y,
+               h, i);
+      }
+    }
+  }
+}
+
+/* check for problems with nulls */
+ void driver4()
+{
+  uint8_t buf[1];
+  uint32_t h,i,state[HASHSTATE];
+
+
+  buf[0] = ~0;
+  for (i=0; i<HASHSTATE; ++i) state[i] = 1;
+  printf("These should all be different\n");
+  for (i=0, h=0; i<8; ++i)
+  {
+    h = hashlittle(buf, 0, h);
+    printf("%2ld  0-byte strings, hash is  %.8x\n", i, h);
+  }
+}
+
+void driver5()
+{
+  uint32_t b,c;
+  b=0, c=0, hashlittle2("", 0, &c, &b);
+  printf("hash is %.8lx %.8lx\n", c, b);   /* deadbeef deadbeef */
+  b=0xdeadbeef, c=0, hashlittle2("", 0, &c, &b);
+  printf("hash is %.8lx %.8lx\n", c, b);   /* bd5b7dde deadbeef */
+  b=0xdeadbeef, c=0xdeadbeef, hashlittle2("", 0, &c, &b);
+  printf("hash is %.8lx %.8lx\n", c, b);   /* 9c093ccd bd5b7dde */
+  b=0, c=0, hashlittle2("Four score and seven years ago", 30, &c, &b);
+  printf("hash is %.8lx %.8lx\n", c, b);   /* 17770551 ce7226e6 */
+  b=1, c=0, hashlittle2("Four score and seven years ago", 30, &c, &b);
+  printf("hash is %.8lx %.8lx\n", c, b);   /* e3607cae bd371de4 */
+  b=0, c=1, hashlittle2("Four score and seven years ago", 30, &c, &b);
+  printf("hash is %.8lx %.8lx\n", c, b);   /* cd628161 6cbea4b3 */
+  c = hashlittle("Four score and seven years ago", 30, 0);
+  printf("hash is %.8lx\n", c);   /* 17770551 */
+  c = hashlittle("Four score and seven years ago", 30, 1);
+  printf("hash is %.8lx\n", c);   /* cd628161 */
+}
+
+
+int main()
+{
+  driver1();   /* test that the key is hashed: used for timings */
+  driver2();   /* test that whole key is hashed thoroughly */
+  driver3();   /* test that nothing but the key is hashed */
+  driver4();   /* test hashing multiple buffers (all buffers are null) */
+  driver5();   /* test the hash against known vectors */
+  return 1;
+}
+
+#endif  /* SELF_TEST */
diff --git a/src/memory/lookup3.h b/src/memory/lookup3.h
new file mode 100644
index 0000000..6033da2
--- /dev/null
+++ b/src/memory/lookup3.h
@@ -0,0 +1,19 @@
+/**
+ * lookup3.h
+ *
+ * Minimal header file wrapping Bob Jenkins' lookup3.c
+ *
+ *
+ * (c) 2019 Simon Brooke <simon@journeyman.cc>
+ * Public domain.
+ */
+
+#ifndef __lookup3_h
+#define __lookup3_h
+
+uint32_t hashword(
+const uint32_t *k,
+size_t          length,
+uint32_t        initval);
+
+#endif
diff --git a/src/memory/map.c b/src/memory/map.c
index e897647..358b2e4 100644
--- a/src/memory/map.c
+++ b/src/memory/map.c
@@ -6,3 +6,246 @@
  * (c) 2019 Simon Brooke <simon@journeyman.cc>
  * Licensed under GPL version 2.0, or, at your option, any later version.
  */
+
+#include <stdlib.h>
+
+#include "consspaceobject.h"
+#include "conspage.h"
+#include "debug.h"
+#include "dump.h"
+#include "fopen.h"
+#include "intern.h"
+#include "lookup3.h"
+#include "map.h"
+#include "print.h"
+#include "vectorspace.h"
+
+/* \todo: a lot of this will be inherited by namespaces, regularities and
+ * homogeneities. Exactly how I don't yet know. */
+
+/**
+ * Get a hash value for this key.
+ */
+uint32_t get_hash_32(struct cons_pointer f, struct cons_pointer key) {
+    uint32_t result = 0;
+    int l =  c_length(key);
+
+    if (keywordp(key) || stringp(key)) {
+        if ( l > 0) {
+            uint32_t buffer[l];
+
+            if (!nilp(f)) {
+                fputws(L"Custom hashing functions are not yet implemented.\n", stderr);
+            }
+            for (int i = 0; i < l; i++) {
+                buffer[i] = (uint32_t)pointer2cell(key).payload.string.character;
+            }
+
+            result = hashword( buffer, l, 0);
+        }
+    } else {
+        fputws(L"Hashing is thud far implemented only for keys and strings.\n", stderr);
+    }
+
+    return result;
+}
+
+/**
+ * get the actual map object from this `pointer`, or NULL if
+ * `pointer` is not a map pointer.
+ */
+struct map_payload *get_map_payload( struct cons_pointer pointer ) {
+    struct map_payload *result = NULL;
+    struct vector_space_object *vso =
+        pointer2cell( pointer ).payload.vectorp.address;
+
+    if (vectorpointp(pointer) && mapp( vso ) ) {
+        result = ( struct map_payload * ) &( vso->payload );
+        debug_printf( DEBUG_STACK,
+                      L"get_map_payload: all good, returning %p\n", result );
+    } else {
+        debug_print( L"get_map_payload: fail, returning NULL\n", DEBUG_STACK );
+    }
+
+    return result;
+}
+
+
+/**
+ * Make an empty immutable map, and return it.
+ *
+ * @param hash_function a pointer to a function of one argument, which
+ * returns an integer; or (more usually) `nil`.
+ * @return the new map, or NULL if memory is exhausted.
+ */
+struct cons_pointer make_empty_map( struct cons_pointer hash_function ) {
+    debug_print( L"Entering make_empty_map\n", DEBUG_ALLOC );
+    struct cons_pointer result =
+        make_vso( MAPTAG, sizeof( struct map_payload ) );
+
+    if ( !nilp( result ) ) {
+        struct map_payload *payload = get_map_payload( result );
+
+        payload->hash_function = functionp( hash_function) ? hash_function : NIL;
+        inc_ref(hash_function);
+
+        for ( int i = 0; i < BUCKETSINMAP; i++) {
+            payload->buckets[i] = NIL;
+        }
+    }
+
+    return result;
+}
+
+
+struct cons_pointer make_duplicate_map( struct cons_pointer parent) {
+    struct cons_pointer result = NIL;
+    struct map_payload * parent_payload = get_map_payload(parent);
+
+    if (parent_payload != NULL) {
+        result =
+            make_vso( MAPTAG, sizeof( struct map_payload ) );
+
+        if ( !nilp( result ) ) {
+            struct map_payload *payload = get_map_payload( result );
+
+            payload->hash_function = parent_payload->hash_function;
+            inc_ref(payload->hash_function);
+
+            for ( int i = 0; i < BUCKETSINMAP; i++) {
+                payload->buckets[i] = parent_payload->buckets[i];
+                inc_ref(payload->buckets[i]);
+            }
+        }
+    }
+
+    return result;
+}
+
+
+struct cons_pointer bind_in_map( struct cons_pointer parent,
+                                struct cons_pointer key,
+                                struct cons_pointer value) {
+    struct cons_pointer result = make_duplicate_map(parent);
+
+    if ( !nilp( result)) {
+        struct map_payload * payload = get_map_payload( result );
+        int bucket = get_hash_32(payload->hash_function, key) % BUCKETSINMAP;
+
+        payload->buckets[bucket] = make_cons(
+            make_cons(key, value), payload->buckets[bucket]);
+
+        inc_ref(payload->buckets[bucket]);
+    }
+
+    return result;
+}
+
+
+struct cons_pointer keys( struct cons_pointer store) {
+    struct cons_pointer result = NIL;
+
+    struct cons_space_object cell = pointer2cell( store );
+
+    switch (pointer2cell( store ).tag.value) {
+        case CONSTV:
+        for (struct cons_pointer c = store; !nilp(c); c = c_cdr(c)) {
+            result = make_cons( c_car( c_car( c)), result);
+        }
+        break;
+        case VECTORPOINTTV: {
+            struct vector_space_object *vso =
+                pointer2cell( store ).payload.vectorp.address;
+
+            if ( mapp( vso ) ) {
+                struct map_payload * payload = get_map_payload( result );
+
+                for (int bucket = 0; bucket < BUCKETSINMAP; bucket++) {
+                    for (struct cons_pointer c = payload->buckets[bucket];
+                         !nilp(c); c = c_cdr(c)) {
+                        result = make_cons( c_car( c_car( c)), result);
+                    }
+                }
+            }
+        }
+        break;
+    }
+
+    return result;
+}
+
+/**
+ * Return a new map which represents the merger of `to_merge` into
+ * `parent`. `parent` must be a map, but `to_merge` may be a map or
+ * an assoc list.
+ *
+ * @param parent a map;
+ * @param to_merge an association from which key/value pairs will be merged.
+ * @result a new map, containing all key/value pairs from `to_merge`
+ * together with those key/value pairs from `parent` whose keys did not
+ * collide.
+ */
+struct cons_pointer merge_into_map( struct cons_pointer parent,
+                                   struct cons_pointer to_merge) {
+    struct cons_pointer result = make_duplicate_map(parent);
+
+    if (!nilp(result)) {
+        struct map_payload *payload = get_map_payload( result );
+        for (struct cons_pointer c = keys(to_merge);
+             !nilp(c); c = c_cdr(c)) {
+            struct cons_pointer key = c_car( c);
+            int bucket = get_hash_32(payload->hash_function, key) % BUCKETSINMAP;
+
+            payload->buckets[bucket] = make_cons(
+                make_cons( key, c_assoc( key, to_merge)),
+                payload->buckets[bucket]);
+        }
+    }
+
+    return result;
+}
+
+
+struct cons_pointer assoc_in_map( struct cons_pointer map,
+                                  struct cons_pointer key) {
+    struct cons_pointer result = NIL;
+    struct map_payload *payload = get_map_payload( map );
+
+    if (payload != NULL) {
+        int bucket = get_hash_32(payload->hash_function, key) % BUCKETSINMAP;
+
+        result = c_assoc(key, payload->buckets[bucket]);
+    }
+
+    return result;
+}
+
+/**
+ * Dump a map to this stream for debugging
+ * @param output the stream
+ * @param map_pointer the pointer to the frame
+ */
+void dump_map( URL_FILE * output, struct cons_pointer map_pointer ) {
+    struct vector_space_object *vso =
+        pointer2cell( map_pointer ).payload.vectorp.address;
+
+    if (vectorpointp(map_pointer) && mapp( vso ) ) {
+        struct map_payload *payload = get_map_payload( map_pointer );
+
+        if ( payload != NULL ) {
+            url_fputws( L"Immutable map; hash function:", output );
+
+            if (nilp(payload->hash_function)) {
+                url_fputws( L"default", output);
+            } else {
+                dump_object( output, payload->hash_function);
+            }
+
+            for (int i = 0; i < BUCKETSINMAP; i++) {
+                url_fwprintf(output, L"\n\tBucket %d: ", i);
+                print( output, payload->buckets[i]);
+            }
+        }
+    }
+}
+
diff --git a/src/memory/map.h b/src/memory/map.h
index d7a65c5..143c7b9 100644
--- a/src/memory/map.h
+++ b/src/memory/map.h
@@ -30,7 +30,14 @@
 #define MAXENTRIESINASSOC 16
 
 /**
- * The vector-space payload of a map object.
+ * true if this vector_space_object is a map, else false.
+ */
+#define mapp( vso) (((struct vector_space_object *)vso)->header.tag.value == MAPTV)
+
+/**
+ * The vector-space payload of a map object. Essentially a vector of
+ * `BUCKETSINMAP` + 1 `cons_pointer`s, but the first one is considered
+ * special.
  */
 struct map_payload {
     /**
@@ -39,7 +46,7 @@ struct map_payload {
      * their own hash values. But it will be possible to override the hash
      * function by putting a function of one argument returning an integer
      * here. */
-    struct cons_pointer hash_function = NIL;
+    struct cons_pointer hash_function;
 
     /**
      * Obviously the number of buckets in a map is a trade off, and this may need
@@ -62,4 +69,22 @@ struct map_payload {
     struct cons_pointer buckets[BUCKETSINMAP];
 };
 
+uint32_t get_hash_32(struct cons_pointer f, struct cons_pointer key);
+
+struct map_payload *get_map_payload( struct cons_pointer pointer );
+
+struct cons_pointer bind_in_map( struct cons_pointer parent,
+                                struct cons_pointer key,
+                                struct cons_pointer value);
+
+struct cons_pointer keys( struct cons_pointer store);
+
+struct cons_pointer merge_into_map( struct cons_pointer parent,
+                                   struct cons_pointer to_merge);
+
+struct cons_pointer assoc_in_map( struct cons_pointer map,
+                                  struct cons_pointer key);
+
+void dump_map( URL_FILE * output, struct cons_pointer map_pointer );
+
 #endif
diff --git a/src/ops/intern.c b/src/ops/intern.c
index 8ce5d71..b4eafd2 100644
--- a/src/ops/intern.c
+++ b/src/ops/intern.c
@@ -24,6 +24,7 @@
 #include "debug.h"
 #include "equal.h"
 #include "lispops.h"
+#include "map.h"
 #include "print.h"
 
 /**
@@ -88,7 +89,7 @@ internedp( struct cons_pointer key, struct cons_pointer store ) {
  * of that key from the store; otherwise return NIL.
  */
 struct cons_pointer c_assoc( struct cons_pointer key,
-                             struct cons_pointer store ) {
+                            struct cons_pointer store ) {
     struct cons_pointer result = NIL;
 
     debug_print( L"c_assoc; key is `", DEBUG_BIND);
@@ -97,15 +98,19 @@ struct cons_pointer c_assoc( struct cons_pointer key,
     debug_dump_object( store, DEBUG_BIND);
     debug_println(DEBUG_BIND);
 
-    for ( struct cons_pointer next = store;
-          consp( next ); next = pointer2cell( next ).payload.cons.cdr ) {
-        struct cons_space_object entry =
-            pointer2cell( pointer2cell( next ).payload.cons.car );
+    if (consp(store)) {
+        for ( struct cons_pointer next = store;
+             consp( next ); next = pointer2cell( next ).payload.cons.cdr ) {
+            struct cons_space_object entry =
+                pointer2cell( pointer2cell( next ).payload.cons.car );
 
-        if ( equal( key, entry.payload.cons.car ) ) {
-            result = entry.payload.cons.cdr;
-            break;
+            if ( equal( key, entry.payload.cons.car ) ) {
+                result = entry.payload.cons.cdr;
+                break;
+            }
         }
+    } else if (vectorpointp( store)) {
+        result = assoc_in_map( key, store);
     }
 
     return result;
@@ -116,15 +121,23 @@ struct cons_pointer c_assoc( struct cons_pointer key,
  * with this key/value pair added to the front.
  */
 struct cons_pointer
-set( struct cons_pointer key, struct cons_pointer value,
-     struct cons_pointer store ) {
+    set( struct cons_pointer key, struct cons_pointer value,
+        struct cons_pointer store ) {
+    struct cons_pointer result = NIL;
+
     debug_print( L"Binding ", DEBUG_BIND );
     debug_print_object( key, DEBUG_BIND );
     debug_print( L" to ", DEBUG_BIND );
     debug_print_object( value, DEBUG_BIND );
     debug_println( DEBUG_BIND );
 
-    return make_cons( make_cons( key, value ), store );
+    if (consp(store)) {
+        result = make_cons( make_cons( key, value ), store );
+    } else if (vectorpointp( store)) {
+        result = bind_in_map( store, key, value);
+    }
+
+    return result;
 }
 
 /**
diff --git a/src/ops/lispops.c b/src/ops/lispops.c
index 14724a1..1624261 100644
--- a/src/ops/lispops.c
+++ b/src/ops/lispops.c
@@ -716,6 +716,22 @@ lisp_cdr( struct stack_frame *frame, struct cons_pointer frame_pointer,
     return result;
 }
 
+/**
+ * Function: return, as an integer, the length of the sequence indicated by
+ * the first argument, or zero if it is not a sequence.
+ *
+ * * (length any)
+ *
+ * @param frame my stack_frame.
+ * @param frame_pointer a pointer to my stack_frame.
+ * @param env my environment (ignored).
+ * @return the length of `any`, if it is a sequence, or zero otherwise.
+ */
+struct cons_pointer lisp_length( struct stack_frame *frame, struct cons_pointer frame_pointer,
+            struct cons_pointer env ) {
+    return make_integer( c_length( frame->arg[0]), NIL);
+}
+
 /**
  * Function; look up the value of a `key` in a `store`.
  *
diff --git a/src/ops/lispops.h b/src/ops/lispops.h
index ea8a883..122635f 100644
--- a/src/ops/lispops.h
+++ b/src/ops/lispops.h
@@ -85,7 +85,9 @@ lisp_set_shriek( struct stack_frame *frame, struct cons_pointer frame_pointer,
 struct cons_pointer lisp_lambda( struct stack_frame *frame,
                                  struct cons_pointer frame_pointer,
                                  struct cons_pointer env );
-
+struct cons_pointer lisp_length( struct stack_frame *frame,
+                                struct cons_pointer frame_pointer,
+            struct cons_pointer env );
 /**
  * Construct an interpretable special form.
  *

From 0687b0baebacc2940922c74f31f8b3133a388ddd Mon Sep 17 00:00:00 2001
From: Simon Brooke <simon@journeyman.cc>
Date: Wed, 6 Feb 2019 11:17:31 +0000
Subject: [PATCH 24/31] #8: Buggy, but a lot of it works.

---
 src/init.c        |  2 ++
 src/io/print.c    | 42 ++++++++++++++++++++++++++++++++++++++++++
 src/memory/dump.c |  5 +++++
 src/memory/map.c  | 22 ++++++++++++++++++++--
 src/memory/map.h  |  6 +++++-
 src/ops/intern.c  | 30 ++++++++++++++++++++++++------
 6 files changed, 98 insertions(+), 9 deletions(-)

diff --git a/src/init.c b/src/init.c
index 06494e9..82b497a 100644
--- a/src/init.c
+++ b/src/init.c
@@ -26,6 +26,7 @@
 #include "intern.h"
 #include "io.h"
 #include "lispops.h"
+#include "map.h"
 #include "meta.h"
 #include "peano.h"
 #include "print.h"
@@ -196,6 +197,7 @@ int main( int argc, char *argv[] ) {
     bind_function( L"eval", &lisp_eval );
     bind_function( L"exception", &lisp_exception );
     bind_function( L"inspect", &lisp_inspect );
+    bind_function( L"make-map", &lisp_make_map);
     bind_function( L"meta", &lisp_metadata );
     bind_function( L"metadata", &lisp_metadata );
     bind_function( L"multiply", &lisp_multiply );
diff --git a/src/io/print.c b/src/io/print.c
index fb0d8a1..f4c98aa 100644
--- a/src/io/print.c
+++ b/src/io/print.c
@@ -20,9 +20,12 @@
 #include "conspage.h"
 #include "consspaceobject.h"
 #include "integer.h"
+#include "intern.h"
+#include "map.h"
 #include "stack.h"
 #include "print.h"
 #include "time.h"
+#include "vectorspace.h"
 
 /**
  * Whether or not we colorise output.
@@ -98,7 +101,43 @@ void print_list( URL_FILE * output, struct cons_pointer pointer ) {
     } else {
         url_fputws( L")", output );
     }
+}
 
+
+void print_map( URL_FILE * output, struct cons_pointer pointer) {
+    if ( vectorpointp( pointer)) {
+        struct vector_space_object *vso = pointer_to_vso( pointer);
+
+        if ( mapp( vso ) ) {
+            url_fputwc( btowc( '{' ), output );
+
+            for ( struct cons_pointer ks = keys(pointer);
+                 !nilp(ks); ks = c_cdr(ks)) {
+                print( output, c_car(ks));
+                url_fputwc( btowc( ' ' ), output );
+                print( output, c_assoc( pointer, c_car(ks)));
+
+                if ( !nilp( c_cdr( ks))) {
+                    url_fputws( L", ", output );
+                }
+            }
+
+            url_fputwc( btowc( '}' ), output );
+        }
+    }
+}
+
+
+void print_vso( URL_FILE * output, struct cons_pointer pointer) {
+    struct vector_space_object *vso =
+        pointer2cell( pointer ).payload.vectorp.address;
+
+    switch ( vso->header.tag.value) {
+        case MAPTV:
+            print_map( output, pointer);
+            break;
+        // \todo: others.
+    }
 }
 
 /**
@@ -217,6 +256,9 @@ struct cons_pointer print( URL_FILE * output, struct cons_pointer pointer ) {
         case TRUETV:
             url_fwprintf( output, L"t" );
             break;
+        case VECTORPOINTTV:
+            print_vso( output, pointer);
+            break;
         case WRITETV:
             url_fwprintf( output, L"<Output stream>" );
             break;
diff --git a/src/memory/dump.c b/src/memory/dump.c
index 28bd36a..074d1c4 100644
--- a/src/memory/dump.c
+++ b/src/memory/dump.c
@@ -21,6 +21,8 @@
 #include "conspage.h"
 #include "consspaceobject.h"
 #include "debug.h"
+#include "intern.h"
+#include "map.h"
 #include "print.h"
 #include "stack.h"
 #include "vectorspace.h"
@@ -146,6 +148,9 @@ void dump_object( URL_FILE * output, struct cons_pointer pointer ) {
                     case STACKFRAMETV:
                         dump_frame( output, pointer );
                         break;
+                    case MAPTV:
+                        dump_map( output, pointer);
+                        break;
                 }
             }
             break;
diff --git a/src/memory/map.c b/src/memory/map.c
index 358b2e4..7224a12 100644
--- a/src/memory/map.c
+++ b/src/memory/map.c
@@ -30,7 +30,7 @@ uint32_t get_hash_32(struct cons_pointer f, struct cons_pointer key) {
     uint32_t result = 0;
     int l =  c_length(key);
 
-    if (keywordp(key) || stringp(key)) {
+    if (keywordp(key) || stringp(key) || symbolp( key)) {
         if ( l > 0) {
             uint32_t buffer[l];
 
@@ -44,7 +44,7 @@ uint32_t get_hash_32(struct cons_pointer f, struct cons_pointer key) {
             result = hashword( buffer, l, 0);
         }
     } else {
-        fputws(L"Hashing is thud far implemented only for keys and strings.\n", stderr);
+        fputws(L"Hashing is thus far implemented only for keys, strings and symbols.\n", stderr);
     }
 
     return result;
@@ -220,6 +220,24 @@ struct cons_pointer assoc_in_map( struct cons_pointer map,
     return result;
 }
 
+/**
+ * Function: create a map initialised with key/value pairs from my
+ * first argument.
+ *
+ * * (make-map)
+ * * (make-map store)
+ *
+ * @param frame the stack frame in which the expression is to be interpreted;
+ * @param frame_pointer a pointer to my stack_frame.
+ * @param env the environment in which it is to be intepreted.
+ * @return a new containing all the key/value pairs from store.
+ */
+struct cons_pointer
+lisp_make_map( struct stack_frame *frame, struct cons_pointer frame_pointer,
+             struct cons_pointer env ) {
+    return merge_into_map( make_empty_map( NIL), frame->arg[0]);
+}
+
 /**
  * Dump a map to this stream for debugging
  * @param output the stream
diff --git a/src/memory/map.h b/src/memory/map.h
index 143c7b9..76a7193 100644
--- a/src/memory/map.h
+++ b/src/memory/map.h
@@ -83,7 +83,11 @@ struct cons_pointer merge_into_map( struct cons_pointer parent,
                                    struct cons_pointer to_merge);
 
 struct cons_pointer assoc_in_map( struct cons_pointer map,
-                                  struct cons_pointer key);
+                                 struct cons_pointer key);
+
+struct cons_pointer lisp_make_map( struct stack_frame *frame,
+                                  struct cons_pointer frame_pointer,
+                                  struct cons_pointer env );
 
 void dump_map( URL_FILE * output, struct cons_pointer map_pointer );
 
diff --git a/src/ops/intern.c b/src/ops/intern.c
index b4eafd2..02deb23 100644
--- a/src/ops/intern.c
+++ b/src/ops/intern.c
@@ -52,7 +52,7 @@ struct cons_pointer
 internedp( struct cons_pointer key, struct cons_pointer store ) {
     struct cons_pointer result = NIL;
 
-    if ( symbolp( key ) ) {
+    if ( symbolp( key ) || keywordp( key ) ) {
         for ( struct cons_pointer next = store;
               nilp( result ) && consp( next );
               next = pointer2cell( next ).payload.cons.cdr ) {
@@ -74,7 +74,7 @@ internedp( struct cons_pointer key, struct cons_pointer store ) {
         debug_print_object( key, DEBUG_BIND );
         debug_print( L"` is a ", DEBUG_BIND );
         debug_print_object( c_type( key ), DEBUG_BIND );
-        debug_print( L", not a SYMB", DEBUG_BIND );
+        debug_print( L", not a KEYW or SYMB", DEBUG_BIND );
     }
 
     return result;
@@ -113,6 +113,10 @@ struct cons_pointer c_assoc( struct cons_pointer key,
         result = assoc_in_map( key, store);
     }
 
+    debug_print( L"c_assoc returning ", DEBUG_BIND);
+    debug_print_object( result, DEBUG_BIND);
+    debug_println( DEBUG_BIND);
+
     return result;
 }
 
@@ -125,18 +129,24 @@ struct cons_pointer
         struct cons_pointer store ) {
     struct cons_pointer result = NIL;
 
-    debug_print( L"Binding ", DEBUG_BIND );
+    debug_print( L"set: binding `", DEBUG_BIND );
     debug_print_object( key, DEBUG_BIND );
-    debug_print( L" to ", DEBUG_BIND );
+    debug_print( L"` to `", DEBUG_BIND );
     debug_print_object( value, DEBUG_BIND );
+    debug_print( L"` in store ", DEBUG_BIND );
+    debug_dump_object( store, DEBUG_BIND);
     debug_println( DEBUG_BIND );
 
-    if (consp(store)) {
+    if (nilp( store) || consp(store)) {
         result = make_cons( make_cons( key, value ), store );
     } else if (vectorpointp( store)) {
         result = bind_in_map( store, key, value);
     }
 
+    debug_print( L"set returning ", DEBUG_BIND);
+    debug_print_object( result, DEBUG_BIND);
+    debug_println( DEBUG_BIND);
+
     return result;
 }
 
@@ -150,11 +160,19 @@ deep_bind( struct cons_pointer key, struct cons_pointer value ) {
     debug_print( L"Entering deep_bind\n", DEBUG_BIND );
     struct cons_pointer old = oblist;
 
+    debug_print( L"deep_bind: binding `", DEBUG_BIND );
+    debug_print_object( key, DEBUG_BIND );
+    debug_print( L"` to ", DEBUG_BIND );
+    debug_print_object( value, DEBUG_BIND );
+    debug_println( DEBUG_BIND );
+
     oblist = set( key, value, oblist );
     inc_ref( oblist );
     dec_ref( old );
 
-    debug_print( L"Leaving deep_bind\n", DEBUG_BIND );
+    debug_print( L"deep_bind returning ", DEBUG_BIND );
+    debug_print_object( oblist, DEBUG_BIND );
+    debug_println( DEBUG_BIND );
 
     return oblist;
 }

From f36436a9e145740ae937064298f9b2f6156313cf Mon Sep 17 00:00:00 2001
From: Simon Brooke <simon@journeyman.cc>
Date: Thu, 7 Feb 2019 09:02:28 +0000
Subject: [PATCH 25/31] #8: Done

I'm now of the opinion that this is done at the wrong level in the stack and needs to be redone later; but it works for now.

There's a regression in `open`, but I can't see why.
---
 src/init.c                      |  2 +-
 src/io/io.c                     |  7 ++-
 src/io/print.c                  | 30 ++++++++-----
 src/io/read.c                   | 79 ++++++++++++++++++++++++++++-----
 src/memory/map.c                | 36 +++++++++++----
 src/memory/map.h                |  6 ++-
 src/ops/intern.c                |  4 +-
 src/ops/lispops.c               |  1 +
 src/utils.c                     |  2 +-
 src/utils.h                     |  4 +-
 unit-tests/eval-quote-symbol.sh |  2 +-
 unit-tests/slurp.sh             |  2 +-
 12 files changed, 134 insertions(+), 41 deletions(-)

diff --git a/src/init.c b/src/init.c
index 82b497a..275cc40 100644
--- a/src/init.c
+++ b/src/init.c
@@ -69,7 +69,7 @@ void bind_special( wchar_t *name, struct cons_pointer ( *executable )
                                          n ),
                               NIL ) );
 
-    deep_bind( n, make_special( NIL, executable ) );
+    deep_bind( n, make_special( meta, executable ) );
 }
 
 /**
diff --git a/src/io/io.c b/src/io/io.c
index b82c6ba..7e6a3c0 100644
--- a/src/io/io.c
+++ b/src/io/io.c
@@ -15,6 +15,7 @@
 #include <pwd.h>
 #include <stdlib.h>
 #include <string.h>
+#include <time.h>
 #include <sys/stat.h>
 #include <sys/types.h>
 #include <unistd.h>
@@ -277,9 +278,11 @@ struct cons_pointer add_meta_time( struct cons_pointer meta, wchar_t *key,
     /* I don't yet have a concept of a date-time object, which is a
      * bit of an oversight! */
     char datestring[256];
-    struct tm *tm = localtime( value );
 
-    strftime( datestring, sizeof( datestring ), nl_langinfo( D_T_FMT ), tm );
+    strftime( datestring,
+             sizeof( datestring ),
+             nl_langinfo( D_T_FMT ),
+             localtime( value ) );
 
     return add_meta_string( meta, key, datestring );
 }
diff --git a/src/io/print.c b/src/io/print.c
index f4c98aa..343160e 100644
--- a/src/io/print.c
+++ b/src/io/print.c
@@ -104,18 +104,18 @@ void print_list( URL_FILE * output, struct cons_pointer pointer ) {
 }
 
 
-void print_map( URL_FILE * output, struct cons_pointer pointer) {
-    if ( vectorpointp( pointer)) {
-        struct vector_space_object *vso = pointer_to_vso( pointer);
+void print_map( URL_FILE * output, struct cons_pointer map) {
+    if ( vectorpointp( map)) {
+        struct vector_space_object *vso = pointer_to_vso( map);
 
         if ( mapp( vso ) ) {
             url_fputwc( btowc( '{' ), output );
 
-            for ( struct cons_pointer ks = keys(pointer);
-                 !nilp(ks); ks = c_cdr(ks)) {
-                print( output, c_car(ks));
+            for ( struct cons_pointer ks = keys( map);
+                 !nilp( ks); ks = c_cdr( ks)) {
+                print( output, c_car( ks));
                 url_fputwc( btowc( ' ' ), output );
-                print( output, c_assoc( pointer, c_car(ks)));
+                print( output, c_assoc( c_car( ks), map));
 
                 if ( !nilp( c_cdr( ks))) {
                     url_fputws( L", ", output );
@@ -162,7 +162,9 @@ struct cons_pointer print( URL_FILE * output, struct cons_pointer pointer ) {
             dump_stack_trace( output, pointer );
             break;
         case FUNCTIONTV:
-            url_fwprintf( output, L"<Function>" );
+            url_fputws( L"<Function: ", output);
+            print( output, cell.payload.function.meta);
+            url_fputwc( L'>', output);
             break;
         case INTEGERTV:{
                 struct cons_pointer s = integer_to_string( pointer, 10 );
@@ -214,7 +216,9 @@ struct cons_pointer print( URL_FILE * output, struct cons_pointer pointer ) {
             print( output, cell.payload.ratio.divisor );
             break;
         case READTV:
-            url_fwprintf( output, L"<Input stream>" );
+            url_fwprintf( output, L"<Input stream: " );
+            print( output, cell.payload.stream.meta);
+            url_fputwc( L'>', output);
             break;
         case REALTV:
             /* \todo using the C heap is a bad plan because it will fragment.
@@ -248,7 +252,9 @@ struct cons_pointer print( URL_FILE * output, struct cons_pointer pointer ) {
             print_string_contents( output, pointer );
             break;
         case SPECIALTV:
-            url_fwprintf( output, L"<Special form>" );
+            url_fwprintf( output, L"<Special form: " );
+            print( output, cell.payload.special.meta);
+            url_fputwc( L'>', output);
             break;
         case TIMETV:
             print_string(output, time_to_string( pointer));
@@ -260,7 +266,9 @@ struct cons_pointer print( URL_FILE * output, struct cons_pointer pointer ) {
             print_vso( output, pointer);
             break;
         case WRITETV:
-            url_fwprintf( output, L"<Output stream>" );
+            url_fwprintf( output, L"<Output stream: " );
+            print( output, cell.payload.stream.meta);
+            url_fputwc( L'>', output);
             break;
         default:
             fwprintf( stderr,
diff --git a/src/io/read.c b/src/io/read.c
index c49d043..4f3ed0a 100644
--- a/src/io/read.c
+++ b/src/io/read.c
@@ -24,6 +24,7 @@
 #include "intern.h"
 #include "io.h"
 #include "lispops.h"
+#include "map.h"
 #include "peano.h"
 #include "print.h"
 #include "ratio.h"
@@ -44,6 +45,9 @@ struct cons_pointer read_number( struct stack_frame *frame,
 struct cons_pointer read_list( struct stack_frame *frame,
                                struct cons_pointer frame_pointer,
                                URL_FILE * input, wint_t initial );
+struct cons_pointer read_map( struct stack_frame *frame,
+                               struct cons_pointer frame_pointer,
+                               URL_FILE * input, wint_t initial );
 struct cons_pointer read_string( URL_FILE * input, wint_t initial );
 struct cons_pointer read_symbol_or_key( URL_FILE * input, char *tag,
                                         wint_t initial );
@@ -100,6 +104,10 @@ struct cons_pointer read_continuation( struct stack_frame *frame,
                     read_list( frame, frame_pointer, input,
                                url_fgetwc( input ) );
                 break;
+            case '{':
+                result = read_map( frame, frame_pointer, input,
+                               url_fgetwc( input ) );
+                break;
             case '"':
                 result = read_string( input, url_fgetwc( input ) );
                 break;
@@ -126,9 +134,10 @@ struct cons_pointer read_continuation( struct stack_frame *frame,
                     } else if ( iswblank( next ) ) {
                         /* dotted pair. \todo this isn't right, we
                          * really need to backtrack up a level. */
-                        result =
-                            read_continuation( frame, frame_pointer, input,
+                        result = read_continuation( frame, frame_pointer, input,
                                                url_fgetwc( input ) );
+                        debug_print( L"read_continuation: dotted pair; read cdr ",
+                                    DEBUG_IO);
                     } else {
                         read_symbol_or_key( input, SYMBOLTAG, c );
                     }
@@ -275,19 +284,38 @@ struct cons_pointer read_number( struct stack_frame *frame,
  * left parenthesis.
  */
 struct cons_pointer read_list( struct stack_frame *frame,
-                               struct cons_pointer frame_pointer,
-                               URL_FILE * input, wint_t initial ) {
+                              struct cons_pointer frame_pointer,
+                              URL_FILE * input, wint_t initial ) {
     struct cons_pointer result = NIL;
+    wint_t c;
+
     if ( initial != ')' ) {
         debug_printf( DEBUG_IO,
-                      L"read_list starting '%C' (%d)\n", initial, initial );
+                     L"read_list starting '%C' (%d)\n", initial, initial );
         struct cons_pointer car =
             read_continuation( frame, frame_pointer, input,
-                               initial );
-        result =
-            make_cons( car,
-                       read_list( frame, frame_pointer, input,
-                                  url_fgetwc( input ) ) );
+                              initial );
+
+        /* skip whitespace */
+        for (c = url_fgetwc( input );
+             iswblank( c ) || iswcntrl( c );
+             c = url_fgetwc( input ));
+
+        if ( c == L'.') {
+            /* might be a dotted pair; indeed, if we rule out numbers with
+             * initial periods, it must be a dotted pair. \todo Ought to check,
+             * howerver, that there's only one form after the period. */
+            result =
+                make_cons( car,
+                          c_car( read_list( frame,
+                                           frame_pointer,
+                                           input,
+                                           url_fgetwc( input ) ) ) );
+        } else {
+            result =
+                make_cons( car,
+                          read_list( frame, frame_pointer, input, c ) );
+        }
     } else {
         debug_print( L"End of list detected\n", DEBUG_IO );
     }
@@ -295,6 +323,37 @@ struct cons_pointer read_list( struct stack_frame *frame,
     return result;
 }
 
+
+struct cons_pointer read_map( struct stack_frame *frame,
+                               struct cons_pointer frame_pointer,
+                             URL_FILE * input, wint_t initial ) {
+    struct cons_pointer result = make_empty_map( NIL);
+    wint_t c = initial;
+
+    while ( c != L'}' ) {
+        struct cons_pointer key =
+            read_continuation( frame, frame_pointer, input, c );
+
+        /* skip whitespace */
+        for (c = url_fgetwc( input );
+             iswblank( c ) || iswcntrl( c );
+             c = url_fgetwc( input ));
+
+        struct cons_pointer value =
+            read_continuation( frame, frame_pointer, input, c );
+
+        /* skip commaa and whitespace at this point. */
+        for (c = url_fgetwc( input );
+             c == L',' || iswblank( c ) || iswcntrl( c );
+             c = url_fgetwc( input ));
+
+        result = merge_into_map( result, make_cons( make_cons( key, value), NIL));
+    }
+
+    return result;
+}
+
+
 /**
  * Read a string. This means either a string delimited by double quotes
  * (is_quoted == true), in which case it may contain whitespace but may
diff --git a/src/memory/map.c b/src/memory/map.c
index 7224a12..cbad3df 100644
--- a/src/memory/map.c
+++ b/src/memory/map.c
@@ -15,6 +15,7 @@
 #include "dump.h"
 #include "fopen.h"
 #include "intern.h"
+#include "io.h"
 #include "lookup3.h"
 #include "map.h"
 #include "print.h"
@@ -61,10 +62,10 @@ struct map_payload *get_map_payload( struct cons_pointer pointer ) {
 
     if (vectorpointp(pointer) && mapp( vso ) ) {
         result = ( struct map_payload * ) &( vso->payload );
-        debug_printf( DEBUG_STACK,
+        debug_printf( DEBUG_BIND,
                       L"get_map_payload: all good, returning %p\n", result );
     } else {
-        debug_print( L"get_map_payload: fail, returning NULL\n", DEBUG_STACK );
+        debug_print( L"get_map_payload: fail, returning NULL\n", DEBUG_BIND );
     }
 
     return result;
@@ -79,7 +80,7 @@ struct map_payload *get_map_payload( struct cons_pointer pointer ) {
  * @return the new map, or NULL if memory is exhausted.
  */
 struct cons_pointer make_empty_map( struct cons_pointer hash_function ) {
-    debug_print( L"Entering make_empty_map\n", DEBUG_ALLOC );
+    debug_print( L"Entering make_empty_map\n", DEBUG_BIND );
     struct cons_pointer result =
         make_vso( MAPTAG, sizeof( struct map_payload ) );
 
@@ -94,6 +95,7 @@ struct cons_pointer make_empty_map( struct cons_pointer hash_function ) {
         }
     }
 
+    debug_print( L"Leaving make_empty_map\n", DEBUG_BIND );
     return result;
 }
 
@@ -143,6 +145,7 @@ struct cons_pointer bind_in_map( struct cons_pointer parent,
 
 
 struct cons_pointer keys( struct cons_pointer store) {
+    debug_print( L"Entering keys\n", DEBUG_BIND );
     struct cons_pointer result = NIL;
 
     struct cons_space_object cell = pointer2cell( store );
@@ -158,18 +161,27 @@ struct cons_pointer keys( struct cons_pointer store) {
                 pointer2cell( store ).payload.vectorp.address;
 
             if ( mapp( vso ) ) {
-                struct map_payload * payload = get_map_payload( result );
+                struct map_payload * payload = get_map_payload( store );
 
                 for (int bucket = 0; bucket < BUCKETSINMAP; bucket++) {
                     for (struct cons_pointer c = payload->buckets[bucket];
                          !nilp(c); c = c_cdr(c)) {
+                        debug_print( L"keys: c is ", DEBUG_BIND);
+                        debug_print_object( c, DEBUG_BIND);
+
                         result = make_cons( c_car( c_car( c)), result);
+                        debug_print( L"; result is ", DEBUG_BIND);
+                        debug_print_object( result, DEBUG_BIND);
+                        debug_println( DEBUG_BIND);
                     }
                 }
             }
         }
         break;
     }
+    debug_print( L"keys returning ", DEBUG_BIND );
+    debug_print_object( result, DEBUG_BIND );
+    debug_println( DEBUG_BIND);
 
     return result;
 }
@@ -187,6 +199,7 @@ struct cons_pointer keys( struct cons_pointer store) {
  */
 struct cons_pointer merge_into_map( struct cons_pointer parent,
                                    struct cons_pointer to_merge) {
+    debug_print( L"Entering merge_into_map\n", DEBUG_BIND );
     struct cons_pointer result = make_duplicate_map(parent);
 
     if (!nilp(result)) {
@@ -202,24 +215,31 @@ struct cons_pointer merge_into_map( struct cons_pointer parent,
         }
     }
 
+    debug_print( L"Leaving merge_into_map\n", DEBUG_BIND );
+
     return result;
 }
 
 
-struct cons_pointer assoc_in_map( struct cons_pointer map,
-                                  struct cons_pointer key) {
+struct cons_pointer assoc_in_map( struct cons_pointer key,
+                                  struct cons_pointer map) {
+    debug_print( L"Entering assoc_in_map\n", DEBUG_BIND );
     struct cons_pointer result = NIL;
     struct map_payload *payload = get_map_payload( map );
 
     if (payload != NULL) {
         int bucket = get_hash_32(payload->hash_function, key) % BUCKETSINMAP;
-
         result = c_assoc(key, payload->buckets[bucket]);
     }
 
+    debug_print( L"assoc_in_map returning ", DEBUG_BIND );
+    debug_print_object( result, DEBUG_BIND);
+    debug_println( DEBUG_BIND);
+
     return result;
 }
 
+
 /**
  * Function: create a map initialised with key/value pairs from my
  * first argument.
@@ -251,7 +271,7 @@ void dump_map( URL_FILE * output, struct cons_pointer map_pointer ) {
         struct map_payload *payload = get_map_payload( map_pointer );
 
         if ( payload != NULL ) {
-            url_fputws( L"Immutable map; hash function:", output );
+            url_fputws( L"Immutable map; hash function: ", output );
 
             if (nilp(payload->hash_function)) {
                 url_fputws( L"default", output);
diff --git a/src/memory/map.h b/src/memory/map.h
index 76a7193..c9b5cfc 100644
--- a/src/memory/map.h
+++ b/src/memory/map.h
@@ -73,6 +73,8 @@ uint32_t get_hash_32(struct cons_pointer f, struct cons_pointer key);
 
 struct map_payload *get_map_payload( struct cons_pointer pointer );
 
+struct cons_pointer make_empty_map( struct cons_pointer hash_function );
+
 struct cons_pointer bind_in_map( struct cons_pointer parent,
                                 struct cons_pointer key,
                                 struct cons_pointer value);
@@ -82,8 +84,8 @@ struct cons_pointer keys( struct cons_pointer store);
 struct cons_pointer merge_into_map( struct cons_pointer parent,
                                    struct cons_pointer to_merge);
 
-struct cons_pointer assoc_in_map( struct cons_pointer map,
-                                 struct cons_pointer key);
+struct cons_pointer assoc_in_map( struct cons_pointer key,
+                                  struct cons_pointer map);
 
 struct cons_pointer lisp_make_map( struct stack_frame *frame,
                                   struct cons_pointer frame_pointer,
diff --git a/src/ops/intern.c b/src/ops/intern.c
index 02deb23..cf86e6b 100644
--- a/src/ops/intern.c
+++ b/src/ops/intern.c
@@ -94,9 +94,7 @@ struct cons_pointer c_assoc( struct cons_pointer key,
 
     debug_print( L"c_assoc; key is `", DEBUG_BIND);
     debug_print_object( key, DEBUG_BIND);
-    debug_print( L"`; store is \n", DEBUG_BIND);
-    debug_dump_object( store, DEBUG_BIND);
-    debug_println(DEBUG_BIND);
+    debug_print( L"`\n", DEBUG_BIND);
 
     if (consp(store)) {
         for ( struct cons_pointer next = store;
diff --git a/src/ops/lispops.c b/src/ops/lispops.c
index 1624261..cb58cf9 100644
--- a/src/ops/lispops.c
+++ b/src/ops/lispops.c
@@ -1288,6 +1288,7 @@ struct cons_pointer lisp_inspect( struct stack_frame *frame,
     }
 
     dump_object( output, frame->arg[0] );
+    url_fputws( L"\n", output );
 
     if ( writep( out_stream ) ) {
         dec_ref( out_stream );
diff --git a/src/utils.c b/src/utils.c
index ea3919f..9919dbe 100644
--- a/src/utils.c
+++ b/src/utils.c
@@ -12,7 +12,7 @@
 #include <string.h>
 
 
-int index_of( char c, char *s ) {
+int index_of( char c, const char *s ) {
     int i;
 
     for ( i = 0; s[i] != c && s[i] != 0; i++ );
diff --git a/src/utils.h b/src/utils.h
index e56fd6e..456e4d0 100644
--- a/src/utils.h
+++ b/src/utils.h
@@ -10,6 +10,8 @@
 #ifndef __psse_utils_h
 #define __psse_utils_h
 
-int index_of( char c, char *s );
+int index_of( char c, const char *s );
+
 char *trim( char *s );
+
 #endif
diff --git a/unit-tests/eval-quote-symbol.sh b/unit-tests/eval-quote-symbol.sh
index 7e80c48..e977461 100755
--- a/unit-tests/eval-quote-symbol.sh
+++ b/unit-tests/eval-quote-symbol.sh
@@ -1,6 +1,6 @@
 #!/bin/bash
 
-expected='<Special form>'
+expected='<Special form: ((:primitive . t) (:name . cond))>'
 actual=`echo "(eval 'cond)" | target/psse | tail -1`
 
 if [ "${expected}" = "${actual}" ]
diff --git a/unit-tests/slurp.sh b/unit-tests/slurp.sh
index b389143..0a9bc7c 100755
--- a/unit-tests/slurp.sh
+++ b/unit-tests/slurp.sh
@@ -1,6 +1,6 @@
 #!/bin/bash
 
-tmp=hi$$
+tmp=hi.$$
 echo "Hello, there." > ${tmp}
 expected='"Hello, there.'
 actual=`echo "(slurp (open \"${tmp}\"))" | target/psse | tail -2 | head -1`

From e35bc643a7246d60c8dfe507d81e633127fb993a Mon Sep 17 00:00:00 2001
From: Simon Brooke <simon@journeyman.cc>
Date: Thu, 7 Feb 2019 10:28:20 +0000
Subject: [PATCH 26/31] Ignore unit test detritus

---
 .gitignore | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/.gitignore b/.gitignore
index ec1281e..1968658 100644
--- a/.gitignore
+++ b/.gitignore
@@ -36,3 +36,5 @@ utils_src/readprintwc/out
 *.bak
 
 src/io/fopen
+
+hi\.*

From 30438297452cb29641e60a8b46244b66152844de Mon Sep 17 00:00:00 2001
From: Simon Brooke <simon@journeyman.cc>
Date: Thu, 7 Feb 2019 13:40:34 +0000
Subject: [PATCH 27/31] #17: Fixed

---
 src/io/io.c            |  4 ++--
 where-does-it-break.sh | 29 -----------------------------
 2 files changed, 2 insertions(+), 31 deletions(-)
 delete mode 100755 where-does-it-break.sh

diff --git a/src/io/io.c b/src/io/io.c
index 7e6a3c0..e9990e9 100644
--- a/src/io/io.c
+++ b/src/io/io.c
@@ -378,13 +378,13 @@ void collect_meta( struct cons_pointer stream, char *url ) {
                 meta =
                     add_meta_integer( meta, L"size",
                                       ( intmax_t ) statbuf.st_size );
-
+/*
                 meta = add_meta_time( meta, L"modified", &statbuf.st_mtime );
+*/
             }
             break;
         case CFTYPE_CURL:
             curl_easy_setopt( s->handle.curl, CURLOPT_VERBOSE, 1L );
-            curl_easy_setopt( s->handle.curl, CURLOPT_HEADER, 1L );
             curl_easy_setopt( s->handle.curl, CURLOPT_HEADERFUNCTION,
                               write_meta_callback );
             curl_easy_setopt( s->handle.curl, CURLOPT_HEADERDATA, stream );
diff --git a/where-does-it-break.sh b/where-does-it-break.sh
deleted file mode 100755
index 4d70041..0000000
--- a/where-does-it-break.sh
+++ /dev/null
@@ -1,29 +0,0 @@
-#!/bin/bash
-
-# Not really a unit test, but a check to see where bignum addition breaks
-
-broken=0
-i=11529215046068469750
-# we've already proven we can successfullu get up to here
-increment=1
-
-while [ $broken -eq "0" ]
-do
-  expr="(+ $i $increment)"
-  # Use sbcl as our reference implementation...
-  expected=`echo "$expr" | sbcl --noinform | grep -v '*'`
-  actual=`echo "$expr" | target/psse | tail -1 | sed 's/\,//g'`
-
-  echo -n "adding $increment to $i: "
-
-  if [ "${expected}" = "${actual}" ]
-  then
-      echo "OK"
-  else
-      echo "Fail: expected '${expected}', got '${actual}'"
-      broken=1
-      exit 1
-  fi
-
-  i=$expected
-done

From 897d5d267027fef2b7c30b91e15e612b2dd66c55 Mon Sep 17 00:00:00 2001
From: Simon Brooke <simon@journeyman.cc>
Date: Thu, 7 Feb 2019 13:57:37 +0000
Subject: [PATCH 28/31] Map in function position

---
 src/ops/lispops.c | 119 +++++++++++++++++++++++++++-------------------
 1 file changed, 69 insertions(+), 50 deletions(-)

diff --git a/src/ops/lispops.c b/src/ops/lispops.c
index cb58cf9..4e2ddbf 100644
--- a/src/ops/lispops.c
+++ b/src/ops/lispops.c
@@ -33,9 +33,11 @@
 #include "intern.h"
 #include "io.h"
 #include "lispops.h"
+#include "map.h"
 #include "print.h"
 #include "read.h"
 #include "stack.h"
+#include "vectorspace.h"
 
 /*
  * also to create in this section:
@@ -288,6 +290,7 @@ struct cons_pointer
             /* just pass exceptions straight back */
             result = fn_pointer;
             break;
+
             case FUNCTIONTV:
             {
                 struct cons_pointer exep = NIL;
@@ -326,64 +329,80 @@ struct cons_pointer
                 if ( exceptionp( next_pointer ) ) {
                     result = next_pointer;
                 } else {
-                        struct stack_frame *next =
-                            get_stack_frame( next_pointer );
-                        result =
-                            eval_lambda( fn_cell, next, next_pointer, env );
-                        if ( !exceptionp( result ) ) {
-                            dec_ref( next_pointer );
-                        }
+                    struct stack_frame *next =
+                        get_stack_frame( next_pointer );
+                    result =
+                        eval_lambda( fn_cell, next, next_pointer, env );
+                    if ( !exceptionp( result ) ) {
+                        dec_ref( next_pointer );
                     }
                 }
+            }
+            break;
+
+            case VECTORPOINTTV:
+            switch ( pointer_to_vso(fn_pointer)->header.tag.value) {
+                case MAPTV:
+                /* \todo: if arg[0] is a CONS, treat it as a path */
+                result = c_assoc( eval_form(frame,
+                                            frame_pointer,
+                                            c_car( c_cdr( frame->arg[0])),
+                                            env),
+                                 fn_pointer);
                 break;
+            }
+            break;
+
             case NLAMBDATV:
-                {
-                    struct cons_pointer next_pointer =
-                        make_special_frame( frame_pointer, args, env );
-                    inc_ref( next_pointer );
-                    if ( exceptionp( next_pointer ) ) {
-                        result = next_pointer;
-                    } else {
-                        struct stack_frame *next =
-                            get_stack_frame( next_pointer );
-                        result =
-                            eval_lambda( fn_cell, next, next_pointer, env );
-                        dec_ref( next_pointer );
-                    }
+            {
+                struct cons_pointer next_pointer =
+                    make_special_frame( frame_pointer, args, env );
+                inc_ref( next_pointer );
+                if ( exceptionp( next_pointer ) ) {
+                    result = next_pointer;
+                } else {
+                    struct stack_frame *next =
+                        get_stack_frame( next_pointer );
+                    result =
+                        eval_lambda( fn_cell, next, next_pointer, env );
+                    dec_ref( next_pointer );
                 }
-                break;
+            }
+            break;
+
             case SPECIALTV:
-                {
-                    struct cons_pointer next_pointer =
-                        make_special_frame( frame_pointer, args, env );
-                    inc_ref( next_pointer );
-                    if ( exceptionp( next_pointer ) ) {
-                        result = next_pointer;
-                    } else {
-                        result =
-                            ( *fn_cell.payload.special.
-                              executable ) ( get_stack_frame( next_pointer ),
-                                             next_pointer, env );
-                        debug_print( L"Special form returning: ", DEBUG_EVAL );
-                        debug_print_object( result, DEBUG_EVAL );
-                        debug_println( DEBUG_EVAL );
-                        dec_ref( next_pointer );
-                    }
+            {
+                struct cons_pointer next_pointer =
+                    make_special_frame( frame_pointer, args, env );
+                inc_ref( next_pointer );
+                if ( exceptionp( next_pointer ) ) {
+                    result = next_pointer;
+                } else {
+                    result =
+                        ( *fn_cell.payload.special.
+                         executable ) ( get_stack_frame( next_pointer ),
+                                       next_pointer, env );
+                    debug_print( L"Special form returning: ", DEBUG_EVAL );
+                    debug_print_object( result, DEBUG_EVAL );
+                    debug_println( DEBUG_EVAL );
+                    dec_ref( next_pointer );
                 }
-                break;
+            }
+            break;
+
             default:
-                {
-                    int bs = sizeof( wchar_t ) * 1024;
-                    wchar_t *buffer = malloc( bs );
-                    memset( buffer, '\0', bs );
-                    swprintf( buffer, bs,
-                              L"Unexpected cell with tag %d (%4.4s) in function position",
-                              fn_cell.tag.value, &fn_cell.tag.bytes[0] );
-                    struct cons_pointer message =
-                        c_string_to_lisp_string( buffer );
-                    free( buffer );
-                    result = throw_exception( message, frame_pointer );
-                }
+            {
+                int bs = sizeof( wchar_t ) * 1024;
+                wchar_t *buffer = malloc( bs );
+                memset( buffer, '\0', bs );
+                swprintf( buffer, bs,
+                         L"Unexpected cell with tag %d (%4.4s) in function position",
+                         fn_cell.tag.value, &fn_cell.tag.bytes[0] );
+                struct cons_pointer message =
+                    c_string_to_lisp_string( buffer );
+                free( buffer );
+                result = throw_exception( message, frame_pointer );
+            }
         }
     }
 

From b35eb8f5c75791244c29152c1049b1341b7d4e24 Mon Sep 17 00:00:00 2001
From: Simon Brooke <simon@journeyman.cc>
Date: Thu, 7 Feb 2019 14:19:49 +0000
Subject: [PATCH 29/31] Unit tests for maps

---
 unit-tests/map.sh | 89 +++++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 89 insertions(+)
 create mode 100755 unit-tests/map.sh

diff --git a/unit-tests/map.sh b/unit-tests/map.sh
new file mode 100755
index 0000000..f40c321
--- /dev/null
+++ b/unit-tests/map.sh
@@ -0,0 +1,89 @@
+#!/bin/bash
+
+#####################################################################
+# Create an empty map using map notation
+expected='{}'
+actual=`echo "$expected" | target/psse | tail -1`
+
+if [ "${expected}" = "${actual}" ]
+then
+    echo "OK"
+else
+    echo "Fail: expected '${expected}', got '${actual}'"
+    exit 1
+fi
+
+#####################################################################
+# Create an empty map using make-map
+expected='{}'
+actual=`echo "(make-map)" | target/psse | tail -1`
+
+echo -n "Empty map using (make-map): "
+if [ "${expected}" = "${actual}" ]
+then
+    echo "OK"
+else
+    echo "Fail: expected '${expected}', got '${actual}'"
+    exit 1
+fi
+
+#####################################################################
+# Create a map using map notation: order of keys in output is not
+# significant at this stage, but in the long term should be sorted
+# alphanumerically
+expected='{:two 2, :one 1, :three 3}'
+actual=`echo "{:one 1 :two 2 :three 3}" | target/psse | tail -1`
+
+echo -n "Map using map notation: "
+if [ "${expected}" = "${actual}" ]
+then
+    echo "OK"
+else
+    echo "Fail: expected '${expected}', got '${actual}'"
+    exit 1
+fi
+
+#####################################################################
+# Create a map using make-map: order of keys in output is not
+# significant at this stage, but in the long term should be sorted
+# alphanumerically
+expected='{:two 2, :one 1, :three 3}'
+actual=`echo "(make-map '((:one . 1)(:two . 2)(:three . 3)))" | target/psse | tail -1`
+
+echo -n "Map using (make-map): "
+if [ "${expected}" = "${actual}" ]
+then
+    echo "OK"
+else
+    echo "Fail: expected '${expected}', got '${actual}'"
+    exit 1
+fi
+
+#####################################################################
+# Keyword in function position
+expected='2'
+actual=`echo "(:two {:one 1 :two 2 :three 3})" | target/psse | tail -1`
+
+echo -n "Keyword in function position: "
+if [ "${expected}" = "${actual}" ]
+then
+    echo "OK"
+else
+    echo "Fail: expected '${expected}', got '${actual}'"
+    exit 1
+fi
+
+
+#####################################################################
+# Map in function position
+expected='2'
+actual=`echo "({:one 1 :two 2 :three 3} :two)" | target/psse | tail -1`
+
+echo -n "Map in function position: "
+if [ "${expected}" = "${actual}" ]
+then
+    echo "OK"
+else
+    echo "Fail: expected '${expected}', got '${actual}'"
+    exit 1
+fi

From af814d8f03a4095ab549c53757eec2f9a593b713 Mon Sep 17 00:00:00 2001
From: Simon Brooke <simon@journeyman.cc>
Date: Thu, 7 Feb 2019 15:32:06 +0000
Subject: [PATCH 30/31] #time: Fixed

Major (unexpected) problem was collision between the name of my header file and that of the system header file!
---
 src/init.c                       |  2 +-
 src/io/io.c                      |  3 +--
 src/io/print.c                   | 29 +++++++++++++++++++++++++++--
 src/time/{time.c => psse_time.c} | 19 ++++++++++++++-----
 src/time/{time.h => psse_time.h} |  2 +-
 5 files changed, 44 insertions(+), 11 deletions(-)
 rename src/time/{time.c => psse_time.c} (88%)
 rename src/time/{time.h => psse_time.h} (96%)

diff --git a/src/init.c b/src/init.c
index 275cc40..538ede3 100644
--- a/src/init.c
+++ b/src/init.c
@@ -31,7 +31,7 @@
 #include "peano.h"
 #include "print.h"
 #include "repl.h"
-#include "time.h"
+#include "psse_time.h"
 
 // extern char *optarg; /* defined in unistd.h */
 
diff --git a/src/io/io.c b/src/io/io.c
index e9990e9..5065044 100644
--- a/src/io/io.c
+++ b/src/io/io.c
@@ -378,9 +378,8 @@ void collect_meta( struct cons_pointer stream, char *url ) {
                 meta =
                     add_meta_integer( meta, L"size",
                                       ( intmax_t ) statbuf.st_size );
-/*
+
                 meta = add_meta_time( meta, L"modified", &statbuf.st_mtime );
-*/
             }
             break;
         case CFTYPE_CURL:
diff --git a/src/io/print.c b/src/io/print.c
index 343160e..dd92606 100644
--- a/src/io/print.c
+++ b/src/io/print.c
@@ -24,7 +24,7 @@
 #include "map.h"
 #include "stack.h"
 #include "print.h"
-#include "time.h"
+#include "psse_time.h"
 #include "vectorspace.h"
 
 /**
@@ -140,6 +140,27 @@ void print_vso( URL_FILE * output, struct cons_pointer pointer) {
     }
 }
 
+/**
+ * stolen from https://stackoverflow.com/questions/11656241/how-to-print-uint128-t-number-using-gcc
+ */
+void print_128bit( URL_FILE * output, __int128_t n ) {
+    if ( n == 0 ) {
+        fwprintf( stderr, L"0" );
+    } else {
+        char str[40] = { 0 }; // log10(1 << 128) + '\0'
+        char *s = str + sizeof( str ) - 1;  // start at the end
+        while ( n != 0 ) {
+            if ( s == str )
+                return;     // never happens
+
+            *--s = "0123456789"[n % 10];  // save last digit
+            n /= 10;        // drop it
+        }
+        url_fwprintf( output, L"%s", s );
+    }
+}
+
+
 /**
  * Print the cons-space object indicated by `pointer` to the stream indicated
  * by `output`.
@@ -257,7 +278,11 @@ struct cons_pointer print( URL_FILE * output, struct cons_pointer pointer ) {
             url_fputwc( L'>', output);
             break;
         case TIMETV:
-            print_string(output, time_to_string( pointer));
+            url_fwprintf( output, L"<Time: " );
+            print_string( output, time_to_string( pointer));
+            url_fputws( L"; ", output);
+            print_128bit( output, pointer2cell(pointer).payload.time.value);
+            url_fputwc( L'>', output);
             break;
         case TRUETV:
             url_fwprintf( output, L"t" );
diff --git a/src/time/time.c b/src/time/psse_time.c
similarity index 88%
rename from src/time/time.c
rename to src/time/psse_time.c
index 146f296..76f52a9 100644
--- a/src/time/time.c
+++ b/src/time/psse_time.c
@@ -1,5 +1,5 @@
 /*
- * time.h
+ * psse_time.c
  *
  * Bare bones of PSSE time. See issue #16.
  *
@@ -8,6 +8,7 @@
  */
 
 #include <stdlib.h>
+#include <string.h>
 #include <time.h>
 /*
  * wide characters
@@ -18,7 +19,7 @@
 #include "conspage.h"
 #include "consspaceobject.h"
 #include "integer.h"
-#include "time.h"
+#include "psse_time.h"
 #define _GNU_SOURCE
 
 #define seconds_per_year 31557600L
@@ -90,9 +91,17 @@ struct cons_pointer lisp_time( struct stack_frame *frame, struct cons_pointer fr
  * This is temporary, for bootstrapping.
  */
 struct cons_pointer time_to_string( struct cons_pointer pointer) {
+    struct cons_pointer result = NIL;
     long int t = lisp_time_to_unix_time(pointer);
 
-    return c_string_to_lisp_string( t == 0 ?
-                                         L"Not yet implemented: cannot print times outside UNIX time\n" :
-                                         ctime(&t));
+    if ( t != 0) {
+        char * bytes = ctime(&t);
+        int l = strlen(bytes) + 1;
+        wchar_t buffer[ l];
+
+        mbstowcs( buffer, bytes, l);
+        result = c_string_to_lisp_string( buffer);
+    }
+
+    return result;
 }
diff --git a/src/time/time.h b/src/time/psse_time.h
similarity index 96%
rename from src/time/time.h
rename to src/time/psse_time.h
index 661decf..af70966 100644
--- a/src/time/time.h
+++ b/src/time/psse_time.h
@@ -1,5 +1,5 @@
 /*
- * time.h
+ * psse_time.h
  *
  * Bare bones of PSSE time. See issue #16.
  *

From 27411689c9a04c96af5bd95622dac275922ae9b2 Mon Sep 17 00:00:00 2001
From: Simon Brooke <simon@journeyman.cc>
Date: Thu, 7 Feb 2019 15:42:01 +0000
Subject: [PATCH 31/31] Removed the `print_use_colours` feature.

More nuisance than help at this stage; removed.
---
 src/init.c     |  5 +----
 src/io/print.c | 47 +++++------------------------------------------
 src/io/print.h |  1 -
 3 files changed, 6 insertions(+), 47 deletions(-)

diff --git a/src/init.c b/src/init.c
index 538ede3..6074ba5 100644
--- a/src/init.c
+++ b/src/init.c
@@ -99,11 +99,8 @@ int main( int argc, char *argv[] ) {
         exit( 1 );
     }
 
-    while ( ( option = getopt( argc, argv, "cpdv:" ) ) != -1 ) {
+    while ( ( option = getopt( argc, argv, "pdv:" ) ) != -1 ) {
         switch ( option ) {
-            case 'c':
-                print_use_colours = true;
-                break;
             case 'd':
                 dump_at_end = true;
                 break;
diff --git a/src/io/print.c b/src/io/print.c
index dd92606..c886981 100644
--- a/src/io/print.c
+++ b/src/io/print.c
@@ -27,12 +27,6 @@
 #include "psse_time.h"
 #include "vectorspace.h"
 
-/**
- * Whether or not we colorise output.
- * \todo this should be a Lisp symbol binding, not a C variable.
- */
-int print_use_colours = 0;
-
 /**
  * print all the characters in the symbol or string indicated by `pointer`
  * onto this `output`; if `pointer` does not indicate a string or symbol,
@@ -89,18 +83,9 @@ print_list_contents( URL_FILE * output, struct cons_pointer pointer,
 }
 
 void print_list( URL_FILE * output, struct cons_pointer pointer ) {
-    if ( print_use_colours ) {
-        url_fwprintf( output, L"%s(%s", "\x1B[31m", "\x1B[39m" );
-    } else {
-        url_fputws( L"(", output );
-    };
-
+    url_fputws( L"(", output );
     print_list_contents( output, pointer, false );
-    if ( print_use_colours ) {
-        url_fwprintf( output, L"%s)%s", "\x1B[31m", "\x1B[39m" );
-    } else {
-        url_fputws( L")", output );
-    }
+    url_fputws( L")", output );
 }
 
 
@@ -178,8 +163,7 @@ struct cons_pointer print( URL_FILE * output, struct cons_pointer pointer ) {
             print_list( output, pointer );
             break;
         case EXCEPTIONTV:
-            url_fwprintf( output, L"\n%sException: ",
-                          print_use_colours ? "\x1B[31m" : "" );
+            url_fwuts( L"\nException: ", output );
             dump_stack_trace( output, pointer );
             break;
         case FUNCTIONTV:
@@ -190,17 +174,11 @@ struct cons_pointer print( URL_FILE * output, struct cons_pointer pointer ) {
         case INTEGERTV:{
                 struct cons_pointer s = integer_to_string( pointer, 10 );
                 inc_ref( s );
-                if ( print_use_colours ) {
-                    url_fputws( L"\x1B[34m", output );
-                }
                 print_string_contents( output, s );
                 dec_ref( s );
             }
             break;
         case KEYTV:
-            if ( print_use_colours ) {
-                url_fputws( L"\x1B[1;33m", output );
-            }
             url_fputws( L":", output );
             print_string_contents( output, pointer );
             break;
@@ -254,22 +232,13 @@ struct cons_pointer print( URL_FILE * output, struct cons_pointer pointer ) {
                     buffer[i] = '\0';
                 }
             }
-            if ( print_use_colours ) {
-                url_fputws( L"\x1B[34m", output );
-            }
             url_fwprintf( output, L"%s", buffer );
             free( buffer );
             break;
         case STRINGTV:
-            if ( print_use_colours ) {
-                url_fputws( L"\x1B[36m", output );
-            }
             print_string( output, pointer );
             break;
         case SYMBOLTV:
-            if ( print_use_colours ) {
-                url_fputws( L"\x1B[1;33m", output );
-            }
             print_string_contents( output, pointer );
             break;
         case SPECIALTV:
@@ -297,17 +266,11 @@ struct cons_pointer print( URL_FILE * output, struct cons_pointer pointer ) {
             break;
         default:
             fwprintf( stderr,
-                      L"%sError: Unrecognised tag value %d (%c%c%c%c)\n",
-                      print_use_colours ? "\x1B[31m" : "",
-                      cell.tag.value, cell.tag.bytes[0], cell.tag.bytes[1],
-                      cell.tag.bytes[2], cell.tag.bytes[3] );
+                      L"Error: Unrecognised tag value %d (%4.4s)\n",
+                      cell.tag.value, &cell.tag.bytes[0] );
             break;
     }
 
-    if ( print_use_colours ) {
-        url_fputws( L"\x1B[39m", output );
-    }
-
     return pointer;
 }
 
diff --git a/src/io/print.h b/src/io/print.h
index f59f090..006ef80 100644
--- a/src/io/print.h
+++ b/src/io/print.h
@@ -16,6 +16,5 @@
 
 struct cons_pointer print( URL_FILE * output, struct cons_pointer pointer );
 void println( URL_FILE * output );
-extern int print_use_colours;
 
 #endif