513 lines
13 KiB
C
513 lines
13 KiB
C
|
/* $Id$
|
||
|
|
||
|
Part of SWI-Prolog
|
||
|
|
||
|
Author: Jan Wielemaker
|
||
|
E-mail: J.Wielemaker@uva.nl
|
||
|
WWW: http://www.swi-prolog.org
|
||
|
Copyright (C): 1985-2009, University of Amsterdam
|
||
|
|
||
|
This library is free software; you can redistribute it and/or
|
||
|
modify it under the terms of the GNU Lesser General Public
|
||
|
License as published by the Free Software Foundation; either
|
||
|
version 2.1 of the License, or (at your option) any later version.
|
||
|
|
||
|
This library is distributed in the hope that it will be useful,
|
||
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
||
|
Lesser General Public License for more details.
|
||
|
|
||
|
You should have received a copy of the GNU Lesser General Public
|
||
|
License along with this library; if not, write to the Free Software
|
||
|
Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
|
||
|
*/
|
||
|
|
||
|
#include <SWI-Stream.h>
|
||
|
#include <SWI-Prolog.h>
|
||
|
#include <string.h>
|
||
|
#include <stdlib.h>
|
||
|
#include <assert.h>
|
||
|
#include <errno.h>
|
||
|
#include "error.h"
|
||
|
|
||
|
#define streq(s,q) (strcmp((s), (q)) == 0)
|
||
|
|
||
|
/* - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
|
||
|
Memory-files
|
||
|
|
||
|
make_memory_file(-Handle)
|
||
|
free_memory_file(+Handle)
|
||
|
open_memory_file(+Handle, +Mode, -Stream)
|
||
|
size_memory_file(+Handle, -Size)
|
||
|
memory_file_to_codes(+Handle, -Codes)
|
||
|
memory_file_to_atom(+Handle, -Atom)
|
||
|
atom_to_memory_file(+Atom, -Handle)
|
||
|
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - */
|
||
|
|
||
|
static functor_t FUNCTOR_memory_file1;
|
||
|
static atom_t ATOM_encoding;
|
||
|
static atom_t ATOM_unknown;
|
||
|
static atom_t ATOM_octet;
|
||
|
static atom_t ATOM_ascii;
|
||
|
static atom_t ATOM_iso_latin_1;
|
||
|
static atom_t ATOM_text;
|
||
|
static atom_t ATOM_utf8;
|
||
|
static atom_t ATOM_unicode_be;
|
||
|
static atom_t ATOM_unicode_le;
|
||
|
static atom_t ATOM_wchar_t;
|
||
|
static atom_t ATOM_read;
|
||
|
static atom_t ATOM_write;
|
||
|
static atom_t ATOM_free_on_close;
|
||
|
|
||
|
#define MEMFILE_MAGIC 0x5624a6b3L
|
||
|
#define NOSIZE ((size_t)-1)
|
||
|
|
||
|
typedef struct
|
||
|
{ long magic; /* MEMFILE_MAGIC */
|
||
|
IOENC encoding; /* encoding of the data */
|
||
|
int free_on_close; /* free if it is closed */
|
||
|
char *data; /* data of the file */
|
||
|
size_t data_size; /* byte-size of data */
|
||
|
size_t size; /* size in characters */
|
||
|
IOSTREAM *stream; /* Stream hanging onto it */
|
||
|
atom_t atom; /* Created from atom */
|
||
|
} memfile;
|
||
|
|
||
|
|
||
|
static int
|
||
|
unify_memfile(term_t handle, memfile *f)
|
||
|
{ return PL_unify_term(handle,
|
||
|
PL_FUNCTOR, FUNCTOR_memory_file1,
|
||
|
PL_POINTER, f);
|
||
|
}
|
||
|
|
||
|
|
||
|
static int
|
||
|
get_memfile(term_t handle, memfile **f)
|
||
|
{ if ( PL_is_functor(handle, FUNCTOR_memory_file1) )
|
||
|
{ term_t a = PL_new_term_ref();
|
||
|
void *ptr;
|
||
|
|
||
|
_PL_get_arg(1, handle, a);
|
||
|
if ( PL_get_pointer(a, &ptr) )
|
||
|
{ memfile *m = ptr;
|
||
|
|
||
|
if ( m->magic == MEMFILE_MAGIC )
|
||
|
{ *f = ptr;
|
||
|
return TRUE;
|
||
|
}
|
||
|
return pl_error(NULL, 0, NULL, ERR_EXISTENCE,
|
||
|
"memory_file", handle);
|
||
|
}
|
||
|
}
|
||
|
|
||
|
return pl_error(NULL, 0, NULL, ERR_ARGTYPE, 1,
|
||
|
handle, "memory_file");
|
||
|
}
|
||
|
|
||
|
|
||
|
static foreign_t
|
||
|
new_memory_file(term_t handle)
|
||
|
{ memfile *m = calloc(1, sizeof(*m));
|
||
|
|
||
|
if ( !m )
|
||
|
return pl_error(NULL, 0, NULL, ERR_ERRNO, errno,
|
||
|
"create", "memory_file", handle);
|
||
|
|
||
|
m->magic = MEMFILE_MAGIC;
|
||
|
m->encoding = ENC_UTF8;
|
||
|
m->data = 0;
|
||
|
m->size = 0;
|
||
|
|
||
|
if ( unify_memfile(handle, m) )
|
||
|
return TRUE;
|
||
|
|
||
|
m->magic = 0;
|
||
|
free(m);
|
||
|
return FALSE;
|
||
|
}
|
||
|
|
||
|
|
||
|
static int
|
||
|
destroy_memory_file(memfile *m)
|
||
|
{ if ( m->stream )
|
||
|
Sclose(m->stream);
|
||
|
if ( m->atom )
|
||
|
PL_unregister_atom(m->atom);
|
||
|
else if ( m->data )
|
||
|
Sfree(m->data); /* MS-Windows: malloc by other DLL! */
|
||
|
m->magic = 0;
|
||
|
free(m);
|
||
|
|
||
|
return TRUE;
|
||
|
}
|
||
|
|
||
|
|
||
|
static foreign_t
|
||
|
free_memory_file(term_t handle)
|
||
|
{ memfile *m;
|
||
|
|
||
|
if ( get_memfile(handle, &m) )
|
||
|
return destroy_memory_file(m);
|
||
|
|
||
|
return FALSE;
|
||
|
}
|
||
|
|
||
|
|
||
|
static void
|
||
|
closehook(void *closure)
|
||
|
{ memfile *m = closure;
|
||
|
|
||
|
m->stream = NULL;
|
||
|
if ( m->free_on_close )
|
||
|
destroy_memory_file(m);
|
||
|
}
|
||
|
|
||
|
|
||
|
static foreign_t
|
||
|
alreadyOpen(term_t handle, const char *op)
|
||
|
{ return pl_error(NULL, 0, "already open",
|
||
|
ERR_PERMISSION, handle, op, "memory_file");
|
||
|
}
|
||
|
|
||
|
|
||
|
static struct encname
|
||
|
{ IOENC code;
|
||
|
atom_t *name;
|
||
|
} encoding_names[] =
|
||
|
{ { ENC_UNKNOWN, &ATOM_unknown },
|
||
|
{ ENC_OCTET, &ATOM_octet },
|
||
|
{ ENC_ASCII, &ATOM_ascii },
|
||
|
{ ENC_ISO_LATIN_1, &ATOM_iso_latin_1 },
|
||
|
{ ENC_ANSI, &ATOM_text },
|
||
|
{ ENC_UTF8, &ATOM_utf8 },
|
||
|
{ ENC_UNICODE_BE, &ATOM_unicode_be },
|
||
|
{ ENC_UNICODE_LE, &ATOM_unicode_le },
|
||
|
{ ENC_WCHAR, &ATOM_wchar_t },
|
||
|
{ ENC_UNKNOWN, NULL },
|
||
|
};
|
||
|
|
||
|
|
||
|
IOENC
|
||
|
atom_to_encoding(atom_t a)
|
||
|
{ struct encname *en;
|
||
|
|
||
|
for(en=encoding_names; en->name; en++)
|
||
|
{ if ( *en->name == a )
|
||
|
return en->code;
|
||
|
}
|
||
|
|
||
|
return ENC_UNKNOWN;
|
||
|
}
|
||
|
|
||
|
|
||
|
static int
|
||
|
get_encoding(term_t t, IOENC *enc)
|
||
|
{ atom_t en;
|
||
|
|
||
|
if ( PL_get_atom(t, &en) )
|
||
|
{ IOENC encoding;
|
||
|
|
||
|
if ( (encoding = atom_to_encoding(en)) == ENC_UNKNOWN )
|
||
|
return pl_error(NULL, 0, NULL, ERR_DOMAIN, t, "encoding");
|
||
|
|
||
|
*enc = encoding;
|
||
|
return TRUE;
|
||
|
}
|
||
|
|
||
|
return pl_error(NULL, 0, NULL, ERR_TYPE, t, "encoding");
|
||
|
}
|
||
|
|
||
|
|
||
|
static foreign_t
|
||
|
open_memory_file4(term_t handle, term_t mode, term_t stream, term_t options)
|
||
|
{ memfile *m;
|
||
|
char *x;
|
||
|
atom_t iom;
|
||
|
IOSTREAM *fd;
|
||
|
IOENC encoding;
|
||
|
int free_on_close = FALSE;
|
||
|
|
||
|
if ( !get_memfile(handle, &m) )
|
||
|
return FALSE;
|
||
|
if ( m->stream )
|
||
|
return alreadyOpen(handle, "open");
|
||
|
if ( !PL_get_atom(mode, &iom) )
|
||
|
return pl_error("open_memory_file", 3, NULL, ERR_ARGTYPE, 2,
|
||
|
mode, "io_mode");
|
||
|
encoding = m->encoding;
|
||
|
|
||
|
if ( options )
|
||
|
{ term_t tail = PL_copy_term_ref(options);
|
||
|
term_t head = PL_new_term_ref();
|
||
|
|
||
|
while(PL_get_list(tail, head, tail))
|
||
|
{ int arity;
|
||
|
atom_t name;
|
||
|
|
||
|
if ( PL_get_name_arity(head, &name, &arity) && arity == 1 )
|
||
|
{ term_t arg = PL_new_term_ref();
|
||
|
|
||
|
_PL_get_arg(1, head, arg);
|
||
|
if ( name == ATOM_encoding )
|
||
|
{ if ( !get_encoding(arg, &encoding) )
|
||
|
return FALSE;
|
||
|
} else if ( name == ATOM_free_on_close )
|
||
|
{ if ( !PL_get_bool(arg, &free_on_close) )
|
||
|
return pl_error("open_memory_file", 4, NULL, ERR_TYPE,
|
||
|
arg, "boolean");
|
||
|
}
|
||
|
} else
|
||
|
return pl_error("open_memory_file", 4, NULL, ERR_TYPE, head, "option");
|
||
|
}
|
||
|
if ( !PL_get_nil(tail) )
|
||
|
return pl_error("open_memory_file", 4, NULL, ERR_TYPE, tail, "list");
|
||
|
}
|
||
|
|
||
|
if ( iom == ATOM_write )
|
||
|
{ x = "w";
|
||
|
if ( m->atom )
|
||
|
return pl_error("open_memory_file", 3, NULL, ERR_PERMISSION,
|
||
|
handle, "write", "memory_file");
|
||
|
if ( m->data )
|
||
|
{ Sfree(m->data);
|
||
|
m->data = NULL;
|
||
|
}
|
||
|
m->data_size = 0;
|
||
|
m->size = NOSIZE; /* don't know */
|
||
|
m->encoding = encoding;
|
||
|
} else if ( iom == ATOM_read )
|
||
|
{ x = "r";
|
||
|
m->free_on_close = free_on_close;
|
||
|
} else
|
||
|
{ return pl_error("open_memory_file", 3, NULL, ERR_DOMAIN,
|
||
|
mode, "io_mode");
|
||
|
}
|
||
|
|
||
|
if ( !(fd = Sopenmem(&m->data, &m->data_size, x)) )
|
||
|
return pl_error("open_memory_file", 3, NULL, ERR_ERRNO, errno,
|
||
|
"create", "memory_file", handle);
|
||
|
|
||
|
fd->close_hook = closehook;
|
||
|
fd->closure = m;
|
||
|
fd->encoding = encoding;
|
||
|
m->stream = fd;
|
||
|
|
||
|
return PL_unify_stream(stream, fd);
|
||
|
}
|
||
|
|
||
|
|
||
|
static foreign_t
|
||
|
open_memory_file(term_t handle, term_t mode, term_t stream)
|
||
|
{ return open_memory_file4(handle, mode, stream, 0);
|
||
|
}
|
||
|
|
||
|
|
||
|
|
||
|
static foreign_t
|
||
|
size_memory_file(term_t handle, term_t size)
|
||
|
{ memfile *m;
|
||
|
|
||
|
if ( get_memfile(handle, &m) )
|
||
|
{ if ( m->stream && !m->atom )
|
||
|
return alreadyOpen(handle, "size");
|
||
|
if ( m->data )
|
||
|
{ if ( m->size == NOSIZE )
|
||
|
{ switch( m->encoding )
|
||
|
{ case ENC_ISO_LATIN_1:
|
||
|
case ENC_OCTET:
|
||
|
m->size = m->data_size;
|
||
|
break;
|
||
|
case ENC_WCHAR:
|
||
|
m->size = m->data_size / sizeof(wchar_t);
|
||
|
break;
|
||
|
case ENC_UTF8:
|
||
|
m->size = PL_utf8_strlen(m->data, m->data_size);
|
||
|
break;
|
||
|
default:
|
||
|
assert(0);
|
||
|
return FALSE;
|
||
|
}
|
||
|
}
|
||
|
return PL_unify_integer(size, m->size);
|
||
|
} else
|
||
|
return PL_unify_integer(size, 0);
|
||
|
}
|
||
|
|
||
|
return FALSE;
|
||
|
}
|
||
|
|
||
|
|
||
|
/* - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
|
||
|
utf8_position_memory_file(+MF, -Here, -Size)
|
||
|
|
||
|
Given MF is a UTF-8 encoded memory file, unify here with the
|
||
|
byte-position of the read-pointer and Size with the total size of the
|
||
|
memory file in bytes. This is a bit hacky predicate, but the information
|
||
|
is easily available at low cost, while it is very valuable for producing
|
||
|
answers in content-length computation of the HTTP server. See
|
||
|
http_wrapper.pl
|
||
|
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - */
|
||
|
|
||
|
static foreign_t
|
||
|
utf8_position(term_t handle, term_t here, term_t size)
|
||
|
{ memfile *m;
|
||
|
|
||
|
if ( !get_memfile(handle, &m) )
|
||
|
return FALSE;
|
||
|
if ( m->encoding != ENC_UTF8 )
|
||
|
return pl_error(NULL, 0, "no UTF-8 encoding",
|
||
|
ERR_PERMISSION, handle, "utf8_position", "memory_file");
|
||
|
if ( !PL_unify_integer(size, m->data_size) )
|
||
|
return FALSE;
|
||
|
if ( m->stream )
|
||
|
{ IOPOS *op = m->stream->position;
|
||
|
long p;
|
||
|
|
||
|
m->stream->position = NULL;
|
||
|
p = Stell(m->stream);
|
||
|
m->stream->position = op;
|
||
|
|
||
|
return PL_unify_integer(here, p);
|
||
|
} else
|
||
|
return PL_unify_integer(here, 0);
|
||
|
}
|
||
|
|
||
|
|
||
|
static foreign_t
|
||
|
atom_to_memory_file(term_t atom, term_t handle)
|
||
|
{ atom_t a;
|
||
|
|
||
|
if ( PL_get_atom(atom, &a) )
|
||
|
{ memfile *m = calloc(1, sizeof(*m));
|
||
|
|
||
|
if ( !m )
|
||
|
return pl_error(NULL, 0, NULL, ERR_ERRNO, errno, "create", "memory_file", handle);
|
||
|
|
||
|
m->atom = a;
|
||
|
PL_register_atom(m->atom);
|
||
|
m->magic = MEMFILE_MAGIC;
|
||
|
|
||
|
if ( (m->data = (char *)PL_atom_nchars(a, &m->size)) )
|
||
|
{ m->encoding = ENC_ISO_LATIN_1;
|
||
|
m->data_size = m->size;
|
||
|
} else if ( (m->data = (char *)PL_atom_wchars(a, &m->size)) )
|
||
|
{ m->encoding = ENC_WCHAR;
|
||
|
m->data_size = m->size * sizeof(wchar_t);
|
||
|
} else if ( PL_blob_data(a, &m->size, NULL) )
|
||
|
{ m->data = PL_blob_data(a, &m->data_size, NULL);
|
||
|
m->encoding = ENC_OCTET;
|
||
|
m->size = m->data_size;
|
||
|
}
|
||
|
|
||
|
if ( unify_memfile(handle, m) )
|
||
|
return TRUE;
|
||
|
else
|
||
|
{ PL_unregister_atom(m->atom);
|
||
|
m->magic = 0;
|
||
|
free(m);
|
||
|
return FALSE;
|
||
|
}
|
||
|
} else
|
||
|
{ return pl_error(NULL, 0, NULL, ERR_ARGTYPE, 1,
|
||
|
atom, "atom");
|
||
|
}
|
||
|
}
|
||
|
|
||
|
|
||
|
static foreign_t
|
||
|
memory_file_to_text(term_t handle, term_t atom, term_t encoding, int flags)
|
||
|
{ memfile *m;
|
||
|
|
||
|
if ( get_memfile(handle, &m) )
|
||
|
{ IOENC enc;
|
||
|
|
||
|
if ( encoding )
|
||
|
{ if ( !get_encoding(encoding, &enc) )
|
||
|
return FALSE;
|
||
|
} else
|
||
|
enc = m->encoding;
|
||
|
|
||
|
if ( m->stream )
|
||
|
return alreadyOpen(handle, "to_atom");
|
||
|
if ( m->data )
|
||
|
{ switch(enc)
|
||
|
{ case ENC_ISO_LATIN_1:
|
||
|
case ENC_OCTET:
|
||
|
return PL_unify_chars(atom, flags, m->data_size, m->data);
|
||
|
case ENC_WCHAR:
|
||
|
return PL_unify_wchars(atom, flags, m->data_size/sizeof(wchar_t), (pl_wchar_t*)m->data);
|
||
|
case ENC_UTF8:
|
||
|
return PL_unify_chars(atom, flags|REP_UTF8, m->data_size, m->data);
|
||
|
default:
|
||
|
assert(0);
|
||
|
}
|
||
|
} else
|
||
|
return PL_unify_chars(atom, flags, 0, "");
|
||
|
}
|
||
|
|
||
|
return FALSE;
|
||
|
}
|
||
|
|
||
|
|
||
|
static foreign_t
|
||
|
memory_file_to_atom2(term_t handle, term_t atom)
|
||
|
{ return memory_file_to_text(handle, atom, 0, PL_ATOM);
|
||
|
}
|
||
|
|
||
|
|
||
|
static foreign_t
|
||
|
memory_file_to_atom3(term_t handle, term_t atom, term_t encoding)
|
||
|
{ return memory_file_to_text(handle, atom, encoding, PL_ATOM);
|
||
|
}
|
||
|
|
||
|
|
||
|
static foreign_t
|
||
|
memory_file_to_codes2(term_t handle, term_t atom)
|
||
|
{ return memory_file_to_text(handle, atom, 0, PL_CODE_LIST);
|
||
|
}
|
||
|
|
||
|
|
||
|
static foreign_t
|
||
|
memory_file_to_codes3(term_t handle, term_t atom, term_t encoding)
|
||
|
{ return memory_file_to_text(handle, atom, encoding, PL_CODE_LIST);
|
||
|
}
|
||
|
|
||
|
|
||
|
#define MKATOM(n) ATOM_ ## n = PL_new_atom(#n);
|
||
|
|
||
|
install_t
|
||
|
install_memfile()
|
||
|
{ if ( PL_query(PL_QUERY_VERSION) <= 50505 )
|
||
|
{ PL_warning("Requires SWI-Prolog version 5.5.6 or later");
|
||
|
return;
|
||
|
}
|
||
|
|
||
|
FUNCTOR_memory_file1 = PL_new_functor(PL_new_atom("$memory_file"), 1);
|
||
|
MKATOM(encoding);
|
||
|
MKATOM(unknown);
|
||
|
MKATOM(octet);
|
||
|
MKATOM(ascii);
|
||
|
MKATOM(iso_latin_1);
|
||
|
MKATOM(text);
|
||
|
MKATOM(utf8);
|
||
|
MKATOM(unicode_be);
|
||
|
MKATOM(unicode_le);
|
||
|
MKATOM(wchar_t);
|
||
|
MKATOM(read);
|
||
|
MKATOM(write);
|
||
|
MKATOM(free_on_close);
|
||
|
|
||
|
PL_register_foreign("new_memory_file", 1, new_memory_file, 0);
|
||
|
PL_register_foreign("free_memory_file", 1, free_memory_file, 0);
|
||
|
PL_register_foreign("size_memory_file", 2, size_memory_file, 0);
|
||
|
PL_register_foreign("open_memory_file", 3, open_memory_file, 0);
|
||
|
PL_register_foreign("open_memory_file", 4, open_memory_file4, 0);
|
||
|
PL_register_foreign("atom_to_memory_file", 2, atom_to_memory_file, 0);
|
||
|
PL_register_foreign("memory_file_to_atom", 2, memory_file_to_atom2, 0);
|
||
|
PL_register_foreign("memory_file_to_codes", 2, memory_file_to_codes2,0);
|
||
|
PL_register_foreign("memory_file_to_atom", 3, memory_file_to_atom3, 0);
|
||
|
PL_register_foreign("memory_file_to_codes", 3, memory_file_to_codes3,0);
|
||
|
PL_register_foreign("utf8_position_memory_file", 3, utf8_position, 0);
|
||
|
}
|