ecl/src/c/serialize.d
2011-07-31 15:24:50 +02:00

549 lines
17 KiB
C

/* -*- mode: c; c-basic-offset: 8 -*- */
/*
serialize.d -- Serialize a bunch of lisp data.
*/
/*
Copyright (c) 2010, Juan Jose Garcia Ripoll.
ECL is free software; you can redistribute it and/or
modify it under the terms of the GNU Library General Public
License as published by the Free Software Foundation; either
version 2 of the License, or (at your option) any later version.
See file '../Copyright' for full details.
*/
#include <ecl/ecl.h>
#include <string.h>
#define ECL_DEFINE_AET_SIZE
#include <ecl/internal.h>
struct fake_package {
HEADER;
cl_object name;
};
struct fake_symbol {
HEADER;
cl_object name;
cl_object pack;
};
#define ROUND_TO_WORD(int) \
((int + sizeof(cl_fixnum) - 1) & ~(sizeof(cl_fixnum) - 1))
#define ROUNDED_SIZE(name) \
ROUND_TO_WORD(sizeof(struct name))
static cl_index object_size[] = {
0, /* t_start */
ROUNDED_SIZE(ecl_cons), /* t_list */
0, /* t_character = 2 */
0, /* t_fixnum = 3 */
ROUNDED_SIZE(ecl_bignum), /* t_bignum = 4 */
ROUNDED_SIZE(ecl_ratio), /* t_ratio */
ROUNDED_SIZE(ecl_singlefloat), /* t_singlefloat */
ROUNDED_SIZE(ecl_doublefloat), /* t_doublefloat */
#ifdef ECL_LONG_FLOAT
ROUNDED_SIZE(ecl_long_float), /* t_longfloat */
#endif
ROUNDED_SIZE(ecl_complex), /* t_complex */
ROUNDED_SIZE(fake_symbol), /* t_symbol */
ROUNDED_SIZE(fake_package), /* t_package */
ROUNDED_SIZE(ecl_hashtable), /* t_hashtable */
ROUNDED_SIZE(ecl_array), /* t_array */
ROUNDED_SIZE(ecl_vector), /* t_vector */
#ifdef ECL_UNICODE
ROUNDED_SIZE(ecl_string), /* t_string */
#endif
ROUNDED_SIZE(ecl_base_string), /* t_base_string */
ROUNDED_SIZE(ecl_vector), /* t_bitvector */
ROUNDED_SIZE(ecl_stream), /* t_stream */
ROUNDED_SIZE(ecl_random), /* t_random */
ROUNDED_SIZE(ecl_readtable), /* t_readtable */
ROUNDED_SIZE(ecl_pathname), /* t_pathname */
ROUNDED_SIZE(ecl_bytecodes), /* t_bytecodes */
ROUNDED_SIZE(ecl_bclosure), /* t_bclosure */
ROUNDED_SIZE(ecl_cfun), /* t_cfun */
ROUNDED_SIZE(ecl_cfunfixed), /* t_cfunfixed */
ROUNDED_SIZE(ecl_cclosure), /* t_cclosure */
#ifdef CLOS
ROUNDED_SIZE(ecl_instance), /* t_instance */
#else
ROUNDED_SIZE(ecl_structure), /* t_structure */
#endif /* CLOS */
#ifdef ECL_THREADS
ROUNDED_SIZE(ecl_process), /* t_process */
ROUNDED_SIZE(ecl_lock), /* t_lock */
ROUNDED_SIZE(ecl_condition_variable), /* t_condition_variable */
# ifdef ECL_SEMAPHORES
ROUNDED_SIZE(ecl_semaphore), /* t_semaphore */
# endif
#endif
ROUNDED_SIZE(ecl_codeblock), /* t_codeblock */
ROUNDED_SIZE(ecl_foreign), /* t_foreign */
ROUNDED_SIZE(ecl_frame), /* t_frame */
ROUNDED_SIZE(ecl_weak_pointer) /* t_weak_pointer */
#ifdef ECL_SSE2
, ROUNDED_SIZE(ecl_sse_pack) /* t_sse_pack */
#endif
};
typedef struct pool {
cl_object data;
cl_object hash;
cl_object queue;
cl_object last;
} *pool_t;
static cl_index
alloc(pool_t pool, cl_index size)
{
cl_index bytes = ROUND_TO_WORD(size);
cl_index fillp = pool->data->vector.fillp;
cl_index next_fillp = fillp + bytes;
if (next_fillp >= pool->data->vector.dim) {
cl_index new_dim = next_fillp + next_fillp / 2;
pool->data = cl_funcall(3, @'adjust-array', pool->data,
MAKE_FIXNUM(new_dim));
}
pool->data->vector.fillp = next_fillp;
return fillp;
}
static cl_object
fix_to_ptr(cl_object ptr)
{
cl_fixnum i = (cl_fixnum)ptr;
return (cl_object)(i & ~IMMEDIATE_TAG);
}
static cl_object
enqueue(pool_t pool, cl_object what)
{
cl_object record, index;
if (FIXNUMP(what) || CHARACTERP(what) || what == OBJNULL) {
return what;
}
#ifdef ECL_SMALL_CONS
if (Null(what))
return what;
#endif
index = ecl_gethash_safe(what, pool->hash, OBJNULL);
if (index == OBJNULL) {
cl_object cons;
index = MAKE_FIXNUM(pool->hash->hash.entries);
ecl_sethash(what, pool->hash, index);
cons = ecl_cons(what, Cnil);
ECL_RPLACD(pool->last, cons);
pool->last = cons;
}
return fix_to_ptr(index);
}
#ifdef ECL_SMALL_CONS
typedef struct {
HEADER;
cl_object car, cdr;
} large_cons;
typedef large_cons *large_cons_ptr;
#endif
static cl_index
serialize_bits(pool_t pool, void *data, cl_index size)
{
cl_index index = alloc(pool, size);
memcpy(pool->data->vector.self.b8 + index, data, size);
return index;
}
static void
serialize_object_ptr(pool_t pool, cl_object *ptr, cl_index dim)
{
cl_index index = serialize_bits(pool, ptr, dim*sizeof(cl_object));
for (; dim; dim--, index += sizeof(cl_object)) {
cl_object *p = (cl_object *)(pool->data->vector.self.b8 + index);
*p = enqueue(pool, *p);
p++;
}
}
static void serialize_vector(pool_t pool, cl_object v);
static void
serialize_displaced_vector(pool_t pool, cl_object v)
{
cl_object disp = v->vector.displaced;
cl_object to = ECL_CONS_CAR(disp);
if (Null(to)) {
v->vector.displaced = Cnil;
serialize_vector(pool, v);
} else {
cl_index index = v->vector.self.b8 - to->vector.self.b8;
v->vector.displaced = enqueue(pool, to);
v->vector.self.b8 = (uint8_t*)index;
}
}
static void
serialize_vector(pool_t pool, cl_object v)
{
if (!Null(v->vector.displaced)) {
serialize_displaced_vector(pool, v);
} else if (v->vector.elttype == aet_object) {
serialize_object_ptr(pool, v->vector.self.t, v->vector.dim);
} else {
serialize_bits(pool, v->vector.self.b8,
v->vector.dim * ecl_aet_size[v->vector.elttype]);
}
}
static void
serialize_array(pool_t pool, cl_object a)
{
serialize_bits(pool, a->array.dims, sizeof(cl_index) * a->array.rank);
serialize_vector(pool, a);
}
static void
serialize_one(pool_t pool, cl_object what)
{
cl_index bytes, index;
cl_object buffer;
#ifdef ECL_SMALL_CONS
if (ECL_LISTP(what)) {
cl_index bytes = ROUND_TO_WORD(sizeof(large_cons));
cl_index index = alloc(pool, bytes);
large_cons_ptr cons =
(large_cons_ptr)(pool->data->vector.self.b8 + index);
memset(cons, 0, bytes);
cons->t = t_list;
cons->car = enqueue(pool, ECL_CONS_CAR(what));
cons->cdr = enqueue(pool, ECL_CONS_CDR(what));
return;
}
#endif
bytes = object_size[what->d.t];
index = alloc(pool, bytes);
buffer = (cl_object)(pool->data->vector.self.b8 + index);
memcpy(buffer, what, bytes);
switch (buffer->d.t) {
case t_singlefloat:
case t_doublefloat:
#ifdef ECL_LONG_FLOAT
case t_longfloat:
#endif
break;
#ifndef ECL_SMALL_CONS
case t_list:
buffer->cons.car = enqueue(pool, buffer->cons.car);
buffer->cons.cdr = enqueue(pool, buffer->cons.car);
break;
#endif
case t_bignum: {
cl_fixnum size = buffer->big.big_size;
cl_index dim = ((size < 0) ? (-size) : size);
cl_index bytes = dim * sizeof(mp_limb_t);
serialize_bits(pool, buffer->big.big_limbs, bytes);
break;
}
case t_ratio: {
buffer->ratio.den = enqueue(pool, buffer->ratio.den);
buffer->ratio.num = enqueue(pool, buffer->ratio.num);
break;
}
case t_complex: {
buffer->complex.real = enqueue(pool, buffer->complex.real);
buffer->complex.imag = enqueue(pool, buffer->complex.imag);
break;
}
#ifdef ECL_UNICODE
case t_string:
#endif
case t_vector:
case t_bitvector:
case t_base_string: {
serialize_vector(pool, buffer);
break;
}
case t_array: {
cl_index bytes = ROUND_TO_WORD(buffer->array.rank *
sizeof(cl_index));
serialize_bits(pool, buffer->array.dims, bytes);
serialize_vector(pool, buffer);
break;
}
case t_package: {
struct fake_package *p = (struct fake_package *)buffer;
p->name = enqueue(pool, what->pack.name);
break;
}
case t_symbol: {
struct fake_symbol *p = (struct fake_symbol *)buffer;
p->name = enqueue(pool, what->symbol.name);
p->pack = enqueue(pool, what->symbol.hpack);
break;
}
case t_pathname:
buffer->pathname.host =
enqueue(pool, buffer->pathname.host);
buffer->pathname.device =
enqueue(pool, buffer->pathname.device);
buffer->pathname.directory =
enqueue(pool, buffer->pathname.directory);
buffer->pathname.name = enqueue(pool, buffer->pathname.name);
buffer->pathname.type = enqueue(pool, buffer->pathname.type);
buffer->pathname.version =
enqueue(pool, buffer->pathname.version);
break;
default:
FEerror("Unable to serialize object ~A", 1, what);
}
}
static void
init_pool(pool_t pool, cl_object root)
{
pool->data = si_make_vector(@'ext::byte8',
MAKE_FIXNUM(1024),
Ct,
MAKE_FIXNUM(2 * sizeof(cl_index)),
Cnil,
MAKE_FIXNUM(0));
pool->hash = cl__make_hash_table(@'eql', MAKE_FIXNUM(256),
cl_core.rehash_size,
cl_core.rehash_threshold);
ecl_sethash(root, pool->hash, MAKE_FIXNUM(0));
pool->queue = ecl_list1(root);
pool->last = pool->queue;
}
static cl_object
close_pool(pool_t pool)
{
pool->data->vector.self.index[0] = pool->data->vector.fillp;
pool->data->vector.self.index[1] = pool->hash->hash.entries;
return pool->data;
}
cl_object
si_serialize(cl_object root)
{
struct pool pool[1];
init_pool(pool, root);
while (!Null(pool->queue)) {
cl_object what = ECL_CONS_CAR(pool->queue);
serialize_one(pool, what);
pool->queue = ECL_CONS_CDR(pool->queue);
}
@(return close_pool(pool));
}
static void *
reconstruct_bits(uint8_t *data, cl_index bytes)
{
void *output = ecl_alloc_atomic(bytes);
memcpy(output, data, bytes);
return output;
}
static void *
reconstruct_object_ptr(uint8_t *data, cl_index bytes)
{
void *output = ecl_alloc(bytes);
memcpy(output, data, bytes);
return output;
}
static uint8_t *
reconstruct_vector(cl_object v, uint8_t *data)
{
if (v->vector.displaced == Cnil) {
cl_type t = v->vector.elttype;
cl_index size = v->vector.dim * ecl_aet_size[t];
cl_index bytes = ROUND_TO_WORD(size);
if (t == aet_object) {
v->vector.self.t = reconstruct_object_ptr(data, bytes);
} else {
v->vector.self.t = reconstruct_bits(data, size);
}
data += bytes;
}
return data;
}
static uint8_t *
reconstruct_array(cl_object a, uint8_t *data)
{
cl_index bytes = ROUND_TO_WORD(a->array.rank * sizeof(cl_index));
a->array.dims = reconstruct_bits(data, bytes);
return reconstruct_vector(a, data + bytes);
}
static uint8_t *
duplicate_object(uint8_t *data, cl_object *output)
{
cl_type t = ((cl_object)data)->d.t;
cl_object o = ecl_alloc_object(t);
cl_index bytes = object_size[t];
memcpy(o, data, bytes);
*output = o;
return data + bytes;
}
static uint8_t *
reconstruct_one(uint8_t *data, cl_object *output)
{
cl_object o = (cl_object)data;
switch (o->d.t) {
#ifdef ECL_SMALL_CONS
case t_list: {
large_cons_ptr c = (large_cons_ptr)data;
*output = ecl_cons(c->car, c->cdr);
data += ROUND_TO_WORD(sizeof(large_cons));
break;
}
#endif
#ifdef ECL_UNICODE
case t_string:
#endif
case t_base_string:
case t_vector:
case t_bitvector:
data = duplicate_object(data, output);
data = reconstruct_vector(*output, data);
break;
case t_array:
data = duplicate_object(data, output);
data = reconstruct_array(*output, data);
break;
case t_package:
*output = (cl_object)data;
data += ROUND_TO_WORD(sizeof(struct fake_package));
break;
case t_symbol:
*output = (cl_object)data;
data += ROUND_TO_WORD(sizeof(struct fake_symbol));
break;
default:
data = duplicate_object(data, output);
}
return data;
}
static cl_object
get_object(cl_object o_or_index, cl_object *o_list)
{
if (IMMEDIATE(o_or_index)) {
return o_or_index;
} else {
cl_index i = (cl_index)o_or_index >> 2;
return o_list[i];
}
}
static void
fixup_vector(cl_object v, cl_object *o_list)
{
if (!IMMEDIATE(v->vector.displaced)) {
cl_object disp = get_object(v->vector.displaced, o_list);
cl_object to = ECL_CONS_CAR(disp);
if (to != Cnil) {
cl_index offset = (cl_index)v->vector.self.b8;
v->vector.displaced = Cnil;
ecl_displace(v, to, MAKE_FIXNUM(offset));
return;
}
}
if (v->vector.elttype == aet_object) {
cl_index i;
cl_object *p = v->vector.self.t;
for (i = v->vector.dim; i; i--, p++) {
*p = get_object(*p, o_list);
}
}
}
static void
fixup(cl_object o, cl_object *o_list)
{
#ifdef ECL_SMALL_CONS
if (ECL_LISTP(o)) {
ECL_RPLACA(o, get_object(ECL_CONS_CAR(o), o_list));
ECL_RPLACD(o, get_object(ECL_CONS_CDR(o), o_list));
return;
}
#endif
switch (o->d.t) {
case t_ratio:
o->ratio.den = get_object(o->ratio.den, o_list);
o->ratio.num = get_object(o->ratio.num, o_list);
break;
case t_complex:
o->complex.real = get_object(o->complex.real, o_list);
o->complex.imag = get_object(o->complex.imag, o_list);
break;
#ifdef ECL_UNICODE
case t_string:
#endif
case t_base_string:
case t_vector:
case t_bitvector:
case t_array:
fixup_vector(o, o_list);
break;
case t_pathname:
o->pathname.host = get_object(o->pathname.host, o_list);
o->pathname.device =
get_object(o->pathname.device, o_list);
o->pathname.directory =
get_object(o->pathname.directory, o_list);
o->pathname.name = get_object(o->pathname.name, o_list);
o->pathname.type = get_object(o->pathname.type, o_list);
o->pathname.version =
get_object(o->pathname.version, o_list);
break;
default:
break;
}
}
cl_object
ecl_deserialize(uint8_t *raw)
{
cl_index *data = (cl_index*)raw;
cl_index i, num_el = data[1];
cl_object *output = ecl_alloc(sizeof(cl_object) * num_el);
raw += 2*sizeof(cl_index);
for (i = 0; i < num_el; i++) {
raw = reconstruct_one(raw, output+i);
}
for (i = 0; i < num_el; i++) {
cl_object package = output[i];
if (!IMMEDIATE(package) && package->d.t == t_package) {
cl_object name = get_object(package->pack.name,
output);
output[i] = ecl_find_package_nolock(name);
}
}
for (i = 0; i < num_el; i++) {
cl_object symbol = output[i];
if (!IMMEDIATE(symbol) && symbol->d.t == t_symbol) {
struct fake_symbol *s = (struct fake_symbol *)symbol;
cl_object name = get_object(s->name, output);
cl_object pack = get_object(s->pack, output);
int flag;
output[i] = ecl_intern(name, pack, &flag);
}
}
for (i = 0; i < num_el; i++) {
fixup(output[i], output);
}
return output[0];
}
cl_object
si_deserialize(cl_object data)
{
@(return ecl_deserialize(data->vector.self.b8))
}