Compare commits

..

2 Commits

Author SHA1 Message Date
Aryadev Chavali
b93042fd27 lisp: INT -> SMI
when we implement big integer support, we should use INT there
instead.  SMI signals intent much better.
2026-03-05 19:41:16 +00:00
Aryadev Chavali
a50ca72b24 lisp: 63 bit -> 56 bit SMI
This massively simplifies the tagging implementation as all types now
have a 1 byte tag.  However, this does make the need for Big Integers
much greater as we've lost 8 bits of precision.
2026-03-05 18:36:43 +00:00
6 changed files with 48 additions and 66 deletions

View File

@@ -26,48 +26,35 @@ typedef struct
/// Tagging system /// Tagging system
typedef enum Tag typedef enum Tag
{ {
TAG_NIL = 0b00000000, // Start of atomic types TAG_SMI = 0b00000001, // Atomic types
TAG_INT = 0b00000001, // Special tag so we can encode 63 bit integers TAG_SYM = 0b00000011,
TAG_SYM = 0b00000100, TAG_NIL = 0b00000000, // Container types (0 LSB)
TAG_CONS = 0b00000010, // Start of container types TAG_CONS = 0b00000010,
TAG_VEC = 0b00000110, TAG_VEC = 0b00000100,
NUM_TAGS = 5, NUM_TAGS = 5,
} tag_t; } tag_t;
static_assert(NUM_TAGS == 5, "Expected NUM_TAGS == 5 for enum SHIFT");
enum Shift
{
SHIFT_INT = 1,
SHIFT_SYM = 8,
SHIFT_CONS = 8,
SHIFT_VEC = 8,
};
static_assert(NUM_TAGS == 5, "Expected NUM_TAGS == 5 for enum MASK");
enum Mask
{
MASK_INT = 0b00000001,
MASK_SYM = 0b11111111,
MASK_CONS = 0b11111111,
MASK_VEC = 0b11111111,
};
// Some helper macros for tagging // Some helper macros for tagging
#define TAG(PTR, TYPE) ((lisp_t *)(((PTR) << SHIFT_##TYPE) | TAG_##TYPE)) #define SHIFT_TAG (8)
#define IS_TAG(PTR, TYPE) (((u64)(PTR) & MASK_##TYPE) == TAG_##TYPE) #define MASK_TAG ((1 << SHIFT_TAG) - 1)
#define UNTAG(PTR, TYPE) (((u64)PTR) >> SHIFT_##TYPE)
#define INT_MAX ((((i64)1) << 62) - 1) #define TAG(PTR, TYPE) ((lisp_t *)((((u64)(PTR)) << SHIFT_TAG) | TAG_##TYPE))
#define INT_MIN (-(((i64)1) << 62)) #define UNTAG(PTR) (((u64)PTR) >> SHIFT_TAG)
#define GET_TAG(PTR) ((tag_t)(((u64)(PTR)) & MASK_TAG))
#define IS_TAG(PTR, TYPE) (GET_TAG(PTR) == TAG_##TYPE)
#define INT_BITS ((sizeof(i64) * 8) - SHIFT_TAG)
#define INT_MAX ((((i64)1) << (INT_BITS - 1)) - 1)
#define INT_MIN (-(INT_MAX + 1))
tag_t get_tag(const lisp_t *); tag_t get_tag(const lisp_t *);
lisp_t *tag_int(const i64); lisp_t *tag_smi(const i64);
lisp_t *tag_sym(const char *); lisp_t *tag_sym(const char *);
lisp_t *tag_cons(const cons_t *); lisp_t *tag_cons(const cons_t *);
lisp_t *tag_vec(const vec_t *); lisp_t *tag_vec(const vec_t *);
lisp_t *tag_generic(void *, tag_t); lisp_t *tag_generic(void *, tag_t);
i64 as_int(lisp_t *); i64 as_smi(lisp_t *);
char *as_sym(lisp_t *); char *as_sym(lisp_t *);
cons_t *as_cons(lisp_t *); cons_t *as_cons(lisp_t *);
vec_t *as_vec(lisp_t *); vec_t *as_vec(lisp_t *);

View File

@@ -32,7 +32,7 @@ alloc_node_t *make_node(page_t *page, tag_t type)
size += sizeof(vec_t); size += sizeof(vec_t);
break; break;
case TAG_NIL: case TAG_NIL:
case TAG_INT: case TAG_SMI:
case TAG_SYM: case TAG_SYM:
default: default:
FAIL("Unreachable"); FAIL("Unreachable");
@@ -61,7 +61,7 @@ alloc_node_t *lisp_to_node(lisp_t *lisp)
raw_ptr = as_vec(lisp); raw_ptr = as_vec(lisp);
break; break;
case TAG_NIL: // These shouldn't be allocated case TAG_NIL: // These shouldn't be allocated
case TAG_INT: case TAG_SMI:
case TAG_SYM: case TAG_SYM:
default: default:
FAIL("Unreachable"); FAIL("Unreachable");
@@ -80,7 +80,7 @@ lisp_t *alloc_make(alloc_t *alloc, tag_t type)
case TAG_VEC: case TAG_VEC:
break; break;
case TAG_NIL: // These shouldn't be allocated case TAG_NIL: // These shouldn't be allocated
case TAG_INT: case TAG_SMI:
case TAG_SYM: case TAG_SYM:
default: default:
FAIL("Unreachable"); FAIL("Unreachable");
@@ -181,7 +181,7 @@ void alloc_free(alloc_t *alloc)
vec_free((vec_t *)node->data); vec_free((vec_t *)node->data);
break; break;
case TAG_NIL: case TAG_NIL:
case TAG_INT: case TAG_SMI:
case TAG_SYM: case TAG_SYM:
default: default:
FAIL("Unreachable"); FAIL("Unreachable");

View File

@@ -10,24 +10,24 @@
#include <alisp/lisp.h> #include <alisp/lisp.h>
lisp_t *tag_int(i64 i) lisp_t *tag_smi(i64 i)
{ {
return TAG((u64)i, INT); return TAG(i, SMI);
} }
lisp_t *tag_sym(const char *str) lisp_t *tag_sym(const char *str)
{ {
return TAG((u64)str, SYM); return TAG(str, SYM);
} }
lisp_t *tag_vec(const vec_t *vec) lisp_t *tag_vec(const vec_t *vec)
{ {
return TAG((u64)vec, VEC); return TAG(vec, VEC);
} }
lisp_t *tag_cons(const cons_t *cons) lisp_t *tag_cons(const cons_t *cons)
{ {
return TAG((u64)cons, CONS); return TAG(cons, CONS);
} }
lisp_t *tag_generic(void *ptr, tag_t type) lisp_t *tag_generic(void *ptr, tag_t type)
@@ -35,9 +35,9 @@ lisp_t *tag_generic(void *ptr, tag_t type)
switch (type) switch (type)
{ {
case TAG_NIL: case TAG_NIL:
return NIL; return TAG(ptr, NIL);
case TAG_INT: case TAG_SMI:
return tag_int((i64)ptr); return tag_smi((i64)ptr);
case TAG_SYM: case TAG_SYM:
return tag_sym(ptr); return tag_sym(ptr);
case TAG_CONS: case TAG_CONS:
@@ -53,39 +53,34 @@ lisp_t *tag_generic(void *ptr, tag_t type)
tag_t get_tag(const lisp_t *lisp) tag_t get_tag(const lisp_t *lisp)
{ {
static_assert(NUM_TAGS == 5); static_assert(NUM_TAGS == 5);
if (!lisp) return GET_TAG(lisp);
return TAG_NIL;
else if (IS_TAG(lisp, INT))
return TAG_INT;
return (u64)lisp & 0xFF;
} }
i64 as_int(lisp_t *obj) i64 as_smi(lisp_t *obj)
{ {
assert(IS_TAG(obj, INT)); assert(IS_TAG(obj, SMI));
u64 p_obj = (u64)obj; u64 raw_obj = UNTAG(obj);
return UNTAG(p_obj, INT) | // Delete the tag u64 msb = (NTH_BYTE(raw_obj, 6) & 0x80) >> 7;
(NTH_BYTE(p_obj, 7) & 0x80) << 56 // duplicate the MSB (preserve sign) msb = ((1LU << 8) - msb) << 56;
; return (i64)(raw_obj | msb);
} }
char *as_sym(lisp_t *obj) char *as_sym(lisp_t *obj)
{ {
assert(IS_TAG(obj, SYM)); assert(IS_TAG(obj, SYM));
return (char *)UNTAG(obj, SYM); return (char *)UNTAG(obj);
} }
cons_t *as_cons(lisp_t *obj) cons_t *as_cons(lisp_t *obj)
{ {
assert(IS_TAG(obj, CONS)); assert(IS_TAG(obj, CONS));
return (cons_t *)UNTAG(obj, CONS); return (cons_t *)UNTAG(obj);
} }
vec_t *as_vec(lisp_t *obj) vec_t *as_vec(lisp_t *obj)
{ {
assert(IS_TAG(obj, VEC)); assert(IS_TAG(obj, VEC));
return (vec_t *)UNTAG(obj, VEC); return (vec_t *)UNTAG(obj);
} }
void lisp_print(FILE *fp, lisp_t *lisp) void lisp_print(FILE *fp, lisp_t *lisp)
@@ -97,11 +92,11 @@ void lisp_print(FILE *fp, lisp_t *lisp)
case TAG_NIL: case TAG_NIL:
fprintf(fp, "NIL"); fprintf(fp, "NIL");
break; break;
case TAG_INT: case TAG_SMI:
#if VERBOSE_LOGS == 2 #if VERBOSE_LOGS == 2
fprintf(fp, "INT["); fprintf(fp, "INT[");
#endif #endif
fprintf(fp, "%ld", as_int(lisp)); fprintf(fp, "%ld", as_smi(lisp));
#if VERBOSE_LOGS == 2 #if VERBOSE_LOGS == 2
fprintf(fp, "]"); fprintf(fp, "]");
#endif #endif
@@ -191,7 +186,7 @@ u64 tag_sizeof(tag_t tag)
{ {
case TAG_NIL: case TAG_NIL:
return 0; return 0;
case TAG_INT: case TAG_SMI:
case TAG_SYM: case TAG_SYM:
return sizeof(lisp_t *); return sizeof(lisp_t *);
case TAG_CONS: case TAG_CONS:

View File

@@ -111,7 +111,7 @@ read_err_t read_negative(sys_t *sys, stream_t *stream, lisp_t **ret)
read_err_t err = read_int(sys, stream, ret); read_err_t err = read_int(sys, stream, ret);
if (err) if (err)
return err; return err;
i64 n = as_int(*ret); i64 n = as_smi(*ret);
n *= -1; n *= -1;
*ret = make_int(n); *ret = make_int(n);
return READ_ERR_OK; return READ_ERR_OK;

View File

@@ -46,7 +46,7 @@ void sys_free(sys_t *sys)
lisp_t *make_int(i64 i) lisp_t *make_int(i64 i)
{ {
return tag_int(i); return tag_smi(i);
} }
lisp_t *cons(sys_t *sys, lisp_t *car, lisp_t *cdr) lisp_t *cons(sys_t *sys, lisp_t *car, lisp_t *cdr)
@@ -102,7 +102,7 @@ void lisp_free(lisp_t *item)
break; break;
} }
case TAG_NIL: case TAG_NIL:
case TAG_INT: case TAG_SMI:
case TAG_SYM: case TAG_SYM:
case NUM_TAGS: case NUM_TAGS:
// shouldn't be dealt with (either constant or dealt with elsewhere) // shouldn't be dealt with (either constant or dealt with elsewhere)
@@ -134,7 +134,7 @@ void lisp_free_rec(lisp_t *item)
break; break;
} }
case TAG_NIL: case TAG_NIL:
case TAG_INT: case TAG_SMI:
case TAG_SYM: case TAG_SYM:
case NUM_TAGS: case NUM_TAGS:
// shouldn't be dealt with (either constant or dealt with elsewhere) // shouldn't be dealt with (either constant or dealt with elsewhere)

View File

@@ -23,7 +23,7 @@ void smi_test(void)
{ {
i64 in = ints[i]; i64 in = ints[i];
lisp_t *lisp = make_int(in); lisp_t *lisp = make_int(in);
i64 out = as_int(lisp); i64 out = as_smi(lisp);
TEST(in == out, "%ld == %ld", in, out); TEST(in == out, "%ld == %ld", in, out);
} }
@@ -47,7 +47,7 @@ void smi_oob_test(void)
{ {
i64 in = ints[i]; i64 in = ints[i];
lisp_t *lisp = make_int(in); lisp_t *lisp = make_int(in);
i64 out = as_int(lisp); i64 out = as_smi(lisp);
TEST(in != out, "%ld != %ld", in, out); TEST(in != out, "%ld != %ld", in, out);
} }