Skip to content

Commit

Permalink
symbol can contain non printable characters
Browse files Browse the repository at this point in the history
  • Loading branch information
matz committed Jun 4, 2012
1 parent 531124f commit b7cc7ff
Show file tree
Hide file tree
Showing 5 changed files with 83 additions and 33 deletions.
3 changes: 3 additions & 0 deletions include/mruby.h
Expand Up @@ -332,7 +332,10 @@ mrb_value mrb_funcall(mrb_state*, mrb_value, const char*, int,...);
mrb_value mrb_funcall_argv(mrb_state*, mrb_value, const char*, int, mrb_value*);
mrb_value mrb_funcall_with_block(mrb_state*, mrb_value, const char*, int, mrb_value*, mrb_value);
mrb_sym mrb_intern(mrb_state*,const char*);
mrb_sym mrb_intern2(mrb_state*,const char*,int);
mrb_sym mrb_intern_str(mrb_state*,mrb_value);
const char *mrb_sym2name(mrb_state*,mrb_sym);
const char *mrb_sym2name_len(mrb_state*,mrb_sym,int*);
mrb_value mrb_str_format(mrb_state *, int, const mrb_value *, mrb_value);

void *mrb_malloc(mrb_state*, size_t);
Expand Down
6 changes: 4 additions & 2 deletions src/dump.c
Expand Up @@ -268,8 +268,10 @@ get_syms_block_size(mrb_state *mrb, mrb_irep *irep, int type)

size += DUMP_SIZE(MRB_DUMP_SIZE_OF_SHORT, type); /* snl(n) */
if (irep->syms[sym_no] != 0) {
name = mrb_sym2name(mrb, irep->syms[sym_no]);
nlen = str_dump_len((char*)name, strlen(name), type);
int len;

name = mrb_sym2name_len(mrb, irep->syms[sym_no], &len);
nlen = str_dump_len((char*)name, len, type);
size += nlen; /* sn(n) */
}
}
Expand Down
2 changes: 1 addition & 1 deletion src/load.c
Expand Up @@ -477,7 +477,7 @@ read_rite_irep_record(mrb_state *mrb, unsigned char *src, mrb_irep *irep, uint32
memcpy(buf, src, snl); //symbol name
src += snl;
buf[snl] = '\0';
irep->syms[i] = mrb_intern(mrb, buf);
irep->syms[i] = mrb_intern2(mrb, buf, snl);
}
}
crc = calc_crc_16_ccitt((unsigned char*)pStart, src - pStart); //Calculate CRC
Expand Down
6 changes: 0 additions & 6 deletions src/string.c
Expand Up @@ -1616,12 +1616,6 @@ mrb_str_init(mrb_state *mrb, mrb_value self)
return self;
}

mrb_sym
mrb_intern_str(mrb_state *mrb, mrb_value str)
{
return mrb_intern(mrb, RSTRING_PTR(str));
}

/* 15.2.10.5.25 */
/* 15.2.10.5.41 */
/*
Expand Down
99 changes: 75 additions & 24 deletions src/symbol.c
Expand Up @@ -17,67 +17,99 @@
#include <stdio.h>

/* ------------------------------------------------------ */
KHASH_INIT(s2n, mrb_sym, const char*, 1, kh_int_hash_func, kh_int_hash_equal)
KHASH_MAP_INIT_STR(n2s, mrb_sym);
typedef struct symbol_name {
int len;
const char *name;
} symbol_name;

static inline khint_t
sym_hash_func(mrb_state *mrb, const symbol_name s)
{
khint_t h = 0;
size_t i;
const char *p = s.name;

for (i=0; i<s.len; i++) {
h = (h << 5) - h + *p++;
}
return h;
}
#define sym_hash_equal(mrb,a, b) (a.len == b.len && memcmp(a.name, b.name, a.len) == 0)

KHASH_INIT(n2s, symbol_name, mrb_sym, 1, sym_hash_func, sym_hash_equal)
/* ------------------------------------------------------ */
mrb_sym
mrb_intern(mrb_state *mrb, const char *name)
mrb_intern2(mrb_state *mrb, const char *name, int len)
{
khash_t(n2s) *h = mrb->name2sym;
khash_t(s2n) *rh = mrb->sym2name;
khiter_t k;
size_t len;
char *p;
mrb_sym sym;
symbol_name sname;

k = kh_get(n2s, h, name);
sname.name = name;
sname.len = len;
k = kh_get(n2s, h, sname);
if (k != kh_end(h))
return kh_value(h, k);

sym = ++mrb->symidx;
len = strlen(name);
p = mrb_malloc(mrb, len+1);
memcpy(p, name, len);
p[len] = 0;
k = kh_put(n2s, h, p);
sname.name = p;
k = kh_put(n2s, h, sname);
kh_value(h, k) = sym;

k = kh_put(s2n, rh, sym);
kh_value(rh, k) = p;

return sym;
}

mrb_sym
mrb_intern(mrb_state *mrb, const char *name)
{
return mrb_intern2(mrb, name, strlen(name));
}

mrb_sym
mrb_intern_str(mrb_state *mrb, mrb_value str)
{
return mrb_intern(mrb, RSTRING_PTR(str));
}

const char*
mrb_sym2name(mrb_state *mrb, mrb_sym sym)
mrb_sym2name_len(mrb_state *mrb, mrb_sym sym, int *lenp)
{
khash_t(s2n) *h = mrb->sym2name;
khash_t(n2s) *h = mrb->name2sym;
khiter_t k;
symbol_name sname;

k = kh_get(s2n, h, sym);
for (k = kh_begin(h); k != kh_end(h); k++) {
if (kh_exist(h, k) && kh_value(h, k) == sym) break;
}
if (k == kh_end(h)) {
*lenp = 0;
return NULL; /* missing */
}
return kh_value(h, k);
sname = kh_key(h, k);
*lenp = sname.len;
return sname.name;
}

void
mrb_free_symtbls(mrb_state *mrb)
{
khash_t(s2n) *h = mrb->sym2name;
khash_t(n2s) *h = mrb->name2sym;
khiter_t k;

for (k = kh_begin(h); k != kh_end(h); ++k)
if (kh_exist(h, k)) mrb_free(mrb, (char*)kh_value(h, k));
kh_destroy(s2n,mrb->sym2name);
for (k = kh_begin(h); k != kh_end(h); k++)
if (kh_exist(h, k)) mrb_free(mrb, (char*)kh_key(h, k).name);
kh_destroy(n2s,mrb->name2sym);
}

void
mrb_init_symtbl(mrb_state *mrb)
{
mrb->name2sym = kh_init(n2s, mrb);
mrb->sym2name = kh_init(s2n, mrb);
}

/**********************************************************************
Expand Down Expand Up @@ -148,8 +180,11 @@ mrb_value
mrb_sym_to_s(mrb_state *mrb, mrb_value sym)
{
mrb_sym id = SYM2ID(sym);
const char *p;
int len;

return mrb_str_new_cstr(mrb, mrb_sym2name(mrb, id));
p = mrb_sym2name_len(mrb, id, &len);
return mrb_str_new(mrb, p, len);
}

/* 15.2.11.3.4 */
Expand Down Expand Up @@ -258,7 +293,7 @@ symname_p(const char *name)
if (*++m == '@') ++m;
break;

case '|': case '^': case '&': case '/': case '%': case '~': case '`':
case '|': case '^': case '&': case '/': case '%': case '~': case '`': case '!':
++m;
break;

Expand Down Expand Up @@ -288,9 +323,10 @@ sym_inspect(mrb_state *mrb, mrb_value sym)
mrb_value str;
const char *name;
mrb_sym id = SYM2ID(sym);
int len;

name = mrb_sym2name(mrb, id); //mrb_id2name(id);
str = mrb_str_new(mrb, 0, strlen(name)+1);
name = mrb_sym2name_len(mrb, id, &len);
str = mrb_str_new(mrb, 0, len+1);
RSTRING(str)->buf[0] = ':';
strcpy(RSTRING(str)->buf+1, name);
if (!symname_p(name)) {
Expand All @@ -300,6 +336,21 @@ sym_inspect(mrb_state *mrb, mrb_value sym)
return str;
}

const char*
mrb_sym2name(mrb_state *mrb, mrb_sym sym)
{
int len;
const char *name = mrb_sym2name_len(mrb, sym, &len);

if (!name) return NULL;
if (symname_p(name) && strlen(name) == len) {
return name;
}
else {
mrb_value str = mrb_str_dump(mrb, mrb_str_new(mrb, name, len));
return RSTRING(str)->buf;
}
}

void
mrb_init_symbols(mrb_state *mrb)
Expand Down

0 comments on commit b7cc7ff

Please sign in to comment.