2 ** cdump.c - mruby binary dumper (in C)
4 ** See Copyright Notice in mruby.h
8 #include <mruby/string.h>
9 #include <mruby/dump.h>
10 #include <mruby/irep.h>
11 #include <mruby/debug.h>
12 #include <mruby/internal.h>
19 #include <mruby/endian.h>
20 #define MRB_FLOAT_FMT "%.17g"
24 cdump_pool(mrb_state
*mrb
, const mrb_pool_value
*p
, FILE *fp
)
26 if (p
->tt
& IREP_TT_NFLAG
) { /* number */
30 if (p
->u
.i64
< INT32_MIN
|| INT32_MAX
< p
->u
.i64
) {
31 fprintf(fp
, "{IREP_TT_INT64, {.i64=%" PRId64
"}},\n", p
->u
.i64
);
34 fprintf(fp
, "{IREP_TT_INT32, {.i32=%" PRId32
"}},\n", (int32_t)p
->u
.i64
);
39 fprintf(fp
, "{IREP_TT_INT32, {.i32=%" PRId32
"}},\n", p
->u
.i32
);
43 fprintf(fp
, "{IREP_TT_FLOAT, {.f=" MRB_FLOAT_FMT
"}},\n", p
->u
.f
);
48 const char *s
= p
->u
.str
;
50 fputs("{IREP_TT_BIGINT, {\"", fp
);
51 for (int i
=0; i
<len
; i
++) {
52 fprintf(fp
, "\\x%02x", (int)s
[i
]&0xff);
60 int i
, len
= p
->tt
>>2;
61 const char *s
= p
->u
.str
;
62 fprintf(fp
, "{IREP_TT_STR|(%d<<2), {\"", len
);
63 for (i
=0; i
<len
; i
++) {
64 fprintf(fp
, "\\x%02x", (int)s
[i
]&0xff);
72 sym_name_word_p(const char *name
, mrb_int len
)
74 if (len
== 0) return FALSE
;
75 if (name
[0] != '_' && !ISALPHA(name
[0])) return FALSE
;
76 for (int i
= 1; i
< len
; i
++) {
77 if (name
[i
] != '_' && !ISALNUM(name
[i
])) return FALSE
;
83 sym_name_with_equal_p(const char *name
, mrb_int len
)
85 return len
>= 2 && name
[len
-1] == '=' && sym_name_word_p(name
, len
-1);
89 sym_name_with_question_mark_p(const char *name
, mrb_int len
)
91 return len
>= 2 && name
[len
-1] == '?' && sym_name_word_p(name
, len
-1);
95 sym_name_with_bang_p(const char *name
, mrb_int len
)
97 return len
>= 2 && name
[len
-1] == '!' && sym_name_word_p(name
, len
-1);
101 sym_name_ivar_p(const char *name
, mrb_int len
)
103 return len
>= 2 && name
[0] == '@' && sym_name_word_p(name
+1, len
-1);
107 sym_name_cvar_p(const char *name
, mrb_int len
)
109 return len
>= 3 && name
[0] == '@' && sym_name_ivar_p(name
+1, len
-1);
112 #define OPERATOR_SYMBOL(sym_name, name) {name, sym_name, sizeof(sym_name)-1}
113 struct operator_symbol
{
115 const char *sym_name
;
116 uint16_t sym_name_len
;
118 static const struct operator_symbol operator_table
[] = {
119 OPERATOR_SYMBOL("!", "not"),
120 OPERATOR_SYMBOL("%", "mod"),
121 OPERATOR_SYMBOL("&", "and"),
122 OPERATOR_SYMBOL("*", "mul"),
123 OPERATOR_SYMBOL("+", "add"),
124 OPERATOR_SYMBOL("-", "sub"),
125 OPERATOR_SYMBOL("/", "div"),
126 OPERATOR_SYMBOL("<", "lt"),
127 OPERATOR_SYMBOL(">", "gt"),
128 OPERATOR_SYMBOL("^", "xor"),
129 OPERATOR_SYMBOL("`", "tick"),
130 OPERATOR_SYMBOL("|", "or"),
131 OPERATOR_SYMBOL("~", "neg"),
132 OPERATOR_SYMBOL("!=", "neq"),
133 OPERATOR_SYMBOL("!~", "nmatch"),
134 OPERATOR_SYMBOL("&&", "andand"),
135 OPERATOR_SYMBOL("**", "pow"),
136 OPERATOR_SYMBOL("+@", "plus"),
137 OPERATOR_SYMBOL("-@", "minus"),
138 OPERATOR_SYMBOL("<<", "lshift"),
139 OPERATOR_SYMBOL("<=", "le"),
140 OPERATOR_SYMBOL("==", "eq"),
141 OPERATOR_SYMBOL("=~", "match"),
142 OPERATOR_SYMBOL(">=", "ge"),
143 OPERATOR_SYMBOL(">>", "rshift"),
144 OPERATOR_SYMBOL("[]", "aref"),
145 OPERATOR_SYMBOL("||", "oror"),
146 OPERATOR_SYMBOL("<=>", "cmp"),
147 OPERATOR_SYMBOL("===", "eqq"),
148 OPERATOR_SYMBOL("[]=", "aset"),
152 sym_operator_name(const char *sym_name
, mrb_int len
)
154 mrb_sym table_size
= sizeof(operator_table
)/sizeof(struct operator_symbol
);
155 if (operator_table
[table_size
-1].sym_name_len
< len
) return NULL
;
157 for (mrb_sym start
= 0; table_size
!= 0; table_size
/=2) {
158 mrb_sym idx
= start
+table_size
/2;
159 const struct operator_symbol
*op_sym
= &operator_table
[idx
];
160 int cmp
= (int)len
-(int)op_sym
->sym_name_len
;
162 cmp
= memcmp(sym_name
, op_sym
->sym_name
, len
);
163 if (cmp
== 0) return op_sym
->name
;
174 sym_var_name(mrb_state
*mrb
, const char *initname
, const char *key
, int n
)
177 mrb_value s
= mrb_str_new_cstr(mrb
, initname
);
178 mrb_str_cat_lit(mrb
, s
, "_");
179 mrb_str_cat_cstr(mrb
, s
, key
);
180 mrb_str_cat_lit(mrb
, s
, "_");
181 snprintf(buf
, sizeof(buf
), "%d", n
);
182 mrb_str_cat_cstr(mrb
, s
, buf
);
183 return RSTRING_PTR(s
);
187 cdump_sym(mrb_state
*mrb
, mrb_sym sym
, const char *var_name
, int idx
, mrb_value init_syms_code
, FILE *fp
)
196 const char *name
= mrb_sym_name_len(mrb
, sym
, &len
), *op_name
;
197 if (!name
) return MRB_DUMP_INVALID_ARGUMENT
;
198 if (sym_name_word_p(name
, len
)) {
199 fprintf(fp
, "MRB_SYM(%s)", name
);
201 else if (sym_name_with_equal_p(name
, len
)) {
202 fprintf(fp
, "MRB_SYM_E(%.*s)", (int)(len
-1), name
);
204 else if (sym_name_with_question_mark_p(name
, len
)) {
205 fprintf(fp
, "MRB_SYM_Q(%.*s)", (int)(len
-1), name
);
207 else if (sym_name_with_bang_p(name
, len
)) {
208 fprintf(fp
, "MRB_SYM_B(%.*s)", (int)(len
-1), name
);
210 else if (sym_name_ivar_p(name
, len
)) {
211 fprintf(fp
, "MRB_IVSYM(%s)", name
+1);
213 else if (sym_name_cvar_p(name
, len
)) {
214 fprintf(fp
, "MRB_CVSYM(%s)", name
+2);
216 else if ((op_name
= sym_operator_name(name
, len
))) {
217 fprintf(fp
, "MRB_OPSYM(%s)", op_name
);
221 mrb_value name_obj
= mrb_str_new(mrb
, name
, len
);
222 mrb_str_cat_lit(mrb
, init_syms_code
, " ");
223 mrb_str_cat_cstr(mrb
, init_syms_code
, var_name
);
224 snprintf(buf
, sizeof(buf
), "[%d] = ", idx
);
225 mrb_str_cat_cstr(mrb
, init_syms_code
, buf
);
226 mrb_str_cat_lit(mrb
, init_syms_code
, "mrb_intern_lit(mrb, ");
227 mrb_str_cat_str(mrb
, init_syms_code
, mrb_str_dump(mrb
, name_obj
));
228 mrb_str_cat_lit(mrb
, init_syms_code
, ");\n");
236 cdump_syms(mrb_state
*mrb
, const char *name
, const char *key
, int n
, int syms_len
, const mrb_sym
*syms
, mrb_value init_syms_code
, FILE *fp
)
238 int ai
= mrb_gc_arena_save(mrb
);
239 mrb_int code_len
= RSTRING_LEN(init_syms_code
);
240 const char *var_name
= sym_var_name(mrb
, name
, key
, n
);
242 fprintf(fp
, "mrb_DEFINE_SYMS_VAR(%s, %d, (", var_name
, syms_len
);
243 for (int i
=0; i
<syms_len
; i
++) {
244 cdump_sym(mrb
, syms
[i
], var_name
, i
, init_syms_code
, fp
);
247 if (code_len
== RSTRING_LEN(init_syms_code
)) fputs("const", fp
);
249 mrb_gc_arena_restore(mrb
, ai
);
253 //Handle the simple/common case of debug_info:
254 // - 1 file associated with a single irep
255 // - mrb_debug_line_ary format only
257 simple_debug_info(mrb_irep_debug_info
*info
)
259 if (!info
|| info
->flen
!= 1) {
265 //Adds debug information to c-structs and
266 //adds filenames in init_syms_code block
268 cdump_debug(mrb_state
*mrb
, const char *name
, int n
, mrb_irep_debug_info
*info
,
269 mrb_value init_syms_code
, FILE *fp
)
271 int ai
= mrb_gc_arena_save(mrb
);
273 const char *line_type
= "mrb_debug_line_ary";
275 if (!simple_debug_info(info
))
276 return MRB_DUMP_INVALID_IREP
;
278 int len
= info
->files
[0]->line_entry_count
;
280 const char *filename
= mrb_sym_name_len(mrb
, info
->files
[0]->filename_sym
, NULL
);
281 snprintf(buffer
, sizeof(buffer
), " %s_debug_file_%d.filename_sym = mrb_intern_lit(mrb,", name
, n
);
282 mrb_str_cat_cstr(mrb
, init_syms_code
, buffer
);
283 mrb_str_cat_str(mrb
, init_syms_code
, mrb_str_dump(mrb
, mrb_str_new_cstr(mrb
, filename
)));
284 mrb_str_cat_cstr(mrb
, init_syms_code
, ");\n");
286 switch (info
->files
[0]->line_type
) {
287 case mrb_debug_line_ary
:
288 fprintf(fp
, "static uint16_t %s_debug_lines_%d[%d] = {", name
, n
, len
);
289 for (int i
=0; i
<len
; i
++) {
290 if (i
%10 == 0) fputs("\n", fp
);
291 fprintf(fp
, "0x%04x,", info
->files
[0]->lines
.ary
[i
]);
296 case mrb_debug_line_flat_map
:
297 line_type
= "mrb_debug_line_flat_map";
298 fprintf(fp
, "static struct mrb_irep_debug_info_line %s_debug_lines_%d[%d] = {", name
, n
, len
);
299 for (int i
=0; i
<len
; i
++) {
300 const mrb_irep_debug_info_line
*fmap
= &info
->files
[0]->lines
.flat_map
[i
];
301 fprintf(fp
, "\t{.start_pos=0x%04x,.line=%d},\n", fmap
->start_pos
, fmap
->line
);
306 case mrb_debug_line_packed_map
:
307 line_type
= "mrb_debug_line_packed_map";
308 fprintf(fp
, "static const char %s_debug_lines_%d[] = \"", name
, n
);
309 const uint8_t *pmap
= info
->files
[0]->lines
.packed_map
;
310 for (int i
=0; i
<len
; i
++) {
311 fprintf(fp
, "\\x%02x", pmap
[i
]&0xff);
316 fprintf(fp
, "static mrb_irep_debug_info_file %s_debug_file_%d = {\n", name
, n
);
317 fprintf(fp
, "%d, %d, %d, %s, {%s_debug_lines_%d}};\n",
318 info
->files
[0]->start_pos
,
319 info
->files
[0]->filename_sym
,
320 info
->files
[0]->line_entry_count
,
323 fprintf(fp
, "static mrb_irep_debug_info_file *%s_debug_file_%d_ = &%s_debug_file_%d;\n", name
, n
, name
, n
);
325 fprintf(fp
, "static mrb_irep_debug_info %s_debug_%d = {\n", name
, n
);
326 fprintf(fp
, "%d, %d, &%s_debug_file_%d_};\n", info
->pc_count
, info
->flen
, name
, n
);
328 mrb_gc_arena_restore(mrb
, ai
);
333 cdump_irep_struct(mrb_state
*mrb
, const mrb_irep
*irep
, uint8_t flags
, FILE *fp
, const char *name
, int n
, mrb_value init_syms_code
, int *mp
)
337 int debug_available
= 0;
341 for (i
=0,len
=irep
->rlen
; i
<len
; i
++) {
343 if (cdump_irep_struct(mrb
, irep
->reps
[i
], flags
, fp
, name
, max
+i
, init_syms_code
, mp
) != MRB_DUMP_OK
)
344 return MRB_DUMP_INVALID_ARGUMENT
;
346 fprintf(fp
, "static const mrb_irep *%s_reps_%d[%d] = {\n", name
, n
, len
);
347 for (i
=0,len
=irep
->rlen
; i
<len
; i
++) {
348 fprintf(fp
, " &%s_irep_%d,\n", name
, max
+i
);
355 fprintf(fp
, "static const mrb_pool_value %s_pool_%d[%d] = {\n", name
, n
, len
);
356 for (i
=0; i
<len
; i
++) {
357 if (cdump_pool(mrb
, &irep
->pool
[i
], fp
) != MRB_DUMP_OK
)
358 return MRB_DUMP_INVALID_ARGUMENT
;
364 cdump_syms(mrb
, name
, "syms", n
, irep
->slen
, irep
->syms
, init_syms_code
, fp
);
367 len
=irep
->ilen
+sizeof(struct mrb_irep_catch_handler
)*irep
->clen
;
368 fprintf(fp
, "static const mrb_code %s_iseq_%d[%d] = {", name
, n
, len
);
369 for (i
=0; i
<len
; i
++) {
370 if (i
%20 == 0) fputs("\n", fp
);
371 fprintf(fp
, "0x%02x,", irep
->iseq
[i
]);
376 cdump_syms(mrb
, name
, "lv", n
, irep
->nlocals
-1, irep
->lv
, init_syms_code
, fp
);
379 if (flags
& MRB_DUMP_DEBUG_INFO
) {
380 if (cdump_debug(mrb
, name
, n
, irep
->debug_info
, init_syms_code
, fp
) == MRB_DUMP_OK
) {
387 fprintf(fp
, "static const mrb_irep %s_irep_%d = {\n", name
, n
);
388 fprintf(fp
, " %d,%d,%d,\n", irep
->nlocals
, irep
->nregs
, irep
->clen
);
389 fprintf(fp
, " MRB_IREP_STATIC,%s_iseq_%d,\n", name
, n
);
391 fprintf(fp
, " %s_pool_%d,", name
, n
);
394 fputs( " NULL,", fp
);
397 fprintf(fp
, "%s_syms_%d,", name
, n
);
403 fprintf(fp
, "%s_reps_%d,\n", name
, n
);
406 fputs( "NULL,\n", fp
);
409 fprintf(fp
, " %s_lv_%d,\n", name
, n
);
412 fputs( " NULL,\t\t\t\t\t/* lv */\n", fp
);
414 if (debug_available
) {
415 fprintf(fp
, " &%s_debug_%d,\n", name
, n
);
418 fputs(" NULL,\t\t\t\t\t/* debug_info */\n", fp
);
420 fprintf(fp
, " %d,%d,%d,%d,0\n};\n", irep
->ilen
, irep
->plen
, irep
->slen
, irep
->rlen
);
426 mrb_dump_irep_cstruct(mrb_state
*mrb
, const mrb_irep
*irep
, uint8_t flags
, FILE *fp
, const char *initname
)
428 if (fp
== NULL
|| initname
== NULL
|| initname
[0] == '\0') {
429 return MRB_DUMP_INVALID_ARGUMENT
;
431 if (fprintf(fp
, "#include <mruby.h>\n"
432 "#include <mruby/irep.h>\n"
433 "#include <mruby/debug.h>\n"
434 "#include <mruby/proc.h>\n"
435 "#include <mruby/presym.h>\n"
437 return MRB_DUMP_WRITE_FAULT
;
439 fputs("#define mrb_BRACED(...) {__VA_ARGS__}\n", fp
);
440 fputs("#define mrb_DEFINE_SYMS_VAR(name, len, syms, qualifier) \\\n", fp
);
441 fputs(" static qualifier mrb_sym name[len] = mrb_BRACED syms\n", fp
);
443 mrb_value init_syms_code
= mrb_str_new_capa(mrb
, 0);
445 int n
= cdump_irep_struct(mrb
, irep
, flags
, fp
, initname
, 0, init_syms_code
, &max
);
446 if (n
!= MRB_DUMP_OK
) return n
;
449 "const struct RProc %s[] = {{\n",
450 (flags
& MRB_DUMP_STATIC
) ? "static"
451 : "#ifdef __cplusplus\n"
455 fprintf(fp
, "NULL,NULL,MRB_TT_PROC,MRB_GC_RED,0,{&%s_irep_0},NULL,{NULL},\n}};\n", initname
);
456 fputs("static void\n", fp
);
457 fprintf(fp
, "%s_init_syms(mrb_state *mrb)\n", initname
);
459 fputs(RSTRING_PTR(init_syms_code
), fp
);