parsergen: ensure value returned from parser_run is initialised.

[ocean] / csrc / parsergen.mdc
diff --git a/csrc/parsergen.mdc b/csrc/parsergen.mdc

index b3d1cf638b3d47a4ff84add7b05c89eef59d86de..81121430f9b3e6e7c31c1c99aa656e1e3498c281 100644 (file)
--- a/csrc/parsergen.mdc
+++ b/csrc/parsergen.mdc
@@ -201,18 +201,6 @@ symbol, but its type might be `Unknown`.
         int num_syms;
  
  ###### functions
-       static int text_cmp(struct text a, struct text b)
-       {
-               int len = a.len;
-               if (a.len > b.len)
-                       len = b.len;
-               int cmp = strncmp(a.txt, b.txt, len);
-               if (cmp)
-                       return cmp;
-               else
-                       return a.len - b.len;
-       }
-
         static struct symbol *sym_find(struct grammar *g, struct text s)
         {
                 struct symbol **l = &g->syms;
@@ -552,8 +540,13 @@ where `START` is the first non-terminal given.
         struct production *p = calloc(1,sizeof(*p));
         struct text start = {"$start",6};
         struct text eof = {"$eof",4};
+       struct text code = {"$0 = $<1;", 9};
         p->head = sym_find(g, start);
         p->head->type = Nonterminal;
+       p->head->struct_name = g->current_type;
+       p->head->isref = g->type_isref;
+       if (g->current_type.txt)
+               p->code = code;
         array_add(&p->body, &p->body_size, head);
         array_add(&p->body, &p->body_size, sym_find(g, eof));
         p->head->first_production = g->production_count;
@@ -1814,7 +1807,7 @@ pieces of code provided in the grammar file, so they are generated first.
                 fprintf(f, "\tconfig->known_count = sizeof(known)/sizeof(known[0]);\n");
                 fprintf(f, "\tconfig->ignored |= (1 << TK_line_comment) | (1 << TK_block_comment);\n");
                 fprintf(f, "\ttokens = token_open(code, config);\n");
-               fprintf(f, "\tvoid *rv = parser_run(tokens, states, do_reduce, do_free, trace, non_term, config->known_count);\n");
+               fprintf(f, "\tvoid *rv = parser_run(tokens, states, do_reduce, do_free, trace, non_term, config);\n");
                 fprintf(f, "\ttoken_close(tokens);\n");
                 fprintf(f, "\treturn rv;\n");
                 fprintf(f, "}\n\n");
@@ -1962,6 +1955,11 @@ This code needs to be able to store data somewhere.  Rather than requiring
  `do_reduce` to `malloc` that "somewhere", we pass in a large buffer and have
  `do_reduce` return the size to be saved.
  
+In order for the code to access "global" context, we pass in the
+"config" pointer that was passed to parser function.  If the `struct
+token_config` is embedded in some larger structure, the reducing code
+can access the larger structure using pointer manipulation.
+
  The code fragment requires translation when written out.  Any `$N` needs to
  be converted to a reference either to that buffer (if `$0`) or to the
  structure returned by a previous reduction.  These pointers need to be cast
@@ -2044,7 +2042,7 @@ automatically freed.  This is equivalent to assigning `NULL` to the pointer.
         {
                 int i;
                 fprintf(f, "#line 0 \"gen_reduce\"\n");
-               fprintf(f, "static int do_reduce(int prod, void **body, void *ret)\n");
+               fprintf(f, "static int do_reduce(int prod, void **body, struct token_config *config, void *ret)\n");
                 fprintf(f, "{\n");
                 fprintf(f, "\tint ret_size = 0;\n");
  
@@ -2103,11 +2101,12 @@ appropriate for tokens on any terminal symbol.
                                 continue;
  
                         fprintf(f, "\tcase %d:\n", s->num);
-                       if (s->isref)
+                       if (s->isref) {
                                 fprintf(f, "\t\tfree_%.*s(*(void**)asn);\n",
                                         s->struct_name.len,
                                         s->struct_name.txt);
-                       else
+                               fprintf(f, "\t\tfree(asn);\n");
+                       } else
                                 fprintf(f, "\t\tfree_%.*s(asn);\n",
                                         s->struct_name.len,
                                         s->struct_name.txt);
@@ -2572,14 +2571,15 @@ since the last state which could have been at the start of a line.
  ###### parser_run
         void *parser_run(struct token_state *tokens,
                          const struct state states[],
-                        int (*do_reduce)(int, void**, void*),
+                        int (*do_reduce)(int, void**, struct token_config*, void*),
                          void (*do_free)(short, void*),
-                        FILE *trace, const char *non_term[], int knowns)
+                        FILE *trace, const char *non_term[],
+                        struct token_config *config)
         {
                 struct parser p = { 0 };
                 struct token *tk = NULL;
                 int accepted = 0;
-               void *ret;
+               void *ret = NULL;
  
                 p.next.newline_permitted = states[0].starts_line;
                 while (!accepted) {
@@ -2588,7 +2588,7 @@ since the last state which could have been at the start of a line.
                                 tk = tok_copy(token_next(tokens));
                         p.next.sym = tk->num;
                         if (trace)
-                               parser_trace(trace, &p, tk, states, non_term, knowns);
+                               parser_trace(trace, &p, tk, states, non_term, config->known_count);
  
                         if (p.next.sym == TK_in) {
                                 p.next.starts_indented = 1;
@@ -2638,7 +2638,7 @@ since the last state which could have been at the start of a line.
                                 body = p.asn_stack +
                                         (p.tos - states[p.next.state].reduce_size);
  
-                               bufsize = do_reduce(prod, body, buf);
+                               bufsize = do_reduce(prod, body, config, buf);
  
                                 pop(&p, size, do_free);
                                 shift(&p, memdup(buf, bufsize), states);
@@ -2702,9 +2702,10 @@ since the last state which could have been at the start of a line.
  ###### exported functions
         void *parser_run(struct token_state *tokens,
                          const struct state states[],
-                        int (*do_reduce)(int, void**, void*),
+                        int (*do_reduce)(int, void**, struct token_config*, void*),
                          void (*do_free)(short, void*),
-                        FILE *trace, const char *non_term[], int knowns);
+                        FILE *trace, const char *non_term[],
+                        struct token_config *config);
  
  ### Tracing
  
@@ -2839,6 +2840,12 @@ an error.
                         .word_cont = "",
                 };
                 parse_calc(s->code, &config, argc > 2 ? stderr : NULL);
+               while (s) {
+                       struct section *t = s->next;
+                       code_free(s->code);
+                       free(s);
+                       s = t;
+               }
                 exit(0);
         }