Guido van Rossum | f70e43a | 1991-02-19 12:39:46 +0000 | [diff] [blame] | 1 | |
Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 2 | /* Computation of FIRST stets */ |
| 3 | |
Guido van Rossum | 3f5da24 | 1990-12-20 15:06:42 +0000 | [diff] [blame] | 4 | #include "pgenheaders.h" |
Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 5 | #include "grammar.h" |
| 6 | #include "token.h" |
| 7 | |
Guido van Rossum | 86bea46 | 1997-04-29 21:03:06 +0000 | [diff] [blame] | 8 | extern int Py_DebugFlag; |
Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 9 | |
Guido van Rossum | 3f5da24 | 1990-12-20 15:06:42 +0000 | [diff] [blame] | 10 | /* Forward */ |
Tim Peters | dbd9ba6 | 2000-07-09 03:09:57 +0000 | [diff] [blame] | 11 | static void calcfirstset(grammar *, dfa *); |
Guido van Rossum | 3f5da24 | 1990-12-20 15:06:42 +0000 | [diff] [blame] | 12 | |
| 13 | void |
Thomas Wouters | 23c9e00 | 2000-07-22 19:20:54 +0000 | [diff] [blame] | 14 | addfirstsets(grammar *g) |
Guido van Rossum | 3f5da24 | 1990-12-20 15:06:42 +0000 | [diff] [blame] | 15 | { |
| 16 | int i; |
| 17 | dfa *d; |
Guido van Rossum | 25dfe2c | 2001-09-11 16:43:16 +0000 | [diff] [blame] | 18 | |
| 19 | if (Py_DebugFlag) |
| 20 | printf("Adding FIRST sets ...\n"); |
Guido van Rossum | 3f5da24 | 1990-12-20 15:06:42 +0000 | [diff] [blame] | 21 | for (i = 0; i < g->g_ndfas; i++) { |
| 22 | d = &g->g_dfa[i]; |
| 23 | if (d->d_first == NULL) |
| 24 | calcfirstset(g, d); |
| 25 | } |
| 26 | } |
| 27 | |
Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 28 | static void |
Thomas Wouters | 23c9e00 | 2000-07-22 19:20:54 +0000 | [diff] [blame] | 29 | calcfirstset(grammar *g, dfa *d) |
Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 30 | { |
| 31 | int i, j; |
| 32 | state *s; |
| 33 | arc *a; |
| 34 | int nsyms; |
| 35 | int *sym; |
| 36 | int nbits; |
| 37 | static bitset dummy; |
| 38 | bitset result; |
| 39 | int type; |
| 40 | dfa *d1; |
| 41 | label *l0; |
| 42 | |
Guido van Rossum | 86bea46 | 1997-04-29 21:03:06 +0000 | [diff] [blame] | 43 | if (Py_DebugFlag) |
Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 44 | printf("Calculate FIRST set for '%s'\n", d->d_name); |
| 45 | |
| 46 | if (dummy == NULL) |
| 47 | dummy = newbitset(1); |
| 48 | if (d->d_first == dummy) { |
| 49 | fprintf(stderr, "Left-recursion for '%s'\n", d->d_name); |
| 50 | return; |
| 51 | } |
| 52 | if (d->d_first != NULL) { |
| 53 | fprintf(stderr, "Re-calculating FIRST set for '%s' ???\n", |
| 54 | d->d_name); |
| 55 | } |
| 56 | d->d_first = dummy; |
| 57 | |
| 58 | l0 = g->g_ll.ll_label; |
| 59 | nbits = g->g_ll.ll_nlabels; |
| 60 | result = newbitset(nbits); |
| 61 | |
Guido van Rossum | 86bea46 | 1997-04-29 21:03:06 +0000 | [diff] [blame] | 62 | sym = PyMem_NEW(int, 1); |
Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 63 | if (sym == NULL) |
Guido van Rossum | 86bea46 | 1997-04-29 21:03:06 +0000 | [diff] [blame] | 64 | Py_FatalError("no mem for new sym in calcfirstset"); |
Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 65 | nsyms = 1; |
| 66 | sym[0] = findlabel(&g->g_ll, d->d_type, (char *)NULL); |
| 67 | |
| 68 | s = &d->d_state[d->d_initial]; |
| 69 | for (i = 0; i < s->s_narcs; i++) { |
| 70 | a = &s->s_arc[i]; |
| 71 | for (j = 0; j < nsyms; j++) { |
| 72 | if (sym[j] == a->a_lbl) |
| 73 | break; |
| 74 | } |
| 75 | if (j >= nsyms) { /* New label */ |
Guido van Rossum | 86bea46 | 1997-04-29 21:03:06 +0000 | [diff] [blame] | 76 | PyMem_RESIZE(sym, int, nsyms + 1); |
Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 77 | if (sym == NULL) |
Guido van Rossum | 86bea46 | 1997-04-29 21:03:06 +0000 | [diff] [blame] | 78 | Py_FatalError( |
| 79 | "no mem to resize sym in calcfirstset"); |
Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 80 | sym[nsyms++] = a->a_lbl; |
| 81 | type = l0[a->a_lbl].lb_type; |
| 82 | if (ISNONTERMINAL(type)) { |
Guido van Rossum | 86bea46 | 1997-04-29 21:03:06 +0000 | [diff] [blame] | 83 | d1 = PyGrammar_FindDFA(g, type); |
Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 84 | if (d1->d_first == dummy) { |
| 85 | fprintf(stderr, |
| 86 | "Left-recursion below '%s'\n", |
| 87 | d->d_name); |
| 88 | } |
| 89 | else { |
| 90 | if (d1->d_first == NULL) |
| 91 | calcfirstset(g, d1); |
Guido van Rossum | 86bea46 | 1997-04-29 21:03:06 +0000 | [diff] [blame] | 92 | mergebitset(result, |
| 93 | d1->d_first, nbits); |
Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 94 | } |
| 95 | } |
| 96 | else if (ISTERMINAL(type)) { |
| 97 | addbit(result, a->a_lbl); |
| 98 | } |
| 99 | } |
| 100 | } |
| 101 | d->d_first = result; |
Guido van Rossum | 86bea46 | 1997-04-29 21:03:06 +0000 | [diff] [blame] | 102 | if (Py_DebugFlag) { |
Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 103 | printf("FIRST set for '%s': {", d->d_name); |
| 104 | for (i = 0; i < nbits; i++) { |
| 105 | if (testbit(result, i)) |
Guido van Rossum | 86bea46 | 1997-04-29 21:03:06 +0000 | [diff] [blame] | 106 | printf(" %s", PyGrammar_LabelRepr(&l0[i])); |
Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 107 | } |
| 108 | printf(" }\n"); |
| 109 | } |
| 110 | } |