drh | f2bc013 | 2004-10-04 13:19:23 +0000 | [diff] [blame] | 1 | #!/usr/bin/awk -f |
| 2 | # |
drh | 722e95a | 2004-10-25 20:33:44 +0000 | [diff] [blame] | 3 | # Generate the file opcodes.h. |
| 4 | # |
drh | f2bc013 | 2004-10-04 13:19:23 +0000 | [diff] [blame] | 5 | # This AWK script scans a concatenation of the parse.h output file from the |
| 6 | # parser and the vdbe.c source file in order to generate the opcodes numbers |
| 7 | # for all opcodes. |
| 8 | # |
| 9 | # The lines of the vdbe.c that we are interested in are of the form: |
| 10 | # |
| 11 | # case OP_aaaa: /* same as TK_bbbbb */ |
| 12 | # |
| 13 | # The TK_ comment is optional. If it is present, then the value assigned to |
| 14 | # the OP_ is the same as the TK_ value. If missing, the OP_ value is assigned |
| 15 | # a small integer that is different from every other OP_ value. |
| 16 | # |
drh | 0ed4fcd | 2006-01-26 14:29:58 +0000 | [diff] [blame] | 17 | # We go to the trouble of making some OP_ values the same as TK_ values |
drh | 722e95a | 2004-10-25 20:33:44 +0000 | [diff] [blame] | 18 | # as an optimization. During parsing, things like expression operators |
| 19 | # are coded with TK_ values such as TK_ADD, TK_DIVIDE, and so forth. Later |
| 20 | # during code generation, we need to generate corresponding opcodes like |
| 21 | # OP_Add and OP_Divide. By making TK_ADD==OP_Add and TK_DIVIDE==OP_Divide, |
drh | 0ed4fcd | 2006-01-26 14:29:58 +0000 | [diff] [blame] | 22 | # code to translate from one to the other is avoided. This makes the |
drh | 722e95a | 2004-10-25 20:33:44 +0000 | [diff] [blame] | 23 | # code generator run (infinitesimally) faster and more importantly it makes |
drh | 0ed4fcd | 2006-01-26 14:29:58 +0000 | [diff] [blame] | 24 | # the library footprint smaller. |
drh | 722e95a | 2004-10-25 20:33:44 +0000 | [diff] [blame] | 25 | # |
drh | fa3b19e | 2005-11-24 22:22:29 +0000 | [diff] [blame] | 26 | # This script also scans for lines of the form: |
| 27 | # |
drh | b24a200 | 2009-11-02 18:14:50 +0000 | [diff] [blame] | 28 | # case OP_aaaa: /* jump, in1, in2, in3, out2-prerelease, out3 */ |
drh | fa3b19e | 2005-11-24 22:22:29 +0000 | [diff] [blame] | 29 | # |
drh | b24a200 | 2009-11-02 18:14:50 +0000 | [diff] [blame] | 30 | # When such comments are found on an opcode, it means that certain |
| 31 | # properties apply to that opcode. Set corresponding flags using the |
| 32 | # OPFLG_INITIALIZER macro. |
drh | fa3b19e | 2005-11-24 22:22:29 +0000 | [diff] [blame] | 33 | # |
drh | f2bc013 | 2004-10-04 13:19:23 +0000 | [diff] [blame] | 34 | |
danielk1977 | bc04f85 | 2005-03-29 08:26:13 +0000 | [diff] [blame] | 35 | |
drh | f2bc013 | 2004-10-04 13:19:23 +0000 | [diff] [blame] | 36 | # Remember the TK_ values from the parse.h file |
| 37 | /^#define TK_/ { |
drh | 8c8a8c4 | 2013-08-06 07:45:08 +0000 | [diff] [blame] | 38 | tk[$2] = 0+$3 # tk[x] holds the numeric value for TK symbol X |
drh | f2bc013 | 2004-10-04 13:19:23 +0000 | [diff] [blame] | 39 | } |
| 40 | |
| 41 | # Scan for "case OP_aaaa:" lines in the vdbe.c file |
| 42 | /^case OP_/ { |
| 43 | name = $2 |
drh | b726ee6 | 2005-09-05 20:35:25 +0000 | [diff] [blame] | 44 | sub(/:/,"",name) |
| 45 | sub("\r","",name) |
drh | 8c8a8c4 | 2013-08-06 07:45:08 +0000 | [diff] [blame] | 46 | op[name] = -1 # op[x] holds the numeric value for OP symbol x |
drh | 3a40f69 | 2008-01-04 16:50:09 +0000 | [diff] [blame] | 47 | jump[name] = 0 |
drh | 4c58312 | 2008-01-04 22:01:03 +0000 | [diff] [blame] | 48 | out2_prerelease[name] = 0 |
drh | b1fdb2a | 2008-01-05 04:06:03 +0000 | [diff] [blame] | 49 | in1[name] = 0 |
| 50 | in2[name] = 0 |
| 51 | in3[name] = 0 |
drh | 93952eb | 2009-11-13 19:43:43 +0000 | [diff] [blame] | 52 | out2[name] = 0 |
drh | b1fdb2a | 2008-01-05 04:06:03 +0000 | [diff] [blame] | 53 | out3[name] = 0 |
danielk1977 | bc04f85 | 2005-03-29 08:26:13 +0000 | [diff] [blame] | 54 | for(i=3; i<NF; i++){ |
drh | f2bc013 | 2004-10-04 13:19:23 +0000 | [diff] [blame] | 55 | if($i=="same" && $(i+1)=="as"){ |
danielk1977 | bc04f85 | 2005-03-29 08:26:13 +0000 | [diff] [blame] | 56 | sym = $(i+2) |
| 57 | sub(/,/,"",sym) |
drh | 8c8a8c4 | 2013-08-06 07:45:08 +0000 | [diff] [blame] | 58 | val = tk[sym] |
| 59 | op[name] = val |
| 60 | used[val] = 1 |
| 61 | sameas[val] = sym |
| 62 | def[val] = name |
danielk1977 | bc04f85 | 2005-03-29 08:26:13 +0000 | [diff] [blame] | 63 | } |
drh | 4aeb7bf | 2008-01-04 19:12:35 +0000 | [diff] [blame] | 64 | x = $i |
| 65 | sub(",","",x) |
drh | 9cbf342 | 2008-01-17 16:22:13 +0000 | [diff] [blame] | 66 | if(x=="jump"){ |
drh | 3a40f69 | 2008-01-04 16:50:09 +0000 | [diff] [blame] | 67 | jump[name] = 1 |
drh | 4c58312 | 2008-01-04 22:01:03 +0000 | [diff] [blame] | 68 | }else if(x=="out2-prerelease"){ |
| 69 | out2_prerelease[name] = 1 |
drh | b1fdb2a | 2008-01-05 04:06:03 +0000 | [diff] [blame] | 70 | }else if(x=="in1"){ |
| 71 | in1[name] = 1 |
| 72 | }else if(x=="in2"){ |
| 73 | in2[name] = 1 |
| 74 | }else if(x=="in3"){ |
| 75 | in3[name] = 1 |
drh | 93952eb | 2009-11-13 19:43:43 +0000 | [diff] [blame] | 76 | }else if(x=="out2"){ |
| 77 | out2[name] = 1 |
drh | b1fdb2a | 2008-01-05 04:06:03 +0000 | [diff] [blame] | 78 | }else if(x=="out3"){ |
| 79 | out3[name] = 1 |
drh | f2bc013 | 2004-10-04 13:19:23 +0000 | [diff] [blame] | 80 | } |
| 81 | } |
drh | b24a200 | 2009-11-02 18:14:50 +0000 | [diff] [blame] | 82 | order[n_op++] = name; |
drh | f2bc013 | 2004-10-04 13:19:23 +0000 | [diff] [blame] | 83 | } |
| 84 | |
| 85 | # Assign numbers to all opcodes and output the result. |
| 86 | END { |
| 87 | cnt = 0 |
drh | daa28ff | 2004-12-10 17:17:18 +0000 | [diff] [blame] | 88 | max = 0 |
drh | b327f77 | 2004-10-06 15:03:57 +0000 | [diff] [blame] | 89 | print "/* Automatically generated. Do not edit */" |
| 90 | print "/* See the mkopcodeh.awk script for details */" |
drh | 91fd4d4 | 2008-01-19 20:11:25 +0000 | [diff] [blame] | 91 | op["OP_Noop"] = -1; |
drh | ccaf773 | 2009-11-02 18:44:58 +0000 | [diff] [blame] | 92 | order[n_op++] = "OP_Noop"; |
drh | 91fd4d4 | 2008-01-19 20:11:25 +0000 | [diff] [blame] | 93 | op["OP_Explain"] = -1; |
drh | ccaf773 | 2009-11-02 18:44:58 +0000 | [diff] [blame] | 94 | order[n_op++] = "OP_Explain"; |
drh | 8c8a8c4 | 2013-08-06 07:45:08 +0000 | [diff] [blame] | 95 | |
| 96 | # Assign small values to opcodes that are processed by resolveP2Values() |
| 97 | # to make code generation for the switch() statement smaller and faster. |
| 98 | for(i=0; i<n_op; i++){ |
| 99 | name = order[i]; |
| 100 | if( op[name]>=0 ) continue; |
| 101 | if( name=="OP_Function" \ |
| 102 | || name=="OP_AggStep" \ |
| 103 | || name=="OP_Transaction" \ |
| 104 | || name=="OP_AutoCommit" \ |
| 105 | || name=="OP_Savepoint" \ |
| 106 | || name=="OP_Checkpoint" \ |
| 107 | || name=="OP_Vacuum" \ |
| 108 | || name=="OP_JournalMode" \ |
| 109 | || name=="OP_VUpdate" \ |
| 110 | || name=="OP_VFilter" \ |
| 111 | || name=="OP_Next" \ |
| 112 | || name=="OP_SorterNext" \ |
| 113 | || name=="OP_Prev" \ |
| 114 | ){ |
| 115 | cnt++ |
| 116 | while( used[cnt] ) cnt++ |
| 117 | op[name] = cnt |
| 118 | used[cnt] = 1 |
| 119 | def[cnt] = name |
| 120 | } |
| 121 | } |
| 122 | |
| 123 | # Generate the numeric values for opcodes |
drh | b24a200 | 2009-11-02 18:14:50 +0000 | [diff] [blame] | 124 | for(i=0; i<n_op; i++){ |
| 125 | name = order[i]; |
drh | f2bc013 | 2004-10-04 13:19:23 +0000 | [diff] [blame] | 126 | if( op[name]<0 ){ |
| 127 | cnt++ |
| 128 | while( used[cnt] ) cnt++ |
| 129 | op[name] = cnt |
drh | 8c8a8c4 | 2013-08-06 07:45:08 +0000 | [diff] [blame] | 130 | used[cnt] = 1 |
| 131 | def[cnt] = name |
drh | f2bc013 | 2004-10-04 13:19:23 +0000 | [diff] [blame] | 132 | } |
drh | 8c8a8c4 | 2013-08-06 07:45:08 +0000 | [diff] [blame] | 133 | } |
| 134 | max = cnt |
| 135 | for(i=1; i<=max; i++){ |
| 136 | if( !used[i] ){ |
| 137 | def[i] = "OP_NotUsed_" i |
| 138 | } |
| 139 | printf "#define %-25s %15d", def[i], i |
| 140 | if( sameas[i] ){ |
| 141 | printf " /* same as %-12s*/", sameas[i] |
drh | 0602c2e | 2005-01-21 17:07:22 +0000 | [diff] [blame] | 142 | } |
| 143 | printf "\n" |
drh | daa28ff | 2004-12-10 17:17:18 +0000 | [diff] [blame] | 144 | } |
danielk1977 | bc04f85 | 2005-03-29 08:26:13 +0000 | [diff] [blame] | 145 | |
drh | 3a40f69 | 2008-01-04 16:50:09 +0000 | [diff] [blame] | 146 | # Generate the bitvectors: |
| 147 | # |
| 148 | # bit 0: jump |
drh | 4c58312 | 2008-01-04 22:01:03 +0000 | [diff] [blame] | 149 | # bit 1: pushes a result onto stack |
| 150 | # bit 2: output to p1. release p1 before opcode runs |
drh | 3a40f69 | 2008-01-04 16:50:09 +0000 | [diff] [blame] | 151 | # |
drh | 8c8a8c4 | 2013-08-06 07:45:08 +0000 | [diff] [blame] | 152 | for(i=0; i<=max; i++){ |
| 153 | name = def[i] |
drh | 4aeb7bf | 2008-01-04 19:12:35 +0000 | [diff] [blame] | 154 | a0 = a1 = a2 = a3 = a4 = a5 = a6 = a7 = 0 |
| 155 | if( jump[name] ) a0 = 1; |
drh | 9cbf342 | 2008-01-17 16:22:13 +0000 | [diff] [blame] | 156 | if( out2_prerelease[name] ) a1 = 2; |
| 157 | if( in1[name] ) a2 = 4; |
| 158 | if( in2[name] ) a3 = 8; |
| 159 | if( in3[name] ) a4 = 16; |
drh | 93952eb | 2009-11-13 19:43:43 +0000 | [diff] [blame] | 160 | if( out2[name] ) a5 = 32; |
| 161 | if( out3[name] ) a6 = 64; |
drh | 8c8a8c4 | 2013-08-06 07:45:08 +0000 | [diff] [blame] | 162 | bv[i] = a0+a1+a2+a3+a4+a5+a6+a7; |
danielk1977 | bc04f85 | 2005-03-29 08:26:13 +0000 | [diff] [blame] | 163 | } |
drh | 3a40f69 | 2008-01-04 16:50:09 +0000 | [diff] [blame] | 164 | print "\n" |
| 165 | print "/* Properties such as \"out2\" or \"jump\" that are specified in" |
drh | 3de120b | 2008-01-10 00:08:43 +0000 | [diff] [blame] | 166 | print "** comments following the \"case\" for each opcode in the vdbe.c" |
drh | 3a40f69 | 2008-01-04 16:50:09 +0000 | [diff] [blame] | 167 | print "** are encoded into bitvectors as follows:" |
| 168 | print "*/" |
drh | 5b6afba | 2008-01-05 16:29:28 +0000 | [diff] [blame] | 169 | print "#define OPFLG_JUMP 0x0001 /* jump: P2 holds jmp target */" |
drh | 9cbf342 | 2008-01-17 16:22:13 +0000 | [diff] [blame] | 170 | print "#define OPFLG_OUT2_PRERELEASE 0x0002 /* out2-prerelease: */" |
| 171 | print "#define OPFLG_IN1 0x0004 /* in1: P1 is an input */" |
| 172 | print "#define OPFLG_IN2 0x0008 /* in2: P2 is an input */" |
| 173 | print "#define OPFLG_IN3 0x0010 /* in3: P3 is an input */" |
drh | 93952eb | 2009-11-13 19:43:43 +0000 | [diff] [blame] | 174 | print "#define OPFLG_OUT2 0x0020 /* out2: P2 is an output */" |
| 175 | print "#define OPFLG_OUT3 0x0040 /* out3: P3 is an output */" |
drh | 3a40f69 | 2008-01-04 16:50:09 +0000 | [diff] [blame] | 176 | print "#define OPFLG_INITIALIZER {\\" |
| 177 | for(i=0; i<=max; i++){ |
drh | 5b6afba | 2008-01-05 16:29:28 +0000 | [diff] [blame] | 178 | if( i%8==0 ) printf("/* %3d */",i) |
drh | 9cbf342 | 2008-01-17 16:22:13 +0000 | [diff] [blame] | 179 | printf " 0x%02x,", bv[i] |
drh | 4c58312 | 2008-01-04 22:01:03 +0000 | [diff] [blame] | 180 | if( i%8==7 ) printf("\\\n"); |
danielk1977 | bc04f85 | 2005-03-29 08:26:13 +0000 | [diff] [blame] | 181 | } |
drh | 3a40f69 | 2008-01-04 16:50:09 +0000 | [diff] [blame] | 182 | print "}" |
drh | f2bc013 | 2004-10-04 13:19:23 +0000 | [diff] [blame] | 183 | } |