blob: 407f40821d7660dfa9965a8666722104fc67c237 [file] [log] [blame]
drhf2bc0132004-10-04 13:19:23 +00001#!/usr/bin/awk -f
2#
drh722e95a2004-10-25 20:33:44 +00003# Generate the file opcodes.h.
4#
drhf2bc0132004-10-04 13:19:23 +00005# This AWK script scans a concatenation of the parse.h output file from the
6# parser and the vdbe.c source file in order to generate the opcodes numbers
7# for all opcodes.
8#
9# The lines of the vdbe.c that we are interested in are of the form:
10#
11# case OP_aaaa: /* same as TK_bbbbb */
12#
13# The TK_ comment is optional. If it is present, then the value assigned to
14# the OP_ is the same as the TK_ value. If missing, the OP_ value is assigned
15# a small integer that is different from every other OP_ value.
16#
drh0ed4fcd2006-01-26 14:29:58 +000017# We go to the trouble of making some OP_ values the same as TK_ values
drh722e95a2004-10-25 20:33:44 +000018# as an optimization. During parsing, things like expression operators
19# are coded with TK_ values such as TK_ADD, TK_DIVIDE, and so forth. Later
20# during code generation, we need to generate corresponding opcodes like
21# OP_Add and OP_Divide. By making TK_ADD==OP_Add and TK_DIVIDE==OP_Divide,
drh0ed4fcd2006-01-26 14:29:58 +000022# code to translate from one to the other is avoided. This makes the
drh722e95a2004-10-25 20:33:44 +000023# code generator run (infinitesimally) faster and more importantly it makes
drh0ed4fcd2006-01-26 14:29:58 +000024# the library footprint smaller.
drh722e95a2004-10-25 20:33:44 +000025#
drhfa3b19e2005-11-24 22:22:29 +000026# This script also scans for lines of the form:
27#
28# case OP_aaaa: /* no-push */
29#
30# When the no-push comment is found on an opcode, it means that that
drh0ed4fcd2006-01-26 14:29:58 +000031# opcode does not leave a result on the stack. By identifying which
drhfa3b19e2005-11-24 22:22:29 +000032# opcodes leave results on the stack it is possible to determine a
33# much smaller upper bound on the size of the stack. This allows
34# a smaller stack to be allocated, which is important to embedded
35# systems with limited memory space. This script generates a series
36# of "NOPUSH_MASK" defines that contain bitmaps of opcodes that leave
37# results on the stack. The NOPUSH_MASK defines are used in vdbeaux.c
38# to help determine the maximum stack size.
39#
drhf2bc0132004-10-04 13:19:23 +000040
danielk1977bc04f852005-03-29 08:26:13 +000041
drhf2bc0132004-10-04 13:19:23 +000042# Remember the TK_ values from the parse.h file
43/^#define TK_/ {
drh0a99ded2007-10-12 18:36:26 +000044 tk[$2] = 0+$3
drhf2bc0132004-10-04 13:19:23 +000045}
46
47# Scan for "case OP_aaaa:" lines in the vdbe.c file
48/^case OP_/ {
49 name = $2
drhb726ee62005-09-05 20:35:25 +000050 sub(/:/,"",name)
51 sub("\r","",name)
drhf2bc0132004-10-04 13:19:23 +000052 op[name] = -1
drh3a40f692008-01-04 16:50:09 +000053 out1[name] = 0
54 out2[name] = 0
55 out3[name] = 0
56 jump[name] = 0
57 in1[name] = 0
58 in2[name] = 0
59 in3[name] = 0
danielk1977287fb612008-01-04 19:10:28 +000060 nopush[name] = 0
danielk1977bc04f852005-03-29 08:26:13 +000061 for(i=3; i<NF; i++){
drhf2bc0132004-10-04 13:19:23 +000062 if($i=="same" && $(i+1)=="as"){
danielk1977bc04f852005-03-29 08:26:13 +000063 sym = $(i+2)
64 sub(/,/,"",sym)
65 op[name] = tk[sym]
drhf2bc0132004-10-04 13:19:23 +000066 used[op[name]] = 1
danielk1977bc04f852005-03-29 08:26:13 +000067 sameas[op[name]] = sym
68 }
drh4aeb7bf2008-01-04 19:12:35 +000069 x = $i
70 sub(",","",x)
71 if(x=="no-push"){
danielk19777a5147c2005-03-29 13:07:00 +000072 nopush[name] = 1
drh4aeb7bf2008-01-04 19:12:35 +000073 }else if(x=="out1"){
drh3a40f692008-01-04 16:50:09 +000074 out1[name] = 1
drh4aeb7bf2008-01-04 19:12:35 +000075 }else if(x=="out2"){
drh3a40f692008-01-04 16:50:09 +000076 out2[name] = 2
drh4aeb7bf2008-01-04 19:12:35 +000077 }else if(x=="out3"){
drh3a40f692008-01-04 16:50:09 +000078 out3[name] = 3
drh4aeb7bf2008-01-04 19:12:35 +000079 }else if(x=="in1"){
drh3a40f692008-01-04 16:50:09 +000080 in1[name] = 1
drh4aeb7bf2008-01-04 19:12:35 +000081 }else if(x=="in2"){
drh3a40f692008-01-04 16:50:09 +000082 in2[name] = 1
drh4aeb7bf2008-01-04 19:12:35 +000083 }else if(x=="in3"){
drh3a40f692008-01-04 16:50:09 +000084 in3[name] = 1
drh4aeb7bf2008-01-04 19:12:35 +000085 }else if(x=="jump"){
drh3a40f692008-01-04 16:50:09 +000086 jump[name] = 1
drhf2bc0132004-10-04 13:19:23 +000087 }
88 }
89}
90
91# Assign numbers to all opcodes and output the result.
92END {
93 cnt = 0
drhdaa28ff2004-12-10 17:17:18 +000094 max = 0
drhb327f772004-10-06 15:03:57 +000095 print "/* Automatically generated. Do not edit */"
96 print "/* See the mkopcodeh.awk script for details */"
drhf2bc0132004-10-04 13:19:23 +000097 for(name in op){
98 if( op[name]<0 ){
99 cnt++
100 while( used[cnt] ) cnt++
101 op[name] = cnt
102 }
drhdaa28ff2004-12-10 17:17:18 +0000103 used[op[name]] = 1;
104 if( op[name]>max ) max = op[name]
drh0602c2e2005-01-21 17:07:22 +0000105 printf "#define %-25s %15d", name, op[name]
106 if( sameas[op[name]] ) {
danielk197724c8ab82005-02-09 01:40:23 +0000107 printf " /* same as %-12s*/", sameas[op[name]]
drh0602c2e2005-01-21 17:07:22 +0000108 }
109 printf "\n"
110
drhf2bc0132004-10-04 13:19:23 +0000111 }
drhdaa28ff2004-12-10 17:17:18 +0000112 seenUnused = 0;
113 for(i=1; i<max; i++){
114 if( !used[i] ){
115 if( !seenUnused ){
116 printf "\n/* The following opcode values are never used */\n"
117 seenUnused = 1
118 }
drh0602c2e2005-01-21 17:07:22 +0000119 printf "#define %-25s %15d\n", sprintf( "OP_NotUsed_%-3d", i ), i
drhdaa28ff2004-12-10 17:17:18 +0000120 }
121 }
danielk1977bc04f852005-03-29 08:26:13 +0000122
drh3a40f692008-01-04 16:50:09 +0000123 # Generate the bitvectors:
124 #
125 # bit 0: jump
126 # bit 1: output on P1
127 # bit 2: output on P2
128 # bit 3: output on P3
129 # bit 4: input on P1
130 # bit 5: input on P2
131 # bit 6: input on P3
132 # bit 7: pushes a result onto stack
133 #
134 for(i=0; i<=max; i++) bv[i] = 0;
danielk1977bc04f852005-03-29 08:26:13 +0000135 for(name in op){
drh4aeb7bf2008-01-04 19:12:35 +0000136 x = op[name]
137 a0 = a1 = a2 = a3 = a4 = a5 = a6 = a7 = 0
138 if( jump[name] ) a0 = 1;
139 if( out1[name] ) a1 = 2;
140 if( out2[name] ) a2 = 4;
141 if( out3[name] ) a3 = 8;
142 if( in1[name] ) a4 = 16;
143 if( in2[name] ) a5 = 32;
144 if( in3[name] ) a6 = 64;
145 if( nopush[name]==0 ) a7 = 128;
146 bv[x] = a0+a1+a2+a3+a4+a5+a6+a7;
danielk1977bc04f852005-03-29 08:26:13 +0000147 }
drh3a40f692008-01-04 16:50:09 +0000148 print "\n"
149 print "/* Properties such as \"out2\" or \"jump\" that are specified in"
150 print "** comments following the "case" for each opcode in the vdbe.c"
151 print "** are encoded into bitvectors as follows:"
152 print "*/"
153 print "#define OPFLG_JUMP 0x01 /* jump: P2 holds a jump target */"
154 print "#define OPFLG_OUT1 0x02 /* out1: P1 specifies output reg */"
155 print "#define OPFLG_OUT2 0x04 /* out2: P2 specifies output reg */"
156 print "#define OPFLG_OUT3 0x08 /* out3: P3 specifies output reg */"
157 print "#define OPFLG_IN1 0x10 /* in1: P1 is an input reg */"
158 print "#define OPFLG_IN2 0x20 /* in2: P2 is an input reg */"
159 print "#define OPFLG_IN3 0x40 /* in3: P3 is an input reg */"
160 print "#define OPFLG_PUSH 0x80 /* omits no-push: Does not push */"
161 print "#define OPFLG_INITIALIZER {\\"
162 for(i=0; i<=max; i++){
163 printf " 0x%02x,", bv[i]
164 if( i%10==9 ) printf("\\\n");
danielk1977bc04f852005-03-29 08:26:13 +0000165 }
drh3a40f692008-01-04 16:50:09 +0000166 print "}"
drhf2bc0132004-10-04 13:19:23 +0000167}