xref: /sqlite-3.40.0/tool/mkopcodeh.tcl (revision 17adf4e5)
1#!/usr/bin/tclsh
2#
3# Generate the file opcodes.h.
4#
5# This TCL script scans a concatenation of the parse.h output file from the
6# parser and the vdbe.c source file in order to generate the opcodes numbers
7# for all opcodes.
8#
9# The lines of the vdbe.c that we are interested in are of the form:
10#
11#       case OP_aaaa:      /* same as TK_bbbbb */
12#
13# The TK_ comment is optional.  If it is present, then the value assigned to
14# the OP_ is the same as the TK_ value.  If missing, the OP_ value is assigned
15# a small integer that is different from every other OP_ value.
16#
17# We go to the trouble of making some OP_ values the same as TK_ values
18# as an optimization.  During parsing, things like expression operators
19# are coded with TK_ values such as TK_ADD, TK_DIVIDE, and so forth.  Later
20# during code generation, we need to generate corresponding opcodes like
21# OP_Add and OP_Divide.  By making TK_ADD==OP_Add and TK_DIVIDE==OP_Divide,
22# code to translate from one to the other is avoided.  This makes the
23# code generator smaller and faster.
24#
25# This script also scans for lines of the form:
26#
27#       case OP_aaaa:       /* jump, in1, in2, in3, out2, out3 */
28#
29# When such comments are found on an opcode, it means that certain
30# properties apply to that opcode.  Set corresponding flags using the
31# OPFLG_INITIALIZER macro.
32#
33
34set in stdin
35set currentOp {}
36set prevName {}
37set nOp 0
38set nGroup 0
39while {![eof $in]} {
40  set line [gets $in]
41
42  # Remember the TK_ values from the parse.h file.
43  # NB:  The "TK_" prefix stands for "ToKen", not the graphical Tk toolkit
44  # commonly associated with TCL.
45  #
46  if {[regexp {^#define TK_} $line]} {
47    set tk([lindex $line 1]) [lindex $line 2]
48    continue
49  }
50
51  # Find "/* Opcode: " lines in the vdbe.c file.  Each one introduces
52  # a new opcode.  Remember which parameters are used.
53  #
54  if {[regexp {^.. Opcode: } $line]} {
55    set currentOp OP_[lindex $line 2]
56    set m 0
57    foreach term $line {
58      switch $term {
59        P1 {incr m 1}
60        P2 {incr m 2}
61        P3 {incr m 4}
62        P4 {incr m 8}
63        P5 {incr m 16}
64      }
65    }
66    set paramused($currentOp) $m
67  }
68
69  # Find "** Synopsis: " lines that follow Opcode:
70  #
71  if {[regexp {^.. Synopsis: (.*)} $line all x] && $currentOp!=""} {
72    set synopsis($currentOp) [string trim $x]
73  }
74
75  # Scan for "case OP_aaaa:" lines in the vdbe.c file
76  #
77  if {[regexp {^case OP_} $line]} {
78    set line [split $line]
79    set name [string trim [lindex $line 1] :]
80    if {$name=="OP_Abortable"} continue;  # put OP_Abortable last
81    set op($name) -1
82    set group($name) 0
83    set jump($name) 0
84    set in1($name) 0
85    set in2($name) 0
86    set in3($name) 0
87    set out2($name) 0
88    set out3($name) 0
89    for {set i 3} {$i<[llength $line]-1} {incr i} {
90       switch [string trim [lindex $line $i] ,] {
91         same {
92           incr i
93           if {[lindex $line $i]=="as"} {
94             incr i
95             set sym [string trim [lindex $line $i] ,]
96             set val $tk($sym)
97             set op($name) $val
98             set used($val) 1
99             set sameas($val) $sym
100             set def($val) $name
101           }
102         }
103         group {set group($name) 1}
104         jump  {set jump($name) 1}
105         in1   {set in1($name) 1}
106         in2   {set in2($name) 1}
107         in3   {set in3($name) 1}
108         out2  {set out2($name) 1}
109         out3  {set out3($name) 1}
110       }
111    }
112    if {$group($name)} {
113      set newGroup 0
114      if {[info exists groups($nGroup)]} {
115        if {$prevName=="" || !$group($prevName)} {
116          set newGroup 1
117        }
118      }
119      lappend groups($nGroup) $name
120      if {$newGroup} {incr nGroup}
121    } else {
122      if {$prevName!="" && $group($prevName)} {
123        incr nGroup
124      }
125    }
126    set order($nOp) $name
127    set prevName $name
128    incr nOp
129  }
130}
131
132# Assign numbers to all opcodes and output the result.
133#
134puts "/* Automatically generated.  Do not edit */"
135puts "/* See the tool/mkopcodeh.tcl script for details */"
136foreach name {OP_Noop OP_Explain OP_Abortable} {
137  set jump($name) 0
138  set in1($name) 0
139  set in2($name) 0
140  set in3($name) 0
141  set out2($name) 0
142  set out3($name) 0
143  set op($name) -1
144  set order($nOp) $name
145  incr nOp
146}
147
148# The following are the opcodes that receive special processing in the
149# resolveP2Values() routine.  Update this list whenever new cases are
150# added to the pOp->opcode switch within resolveP2Values().
151#
152set rp2v_ops {
153  OP_Transaction
154  OP_AutoCommit
155  OP_Savepoint
156  OP_Checkpoint
157  OP_Vacuum
158  OP_JournalMode
159  OP_VUpdate
160  OP_VFilter
161  OP_Next
162  OP_SorterNext
163  OP_Prev
164}
165
166# Assign the smallest values to opcodes that are processed by resolveP2Values()
167# to make code generation for the switch() statement smaller and faster.
168#
169set cnt -1
170for {set i 0} {$i<$nOp} {incr i} {
171  set name $order($i)
172  if {[lsearch $rp2v_ops $name]>=0} {
173    incr cnt
174    while {[info exists used($cnt)]} {incr cnt}
175    set op($name) $cnt
176    set used($cnt) 1
177    set def($cnt) $name
178  }
179}
180set mxCase1 $cnt
181
182# Assign the next group of values to JUMP opcodes
183#
184for {set i 0} {$i<$nOp} {incr i} {
185  set name $order($i)
186  if {$op($name)>=0} continue
187  if {!$jump($name)} continue
188  incr cnt
189  while {[info exists used($cnt)]} {incr cnt}
190  set op($name) $cnt
191  set used($cnt) 1
192  set def($cnt) $name
193}
194
195# Find the numeric value for the largest JUMP opcode
196#
197set mxJump -1
198for {set i 0} {$i<$nOp} {incr i} {
199  set name $order($i)
200  if {$jump($name) && $op($name)>$mxJump} {set mxJump $op($name)}
201}
202
203
204# Generate the numeric values for all remaining opcodes, while
205# preserving any groupings of opcodes (i.e. those that must be
206# together).
207#
208for {set g 0} {$g<$nGroup} {incr g} {
209  set gLen [llength $groups($g)]
210  set ok 0; set start -1
211  set seek $cnt
212  while {!$ok} {
213    incr seek
214    while {[info exists used($seek)]} {incr seek}
215    set ok 1; set start $seek
216    for {set j 0} {$j<$gLen} {incr j} {
217      incr seek
218      if {[info exists used($seek)]} {
219        set ok 0; break
220      }
221    }
222  }
223  if {$ok} {
224    set next $start
225    for {set j 0} {$j<$gLen} {incr j} {
226      set name [lindex $groups($g) $j]
227      if {$op($name)>=0} continue
228      set op($name) $next
229      set used($next) 1
230      set def($next) $name
231      incr next
232    }
233  } else {
234    error "cannot find opcodes for group: $groups($g)"
235  }
236}
237
238for {set i 0} {$i<$nOp} {incr i} {
239  set name $order($i)
240  if {$op($name)<0} {
241    incr cnt
242    while {[info exists used($cnt)]} {incr cnt}
243    set op($name) $cnt
244    set used($cnt) 1
245    set def($cnt) $name
246  }
247}
248
249set max [lindex [lsort -decr -integer [array names used]] 0]
250for {set i 0} {$i<=$max} {incr i} {
251  if {![info exists used($i)]} {
252    set def($i) "OP_NotUsed_$i"
253  }
254  if {$i>$max} {set max $i}
255  set name $def($i)
256  puts -nonewline [format {#define %-16s %3d} $name $i]
257  set com {}
258  if {[info exists jump($name)] && $jump($name)} {
259    lappend com "jump"
260  }
261  if {[info exists sameas($i)]} {
262    lappend com "same as $sameas($i)"
263  }
264  if {[info exists synopsis($name)]} {
265    lappend com "synopsis: $synopsis($name)"
266  }
267  if {[llength $com]} {
268    puts -nonewline [format " /* %-42s */" [join $com {, }]]
269  }
270  puts ""
271}
272
273if {$max>255} {
274  error "More than 255 opcodes - VdbeOp.opcode is of type u8!"
275}
276
277# Generate the bitvectors:
278#
279set bv(0) 0
280for {set i 0} {$i<=$max} {incr i} {
281  set x 0
282  set name $def($i)
283  if {[string match OP_NotUsed* $name]==0} {
284    if {$jump($name)}  {incr x 1}
285    if {$in1($name)}   {incr x 2}
286    if {$in2($name)}   {incr x 4}
287    if {$in3($name)}   {incr x 8}
288    if {$out2($name)}  {incr x 16}
289    if {$out3($name)}  {incr x 32}
290  }
291  set bv($i) $x
292}
293puts ""
294puts "/* Properties such as \"out2\" or \"jump\" that are specified in"
295puts "** comments following the \"case\" for each opcode in the vdbe.c"
296puts "** are encoded into bitvectors as follows:"
297puts "*/"
298puts "#define OPFLG_JUMP        0x01  /* jump:  P2 holds jmp target */"
299puts "#define OPFLG_IN1         0x02  /* in1:   P1 is an input */"
300puts "#define OPFLG_IN2         0x04  /* in2:   P2 is an input */"
301puts "#define OPFLG_IN3         0x08  /* in3:   P3 is an input */"
302puts "#define OPFLG_OUT2        0x10  /* out2:  P2 is an output */"
303puts "#define OPFLG_OUT3        0x20  /* out3:  P3 is an output */"
304puts "#define OPFLG_INITIALIZER \173\\"
305for {set i 0} {$i<=$max} {incr i} {
306  if {$i%8==0} {
307    puts -nonewline [format "/* %3d */" $i]
308  }
309  puts -nonewline [format " 0x%02x," $bv($i)]
310  if {$i%8==7} {
311    puts "\\"
312  }
313}
314puts "\175"
315puts ""
316puts "/* The resolve3P2Values() routine is able to run faster if it knows"
317puts "** the value of the largest JUMP opcode.  The smaller the maximum"
318puts "** JUMP opcode the better, so the mkopcodeh.tcl script that"
319puts "** generated this include file strives to group all JUMP opcodes"
320puts "** together near the beginning of the list."
321puts "*/"
322puts "#define SQLITE_MX_JUMP_OPCODE  $mxJump  /* Maximum JUMP opcode */"
323