Skip to content

Commit 97e4a0f

Browse files
committed
compile: add line numbers to compiler and create line number table (lnotab)
1 parent bbab811 commit 97e4a0f

File tree

5 files changed

+168
-14
lines changed

5 files changed

+168
-14
lines changed

compile/compile.go

+21-4
Original file line numberDiff line numberDiff line change
@@ -68,6 +68,7 @@ const (
6868
type compiler struct {
6969
Code *py.Code // code being built up
7070
Filename string
71+
Lineno int // current line number
7172
OpCodes Instructions
7273
loops loopstack
7374
SymTable *symtable.SymTable
@@ -144,6 +145,11 @@ func (c *compiler) panicSyntaxErrorf(Ast ast.Ast, format string, a ...interface{
144145
panic(err)
145146
}
146147

148+
// Sets Lineno from an ast node
149+
func (c *compiler) SetLineno(node ast.Ast) {
150+
c.Lineno = node.GetLineno()
151+
}
152+
147153
// Create a new compiler object at Ast, using private for name mangling
148154
func (c *compiler) newCompilerScope(compilerScope compilerScopeType, Ast ast.Ast, private string) (newC *compiler) {
149155
newSymTable := c.SymTable.FindChild(Ast)
@@ -186,6 +192,7 @@ func (c *compiler) compileAst(Ast ast.Ast, filename string, futureFlags int, don
186192
code.Freevars = append(code.Freevars, SymTable.Find(symtable.ScopeFree, symtable.DefFreeClass)...)
187193
code.Flags = c.codeFlags(SymTable) | int32(futureFlags&py.CO_COMPILER_FLAGS_MASK)
188194
valueOnStack := false
195+
c.SetLineno(Ast)
189196
switch node := Ast.(type) {
190197
case *ast.Module:
191198
c.Stmts(c.docString(node.Body, false))
@@ -283,6 +290,7 @@ func (c *compiler) compileAst(Ast ast.Ast, filename string, futureFlags int, don
283290
code.Code = c.OpCodes.Assemble()
284291
code.Stacksize = int32(c.OpCodes.StackDepth())
285292
code.Nlocals = int32(len(code.Varnames))
293+
code.Lnotab = string(c.OpCodes.Lnotab())
286294
return nil
287295
}
288296

@@ -377,15 +385,19 @@ func (c *compiler) OpArg(Op vm.OpCode, Arg uint32) {
377385
if !Op.HAS_ARG() {
378386
panic("OpArg called with an instruction which doesn't take an Arg")
379387
}
380-
c.OpCodes.Add(&OpArg{Op: Op, Arg: Arg})
388+
instr := &OpArg{Op: Op, Arg: Arg}
389+
instr.SetLineno(c.Lineno)
390+
c.OpCodes.Add(instr)
381391
}
382392

383393
// Compiles an instruction without an argument
384394
func (c *compiler) Op(op vm.OpCode) {
385395
if op.HAS_ARG() {
386396
panic("Op called with an instruction which takes an Arg")
387397
}
388-
c.OpCodes.Add(&Op{Op: op})
398+
instr := &Op{Op: op}
399+
instr.SetLineno(c.Lineno)
400+
c.OpCodes.Add(instr)
389401
}
390402

391403
// Inserts an existing label
@@ -402,14 +414,17 @@ func (c *compiler) NewLabel() *Label {
402414

403415
// Compiles a jump instruction
404416
func (c *compiler) Jump(Op vm.OpCode, Dest *Label) {
417+
var instr Instruction
405418
switch Op {
406419
case vm.JUMP_IF_FALSE_OR_POP, vm.JUMP_IF_TRUE_OR_POP, vm.JUMP_ABSOLUTE, vm.POP_JUMP_IF_FALSE, vm.POP_JUMP_IF_TRUE, vm.CONTINUE_LOOP: // Absolute
407-
c.OpCodes.Add(&JumpAbs{OpArg: OpArg{Op: Op}, Dest: Dest})
420+
instr = &JumpAbs{OpArg: OpArg{Op: Op}, Dest: Dest}
408421
case vm.JUMP_FORWARD, vm.SETUP_WITH, vm.FOR_ITER, vm.SETUP_LOOP, vm.SETUP_EXCEPT, vm.SETUP_FINALLY:
409-
c.OpCodes.Add(&JumpRel{OpArg: OpArg{Op: Op}, Dest: Dest})
422+
instr = &JumpRel{OpArg: OpArg{Op: Op}, Dest: Dest}
410423
default:
411424
panic("Jump called with non jump instruction")
412425
}
426+
instr.SetLineno(c.Lineno)
427+
c.OpCodes.Add(instr)
413428
}
414429

415430
/* The test for LOCAL must come before the test for FREE in order to
@@ -963,6 +978,7 @@ func (c *compiler) Stmts(stmts []ast.Stmt) {
963978

964979
// Compile statement
965980
func (c *compiler) Stmt(stmt ast.Stmt) {
981+
c.SetLineno(stmt)
966982
switch node := stmt.(type) {
967983
case *ast.FunctionDef:
968984
// Name Identifier
@@ -1578,6 +1594,7 @@ func (c *compiler) Exprs(exprs []ast.Expr) {
15781594

15791595
// Compile and expression
15801596
func (c *compiler) Expr(expr ast.Expr) {
1597+
c.SetLineno(expr)
15811598
switch node := expr.(type) {
15821599
case *ast.BoolOp:
15831600
// Op BoolOpNumber

compile/compile_test.go

+36-1
Original file line numberDiff line numberDiff line change
@@ -19,6 +19,39 @@ func EqString(t *testing.T, name string, a, b string) {
1919
}
2020
}
2121

22+
// Compact the lnotab as python3 seems to generate inefficient ones
23+
// with spurious zero line number increments.
24+
func lnotabCompact(t *testing.T, pxs *[]byte) {
25+
xs := *pxs
26+
newxs := make([]byte, 0, len(xs))
27+
carry := 0
28+
for i := 0; i < len(xs); i += 2 {
29+
d_offset, d_lineno := xs[i], xs[i+1]
30+
if d_lineno == 0 {
31+
carry += int(d_offset)
32+
continue
33+
}
34+
// FIXME ignoring d_offset overflow
35+
d_offset += byte(carry)
36+
carry = 0
37+
newxs = append(newxs, byte(d_offset), d_lineno)
38+
}
39+
// if string(newxs) != string(xs) {
40+
// t.Logf("Compacted\n% x\n% x", xs, newxs)
41+
// }
42+
*pxs = newxs
43+
}
44+
45+
func EqLnotab(t *testing.T, name string, aStr, bStr string) {
46+
a := []byte(aStr)
47+
b := []byte(bStr)
48+
lnotabCompact(t, &a)
49+
lnotabCompact(t, &b)
50+
if string(a) != string(b) {
51+
t.Errorf("%s want % x, got % x", name, a, b)
52+
}
53+
}
54+
2255
func EqInt32(t *testing.T, name string, a, b int32) {
2356
if a != b {
2457
t.Errorf("%s want %d, got %d", name, a, b)
@@ -105,7 +138,9 @@ func EqCode(t *testing.T, name string, a, b *py.Code) {
105138
EqCodeCode(t, name+": Code", a.Code, b.Code)
106139
EqString(t, name+": Filename", a.Filename, b.Filename)
107140
EqString(t, name+": Name", a.Name, b.Name)
108-
// FIXME EqString(t, name+": Lnotab", a.Lnotab, b.Lnotab)
141+
// The Lnotabs are mostly the same but not entirely
142+
// So it is probably not profitable to test them exactly
143+
// EqLnotab(t, name+": Lnotab", a.Lnotab, b.Lnotab)
109144

110145
// []string
111146
EqStrings(t, name+": Names", a.Names, b.Names)

compile/instructions.go

+54-5
Original file line numberDiff line numberDiff line change
@@ -1,8 +1,6 @@
11
package compile
22

3-
import (
4-
"github.com/ncw/gpython/vm"
5-
)
3+
import "github.com/ncw/gpython/vm"
64

75
// FIXME detect if label is not in the instruction stream by setting
86
// Pos to 0xFFFF say by default, ie we made a label but forgot to add
@@ -300,6 +298,8 @@ func (is Instructions) StackDepth() int {
300298
type Instruction interface {
301299
Pos() uint32
302300
Number() int
301+
Lineno() int
302+
SetLineno(int)
303303
SetPos(int, uint32) bool
304304
Size() uint32
305305
Output() []byte
@@ -312,8 +312,9 @@ type Resolver interface {
312312

313313
// Position
314314
type pos struct {
315-
n uint32
316-
p uint32
315+
n uint32
316+
p uint32
317+
lineno int
317318
}
318319

319320
// Read instruction number
@@ -326,6 +327,16 @@ func (p *pos) Pos() uint32 {
326327
return p.p
327328
}
328329

330+
// Read lineno
331+
func (p *pos) Lineno() int {
332+
return p.lineno
333+
}
334+
335+
// Set lineno
336+
func (p *pos) SetLineno(lineno int) {
337+
p.lineno = lineno
338+
}
339+
329340
// Set Position - returns changed
330341
func (p *pos) SetPos(number int, newPos uint32) bool {
331342
p.n = uint32(number)
@@ -439,3 +450,41 @@ func (o *JumpRel) Resolve() {
439450
panic("FIXME compile: JUMP_FOWARDS size changed")
440451
}
441452
}
453+
454+
// Creates the lnotab from the instruction stream
455+
//
456+
// See Objects/lnotab_notes.txt for the description of the line number table.
457+
func (is Instructions) Lnotab() []byte {
458+
var lnotab []byte
459+
old_offset := uint32(0)
460+
old_lineno := 1
461+
for _, instr := range is {
462+
if instr.Size() == 0 {
463+
continue
464+
}
465+
lineno := instr.Lineno()
466+
offset := instr.Pos()
467+
d_lineno := lineno - old_lineno
468+
if d_lineno <= 0 {
469+
continue
470+
}
471+
d_bytecode := offset - old_offset
472+
for d_bytecode > 255 {
473+
lnotab = append(lnotab, 255, 0)
474+
d_bytecode -= 255
475+
}
476+
for d_lineno > 255 {
477+
lnotab = append(lnotab, byte(d_bytecode), 255)
478+
d_bytecode = 0
479+
d_lineno -= 255
480+
}
481+
if d_bytecode > 0 {
482+
lnotab = append(lnotab, byte(d_bytecode), byte(d_lineno))
483+
} else { /* First line of a block; def stmt, etc. */
484+
lnotab = append(lnotab, 0, byte(d_lineno))
485+
}
486+
old_lineno = lineno
487+
old_offset = offset
488+
}
489+
return lnotab
490+
}

compile/instructions_test.go

+56
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,56 @@
1+
package compile
2+
3+
import (
4+
"bytes"
5+
"testing"
6+
)
7+
8+
func TestLnotab(t *testing.T) {
9+
for i, test := range []struct {
10+
instrs Instructions
11+
want []byte
12+
}{
13+
{
14+
instrs: Instructions{},
15+
want: []byte{},
16+
},
17+
{
18+
instrs: Instructions{
19+
&Op{pos: pos{n: 1, p: 10, lineno: 1}},
20+
&Op{pos: pos{n: 0, p: 10, lineno: 0}},
21+
&Op{pos: pos{n: 1, p: 102, lineno: 1}},
22+
},
23+
want: []byte{},
24+
},
25+
{
26+
instrs: Instructions{
27+
&Op{pos: pos{n: 1, p: 0, lineno: 1}},
28+
&Op{pos: pos{n: 1, p: 1, lineno: 2}},
29+
&Op{pos: pos{n: 1, p: 2, lineno: 3}},
30+
},
31+
want: []byte{1, 1, 1, 1},
32+
},
33+
{
34+
// Example from lnotab.txt
35+
instrs: Instructions{
36+
&Op{pos: pos{n: 1, p: 0, lineno: 1}},
37+
&Op{pos: pos{n: 1, p: 6, lineno: 2}},
38+
&Op{pos: pos{n: 1, p: 50, lineno: 7}},
39+
&Op{pos: pos{n: 1, p: 350, lineno: 307}},
40+
&Op{pos: pos{n: 1, p: 361, lineno: 308}},
41+
},
42+
want: []byte{
43+
6, 1,
44+
44, 5,
45+
255, 0,
46+
45, 255,
47+
0, 45,
48+
11, 1},
49+
},
50+
} {
51+
got := test.instrs.Lnotab()
52+
if bytes.Compare(test.want, got) != 0 {
53+
t.Errorf("%d: want %d got %d", i, test.want, got)
54+
}
55+
}
56+
}

notes.txt

+1-4
Original file line numberDiff line numberDiff line change
@@ -18,6 +18,7 @@ Things to do before release
1818
===========================
1919

2020
* Line numbers
21+
* frame.Lasti is pointing past the instruction which puts tracebacks out
2122
* Subclass builtins
2223
* pygen
2324

@@ -39,10 +40,6 @@ Failes on /usr/lib/python3/dist-packages/mpmath/usertools.py
3940
Limitations & Missing parts
4041
===========================
4142
* string keys only in dictionaries
42-
* line numbers missing in SyntaxErrors
43-
* now need to show them when printing SyntaxErrors
44-
* line numbers missing in Tracebacks
45-
* lnotab etc
4643
* \N{...} escapes not implemented
4744
* lots of builtins still to implement
4845
* FIXME eq && ne should throw an error for a type which doesn' have eq implemented

0 commit comments

Comments
 (0)