Commit 99e22328 authored by Richard Musiol's avatar Richard Musiol Committed by Richard Musiol

cmd/link/internal/wasm: optimize data section in wasm binary

This change optimizes the data section in the wasm binary by
omitting blocks of zeroes and instead emitting data segments
with offsets skipping the zeroes.

This optimization is inspired by the memory-packing pass of the
wasm-opt tool and reduces the wasm binary size of "hello world" by 14%.

Change-Id: Iba3043df05bf6aab4745c5f8015c0337fc218aff
Reviewed-on: https://go-review.googlesource.com/c/go/+/167801
Run-TryBot: Brad Fitzpatrick <bradfitz@golang.org>
TryBot-Result: Gobot Gobot <gobot@golang.org>
Reviewed-by: default avatarCherry Zhang <cherryyz@google.com>
parent 4dad64f5
...@@ -32,6 +32,7 @@ ...@@ -32,6 +32,7 @@
package ld package ld
import ( import (
"bufio"
"bytes" "bytes"
"cmd/internal/gcprog" "cmd/internal/gcprog"
"cmd/internal/objabi" "cmd/internal/objabi"
...@@ -684,7 +685,7 @@ func CodeblkPad(ctxt *Link, addr int64, size int64, pad []byte) { ...@@ -684,7 +685,7 @@ func CodeblkPad(ctxt *Link, addr int64, size int64, pad []byte) {
ctxt.Logf("codeblk [%#x,%#x) at offset %#x\n", addr, addr+size, ctxt.Out.Offset()) ctxt.Logf("codeblk [%#x,%#x) at offset %#x\n", addr, addr+size, ctxt.Out.Offset())
} }
blk(ctxt, ctxt.Textp, addr, size, pad) blk(ctxt.Out, ctxt.Textp, addr, size, pad)
/* again for printing */ /* again for printing */
if !*flagA { if !*flagA {
...@@ -742,7 +743,7 @@ func CodeblkPad(ctxt *Link, addr int64, size int64, pad []byte) { ...@@ -742,7 +743,7 @@ func CodeblkPad(ctxt *Link, addr int64, size int64, pad []byte) {
} }
} }
func blk(ctxt *Link, syms []*sym.Symbol, addr, size int64, pad []byte) { func blk(out *OutBuf, syms []*sym.Symbol, addr, size int64, pad []byte) {
for i, s := range syms { for i, s := range syms {
if !s.Attr.SubSymbol() && s.Value >= addr { if !s.Attr.SubSymbol() && s.Value >= addr {
syms = syms[i:] syms = syms[i:]
...@@ -767,13 +768,13 @@ func blk(ctxt *Link, syms []*sym.Symbol, addr, size int64, pad []byte) { ...@@ -767,13 +768,13 @@ func blk(ctxt *Link, syms []*sym.Symbol, addr, size int64, pad []byte) {
errorexit() errorexit()
} }
if addr < s.Value { if addr < s.Value {
ctxt.Out.WriteStringPad("", int(s.Value-addr), pad) out.WriteStringPad("", int(s.Value-addr), pad)
addr = s.Value addr = s.Value
} }
ctxt.Out.Write(s.P) out.Write(s.P)
addr += int64(len(s.P)) addr += int64(len(s.P))
if addr < s.Value+s.Size { if addr < s.Value+s.Size {
ctxt.Out.WriteStringPad("", int(s.Value+s.Size-addr), pad) out.WriteStringPad("", int(s.Value+s.Size-addr), pad)
addr = s.Value + s.Size addr = s.Value + s.Size
} }
if addr != s.Value+s.Size { if addr != s.Value+s.Size {
...@@ -786,17 +787,29 @@ func blk(ctxt *Link, syms []*sym.Symbol, addr, size int64, pad []byte) { ...@@ -786,17 +787,29 @@ func blk(ctxt *Link, syms []*sym.Symbol, addr, size int64, pad []byte) {
} }
if addr < eaddr { if addr < eaddr {
ctxt.Out.WriteStringPad("", int(eaddr-addr), pad) out.WriteStringPad("", int(eaddr-addr), pad)
} }
ctxt.Out.Flush() out.Flush()
} }
func Datblk(ctxt *Link, addr int64, size int64) { func Datblk(ctxt *Link, addr int64, size int64) {
writeDatblkToOutBuf(ctxt, ctxt.Out, addr, size)
}
func DatblkBytes(ctxt *Link, addr int64, size int64) []byte {
buf := bytes.NewBuffer(make([]byte, 0, size))
out := &OutBuf{w: bufio.NewWriter(buf)}
writeDatblkToOutBuf(ctxt, out, addr, size)
out.Flush()
return buf.Bytes()
}
func writeDatblkToOutBuf(ctxt *Link, out *OutBuf, addr int64, size int64) {
if *flagA { if *flagA {
ctxt.Logf("datblk [%#x,%#x) at offset %#x\n", addr, addr+size, ctxt.Out.Offset()) ctxt.Logf("datblk [%#x,%#x) at offset %#x\n", addr, addr+size, ctxt.Out.Offset())
} }
blk(ctxt, datap, addr, size, zeros[:]) blk(out, datap, addr, size, zeros[:])
/* again for printing */ /* again for printing */
if !*flagA { if !*flagA {
...@@ -870,7 +883,7 @@ func Dwarfblk(ctxt *Link, addr int64, size int64) { ...@@ -870,7 +883,7 @@ func Dwarfblk(ctxt *Link, addr int64, size int64) {
ctxt.Logf("dwarfblk [%#x,%#x) at offset %#x\n", addr, addr+size, ctxt.Out.Offset()) ctxt.Logf("dwarfblk [%#x,%#x) at offset %#x\n", addr, addr+size, ctxt.Out.Offset())
} }
blk(ctxt, dwarfp, addr, size, zeros[:]) blk(ctxt.Out, dwarfp, addr, size, zeros[:])
} }
var zeros [512]byte var zeros [512]byte
......
...@@ -417,14 +417,63 @@ func writeDataSec(ctxt *ld.Link) { ...@@ -417,14 +417,63 @@ func writeDataSec(ctxt *ld.Link) {
ctxt.Syms.Lookup("runtime.data", 0).Sect, ctxt.Syms.Lookup("runtime.data", 0).Sect,
} }
writeUleb128(ctxt.Out, uint64(len(sections))) // number of data entries type dataSegment struct {
offset int32
data []byte
}
// Omit blocks of zeroes and instead emit data segments with offsets skipping the zeroes.
// This reduces the size of the WebAssembly binary. We use 8 bytes as an estimate for the
// overhead of adding a new segment (same as wasm-opt's memory-packing optimization uses).
const segmentOverhead = 8
var segments []*dataSegment
for _, sec := range sections { for _, sec := range sections {
data := ld.DatblkBytes(ctxt, int64(sec.Vaddr), int64(sec.Length))
offset := int32(sec.Vaddr)
// skip leading zeroes
for len(data) > 0 && data[0] == 0 {
data = data[1:]
offset++
}
for len(data) > 0 {
dataLen := int32(len(data))
var segmentEnd, zeroEnd int32
for {
// look for beginning of zeroes
for segmentEnd < dataLen && data[segmentEnd] != 0 {
segmentEnd++
}
// look for end of zeroes
zeroEnd = segmentEnd
for zeroEnd < dataLen && data[zeroEnd] == 0 {
zeroEnd++
}
// emit segment if omitting zeroes reduces the output size
if zeroEnd-segmentEnd >= segmentOverhead || zeroEnd == dataLen {
break
}
segmentEnd = zeroEnd
}
segments = append(segments, &dataSegment{
offset: offset,
data: data[:segmentEnd],
})
data = data[zeroEnd:]
offset += zeroEnd
}
}
writeUleb128(ctxt.Out, uint64(len(segments))) // number of data entries
for _, seg := range segments {
writeUleb128(ctxt.Out, 0) // memidx writeUleb128(ctxt.Out, 0) // memidx
writeI32Const(ctxt.Out, int32(sec.Vaddr)) writeI32Const(ctxt.Out, seg.offset)
ctxt.Out.WriteByte(0x0b) // end ctxt.Out.WriteByte(0x0b) // end
writeUleb128(ctxt.Out, uint64(sec.Length)) writeUleb128(ctxt.Out, uint64(len(seg.data)))
ld.Datblk(ctxt, int64(sec.Vaddr), int64(sec.Length)) ctxt.Out.Write(seg.data)
} }
writeSecSize(ctxt, sizeOffset) writeSecSize(ctxt, sizeOffset)
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment