// Copyright 2015 syzkaller project authors. All rights reserved.
// Use of this source code is governed by Apache 2 LICENSE that can be found in the LICENSE file.
// This file does serialization of programs for executor binary.
// The format aims at simple parsing: binary and irreversible.
// Exec format is an sequence of uint64's which encodes a sequence of calls.
// The sequence is terminated by a speciall call execInstrEOF.
// Each call is (call ID, copyout index, number of arguments, arguments...).
// Each argument is (type, size, value).
// There are 4 types of arguments:
// - execArgConst: value is const value
// - execArgResult: value is copyout index we want to reference
// - execArgData: value is a binary blob (represented as ]size/8[ uint64's)
// - execArgCsum: runtime checksum calculation
// There are 2 other special calls:
// - execInstrCopyin: copies its second argument into address specified by first argument
// - execInstrCopyout: reads value at address specified by first argument (result can be referenced by execArgResult)
package prog
import (
"fmt"
"sort"
)
const (
execInstrEOF = ^uint64(iota)
execInstrCopyin
execInstrCopyout
)
const (
execArgConst = uint64(iota)
execArgResult
execArgData
execArgCsum
)
const (
ExecArgCsumInet = uint64(iota)
)
const (
ExecArgCsumChunkData = uint64(iota)
ExecArgCsumChunkConst
)
const (
ExecBufferSize = 2 << 20
ExecNoCopyout = ^uint64(0)
)
// SerializeForExec serializes program p for execution by process pid into the provided buffer.
// Returns number of bytes written to the buffer.
// If the provided buffer is too small for the program an error is returned.
func (p *Prog) SerializeForExec(buffer []byte) (int, error) {
p.debugValidate()
w := &execContext{
target: p.Target,
buf: buffer,
eof: false,
args: make(map[Arg]argInfo),
}
for _, c := range p.Calls {
w.csumMap, w.csumUses = calcChecksumsCall(c)
w.serializeCall(c)
}
w.write(execInstrEOF)
if w.eof {
return 0, fmt.Errorf("provided buffer is too small")
}
return len(buffer) - len(w.buf), nil
}
func (w *execContext) serializeCall(c *Call) {
// Calculate arg offsets within structs.
// Generate copyin instructions that fill in data into pointer arguments.
w.writeCopyin(c)
// Generate checksum calculation instructions starting from the last one,
// since checksum values can depend on values of the latter ones
w.writeChecksums()
// Generate the call itself.
w.write(uint64(c.Meta.ID))
if c.Ret != nil && len(c.Ret.uses) != 0 {
if _, ok := w.args[c.Ret]; ok {
panic("argInfo is already created for return value")
}
w.args[c.Ret] = argInfo{Idx: w.copyoutSeq, Ret: true}
w.write(w.copyoutSeq)
w.copyoutSeq++
} else {
w.write(ExecNoCopyout)
}
w.write(uint64(len(c.Args)))
for _, arg := range c.Args {
w.writeArg(arg)
}
// Generate copyout instructions that persist interesting return values.
w.writeCopyout(c)
}
func (target *Target) PhysicalAddr(arg *PointerArg) uint64 {
if arg.IsNull() {
return 0
}
return target.DataOffset + arg.Address
}
type execContext struct {
target *Target
buf []byte
eof bool
args map[Arg]argInfo
copyoutSeq uint64
// Per-call state cached here to not pass it through all functions.
csumMap map[Arg]CsumInfo
csumUses map[Arg]struct{}
}
type argInfo struct {
Addr uint64 // physical addr
Idx uint64 // copyout instruction index
Ret bool
}
func (w *execContext) writeCopyin(c *Call) {
ForeachArg(c, func(arg Arg, ctx *ArgCtx) {
if ctx.Base == nil {
return
}
addr := w.target.PhysicalAddr(ctx.Base) + ctx.Offset
if w.willBeUsed(arg) {
w.args[arg] = argInfo{Addr: addr}
}
switch arg.(type) {
case *GroupArg, *UnionArg:
return
}
typ := arg.Type()
if typ.Dir() == DirOut || IsPad(typ) || arg.Size() == 0 {
return
}
w.write(execInstrCopyin)
w.write(addr)
w.writeArg(arg)
})
}
func (w *execContext) willBeUsed(arg Arg) bool {
if res, ok := arg.(*ResultArg); ok && len(res.uses) != 0 {
return true
}
_, ok1 := w.csumMap[arg]
_, ok2 := w.csumUses[arg]
return ok1 || ok2
}
func (w *execContext) writeChecksums() {
if len(w.csumMap) == 0 {
return
}
csumArgs := make([]Arg, 0, len(w.csumMap))
for arg := range w.csumMap {
csumArgs = append(csumArgs, arg)
}
sort.Slice(csumArgs, func(i, j int) bool {
return w.args[csumArgs[i]].Addr < w.args[csumArgs[j]].Addr
})
for i := len(csumArgs) - 1; i >= 0; i-- {
arg := csumArgs[i]
info := w.csumMap[arg]
if _, ok := arg.Type().(*CsumType); !ok {
panic("csum arg is not csum type")
}
w.write(execInstrCopyin)
w.write(w.args[arg].Addr)
w.write(execArgCsum)
w.write(arg.Size())
switch info.Kind {
case CsumInet:
w.write(ExecArgCsumInet)
w.write(uint64(len(info.Chunks)))
for _, chunk := range info.Chunks {
switch chunk.Kind {
case CsumChunkArg:
w.write(ExecArgCsumChunkData)
w.write(w.args[chunk.Arg].Addr)
w.write(chunk.Arg.Size())
case CsumChunkConst:
w.write(ExecArgCsumChunkConst)
w.write(chunk.Value)
w.write(chunk.Size)
default:
panic(fmt.Sprintf("csum chunk has unknown kind %v", chunk.Kind))
}
}
default:
panic(fmt.Sprintf("csum arg has unknown kind %v", info.Kind))
}
}
}
func (w *execContext) writeCopyout(c *Call) {
ForeachArg(c, func(arg Arg, _ *ArgCtx) {
if res, ok := arg.(*ResultArg); ok && len(res.uses) != 0 {
// Create a separate copyout instruction that has own Idx.
info := w.args[arg]
if info.Ret {
return // Idx is already assigned above.
}
info.Idx = w.copyoutSeq
w.copyoutSeq++
w.args[arg] = info
w.write(execInstrCopyout)
w.write(info.Idx)
w.write(info.Addr)
w.write(arg.Size())
}
})
}
func (w *execContext) write(v uint64) {
if len(w.buf) < 8 {
w.eof = true
return
}
w.buf[0] = byte(v >> 0)
w.buf[1] = byte(v >> 8)
w.buf[2] = byte(v >> 16)
w.buf[3] = byte(v >> 24)
w.buf[4] = byte(v >> 32)
w.buf[5] = byte(v >> 40)
w.buf[6] = byte(v >> 48)
w.buf[7] = byte(v >> 56)
w.buf = w.buf[8:]
}
func (w *execContext) writeArg(arg Arg) {
switch a := arg.(type) {
case *ConstArg:
val, pidStride := a.Value()
typ := a.Type()
w.writeConstArg(a.Size(), val, typ.BitfieldOffset(), typ.BitfieldLength(), pidStride, typ.Format())
case *ResultArg:
if a.Res == nil {
w.writeConstArg(a.Size(), a.Val, 0, 0, 0, a.Type().Format())
} else {
info, ok := w.args[a.Res]
if !ok {
panic("no copyout index")
}
w.write(execArgResult)
meta := a.Size() | uint64(a.Type().Format())<<8
w.write(meta)
w.write(info.Idx)
w.write(a.OpDiv)
w.write(a.OpAdd)
w.write(a.Type().(*ResourceType).Default())
}
case *PointerArg:
w.writeConstArg(a.Size(), w.target.PhysicalAddr(a), 0, 0, 0, FormatNative)
case *DataArg:
data := a.Data()
w.write(execArgData)
w.write(uint64(len(data)))
padded := len(data)
if pad := 8 - len(data)%8; pad != 8 {
padded += pad
}
if len(w.buf) < padded {
w.eof = true
} else {
copy(w.buf, data)
w.buf = w.buf[padded:]
}
case *UnionArg:
w.writeArg(a.Option)
default:
panic("unknown arg type")
}
}
func (w *execContext) writeConstArg(size, val, bfOffset, bfLength, pidStride uint64, bf BinaryFormat) {
w.write(execArgConst)
meta := size | uint64(bf)<<8 | bfOffset<<16 | bfLength<<24 | pidStride<<32
w.write(meta)
w.write(val)
}