blob: 4752dc75cfc6dd28d8674f0a18eee540017d6265 [file] [log] [blame]
// Copyright 2015 syzkaller project authors. All rights reserved.
// Use of this source code is governed by Apache 2 LICENSE that can be found in the LICENSE file.
package ipc
import (
"fmt"
"io"
"io/ioutil"
"os"
"os/exec"
"path/filepath"
"strings"
"sync/atomic"
"time"
"unsafe"
"github.com/google/syzkaller/pkg/osutil"
"github.com/google/syzkaller/prog"
)
// Configuration flags for Config.Flags.
type EnvFlags uint64
const (
FlagDebug EnvFlags = 1 << iota // debug output from executor
FlagSignal // collect feedback signals (coverage)
FlagSandboxSetuid // impersonate nobody user
FlagSandboxNamespace // use namespaces for sandboxing
FlagEnableTun // initialize and use tun in executor
FlagEnableNetDev // setup a bunch of various network devices for testing
FlagEnableFault // enable fault injection support
// Executor does not know about these:
FlagUseShmem // use shared memory instead of pipes for communication
FlagUseForkServer // use extended protocol with handshake
)
// Per-exec flags for ExecOpts.Flags:
type ExecFlags uint64
const (
FlagCollectCover ExecFlags = 1 << iota // collect coverage
FlagDedupCover // deduplicate coverage in executor
FlagInjectFault // inject a fault in this execution (see ExecOpts)
FlagCollectComps // collect KCOV comparisons
FlagThreaded // use multiple threads to mitigate blocked syscalls
FlagCollide // collide syscalls to provoke data races
)
type ExecOpts struct {
Flags ExecFlags
FaultCall int // call index for fault injection (0-based)
FaultNth int // fault n-th operation in the call (0-based)
}
// ExecutorFailure is returned from MakeEnv or from env.Exec when executor terminates
// by calling fail function. This is considered a logical error (a failed assert).
type ExecutorFailure string
func (err ExecutorFailure) Error() string {
return string(err)
}
// Config is the configuration for Env.
type Config struct {
// Path to executor binary.
Executor string
// Flags are configuation flags, defined above.
Flags EnvFlags
// Timeout is the execution timeout for a single program.
Timeout time.Duration
}
type CallFlags uint32
const (
CallExecuted CallFlags = 1 << iota // was started at all
CallFinished // finished executing (rather than blocked forever)
CallBlocked // finished but blocked during execution
CallFaultInjected // fault was injected into this call
)
type CallInfo struct {
Flags CallFlags
Signal []uint32 // feedback signal, filled if FlagSignal is set
Cover []uint32 // per-call coverage, filled if FlagSignal is set and cover == true,
//if dedup == false, then cov effectively contains a trace, otherwise duplicates are removed
Comps prog.CompMap // per-call comparison operands
Errno int // call errno (0 if the call was successful)
}
type Env struct {
in []byte
out []byte
cmd *command
inFile *os.File
outFile *os.File
bin []string
linkedBin string
pid int
config *Config
StatExecs uint64
StatRestarts uint64
}
const (
outputSize = 16 << 20
statusFail = 67
statusError = 68
statusRetry = 69
// Comparison types masks taken from KCOV headers.
compSizeMask = 6
compSize8 = 6
compConstMask = 1
)
func MakeEnv(config *Config, pid int) (*Env, error) {
var inf, outf *os.File
var inmem, outmem []byte
if config.Flags&FlagUseShmem != 0 {
var err error
inf, inmem, err = osutil.CreateMemMappedFile(prog.ExecBufferSize)
if err != nil {
return nil, err
}
defer func() {
if inf != nil {
osutil.CloseMemMappedFile(inf, inmem)
}
}()
outf, outmem, err = osutil.CreateMemMappedFile(outputSize)
if err != nil {
return nil, err
}
defer func() {
if outf != nil {
osutil.CloseMemMappedFile(outf, outmem)
}
}()
} else {
inmem = make([]byte, prog.ExecBufferSize)
outmem = make([]byte, outputSize)
}
env := &Env{
in: inmem,
out: outmem,
inFile: inf,
outFile: outf,
bin: strings.Split(config.Executor, " "),
pid: pid,
config: config,
}
if len(env.bin) == 0 {
return nil, fmt.Errorf("binary is empty string")
}
env.bin[0] = osutil.Abs(env.bin[0]) // we are going to chdir
// Append pid to binary name.
// E.g. if binary is 'syz-executor' and pid=15,
// we create a link from 'syz-executor15' to 'syz-executor' and use 'syz-executor15' as binary.
// This allows to easily identify program that lead to a crash in the log.
// Log contains pid in "executing program 15" and crashes usually contain "Comm: syz-executor15".
base := filepath.Base(env.bin[0])
pidStr := fmt.Sprint(pid)
if len(base)+len(pidStr) >= 16 {
// TASK_COMM_LEN is currently set to 16
base = base[:15-len(pidStr)]
}
binCopy := filepath.Join(filepath.Dir(env.bin[0]), base+pidStr)
if err := os.Link(env.bin[0], binCopy); err == nil {
env.bin[0] = binCopy
env.linkedBin = binCopy
}
inf = nil
outf = nil
return env, nil
}
func (env *Env) Close() error {
if env.cmd != nil {
env.cmd.close()
}
if env.linkedBin != "" {
os.Remove(env.linkedBin)
}
var err1, err2 error
if env.inFile != nil {
err1 = osutil.CloseMemMappedFile(env.inFile, env.in)
}
if env.outFile != nil {
err2 = osutil.CloseMemMappedFile(env.outFile, env.out)
}
switch {
case err1 != nil:
return err1
case err2 != nil:
return err2
default:
return nil
}
}
var rateLimit = time.NewTicker(1 * time.Second)
// Exec starts executor binary to execute program p and returns information about the execution:
// output: process output
// info: per-call info
// failed: true if executor has detected a kernel bug
// hanged: program hanged and was killed
// err0: failed to start process, or executor has detected a logical error
func (env *Env) Exec(opts *ExecOpts, p *prog.Prog) (output []byte, info []CallInfo, failed, hanged bool, err0 error) {
// Copy-in serialized program.
progSize, err := p.SerializeForExec(env.in)
if err != nil {
err0 = fmt.Errorf("failed to serialize: %v", err)
return
}
var progData []byte
if env.config.Flags&FlagUseShmem == 0 {
progData = env.in[:progSize]
}
// Zero out the first two words (ncmd and nsig), so that we don't have garbage there
// if executor crashes before writing non-garbage there.
for i := 0; i < 4; i++ {
env.out[i] = 0
}
atomic.AddUint64(&env.StatExecs, 1)
if env.cmd == nil {
if p.Target.OS == "akaros" {
// On akaros executor is actually ssh,
// starting them too frequently leads to timeouts.
<-rateLimit.C
}
atomic.AddUint64(&env.StatRestarts, 1)
env.cmd, err0 = makeCommand(env.pid, env.bin, env.config, env.inFile, env.outFile, env.out)
if err0 != nil {
return
}
}
var restart bool
output, failed, hanged, restart, err0 = env.cmd.exec(opts, progData)
if err0 != nil {
env.cmd.close()
env.cmd = nil
return
}
info, err0 = env.parseOutput(p)
if info != nil && env.config.Flags&FlagSignal == 0 {
addFallbackSignal(p, info)
}
if restart {
env.cmd.close()
env.cmd = nil
}
return
}
// addFallbackSignal computes simple fallback signal in cases we don't have real coverage signal.
// We use syscall number or-ed with returned errno value as signal.
// At least this gives us all combinations of syscall+errno.
func addFallbackSignal(p *prog.Prog, info []CallInfo) {
callInfos := make([]prog.CallInfo, len(info))
for i, inf := range info {
if inf.Flags&CallExecuted != 0 {
callInfos[i].Flags |= prog.CallExecuted
}
if inf.Flags&CallFinished != 0 {
callInfos[i].Flags |= prog.CallFinished
}
if inf.Flags&CallBlocked != 0 {
callInfos[i].Flags |= prog.CallBlocked
}
callInfos[i].Errno = inf.Errno
}
p.FallbackSignal(callInfos)
for i, inf := range callInfos {
info[i].Signal = inf.Signal
}
}
func (env *Env) parseOutput(p *prog.Prog) ([]CallInfo, error) {
out := env.out
ncmd, ok := readUint32(&out)
if !ok {
return nil, fmt.Errorf("failed to read number of calls")
}
info := make([]CallInfo, len(p.Calls))
for i := uint32(0); i < ncmd; i++ {
if len(out) < int(unsafe.Sizeof(callReply{})) {
return nil, fmt.Errorf("failed to read call %v reply", i)
}
reply := *(*callReply)(unsafe.Pointer(&out[0]))
out = out[unsafe.Sizeof(callReply{}):]
if int(reply.index) >= len(info) {
return nil, fmt.Errorf("bad call %v index %v/%v", i, reply.index, len(info))
}
if num := p.Calls[reply.index].Meta.ID; int(reply.num) != num {
return nil, fmt.Errorf("wrong call %v num %v/%v", i, reply.num, num)
}
inf := &info[reply.index]
if inf.Flags != 0 || inf.Signal != nil {
return nil, fmt.Errorf("duplicate reply for call %v/%v/%v", i, reply.index, reply.num)
}
inf.Errno = int(reply.errno)
inf.Flags = CallFlags(reply.flags)
if inf.Signal, ok = readUint32Array(&out, reply.signalSize); !ok {
return nil, fmt.Errorf("call %v/%v/%v: signal overflow: %v/%v",
i, reply.index, reply.num, reply.signalSize, len(out))
}
if inf.Cover, ok = readUint32Array(&out, reply.coverSize); !ok {
return nil, fmt.Errorf("call %v/%v/%v: cover overflow: %v/%v",
i, reply.index, reply.num, reply.coverSize, len(out))
}
comps, err := readComps(&out, reply.compsSize)
if err != nil {
return nil, err
}
inf.Comps = comps
}
return info, nil
}
func readComps(outp *[]byte, compsSize uint32) (prog.CompMap, error) {
if compsSize == 0 {
return nil, nil
}
compMap := make(prog.CompMap)
for i := uint32(0); i < compsSize; i++ {
typ, ok := readUint32(outp)
if !ok {
return nil, fmt.Errorf("failed to read comp %v", i)
}
if typ > compConstMask|compSizeMask {
return nil, fmt.Errorf("bad comp %v type %v", i, typ)
}
var op1, op2 uint64
var ok1, ok2 bool
if typ&compSizeMask == compSize8 {
op1, ok1 = readUint64(outp)
op2, ok2 = readUint64(outp)
} else {
var tmp1, tmp2 uint32
tmp1, ok1 = readUint32(outp)
tmp2, ok2 = readUint32(outp)
op1, op2 = uint64(tmp1), uint64(tmp2)
}
if !ok1 || !ok2 {
return nil, fmt.Errorf("failed to read comp %v op", i)
}
if op1 == op2 {
continue // it's useless to store such comparisons
}
compMap.AddComp(op2, op1)
if (typ & compConstMask) != 0 {
// If one of the operands was const, then this operand is always
// placed first in the instrumented callbacks. Such an operand
// could not be an argument of our syscalls (because otherwise
// it wouldn't be const), thus we simply ignore it.
continue
}
compMap.AddComp(op1, op2)
}
return compMap, nil
}
func readUint32(outp *[]byte) (uint32, bool) {
out := *outp
if len(out) < 4 {
return 0, false
}
v := *(*uint32)(unsafe.Pointer(&out[0]))
*outp = out[4:]
return v, true
}
func readUint64(outp *[]byte) (uint64, bool) {
out := *outp
if len(out) < 8 {
return 0, false
}
v := *(*uint64)(unsafe.Pointer(&out[0]))
*outp = out[8:]
return v, true
}
func readUint32Array(outp *[]byte, size uint32) ([]uint32, bool) {
out := *outp
if int(size)*4 > len(out) {
return nil, false
}
arr := ((*[1 << 28]uint32)(unsafe.Pointer(&out[0])))
res := arr[:size:size]
*outp = out[size*4:]
return res, true
}
type command struct {
pid int
config *Config
timeout time.Duration
cmd *exec.Cmd
dir string
readDone chan []byte
exited chan struct{}
inrp *os.File
outwp *os.File
outmem []byte
}
const (
inMagic = uint64(0xbadc0ffeebadface)
outMagic = uint32(0xbadf00d)
)
type handshakeReq struct {
magic uint64
flags uint64 // env flags
pid uint64
}
type handshakeReply struct {
magic uint32
}
type executeReq struct {
magic uint64
envFlags uint64 // env flags
execFlags uint64 // exec flags
pid uint64
faultCall uint64
faultNth uint64
progSize uint64
// prog follows on pipe or in shmem
}
type executeReply struct {
magic uint32
// If done is 0, then this is call completion message followed by callReply.
// If done is 1, then program execution is finished and status is set.
done uint32
status uint32
}
type callReply struct {
index uint32 // call index in the program
num uint32 // syscall number (for cross-checking)
errno uint32
flags uint32 // see CallFlags
signalSize uint32
coverSize uint32
compsSize uint32
// signal/cover/comps follow
}
func makeCommand(pid int, bin []string, config *Config, inFile, outFile *os.File, outmem []byte) (
*command, error) {
dir, err := ioutil.TempDir("./", "syzkaller-testdir")
if err != nil {
return nil, fmt.Errorf("failed to create temp dir: %v", err)
}
dir = osutil.Abs(dir)
c := &command{
pid: pid,
config: config,
timeout: sanitizeTimeout(config),
dir: dir,
outmem: outmem,
}
defer func() {
if c != nil {
c.close()
}
}()
if config.Flags&(FlagSandboxSetuid|FlagSandboxNamespace) != 0 {
if err := os.Chmod(dir, 0777); err != nil {
return nil, fmt.Errorf("failed to chmod temp dir: %v", err)
}
}
// Output capture pipe.
rp, wp, err := os.Pipe()
if err != nil {
return nil, fmt.Errorf("failed to create pipe: %v", err)
}
defer wp.Close()
// executor->ipc command pipe.
inrp, inwp, err := os.Pipe()
if err != nil {
return nil, fmt.Errorf("failed to create pipe: %v", err)
}
defer inwp.Close()
c.inrp = inrp
// ipc->executor command pipe.
outrp, outwp, err := os.Pipe()
if err != nil {
return nil, fmt.Errorf("failed to create pipe: %v", err)
}
defer outrp.Close()
c.outwp = outwp
c.readDone = make(chan []byte, 1)
c.exited = make(chan struct{})
cmd := osutil.Command(bin[0], bin[1:]...)
if inFile != nil && outFile != nil {
cmd.ExtraFiles = []*os.File{inFile, outFile}
}
cmd.Env = []string{}
cmd.Dir = dir
cmd.Stdin = outrp
cmd.Stdout = inwp
if config.Flags&FlagDebug != 0 {
close(c.readDone)
cmd.Stderr = os.Stdout
} else if config.Flags&FlagUseForkServer == 0 {
close(c.readDone)
// TODO: read out output after execution failure.
} else {
cmd.Stderr = wp
go func(c *command) {
// Read out output in case executor constantly prints something.
const bufSize = 128 << 10
output := make([]byte, bufSize)
var size uint64
for {
n, err := rp.Read(output[size:])
if n > 0 {
size += uint64(n)
if size >= bufSize*3/4 {
copy(output, output[size-bufSize/2:size])
size = bufSize / 2
}
}
if err != nil {
rp.Close()
c.readDone <- output[:size]
close(c.readDone)
return
}
}
}(c)
}
if err := cmd.Start(); err != nil {
return nil, fmt.Errorf("failed to start executor binary: %v", err)
}
c.cmd = cmd
wp.Close()
inwp.Close()
if c.config.Flags&FlagUseForkServer != 0 {
if err := c.handshake(); err != nil {
return nil, err
}
}
tmp := c
c = nil // disable defer above
return tmp, nil
}
func (c *command) close() {
if c.cmd != nil {
c.cmd.Process.Kill()
c.wait()
}
osutil.RemoveAll(c.dir)
if c.inrp != nil {
c.inrp.Close()
}
if c.outwp != nil {
c.outwp.Close()
}
}
// handshake sends handshakeReq and waits for handshakeReply (sandbox setup can take significant time).
func (c *command) handshake() error {
req := &handshakeReq{
magic: inMagic,
flags: uint64(c.config.Flags),
pid: uint64(c.pid),
}
reqData := (*[unsafe.Sizeof(*req)]byte)(unsafe.Pointer(req))[:]
if _, err := c.outwp.Write(reqData); err != nil {
return c.handshakeError(fmt.Errorf("failed to write control pipe: %v", err))
}
read := make(chan error, 1)
go func() {
reply := &handshakeReply{}
replyData := (*[unsafe.Sizeof(*reply)]byte)(unsafe.Pointer(reply))[:]
if _, err := io.ReadFull(c.inrp, replyData); err != nil {
read <- err
return
}
if reply.magic != outMagic {
read <- fmt.Errorf("bad handshake reply magic 0x%x", reply.magic)
return
}
read <- nil
}()
timeout := time.NewTimer(time.Minute)
select {
case err := <-read:
timeout.Stop()
if err != nil {
return c.handshakeError(err)
}
return nil
case <-timeout.C:
return c.handshakeError(fmt.Errorf("not serving"))
}
}
func (c *command) handshakeError(err error) error {
c.cmd.Process.Kill()
output := <-c.readDone
err = fmt.Errorf("executor %v: %v\n%s", c.pid, err, output)
c.wait()
if c.cmd.ProcessState != nil {
// Magic values returned by executor.
if osutil.ProcessExitStatus(c.cmd.ProcessState) == statusFail {
err = ExecutorFailure(err.Error())
}
}
return err
}
func (c *command) wait() error {
err := c.cmd.Wait()
select {
case <-c.exited:
// c.exited closed by an earlier call to wait.
default:
close(c.exited)
}
return err
}
func (c *command) exec(opts *ExecOpts, progData []byte) (output []byte, failed, hanged,
restart bool, err0 error) {
req := &executeReq{
magic: inMagic,
envFlags: uint64(c.config.Flags),
execFlags: uint64(opts.Flags),
pid: uint64(c.pid),
faultCall: uint64(opts.FaultCall),
faultNth: uint64(opts.FaultNth),
progSize: uint64(len(progData)),
}
reqData := (*[unsafe.Sizeof(*req)]byte)(unsafe.Pointer(req))[:]
if _, err := c.outwp.Write(reqData); err != nil {
output = <-c.readDone
err0 = fmt.Errorf("executor %v: failed to write control pipe: %v", c.pid, err)
return
}
if progData != nil {
if _, err := c.outwp.Write(progData); err != nil {
output = <-c.readDone
err0 = fmt.Errorf("executor %v: failed to write control pipe: %v", c.pid, err)
return
}
}
// At this point program is executing.
done := make(chan bool)
hang := make(chan bool)
go func() {
t := time.NewTimer(c.timeout)
select {
case <-t.C:
c.cmd.Process.Kill()
hang <- true
case <-done:
t.Stop()
hang <- false
}
}()
restart = c.config.Flags&FlagUseForkServer == 0
exitStatus := -1
completedCalls := (*uint32)(unsafe.Pointer(&c.outmem[0]))
outmem := c.outmem[4:]
for {
reply := &executeReply{}
replyData := (*[unsafe.Sizeof(*reply)]byte)(unsafe.Pointer(reply))[:]
if _, err := io.ReadFull(c.inrp, replyData); err != nil {
break
}
if reply.magic != outMagic {
fmt.Fprintf(os.Stderr, "executor %v: got bad reply magic 0x%x\n", c.pid, reply.magic)
os.Exit(1)
}
if reply.done != 0 {
exitStatus = int(reply.status)
break
}
callReply := &callReply{}
callReplyData := (*[unsafe.Sizeof(*callReply)]byte)(unsafe.Pointer(callReply))[:]
if _, err := io.ReadFull(c.inrp, callReplyData); err != nil {
break
}
if callReply.signalSize != 0 || callReply.coverSize != 0 || callReply.compsSize != 0 {
// This is unsupported yet.
fmt.Fprintf(os.Stderr, "executor %v: got call reply with coverage\n", c.pid)
os.Exit(1)
}
copy(outmem, callReplyData)
outmem = outmem[len(callReplyData):]
*completedCalls++
}
close(done)
if exitStatus == 0 {
// Program was OK.
<-hang
return
}
c.cmd.Process.Kill()
output = <-c.readDone
if err := c.wait(); <-hang {
hanged = true
output = append(output, []byte(err.Error())...)
output = append(output, '\n')
return
}
if exitStatus == -1 {
exitStatus = osutil.ProcessExitStatus(c.cmd.ProcessState)
if exitStatus == 0 {
exitStatus = statusRetry // fuchsia always returns wrong exit status 0
}
}
// Handle magic values returned by executor.
switch exitStatus {
case statusFail:
err0 = ExecutorFailure(fmt.Sprintf("executor %v: failed: %s", c.pid, output))
case statusError:
err0 = fmt.Errorf("executor %v: detected kernel bug", c.pid)
failed = true
case statusRetry:
// This is a temporal error (ENOMEM) or an unfortunate
// program that messes with testing setup (e.g. kills executor
// loop process). Pretend that nothing happened.
// It's better than a false crash report.
err0 = nil
hanged = false
restart = true
default:
err0 = fmt.Errorf("executor %v: exit status %d", c.pid, exitStatus)
}
return
}
func sanitizeTimeout(config *Config) time.Duration {
const (
executorTimeout = 5 * time.Second
minTimeout = executorTimeout + 2*time.Second
)
timeout := config.Timeout
if timeout == 0 {
// Executor protects against most hangs, so we use quite large timeout here.
// Executor can be slow due to global locks in namespaces and other things,
// so let's better wait than report false misleading crashes.
timeout = time.Minute
if config.Flags&FlagUseForkServer == 0 {
// If there is no fork server, executor does not have internal timeout.
timeout = executorTimeout
}
}
// IPC timeout must be larger then executor timeout.
// Otherwise IPC will kill parent executor but leave child executor alive.
if config.Flags&FlagUseForkServer != 0 && timeout < minTimeout {
timeout = minTimeout
}
return timeout
}