grace/grace.go

221 lines
5.1 KiB
Go
Raw Normal View History

2012-06-05 06:21:10 +08:00
// Package grace allows for gracefully waiting for a listener to
// finish serving it's active requests.
package grace
import (
"errors"
"fmt"
"net"
"os"
"os/exec"
"os/signal"
"strconv"
"strings"
"sync"
"syscall"
"time"
2012-06-05 06:21:10 +08:00
)
var (
// This error is returned by Inherits() when we're not inheriting any fds.
ErrNotInheriting = errors.New("no inherited listeners")
// This error is returned by Listener.Accept() when Close is in progress.
ErrAlreadyClosed = errors.New("already closed")
// Time in the past to trigger immediate deadline.
timeInPast = time.Date(1983, time.November, 6, 0, 0, 0, 0, time.UTC)
2012-06-05 06:21:10 +08:00
)
const (
// Used to indicate a graceful restart in the new process.
envCountKey = "LISTEN_FDS"
2012-06-05 06:21:10 +08:00
// The error returned by the standard library when the socket is closed.
errClosed = "use of closed network connection"
)
// A Listener providing a graceful Close process and can be sent
// across processes using the underlying File descriptor.
type Listener interface {
2013-03-26 05:39:26 +08:00
net.Listener
// Will return the underlying file representing this Listener.
File() (f *os.File, err error)
}
2012-06-05 06:21:10 +08:00
type listener struct {
Listener
closed bool
closedMutex sync.RWMutex
wg sync.WaitGroup
2012-06-05 06:21:10 +08:00
}
// Allows for us to notice when the connection is closed.
type conn struct {
net.Conn
wg *sync.WaitGroup
2012-06-05 06:21:10 +08:00
}
func (c conn) Close() error {
err := c.Conn.Close()
c.wg.Done()
return err
2012-06-05 06:21:10 +08:00
}
2012-06-05 12:56:51 +08:00
// Wraps an existing File listener to provide a graceful Close() process.
func NewListener(l Listener) Listener {
return &listener{Listener: l}
2012-06-05 06:21:10 +08:00
}
func (l *listener) Close() error {
l.closedMutex.Lock()
l.closed = true
l.closedMutex.Unlock()
var err error
// Init provided sockets dont actually close so we trigger Accept to return
// by setting the deadline.
if os.Getppid() == 1 {
if ld, ok := l.Listener.(interface {
SetDeadline(t time.Time) error
}); ok {
ld.SetDeadline(timeInPast)
} else {
fmt.Fprintln(os.Stderr, "init activated server did not have SetDeadline")
}
} else {
err = l.Listener.Close()
}
l.wg.Wait()
return err
2012-06-05 06:21:10 +08:00
}
func (l *listener) Accept() (net.Conn, error) {
l.closedMutex.RLock()
if l.closed {
l.closedMutex.RUnlock()
return nil, ErrAlreadyClosed
}
l.closedMutex.RUnlock()
c, err := l.Listener.Accept()
if err != nil {
if strings.HasSuffix(err.Error(), errClosed) {
return nil, ErrAlreadyClosed
}
// We use SetDeadline above to trigger Accept to return when we're trying
// to handoff to a child as part of our restart process. In this scenario
2013-08-21 07:48:43 +08:00
// we want to treat the timeout the same as a Close.
if nerr, ok := err.(net.Error); ok && nerr.Timeout() {
l.closedMutex.RLock()
if l.closed {
l.closedMutex.RUnlock()
return nil, ErrAlreadyClosed
}
l.closedMutex.RUnlock()
}
return nil, err
}
l.wg.Add(1)
return conn{Conn: c, wg: &l.wg}, nil
2012-06-05 06:21:10 +08:00
}
2012-06-05 12:56:51 +08:00
// Wait for signals to gracefully terminate or restart the process.
2012-06-05 06:21:10 +08:00
func Wait(listeners []Listener) (err error) {
ch := make(chan os.Signal, 2)
signal.Notify(ch, syscall.SIGTERM, syscall.SIGUSR2)
for {
sig := <-ch
switch sig {
case syscall.SIGTERM:
var wg sync.WaitGroup
wg.Add(len(listeners))
for _, l := range listeners {
go func(l Listener) {
cErr := l.Close()
if cErr != nil {
err = cErr
2012-06-05 06:21:10 +08:00
}
wg.Done()
}(l)
}
wg.Wait()
return
case syscall.SIGUSR2:
rErr := Restart(listeners)
if rErr != nil {
return rErr
}
}
}
panic("not reached")
}
2012-06-05 12:56:51 +08:00
// Try to inherit listeners from the parent process.
2012-06-05 06:21:10 +08:00
func Inherit() (listeners []Listener, err error) {
countStr := os.Getenv(envCountKey)
if countStr == "" {
return nil, ErrNotInheriting
}
count, err := strconv.Atoi(countStr)
if err != nil {
return nil, err
}
// If we are inheriting, the listeners will begin at fd 3
for i := 3; i < 3+count; i++ {
file := os.NewFile(uintptr(i), "listener")
tmp, err := net.FileListener(file)
file.Close()
if err != nil {
return nil, err
}
l := tmp.(*net.TCPListener)
listeners = append(listeners, NewListener(l))
}
return
}
2012-06-05 12:56:51 +08:00
// Start the Close process in the parent. This does not wait for the
// parent to close and simply sends it the TERM signal.
2012-06-05 06:21:10 +08:00
func CloseParent() error {
ppid := os.Getppid()
if ppid == 1 { // init provided sockets, for example systemd
return nil
}
return syscall.Kill(ppid, syscall.SIGTERM)
2012-06-05 06:21:10 +08:00
}
2012-06-05 12:56:51 +08:00
// Restart the process passing the given listeners to the new process.
2012-06-05 06:21:10 +08:00
func Restart(listeners []Listener) (err error) {
if len(listeners) == 0 {
return errors.New("restart must be given listeners.")
}
files := make([]*os.File, len(listeners))
for i, l := range listeners {
files[i], err = l.File()
if err != nil {
return err
}
defer files[i].Close()
syscall.CloseOnExec(int(files[i].Fd()))
}
argv0, err := exec.LookPath(os.Args[0])
if err != nil {
return err
}
wd, err := os.Getwd()
if err != nil {
return err
}
allFiles := append([]*os.File{os.Stdin, os.Stdout, os.Stderr}, files...)
allFiles = append(allFiles, nil)
_, err = os.StartProcess(argv0, os.Args, &os.ProcAttr{
Dir: wd,
Env: append(os.Environ(), fmt.Sprintf("%s=%d", envCountKey, len(files))),
Files: allFiles,
})
return err
}