Use database page size in read replication

This commit is contained in:
Ben Johnson
2022-04-02 11:43:49 -06:00
parent 00bad4308d
commit 8d10881278
4 changed files with 140 additions and 115 deletions

264
http/server.go Normal file
View File

@@ -0,0 +1,264 @@
package http
import (
"fmt"
"io"
"log"
"net"
"net/http"
httppprof "net/http/pprof"
"os"
"strconv"
"strings"
"github.com/benbjohnson/litestream"
"github.com/prometheus/client_golang/prometheus/promhttp"
"golang.org/x/sync/errgroup"
)
// Server represents an HTTP API server for Litestream.
type Server struct {
ln net.Listener
closed bool
httpServer *http.Server
promHandler http.Handler
addr string
server *litestream.Server
g errgroup.Group
Logger *log.Logger
}
func NewServer(server *litestream.Server, addr string) *Server {
s := &Server{
addr: addr,
server: server,
Logger: log.New(os.Stderr, "http: ", litestream.LogFlags),
}
s.promHandler = promhttp.Handler()
s.httpServer = &http.Server{
Handler: http.HandlerFunc(s.serveHTTP),
}
return s
}
func (s *Server) Open() (err error) {
if s.ln, err = net.Listen("tcp", s.addr); err != nil {
return err
}
s.g.Go(func() error {
if err := s.httpServer.Serve(s.ln); err != nil && !s.closed {
return err
}
return nil
})
return nil
}
func (s *Server) Close() (err error) {
s.closed = true
if s.ln != nil {
if e := s.ln.Close(); e != nil && err == nil {
err = e
}
}
if e := s.g.Wait(); e != nil && err == nil {
err = e
}
return err
}
// Port returns the port the listener is running on.
func (s *Server) Port() int {
if s.ln == nil {
return 0
}
return s.ln.Addr().(*net.TCPAddr).Port
}
// URL returns the full base URL for the running server.
func (s *Server) URL() string {
host, _, _ := net.SplitHostPort(s.addr)
if host == "" {
host = "localhost"
}
return fmt.Sprintf("http://%s", net.JoinHostPort(host, fmt.Sprint(s.Port())))
}
func (s *Server) serveHTTP(w http.ResponseWriter, r *http.Request) {
if strings.HasPrefix(r.URL.Path, "/debug/pprof") {
switch r.URL.Path {
case "/debug/pprof/cmdline":
httppprof.Cmdline(w, r)
case "/debug/pprof/profile":
httppprof.Profile(w, r)
case "/debug/pprof/symbol":
httppprof.Symbol(w, r)
case "/debug/pprof/trace":
httppprof.Trace(w, r)
default:
httppprof.Index(w, r)
}
return
}
switch r.URL.Path {
case "/metrics":
s.promHandler.ServeHTTP(w, r)
case "/stream":
switch r.Method {
case http.MethodGet:
s.handleGetStream(w, r)
default:
http.Error(w, "Method not allowed", http.StatusMethodNotAllowed)
}
default:
http.NotFound(w, r)
}
}
func (s *Server) handleGetStream(w http.ResponseWriter, r *http.Request) {
q := r.URL.Query()
// TODO: Listen for all databases matching query criteria.
path := q.Get("path")
if path == "" {
http.Error(w, "Database name required", http.StatusBadRequest)
return
}
db := s.server.DB(path)
if db == nil {
http.Error(w, "Database not found", http.StatusNotFound)
return
}
// Set the page size in the header.
w.Header().Set("Litestream-page-size", strconv.Itoa(db.PageSize()))
// TODO: Restart stream from a previous position, if specified.
// Determine starting position.
pos := db.Pos()
if pos.Generation == "" {
http.Error(w, "No generation available", http.StatusServiceUnavailable)
return
}
pos.Offset = 0
s.Logger.Printf("stream connected @ %s", pos)
defer s.Logger.Printf("stream disconnected")
// Obtain iterator before snapshot so we don't miss any WAL segments.
itr, err := db.WALSegments(r.Context(), pos.Generation)
if err != nil {
http.Error(w, fmt.Sprintf("Cannot obtain WAL iterator: %s", err), http.StatusInternalServerError)
return
}
defer itr.Close()
// Write snapshot to response body.
if err := db.WithFile(func(f *os.File) error {
fi, err := f.Stat()
if err != nil {
return err
}
// Write snapshot header with current position & size.
hdr := litestream.StreamRecordHeader{
Type: litestream.StreamRecordTypeSnapshot,
Generation: pos.Generation,
Index: pos.Index,
Size: fi.Size(),
}
if buf, err := hdr.MarshalBinary(); err != nil {
return fmt.Errorf("marshal snapshot stream record header: %w", err)
} else if _, err := w.Write(buf); err != nil {
return fmt.Errorf("write snapshot stream record header: %w", err)
}
if _, err := io.CopyN(w, f, fi.Size()); err != nil {
return fmt.Errorf("copy snapshot: %w", err)
}
return nil
}); err != nil {
http.Error(w, err.Error(), http.StatusInternalServerError)
return
}
// Flush after snapshot has been written.
w.(http.Flusher).Flush()
for {
// Wait for notification of new entries.
select {
case <-r.Context().Done():
return
case <-itr.NotifyCh():
}
for itr.Next() {
info := itr.WALSegment()
// Skip any segments before our initial position.
if cmp, err := litestream.ComparePos(info.Pos(), pos); err != nil {
s.Logger.Printf("pos compare: %s", err)
return
} else if cmp == -1 {
continue
}
hdr := litestream.StreamRecordHeader{
Type: litestream.StreamRecordTypeWALSegment,
Flags: 0,
Generation: info.Generation,
Index: info.Index,
Offset: info.Offset,
Size: info.Size,
}
// Write record header.
data, err := hdr.MarshalBinary()
if err != nil {
s.Logger.Printf("marshal WAL segment stream record header: %s", err)
return
} else if _, err := w.Write(data); err != nil {
s.Logger.Printf("write WAL segment stream record header: %s", err)
return
}
// Copy WAL segment data to writer.
if err := func() error {
rd, err := db.WALSegmentReader(r.Context(), info.Pos())
if err != nil {
return fmt.Errorf("cannot fetch wal segment reader: %w", err)
}
defer rd.Close()
if _, err := io.CopyN(w, rd, hdr.Size); err != nil {
return fmt.Errorf("cannot copy wal segment: %w", err)
}
return nil
}(); err != nil {
log.Print(err)
return
}
// Flush after WAL segment has been written.
w.(http.Flusher).Flush()
}
if itr.Err() != nil {
s.Logger.Printf("wal iterator error: %s", err)
return
}
}
}