From 8f7934d025aeb9d15a3f3267262ed487065b497f Mon Sep 17 00:00:00 2001 From: Alin Sinpalean Date: Fri, 1 Sep 2017 09:45:54 +0200 Subject: [PATCH] Take the fdatasync() syscall out from under mutex lock to (mostly) avoid scrape and eval from blocking on disk I/O. --- wal.go | 33 ++++++++++++++++++++++++++------- 1 file changed, 26 insertions(+), 7 deletions(-) diff --git a/wal.go b/wal.go index 7df01ca8b..773bf51ee 100644 --- a/wal.go +++ b/wal.go @@ -298,22 +298,41 @@ func (w *SegmentWAL) tail() *os.File { // Sync flushes the changes to disk. func (w *SegmentWAL) Sync() error { - w.mtx.Lock() - defer w.mtx.Unlock() + var tail *os.File + var err error + + // Flush the writer and retrieve the reference to the tail segment under mutex lock + func() { + w.mtx.Lock() + defer w.mtx.Unlock() + if err = w.flush(); err != nil { + return + } + tail = w.tail() + } () + + if err != nil { + return err + } - return w.sync() + // But only fsync the tail segment after releasing the mutex as it will block on disk I/O + return fileutil.Fdatasync(tail) } func (w *SegmentWAL) sync() error { - if w.cur == nil { - return nil - } - if err := w.cur.Flush(); err != nil { + if err := w.flush(); err != nil { return err } return fileutil.Fdatasync(w.tail()) } +func (w *SegmentWAL) flush() error { + if w.cur == nil { + return nil + } + return w.cur.Flush() +} + func (w *SegmentWAL) run(interval time.Duration) { var tick <-chan time.Time