From 3cf3b73ffc6881d5428a735736a347f6e143b366 Mon Sep 17 00:00:00 2001
From: Boris Kolpackov <boris@codesynthesis.com>
Date: Mon, 29 Feb 2016 10:57:40 +0200
Subject: Implement auxiliary dependency database (.d files), use in
 cxx.compile

This is part of the "High Fidelity Build" work.
---
 build2/depdb.cxx | 196 +++++++++++++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 196 insertions(+)
 create mode 100644 build2/depdb.cxx

(limited to 'build2/depdb.cxx')

diff --git a/build2/depdb.cxx b/build2/depdb.cxx
new file mode 100644
index 0000000..5623405
--- /dev/null
+++ b/build2/depdb.cxx
@@ -0,0 +1,196 @@
+// file      : build2/depdb.cxx -*- C++ -*-
+// copyright : Copyright (c) 2014-2016 Code Synthesis Ltd
+// license   : MIT; see accompanying LICENSE file
+
+#include <build2/depdb>
+
+#include <butl/filesystem> // file_mtime()
+
+using namespace std;
+using namespace butl;
+
+namespace build2
+{
+  depdb::
+  depdb (const path& f)
+      : mtime_ (file_mtime (f)), touch_ (false)
+  {
+    fs_.exceptions (fstream::failbit | fstream::badbit);
+
+    if (mtime_ != timestamp_nonexistent)
+    {
+      // Open an existing file.
+      //
+      fs_.open (f.string (), fstream::in | fstream::out | fstream::binary);
+      state_ = state::read;
+      fs_.exceptions (fstream::badbit);
+
+      // Read the database format version.
+      //
+      string* l (read ());
+      if (l == nullptr || *l != "1")
+        write ('1');
+    }
+    else
+    {
+      fs_.open (f.string (), fstream::out | fstream::binary);
+
+      state_ = state::write;
+      mtime_ = timestamp_unknown;
+
+      write ('1');
+    }
+  }
+
+  void depdb::
+  change (bool flush)
+  {
+    assert (state_ != state::write);
+
+    fs_.clear ();
+    fs_.exceptions (fstream::failbit | fstream::badbit);
+
+    // Consider this scenario: we are overwriting an old line (so it ends with
+    // a newline and the "end marker") but the operation failed half way
+    // through. Now we have the prefix from the new line, the suffix from the
+    // old, and everything looks valid. So what we need is to somehow
+    // invalidate the old content so that it can never combine with (partial)
+    // new content to form a valid line. One way would be to truncate the file
+    // but that is not straightforward (see note in close()). Alternatively,
+    // we can replace everything with the "end markers".
+    //
+    fs_.seekg (0, fstream::end);
+    fstream::pos_type end (fs_.tellg ());
+
+    if (end != pos_)
+    {
+      fs_.seekp (pos_);
+
+      for (auto i (end - pos_); i != 0; --i)
+        fs_.put ('\0');
+
+      if (flush)
+        fs_.flush ();
+    }
+
+    fs_.seekp (pos_); // Must be done when changing from read to write.
+
+    state_ = state::write;
+    mtime_ = timestamp_unknown;
+  }
+
+  string* depdb::
+  read_ ()
+  {
+    // Save the start position of this line so that we can overwrite it.
+    //
+    pos_ = fs_.tellg ();
+
+    // Note that we intentionally check for eof after updating the write
+    // position.
+    //
+    if (state_ == state::read_eof)
+      return nullptr;
+
+    getline (fs_, line_); // Calls data_.erase().
+
+    // The line should always end with a newline. If it doesn't, then this
+    // line (and the rest of the database) is assumed corrupted. Also peek at
+    // the character after the newline. We should either have the next line or
+    // '\0', which is our "end marker", that is, it indicates the database
+    // was properly closed.
+    //
+    fstream::int_type c;
+    if (fs_.fail () || // Nothing got extracted.
+        fs_.eof ()  || // Eof reached before delimiter.
+        (c = fs_.peek ()) == fstream::traits_type::eof ())
+    {
+      // Preemptively switch to writing. While we could have delayed this
+      // until the user called write(), if the user calls read() again (for
+      // whatever misguided reason) we will mess up the overwrite position.
+      //
+      change ();
+      return nullptr;
+    }
+
+    // Handle the "end marker". Note that the caller can still switch to the
+    // write mode on this line. And, after calling read() again, write to the
+    // next line (i.e., start from the "end marker").
+    //
+    if (c == '\0')
+      state_ = state::read_eof;
+
+    return &line_;
+  }
+
+  void depdb::
+  write (const char* s, size_t n)
+  {
+    // Switch to writing if we are still reading.
+    //
+    if (state_ != state::write)
+      change ();
+
+    fs_.write (s, static_cast<streamsize> (n));
+    fs_.put ('\n');
+  }
+
+  void depdb::
+  write (char c)
+  {
+    // Switch to writing if we are still reading.
+    //
+    if (state_ != state::write)
+      change ();
+
+    fs_.put (c);
+    fs_.put ('\n');
+  }
+
+  void depdb::
+  close ()
+  {
+    // If we are at eof, then it means all lines are good, there is the "end
+    // marker" at the end, and we don't need to do anything, except, maybe
+    // touch the file. Otherwise, we need to add the "end marker" and truncate
+    // the rest.
+    //
+    if (state_ == state::read_eof)
+    {
+      // While there are utime(2)/utimensat(2) (and probably something similar
+      // for Windows), for now we just overwrite the "end marker". Hopefully
+      // no implementation will be smart enough to recognize this is a no-op
+      // and skip updating mtime (which would probably be incorrect).
+      //
+      // It would be interesting to one day write an implementation that uses
+      // POSIX file OI, futimens(), and ftruncate() and see how much better it
+      // performs.
+      //
+      if (touch_)
+      {
+        fs_.clear ();
+        fs_.exceptions (fstream::failbit | fstream::badbit);
+        fs_.seekp (0, fstream::cur); // Required to switch from read to write.
+        fs_.put ('\0');
+      }
+    }
+    else
+    {
+      if (state_ != state::write)
+      {
+        pos_ = fs_.tellg (); // The last line is accepted.
+        change (false); // Don't flush.
+      }
+
+      fs_.put ('\0'); // The "end marker".
+
+      // Truncating an fstream is actually a non-portable pain in the butt.
+      // What if we leave the junk after the "end marker"? These files are
+      // pretty small and chances are they will occupy the filesystem's block
+      // size (usually 4KB) whether they are truncated or not. So it might
+      // actually be faster not to truncate.
+    }
+
+    fs_.close ();
+  }
+}
-- 
cgit v1.1