1 files changed, 1394 insertions, 1165 deletions
diff --git a/libbuild2/cc/compile-rule.cxx b/libbuild2/cc/compile-rule.cxx
index 93f05f1..fa46332 100644
--- a/libbuild2/cc/compile-rule.cxx
+++ b/libbuild2/cc/compile-rule.cxx
@@ -3,6 +3,7 @@
 
 #include <libbuild2/cc/compile-rule.hxx>
 
+#include <cerrno>
 #include <cstdlib>  // exit()
 #include <cstring>  // strlen(), strchr(), strncmp()
 
@@ -16,6 +17,7 @@
 #include <libbuild2/algorithm.hxx>
 #include <libbuild2/filesystem.hxx>  // mtime()
 #include <libbuild2/diagnostics.hxx>
+#include <libbuild2/make-parser.hxx>
 
 #include <libbuild2/bin/target.hxx>
 
@@ -174,7 +176,7 @@ namespace build2
       if (s == "includes") return preprocessed::includes;
       if (s == "modules")  return preprocessed::modules;
       if (s == "all")      return preprocessed::all;
-      throw invalid_argument ("invalid preprocessed value '" + s + "'");
+      throw invalid_argument ("invalid preprocessed value '" + s + '\'');
     }
 
     // Return true if the compiler supports -isystem (GCC class) or
@@ -228,11 +230,17 @@ namespace build2
       return nullopt;
     }
 
+    // Note that we don't really need this for clean (where we only need
+    // unrefined unit type) so we could make this update-only. But let's keep
+    // it simple for now. Note that now we do need the source prerequisite
+    // type in clean to deal with Objective-X.
+    //
     struct compile_rule::match_data
     {
-      explicit
-      match_data (unit_type t, const prerequisite_member& s)
-          : type (t), src (s) {}
+      match_data (const compile_rule& r,
+                  unit_type t,
+                  const prerequisite_member& s)
+          : type (t), src (s), rule (r) {}
 
       unit_type type;
       preprocessed pp = preprocessed::none;
@@ -245,39 +253,67 @@ namespace build2
       path dd;                              // Dependency database path.
       size_t header_units = 0;              // Number of imported header units.
       module_positions modules = {0, 0, 0}; // Positions of imported modules.
+
+      const compile_rule& rule;
+
+      target_state
+      operator() (action a, const target& t)
+      {
+        return rule.perform_update (a, t, *this);
+      }
     };
 
     compile_rule::
-    compile_rule (data&& d)
+    compile_rule (data&& d, const scope& rs)
         : common (move (d)),
-          rule_id (string (x) += ".compile 5")
+          rule_id (string (x) += ".compile 6")
     {
-      static_assert (sizeof (match_data) <= target::data_size,
-                     "insufficient space");
+      // Locate the header cache (see enter_header() for details).
+      //
+      {
+        string mn (string (x) + ".config");
+
+        header_cache_ = rs.find_module<config_module> (mn); // Must be there.
+
+        const scope* ws (rs.weak_scope ());
+        if (ws != &rs)
+        {
+          const scope* s (&rs);
+          do
+          {
+            s = s->parent_scope ()->root_scope ();
+
+            if (const auto* m = s->find_module<config_module> (mn))
+              header_cache_ = m;
+
+          } while (s != ws);
+        }
+      }
     }
 
     template <typename T>
     void compile_rule::
     append_sys_hdr_options (T& args) const
     {
-      assert (sys_hdr_dirs_extra <= sys_hdr_dirs.size ());
+      assert (sys_hdr_dirs_mode + sys_hdr_dirs_extra <= sys_hdr_dirs.size ());
 
       // Note that the mode options are added as part of cmode.
       //
       auto b (sys_hdr_dirs.begin () + sys_hdr_dirs_mode);
-      auto m (sys_hdr_dirs.begin () + sys_hdr_dirs_extra);
-      auto e (sys_hdr_dirs.end ());
+      auto x (b + sys_hdr_dirs_extra);
 
+      // Add extras.
+      //
       // Note: starting from 16.10, MSVC gained /external:I option though it
       // doesn't seem to affect the order, only "system-ness".
       //
       append_option_values (
         args,
-        cclass == compiler_class::gcc  ? "-idirafter" :
+        cclass == compiler_class::gcc  ? "-isystem" :
         cclass == compiler_class::msvc ? (isystem (*this)
                                           ? "/external:I"
                                           : "/I") : "-I",
-        m, e,
+        b, x,
         [] (const dir_path& d) {return d.string ().c_str ();});
 
       // For MSVC if we have no INCLUDE environment variable set, then we
@@ -293,7 +329,7 @@ namespace build2
         {
           append_option_values (
             args, "/I",
-            b, m,
+            x, sys_hdr_dirs.end (),
             [] (const dir_path& d) {return d.string ().c_str ();});
         }
       }
@@ -336,10 +372,18 @@ namespace build2
           case unit_type::module_impl:
             {
               o1 = "-x";
-              switch (x_lang)
+
+              if (x_assembler_cpp (md.src))
+                o2 = "assembler-with-cpp";
+              else
               {
-              case lang::c:   o2 = "c";   break;
-              case lang::cxx: o2 = "c++"; break;
+                bool obj (x_objective (md.src));
+
+                switch (x_lang)
+                {
+                case lang::c:   o2 = obj ? "objective-c"   : "c";   break;
+                case lang::cxx: o2 = obj ? "objective-c++" : "c++"; break;
+                }
               }
               break;
             }
@@ -406,7 +450,7 @@ namespace build2
     }
 
     bool compile_rule::
-    match (action a, target& t, const string&) const
+    match (action a, target& t) const
     {
       tracer trace (x, "compile_rule::match");
 
@@ -441,11 +485,13 @@ namespace build2
         //
         if (ut == unit_type::module_header ? p.is_a (**x_hdr) || p.is_a<h> () :
             ut == unit_type::module_intf   ? p.is_a (*x_mod)                  :
-            p.is_a (x_src))
+            p.is_a (x_src)                        ||
+            (x_asp != nullptr && p.is_a (*x_asp)) ||
+            (x_obj != nullptr && p.is_a (*x_obj)))
         {
           // Save in the target's auxiliary storage.
           //
-          t.data (match_data (ut, p));
+          t.data (a, match_data (*this, ut, p));
           return true;
         }
       }
@@ -456,13 +502,16 @@ namespace build2
 
     // Append or hash library options from a pair of *.export.* variables
     // (first is x.* then cc.*) recursively, prerequisite libraries first.
+    // If common is true, then only append common options from the lib{}
+    // groups.
     //
     template <typename T>
     void compile_rule::
     append_library_options (appended_libraries& ls, T& args,
                             const scope& bs,
                             const scope* is, // Internal scope.
-                            action a, const file& l, bool la, linfo li,
+                            action a, const file& l, bool la,
+                            linfo li, bool common,
                             library_cache* lib_cache) const
     {
       struct data
@@ -476,7 +525,7 @@ namespace build2
       //
       auto imp = [] (const target& l, bool la) {return la && l.is_a<libux> ();};
 
-      auto opt = [&d, this] (const target& lt,
+      auto opt = [&d, this] (const target& l, // Note: could be lib{}
                              const string& t, bool com, bool exp)
       {
         // Note that in our model *.export.poptions are always "interface",
@@ -485,8 +534,6 @@ namespace build2
         if (!exp) // Ignore libux.
           return true;
 
-        const file& l (lt.as<file> ());
-
         // Suppress duplicates.
         //
         // Compilation is the simple case: we can add the options on the first
@@ -496,6 +543,8 @@ namespace build2
         if (find (d.ls.begin (), d.ls.end (), &l) != d.ls.end ())
           return false;
 
+        // Note: go straight for the public variable pool.
+        //
         const variable& var (
           com
           ? c_export_poptions
@@ -645,16 +694,24 @@ namespace build2
 
       process_libraries (a, bs, li, sys_lib_dirs,
                          l, la, 0, // lflags unused.
-                         imp, nullptr, opt, false /* self */, lib_cache);
+                         imp, nullptr, opt,
+                         false /* self */,
+                         common /* proc_opt_group */,
+                         lib_cache);
     }
 
     void compile_rule::
     append_library_options (appended_libraries& ls, strings& args,
                             const scope& bs,
-                            action a, const file& l, bool la, linfo li) const
+                            action a, const file& l, bool la,
+                            linfo li,
+                            bool common,
+                            bool original) const
     {
-      const scope* is (isystem (*this) ? effective_iscope (bs) : nullptr);
-      append_library_options (ls, args, bs, is, a, l, la, li, nullptr);
+      const scope* is (!original && isystem (*this)
+                       ? effective_iscope (bs)
+                       : nullptr);
+      append_library_options (ls, args, bs, is, a, l, la, li, common, nullptr);
     }
 
     template <typename T>
@@ -695,7 +752,9 @@ namespace build2
             append_library_options (ls,
                                     args,
                                     bs, iscope (),
-                                    a, *f, la, li,
+                                    a, *f, la,
+                                    li,
+                                    false /* common */,
                                     &lc);
           }
         }
@@ -708,7 +767,7 @@ namespace build2
     void compile_rule::
     append_library_prefixes (appended_libraries& ls, prefix_map& pm,
                              const scope& bs,
-                             action a, target& t, linfo li) const
+                             action a, const target& t, linfo li) const
     {
       struct data
       {
@@ -731,14 +790,23 @@ namespace build2
         if (find (d.ls.begin (), d.ls.end (), &l) != d.ls.end ())
           return false;
 
-        const variable& var (
-          com
-          ? c_export_poptions
-          : (t == x
-             ? x_export_poptions
-             : l.ctx.var_pool[t + ".export.poptions"]));
-
-        append_prefixes (d.pm, l, var);
+        // If this target does not belong to any project (e.g, an "imported as
+        // installed" library), then it can't possibly generate any headers
+        // for us.
+        //
+        if (const scope* rs = l.base_scope ().root_scope ())
+        {
+          // Note: go straight for the public variable pool.
+          //
+          const variable& var (
+            com
+            ? c_export_poptions
+            : (t == x
+               ? x_export_poptions
+               : l.ctx.var_pool[t + ".export.poptions"]));
+
+          append_prefixes (d.pm, *rs, l, var);
+        }
 
         if (com)
           d.ls.push_back (&l);
@@ -770,75 +838,14 @@ namespace build2
 
           process_libraries (a, bs, li, sys_lib_dirs,
                              pt->as<file> (), la, 0, // lflags unused.
-                             impf, nullptr, optf, false /* self */,
+                             impf, nullptr, optf,
+                             false /* self */,
+                             false /* proc_opt_group */,
                              &lib_cache);
         }
       }
     }
 
-    // Update the target during the match phase. Return true if it has changed
-    // or if the passed timestamp is not timestamp_unknown and is older than
-    // the target.
-    //
-    // This function is used to make sure header dependencies are up to date.
-    //
-    // There would normally be a lot of headers for every source file (think
-    // all the system headers) and just calling execute_direct() on all of
-    // them can get expensive. At the same time, most of these headers are
-    // existing files that we will never be updating (again, system headers,
-    // for example) and the rule that will match them is the fallback
-    // file_rule. That rule has an optimization: it returns noop_recipe (which
-    // causes the target state to be automatically set to unchanged) if the
-    // file is known to be up to date. So we do the update "smartly".
-    //
-    static bool
-    update (tracer& trace, action a, const target& t, timestamp ts)
-    {
-      const path_target* pt (t.is_a<path_target> ());
-
-      if (pt == nullptr)
-        ts = timestamp_unknown;
-
-      target_state os (t.matched_state (a));
-
-      if (os == target_state::unchanged)
-      {
-        if (ts == timestamp_unknown)
-          return false;
-        else
-        {
-          // We expect the timestamp to be known (i.e., existing file).
-          //
-          timestamp mt (pt->mtime ());
-          assert (mt != timestamp_unknown);
-          return mt > ts;
-        }
-      }
-      else
-      {
-        // We only want to return true if our call to execute() actually
-        // caused an update. In particular, the target could already have been
-        // in target_state::changed because of a dependency extraction run for
-        // some other source file.
-        //
-        // @@ MT perf: so we are going to switch the phase and execute for
-        //    any generated header.
-        //
-        phase_switch ps (t.ctx, run_phase::execute);
-        target_state ns (execute_direct (a, t));
-
-        if (ns != os && ns != target_state::unchanged)
-        {
-          l6 ([&]{trace << "updated " << t
-                        << "; old state " << os
-                        << "; new state " << ns;});
-          return true;
-        }
-        else
-          return ts != timestamp_unknown ? pt->newer (ts, ns) : false;
-      }
-    }
-
     recipe compile_rule::
     apply (action a, target& xt) const
     {
@@ -846,7 +853,7 @@ namespace build2
 
       file& t (xt.as<file> ()); // Either obj*{} or bmi*{}.
 
-      match_data& md (t.data<match_data> ());
+      match_data& md (t.data<match_data> (a));
 
       context& ctx (t.ctx);
 
@@ -1000,6 +1007,12 @@ namespace build2
             // to match it if we may need its modules or importable headers
             // (see search_modules(), make_header_sidebuild() for details).
             //
+            // Well, that was the case until we've added support for immediate
+            // importation of libraries, which happens during the load phase
+            // and natually leaves the library unmatched. While we could have
+            // returned from search_library() an indication of whether the
+            // library has been matched, this doesn't seem worth the trouble.
+            //
             if (p.proj ())
             {
               pt = search_library (a,
@@ -1007,8 +1020,10 @@ namespace build2
                                    usr_lib_dirs,
                                    p.prerequisite);
 
+#if 0
               if (pt != nullptr && !modules)
                 continue;
+#endif
             }
 
             if (pt == nullptr)
@@ -1063,8 +1078,13 @@ namespace build2
         // match in link::apply() it will be safe unless someone is building
         // an obj?{} target directly.
         //
+        // @@ If for some reason unmatch fails, this messes up the for_install
+        //    logic because we will update this library during match. Perhaps
+        //    we should postpone updating them until execute if we failed to
+        //    unmatch. See how we do this in ad hoc rule.
+        //
         pair<bool, target_state> mr (
-          build2::match (
+          match_complete (
             a,
             *pt,
             pt->is_a<liba> () || pt->is_a<libs> () || pt->is_a<libux> ()
@@ -1098,6 +1118,8 @@ namespace build2
           md.symexport = l ? cast<bool> (l) : symexport;
         }
 
+        // NOTE: see similar code in adhoc_buildscript_rule::apply().
+
         // Make sure the output directory exists.
         //
         // Is this the right thing to do? It does smell a bit, but then we do
@@ -1198,15 +1220,6 @@ namespace build2
 
           append_options (cs, t, c_coptions);
           append_options (cs, t, x_coptions);
-
-          if (ot == otype::s)
-          {
-            // On Darwin, Win32 -fPIC is the default.
-            //
-            if (tclass == "linux" || tclass == "bsd")
-              cs.append ("-fPIC");
-          }
-
           append_options (cs, cmode);
 
           if (md.pp != preprocessed::all)
@@ -1300,7 +1313,7 @@ namespace build2
           //
           l5 ([&]{trace << "extracting headers from " << src;});
           auto& is (tu.module_info.imports);
-          psrc = extract_headers (a, bs, t, li, src, md, dd, u, mt, is);
+          extract_headers (a, bs, t, li, src, md, dd, u, mt, is, psrc);
           is.clear (); // No longer needed.
         }
 
@@ -1475,10 +1488,10 @@ namespace build2
         // to keep re-validating the file on every subsequent dry-run as well
         // on the real run).
         //
-        if (u && dd.reading () && !ctx.dry_run)
-          dd.touch = true;
+        if (u && dd.reading () && !ctx.dry_run_option)
+          dd.touch = timestamp_unknown;
 
-        dd.close ();
+        dd.close (false /* mtime_check */);
         md.dd = move (dd.path);
 
         // If the preprocessed output is suitable for compilation, then pass
@@ -1536,67 +1549,25 @@ namespace build2
 
       switch (a)
       {
-      case perform_update_id: return [this] (action a, const target& t)
-        {
-          return perform_update (a, t);
-        };
-      case perform_clean_id: return [this] (action a, const target& t)
+      case perform_update_id: return move (md);
+      case perform_clean_id:
         {
-          return perform_clean (a, t);
-        };
+          return [this, srct = &md.src.type ()] (action a, const target& t)
+          {
+            return perform_clean (a, t, *srct);
+          };
+        }
       default: return noop_recipe; // Configure update.
       }
     }
 
-    // Reverse-lookup target type(s) from extension.
-    //
-    small_vector<const target_type*, 2> compile_rule::
-    map_extension (const scope& s, const string& n, const string& e) const
-    {
-      // We will just have to try all of the possible ones, in the "most
-      // likely to match" order.
-      //
-      auto test = [&s, &n, &e] (const target_type& tt) -> bool
-      {
-        // Call the extension derivation function. Here we know that it will
-        // only use the target type and name from the target key so we can
-        // pass bogus values for the rest.
-        //
-        target_key tk {&tt, nullptr, nullptr, &n, nullopt};
-
-        // This is like prerequisite search.
-        //
-        optional<string> de (tt.default_extension (tk, s, nullptr, true));
-
-        return de && *de == e;
-      };
-
-      small_vector<const target_type*, 2> r;
-
-      for (const target_type* const* p (x_inc); *p != nullptr; ++p)
-        if (test (**p))
-          r.push_back (*p);
-
-      return r;
-    }
-
     void compile_rule::
-    append_prefixes (prefix_map& m, const target& t, const variable& var) const
+    append_prefixes (prefix_map& m,
+                     const scope& rs, const target& t,
+                     const variable& var) const
     {
       tracer trace (x, "compile_rule::append_prefixes");
 
-      // If this target does not belong to any project (e.g, an "imported as
-      // installed" library), then it can't possibly generate any headers for
-      // us.
-      //
-      const scope& bs (t.base_scope ());
-      const scope* rs (bs.root_scope ());
-      if (rs == nullptr)
-        return;
-
-      const dir_path& out_base (t.dir);
-      const dir_path& out_root (rs->out_path ());
-
       if (auto l = t[var])
       {
         const auto& v (cast<strings> (l));
@@ -1654,113 +1625,8 @@ namespace build2
 
           // If we are not inside our project root, then ignore.
           //
-          if (!d.sub (out_root))
-            continue;
-
-          // If the target directory is a sub-directory of the include
-          // directory, then the prefix is the difference between the
-          // two. Otherwise, leave it empty.
-          //
-          // The idea here is to make this "canonical" setup work auto-
-          // magically:
-          //
-          // 1. We include all files with a prefix, e.g., <foo/bar>.
-          // 2. The library target is in the foo/ sub-directory, e.g.,
-          //    /tmp/foo/.
-          // 3. The poptions variable contains -I/tmp.
-          //
-          dir_path p (out_base.sub (d) ? out_base.leaf (d) : dir_path ());
-
-          // We use the target's directory as out_base but that doesn't work
-          // well for targets that are stashed in subdirectories. So as a
-          // heuristics we are going to also enter the outer directories of
-          // the original prefix. It is, however, possible, that another -I
-          // option after this one will produce one of these outer prefixes as
-          // its original prefix in which case we should override it.
-          //
-          // So we are going to assign the original prefix priority value 0
-          // (highest) and then increment it for each outer prefix.
-          //
-          auto enter = [&trace, &m] (dir_path p, dir_path d, size_t prio)
-          {
-            auto j (m.find (p));
-
-            if (j != m.end ())
-            {
-              prefix_value& v (j->second);
-
-              // We used to reject duplicates but it seems this can be
-              // reasonably expected to work according to the order of the
-              // -I options.
-              //
-              // Seeing that we normally have more "specific" -I paths first,
-              // (so that we don't pick up installed headers, etc), we ignore
-              // it.
-              //
-              if (v.directory == d)
-              {
-                if (v.priority > prio)
-                  v.priority = prio;
-              }
-              else if (v.priority <= prio)
-              {
-                if (verb >= 4)
-                  trace << "ignoring mapping for prefix '" << p << "'\n"
-                        << "  existing mapping to " << v.directory
-                        << " priority " << v.priority << '\n'
-                        << "  another mapping to  " << d
-                        << " priority " << prio;
-              }
-              else
-              {
-                if (verb >= 4)
-                  trace << "overriding mapping for prefix '" << p << "'\n"
-                        << "  existing mapping to " << v.directory
-                        << " priority " << v.priority << '\n'
-                        << "  new mapping to      " << d
-                        << " priority " << prio;
-
-                v.directory = move (d);
-                v.priority = prio;
-              }
-            }
-            else
-            {
-              l6 ([&]{trace << "'" << p << "' -> " << d << " priority "
-                            << prio;});
-              m.emplace (move (p), prefix_value {move (d), prio});
-            }
-          };
-
-#if 1
-          // Enter all outer prefixes, including prefixless.
-          //
-          // The prefixless part is fuzzy but seems to be doing the right
-          // thing ignoring/overriding-wise, at least in cases where one of
-          // the competing -I paths is a subdirectory of another. But the
-          // proper solution will be to keep all the prefixless entries (by
-          // changing prefix_map to a multimap) since for them we have an
-          // extra check (target must be explicitly spelled out in a
-          // buildfile).
-          //
-          for (size_t prio (0);; ++prio)
-          {
-            bool e (p.empty ());
-            enter ((e ? move (p) : p), (e ? move (d) : d), prio);
-            if (e)
-              break;
-            p = p.directory ();
-          }
-#else
-          size_t prio (0);
-          for (bool e (false); !e; ++prio)
-          {
-            dir_path n (p.directory ());
-            e = n.empty ();
-            enter ((e ? move (p) : p), (e ? move (d) : d), prio);
-            p = move (n);
-          }
-#endif
+          if (d.sub (rs.out_path ()))
+            append_prefix (trace, m, t, move (d));
         }
       }
     }
@@ -1768,15 +1634,16 @@ namespace build2
     auto compile_rule::
     build_prefix_map (const scope& bs,
                       action a,
-                      target& t,
+                      const target& t,
                       linfo li) const -> prefix_map
     {
       prefix_map pm;
 
       // First process our own.
       //
-      append_prefixes (pm, t, x_poptions);
-      append_prefixes (pm, t, c_poptions);
+      const scope& rs (*bs.root_scope ());
+      append_prefixes (pm, rs, t, x_poptions);
+      append_prefixes (pm, rs, t, c_poptions);
 
       // Then process the include directories from prerequisite libraries.
       //
@@ -1786,68 +1653,6 @@ namespace build2
       return pm;
     }
 
-    // Return the next make prerequisite starting from the specified
-    // position and update position to point to the start of the
-    // following prerequisite or l.size() if there are none left.
-    //
-    static string
-    next_make (const string& l, size_t& p)
-    {
-      size_t n (l.size ());
-
-      // Skip leading spaces.
-      //
-      for (; p != n && l[p] == ' '; p++) ;
-
-      // Lines containing multiple prerequisites are 80 characters max.
-      //
-      string r;
-      r.reserve (n);
-
-      // Scan the next prerequisite while watching out for escape sequences.
-      //
-      for (; p != n && l[p] != ' '; p++)
-      {
-        char c (l[p]);
-
-        if (p + 1 != n)
-        {
-          if (c == '$')
-          {
-            // Got to be another (escaped) '$'.
-            //
-            if (l[p + 1] == '$')
-              ++p;
-          }
-          else if (c == '\\')
-          {
-            // This may or may not be an escape sequence depending on whether
-            // what follows is "escapable".
-            //
-            switch (c = l[++p])
-            {
-            case '\\': break;
-            case ' ': break;
-            default: c = '\\'; --p; // Restore.
-            }
-          }
-        }
-
-        r += c;
-      }
-
-      // Skip trailing spaces.
-      //
-      for (; p != n && l[p] == ' '; p++) ;
-
-      // Skip final '\'.
-      //
-      if (p == n - 1 && l[p] == '\\')
-        p++;
-
-      return r;
-    }
-
     // VC /showIncludes output. The first line is the file being compiled
     // (unless clang-cl; handled by our caller). Then we have the list of
     // headers, one per line, in this form (text can presumably be
@@ -2043,7 +1848,7 @@ namespace build2
     // Any unhandled io_error is handled by the caller as a generic module
     // mapper io error. Returning false terminates the communication.
     //
-    struct compile_rule::module_mapper_state //@@ gcc_module_mapper_state
+    struct compile_rule::gcc_module_mapper_state
     {
       size_t skip;              // Number of depdb entries to skip.
       size_t header_units = 0;  // Number of header units imported.
@@ -2054,15 +1859,20 @@ namespace build2
       optional<const build2::cc::translatable_headers*> translatable_headers;
 
       small_vector<string, 2> batch; // Reuse buffers.
+      size_t                  batch_n = 0;
 
-      module_mapper_state (size_t s, module_imports& i)
+      gcc_module_mapper_state (size_t s, module_imports& i)
           : skip (s), imports (i) {}
     };
 
-    bool compile_rule::
-    gcc_module_mapper (module_mapper_state& st,
+    // The module mapper is called on one line of input at a time. It should
+    // return nullopt if another line is expected (batch), false if the mapper
+    // interaction should be terminated, and true if it should be continued.
+    //
+    optional<bool> compile_rule::
+    gcc_module_mapper (gcc_module_mapper_state& st,
                        action a, const scope& bs, file& t, linfo li,
-                       ifdstream& is,
+                       const string& l,
                        ofdstream& os,
                        depdb& dd, bool& update, bool& bad_error,
                        optional<prefix_map>& pfx_map, srcout_map& so_map) const
@@ -2078,35 +1888,40 @@ namespace build2
 
       // Read in the entire batch trying hard to reuse the buffers.
       //
-      auto& batch (st.batch);
-      size_t batch_n (0);
+      small_vector<string, 2>& batch (st.batch);
+      size_t& batch_n (st.batch_n);
 
-      for (;;)
+      // Add the next line.
+      //
       {
         if (batch.size () == batch_n)
-          batch.push_back (string ());
-
-        string& r (batch[batch_n]);
-
-        if (eof (getline (is, r)))
-          break;
+          batch.push_back (l);
+        else
+          batch[batch_n] = l;
 
         batch_n++;
+      }
 
-        if (r.back () != ';')
-          break;
+      // Check if more is expected in this batch.
+      //
+      {
+        string& r (batch[batch_n - 1]);
 
-        // Strip the trailing `;` word.
-        //
-        r.pop_back ();
-        r.pop_back ();
-      }
+        if (r.back () == ';')
+        {
+          // Strip the trailing `;` word.
+          //
+          r.pop_back ();
+          r.pop_back ();
 
-      if (batch_n == 0) // EOF
-        return false;
+          return nullopt;
+        }
+      }
 
       if (verb >= 3)
       {
+        // It doesn't feel like buffering this would be useful.
+        //
         // Note that we show `;` in requests/responses so that the result
         // could be replayed.
         //
@@ -2128,23 +1943,211 @@ namespace build2
       for (size_t i (0); i != batch_n; ++i)
       {
         string& r (batch[i]);
+        size_t rn (r.size ());
+
+        // The protocol uses a peculiar quoting/escaping scheme that can be
+        // summarized as follows (see the libcody documentation for details):
+        //
+        // - Words are seperated with spaces and/or tabs.
+        //
+        // - Words need not be quoted if they only containing characters from
+        //   the [-+_/%.A-Za-z0-9] set.
+        //
+        // - Otherwise words need to be single-quoted.
+        //
+        // - Inside single-quoted words, the \n \t \' and \\ escape sequences
+        //   are recognized.
+        //
+        // Note that we currently don't treat abutted quotes (as in a' 'b) as
+        // a single word (it doesn't seem plausible that we will ever receive
+        // something like this).
+        //
+        size_t b (0), e (0), n; bool q; // Next word.
+
+        auto next = [&r, rn, &b, &e, &n, &q] () -> size_t
+        {
+          if (b != e)
+            b = e;
+
+          // Skip leading whitespaces.
+          //
+          for (; b != rn && (r[b] == ' ' || r[b] == '\t'); ++b) ;
+
+          if (b != rn)
+          {
+            q = (r[b] == '\'');
+
+            // Find first trailing whitespace or closing quote.
+            //
+            for (e = b + 1; e != rn; ++e)
+            {
+              // Note that we deal with invalid quoting/escaping in unquote().
+              //
+              switch (r[e])
+              {
+              case ' ':
+              case '\t':
+                if (q)
+                  continue;
+                else
+                  break;
+              case '\'':
+                if (q)
+                {
+                  ++e; // Include closing quote (hopefully).
+                  break;
+                }
+                else
+                {
+                  assert (false); // Abutted quote.
+                  break;
+                }
+              case '\\':
+                if (++e != rn) // Skip next character (hopefully).
+                  continue;
+                else
+                  break;
+              default:
+                continue;
+              }
+
+              break;
+            }
+
+            n = e - b;
+          }
+          else
+          {
+            q = false;
+            e = rn;
+            n = 0;
+          }
+
+          return n;
+        };
+
+        // Unquote into tmp the current word returning false if malformed.
+        //
+        auto unquote = [&r, &b, &n, &q, &tmp] (bool clear = true) -> bool
+        {
+          if (q && n > 1)
+          {
+            size_t e (b + n - 1);
+
+            if (r[b] == '\'' && r[e] == '\'')
+            {
+              if (clear)
+                tmp.clear ();
+
+              size_t i (b + 1);
+              for (; i != e; ++i)
+              {
+                char c (r[i]);
+                if (c == '\\')
+                {
+                  if (++i == e)
+                  {
+                    i = 0;
+                    break;
+                  }
+
+                  c = r[i];
+                  if      (c == 'n') c = '\n';
+                  else if (c == 't') c = '\t';
+                }
+                tmp += c;
+              }
+
+              if (i == e)
+                return true;
+            }
+          }
 
-        // @@ TODO: quoting and escaping.
+          return false;
+        };
+
+#if 0
+#define UNQUOTE(x, y)                     \
+        r = x; rn = r.size (); b = e = 0; \
+        assert (next () && unquote () && tmp == y)
+
+        UNQUOTE ("'foo bar'", "foo bar");
+        UNQUOTE (" 'foo bar' ", "foo bar");
+        UNQUOTE ("'foo\\\\bar'", "foo\\bar");
+        UNQUOTE ("'\\'foo bar'", "'foo bar");
+        UNQUOTE ("'foo bar\\''", "foo bar'");
+        UNQUOTE ("'\\'foo\\\\bar\\''", "'foo\\bar'");
+
+        fail << "all good";
+#endif
+
+        // Escape if necessary the specified string and append to r.
         //
-        size_t b (0), e (0), n; // Next word.
+        auto escape = [&r] (const string& s)
+        {
+          size_t b (0), e, n (s.size ());
+          while (b != n && (e = s.find_first_of ("\\'\n\t", b)) != string::npos)
+          {
+            r.append (s, b, e - b); // Preceding chunk.
+
+            char c (s[e]);
+            r += '\\';
+            r += (c == '\n' ? 'n' : c == '\t' ? 't' : c);
+            b = e + 1;
+          }
+
+          if (b != n)
+            r.append (s, b, e); // Final chunk.
+        };
 
-        auto next = [&r, &b, &e, &n] () -> size_t
+        // Quote and escape if necessary the specified string and append to r.
+        //
+        auto quote = [&r, &escape] (const string& s)
         {
-          return (n = next_word (r, b, e, ' ', '\t'));
+          if (find_if (s.begin (), s.end (),
+                       [] (char c)
+                       {
+                         return !((c >= 'a' && c <= 'z') ||
+                                  (c >= '0' && c <= '9') ||
+                                  (c >= 'A' && c <= 'Z') ||
+                                  c == '-' || c == '_' || c == '/' ||
+                                  c == '.' || c == '+' || c == '%');
+                       }) == s.end ())
+          {
+            r += s;
+          }
+          else
+          {
+            r += '\'';
+            escape (s);
+            r += '\'';
+          }
         };
 
+#if 0
+#define QUOTE(x, y)            \
+        r.clear (); quote (x); \
+        assert (r == y)
+
+        QUOTE ("foo/Bar-7.h", "foo/Bar-7.h");
+
+        QUOTE ("foo bar", "'foo bar'");
+        QUOTE ("foo\\bar", "'foo\\\\bar'");
+        QUOTE ("'foo bar", "'\\'foo bar'");
+        QUOTE ("foo bar'", "'foo bar\\''");
+        QUOTE ("'foo\\bar'", "'\\'foo\\\\bar\\''");
+
+        fail << "all good";
+#endif
+
         next (); // Request name.
 
-        auto name = [&r, b, n] (const char* c) -> bool
+        auto name = [&r, b, n, q] (const char* c) -> bool
         {
           // We can reasonably assume a command will never be quoted.
           //
-          return (r.compare (b, n, c) == 0 &&
+          return (!q                       &&
+                  r.compare (b, n, c) == 0 &&
                   (r[n] == ' '  || r[n] == '\t' || r[n] == '\0'));
         };
 
@@ -2193,7 +2196,17 @@ namespace build2
 
           if (next ())
           {
-            path f (r, b, n);
+            path f;
+            if (!q)
+              f = path (r, b, n);
+            else if (unquote ())
+              f = path (tmp);
+            else
+            {
+              r = "ERROR 'malformed quoting/escaping in request'";
+              continue;
+            }
+
             bool exists (true);
 
             // The TU path we pass to the compiler is always absolute so any
@@ -2204,8 +2217,9 @@ namespace build2
             //
             if (exists && f.relative ())
             {
-              tmp.assign (r, b, n);
-              r = "ERROR relative header path '"; r += tmp; r += '\'';
+              r = "ERROR 'relative header path ";
+              escape (f.string ());
+              r += '\'';
               continue;
             }
 
@@ -2242,16 +2256,17 @@ namespace build2
             try
             {
               pair<const file*, bool> er (
-                enter_header (a, bs, t, li,
-                              move (f), false /* cache */, false /* norm */,
-                              pfx_map, so_map));
+                enter_header (
+                  a, bs, t, li,
+                  move (f), false /* cache */, false /* normalized */,
+                  pfx_map, so_map));
 
               ht = er.first;
               remapped = er.second;
 
               if (remapped)
               {
-                r = "ERROR remapping of headers not supported";
+                r = "ERROR 'remapping of headers not supported'";
                 continue;
               }
 
@@ -2261,14 +2276,14 @@ namespace build2
               // diagnostics won't really add anything to the compiler's. So
               // let's only print it at -V or higher.
               //
-              if (ht == nullptr)
+              if (ht == nullptr) // f is still valid.
               {
                 assert (!exists); // Sanity check.
 
                 if (verb > 2)
                 {
                   diag_record dr;
-                  dr << error << "header '" << f << "' not found and no "
+                  dr << error << "header " << f << " not found and no "
                      << "rule to generate it";
 
                   if (verb < 4)
@@ -2309,8 +2324,10 @@ namespace build2
               // messy, let's keep both (it would have been nicer to print
               // ours after the compiler's but that isn't easy).
               //
-              r = "ERROR unable to update header '";
-              r += (ht != nullptr ? ht->path () : f).string ();
+              // Note: if ht is NULL, f is still valid.
+              //
+              r = "ERROR 'unable to update header ";
+              escape ((ht != nullptr ? ht->path () : f).string ());
               r += '\'';
               continue;
             }
@@ -2445,17 +2462,27 @@ namespace build2
                   // original (which we may need to normalize when we read
                   // this mapping in extract_headers()).
                   //
-                  tmp = "@ "; tmp.append (r, b, n); tmp += ' '; tmp += bp;
+                  // @@ This still breaks if the header path contains spaces.
+                  //    GCC bug 110153.
+                  //
+                  tmp = "@ ";
+                  if (!q) tmp.append (r, b, n);
+                  else    unquote (false /* clear */); // Can't fail.
+                  tmp += ' ';
+                  tmp += bp;
+
                   dd.expect (tmp);
                   st.header_units++;
                 }
 
-                r = "PATHNAME "; r += bp;
+                r = "PATHNAME ";
+                quote (bp);
               }
               catch (const failed&)
               {
                 r = "ERROR 'unable to update header unit for ";
-                r += hs; r += '\'';
+                escape (hs);
+                r += '\'';
                 continue;
               }
             }
@@ -2481,7 +2508,7 @@ namespace build2
         // Truncate the response batch and terminate the communication (see
         // also libcody issue #22).
         //
-        tmp.assign (r, b, n);
+        tmp.assign (r, b, n); // Request name (unquoted).
         r = "ERROR '"; r += w; r += ' '; r += tmp; r += '\'';
         batch_n = i + 1;
         term = true;
@@ -2497,6 +2524,9 @@ namespace build2
 
       // Write the response batch.
       //
+      // @@ It's theoretically possible that we get blocked writing the
+      //    response while the compiler gets blocked writing the diagnostics.
+      //
       for (size_t i (0);; )
       {
         string& r (batch[i]);
@@ -2517,6 +2547,8 @@ namespace build2
 
       os.flush ();
 
+      batch_n = 0; // Start a new batch.
+
       return !term;
     }
 
@@ -2770,9 +2802,10 @@ namespace build2
             if (exists)
             {
               pair<const file*, bool> r (
-                enter_header (a, bs, t, li,
-                              move (f), false /* cache */, false /* norm */,
-                              pfx_map, so_map));
+                enter_header (
+                  a, bs, t, li,
+                  move (f), false /* cache */, false /* normalized */,
+                  pfx_map, so_map));
 
               if (!r.second) // Shouldn't be remapped.
                 ht = r.first;
@@ -2780,7 +2813,7 @@ namespace build2
 
             if (ht != pts.back ())
             {
-              ht = static_cast<const file*> (pts.back ().target);
+              ht = &pts.back ().target->as<file> ();
               rs = "ERROR expected header '" + ht->path ().string () +
                 "' to be found instead";
               bad_error = true; // We expect an error from the compiler.
@@ -2797,9 +2830,10 @@ namespace build2
             try
             {
               pair<const file*, bool> er (
-                enter_header (a, bs, t, li,
-                              move (f), false /* cache */, false /* norm */,
-                              pfx_map, so_map));
+                enter_header (
+                  a, bs, t, li,
+                  move (f), false /* cache */, false /* normalized */,
+                  pfx_map, so_map));
 
               ht = er.first;
               remapped = er.second;
@@ -2817,7 +2851,7 @@ namespace build2
               // diagnostics won't really add anything to the compiler's. So
               // let's only print it at -V or higher.
               //
-              if (ht == nullptr)
+              if (ht == nullptr) // f is still valid.
               {
                 assert (!exists); // Sanity check.
 
@@ -2864,10 +2898,12 @@ namespace build2
               // messy, let's keep both (it would have been nicer to print
               // ours after the compiler's but that isn't easy).
               //
+              // Note: if ht is NULL, f is still valid.
+              //
               rs = !exists
                 ? string ("INCLUDE")
                 : ("ERROR unable to update header '" +
-                   (ht != nullptr ? ht->path () : f).string () + "'");
+                   (ht != nullptr ? ht->path () : f).string () + '\'');
 
               bad_error = true;
               break;
@@ -2945,7 +2981,7 @@ namespace build2
             }
             catch (const failed&)
             {
-              rs = "ERROR unable to update header unit '" + hp + "'";
+              rs = "ERROR unable to update header unit '" + hp + '\'';
               bad_error = true;
               break;
             }
@@ -2987,351 +3023,204 @@ namespace build2
     }
 #endif
 
-    // Enter as a target a header file. Depending on the cache flag, the file
-    // is assumed to either have come from the depdb cache or from the
-    // compiler run.
-    //
-    // Return the header target and an indication of whether it was remapped
-    // or NULL if the header does not exist and cannot be generated. In the
-    // latter case the passed header path is guaranteed to be still valid but
-    // might have been adjusted (e.g., normalized, etc).
+    //atomic_count cache_hit {0};
+    //atomic_count cache_mis {0};
+    //atomic_count cache_cls {0};
+
+    // The fp path is only moved from on success.
     //
     // Note: this used to be a lambda inside extract_headers() so refer to the
     // body of that function for the overall picture.
     //
     pair<const file*, bool> compile_rule::
     enter_header (action a, const scope& bs, file& t, linfo li,
-                  path&& f, bool cache, bool norm,
-                  optional<prefix_map>& pfx_map, srcout_map& so_map) const
+                  path&& fp, bool cache, bool norm,
+                  optional<prefix_map>& pfx_map,
+                  const srcout_map& so_map) const
     {
       tracer trace (x, "compile_rule::enter_header");
 
-      // Find or maybe insert the target. The directory is only moved from if
-      // insert is true. Note that it must be normalized.
-      //
-      auto find = [&trace, &t, this] (dir_path&& d,
-                                      path&& f,
-                                      bool insert) -> const file*
+      // It's reasonable to expect the same header to be included by multiple
+      // translation units, which means we will be re-doing this work over and
+      // over again. And it's not exactly cheap, taking up to 50% of an
+      // up-to-date check time on some projects. So we are going to cache the
+      // header path to target mapping.
+      //
+      // While we pass quite a bit of specific "context" (target, base scope)
+      // to enter_file(), here is the analysis why the result will not depend
+      // on this context for the non-absent header (fp is absolute):
+      //
+      // 1. Let's start with the base scope (bs). Firstly, the base scope
+      //    passed to map_extension() is the scope of the header (i.e., it is
+      //    the scope of fp.directory()). Other than that, the target base
+      //    scope is only passed to build_prefix_map() which is only called
+      //    for the absent header (linfo is also only used here).
+      //
+      // 2. Next is the target (t). It is passed to build_prefix_map() but
+      //    that doesn't matter for the same reason as in (1). Other than
+      //    that, it is only passed to build2::search() which in turn passes
+      //    it to target type-specific prerequisite search callback (see
+      //    target_type::search) if one is not NULL. The target type in
+      //    question here is one of the headers and we know all of them use
+      //    the standard file_search() which ignores the passed target.
+      //
+      // 3. Finally, so_map could be used for an absolute fp. While we could
+      //    simply not cache the result if it was used (second half of the
+      //    result pair is true), there doesn't seem to be any harm in caching
+      //    the remapped path->target mapping. In fact, if to think about it,
+      //    there is no harm in caching the generated file mapping since it
+      //    will be immediately generated and any subsequent inclusions we
+      //    will "see" with an absolute path, which we can resolve from the
+      //    cache.
+      //
+      // To put it another way, all we need to do is make sure that if we were
+      // to not return an existing cache entry, the call to enter_file() would
+      // have returned exactly the same path/target.
+      //
+      // @@ Could it be that the header is re-mapped in one config but not the
+      //    other (e.g., when we do both in src and in out builds and we pick
+      //    the generated header in src)? If so, that would lead to a
+      //    divergence. I.e., we would cache the no-remap case first and then
+      //    return it even though the re-map is necessary? Why can't we just
+      //    check for re-mapping ourselves? A: the remapping logic in
+      //    enter_file() is not exactly trivial.
+      //
+      //    But on the other hand, I think we can assume that different
+      //    configurations will end up with different caches. In other words,
+      //    we can assume that for the same "cc amalgamation" we use only a
+      //    single "version" of a header. Seems reasonable.
+      //
+      // Note also that while it would have been nice to have a unified cc
+      // cache, the map_extension() call is passed x_inc which is module-
+      // specific. In other words, we may end up mapping the same header to
+      // two different targets depending on whether it is included from, say,
+      // C or C++ translation unit. We could have used a unified cache for
+      // headers that were mapped using the fallback target type, which would
+      // cover the installed headers. Maybe, one day (it's also possible that
+      // separate caches reduce contention).
+      //
+      // Another related question is where we want to keep the cache: project,
+      // strong amalgamation, or weak amalgamation (like module sidebuilds).
+      // Some experimentation showed that weak has the best performance (which
+      // suggest that a unified cache will probably be a win).
+      //
+      // Note also that we don't need to clear this cache since we never clear
+      // the targets set. In other words, the only time targets are
+      // invalidated is when we destroy the build context, which also destroys
+      // the cache.
+      //
+      const config_module& hc (*header_cache_);
+
+      // First check the cache.
+      //
+      config_module::header_key hk;
+
+      bool e (fp.absolute ());
+      if (e)
       {
-        // Split the file into its name part and extension. Here we can assume
-        // the name part is a valid filesystem name.
-        //
-        // Note that if the file has no extension, we record an empty
-        // extension rather than NULL (which would signify that the default
-        // extension should be added).
-        //
-        string e (f.extension ());
-        string n (move (f).string ());
-
-        if (!e.empty ())
-          n.resize (n.size () - e.size () - 1); // One for the dot.
-
-        // See if this directory is part of any project and if so determine
-        // the target type.
-        //
-        // While at it also determine if this target is from the src or out
-        // tree of said project.
-        //
-        dir_path out;
-
-        // It's possible the extension-to-target type mapping is ambiguous
-        // (usually because both C and X-language headers use the same .h
-        // extension). In this case we will first try to find one that matches
-        // an explicit target (similar logic to when insert is false).
-        //
-        small_vector<const target_type*, 2> tts;
-
-        // Note that the path can be in out or src directory and the latter
-        // can be associated with multiple scopes. So strictly speaking we
-        // need to pick one that is "associated" with us. But that is still a
-        // TODO (see scope_map::find() for details) and so for now we just
-        // pick the first one (it's highly unlikely the source file extension
-        // mapping will differ based on the configuration).
-        //
-        {
-          const scope& bs (**t.ctx.scopes.find (d).first);
-          if (const scope* rs = bs.root_scope ())
-          {
-            tts = map_extension (bs, n, e);
-
-            if (!bs.out_eq_src () && d.sub (bs.src_path ()))
-              out = out_src (d, *rs);
-          }
-        }
-
-        // If it is outside any project, or the project doesn't have such an
-        // extension, assume it is a plain old C header.
-        //
-        if (tts.empty ())
+        if (!norm)
         {
-          // If the project doesn't "know" this extension then we can't
-          // possibly find an explicit target of this type.
-          //
-          if (!insert)
-            return nullptr;
-
-          tts.push_back (&h::static_type);
+          normalize_external (fp, "header");
+          norm = true;
         }
 
-        // Find or insert target.
-        //
-        // Note that in case of the target type ambiguity we first try to find
-        // an explicit target that resolves this ambiguity.
-        //
-        const target* r (nullptr);
+        hk.file = move (fp);
+        hk.hash = hash<path> () (hk.file);
 
-        if (!insert || tts.size () > 1)
+        slock l (hc.header_map_mutex);
+        auto i (hc.header_map.find (hk));
+        if (i != hc.header_map.end ())
         {
-          // Note that we skip any target type-specific searches (like for an
-          // existing file) and go straight for the target object since we
-          // need to find the target explicitly spelled out.
-          //
-          // Also, it doesn't feel like we should be able to resolve an
-          // absolute path with a spelled-out extension to multiple targets.
-          //
-          for (const target_type* tt: tts)
-            if ((r = t.ctx.targets.find (*tt, d, out, n, e, trace)) != nullptr)
-              break;
-
-          // Note: we can't do this because of the in-source builds where
-          // there won't be explicit targets for non-generated headers.
-          //
-          // This should be harmless, however, since in our world generated
-          // headers are normally spelled-out as explicit targets. And if not,
-          // we will still get an error, just a bit less specific.
-          //
-#if 0
-          if (r == nullptr && insert)
-          {
-            f = d / n;
-            if (!e.empty ())
-            {
-              f += '.';
-              f += e;
-            }
-
-            diag_record dr (fail);
-            dr << "mapping of header " << f << " to target type is ambiguous";
-            for (const target_type* tt: tts)
-              dr << info << "could be " << tt->name << "{}";
-            dr << info << "spell-out its target to resolve this ambiguity";
-          }
-#endif
+          //cache_hit.fetch_add (1, memory_order_relaxed);
+          return make_pair (i->second, false);
         }
 
-        // @@ OPT: move d, out, n
-        //
-        if (r == nullptr && insert)
-          r = &search (t, *tts[0], d, out, n, &e, nullptr);
+        fp = move (hk.file);
 
-        return static_cast<const file*> (r);
-      };
+        //cache_mis.fetch_add (1, memory_order_relaxed);
+      }
 
-      // If it's not absolute then it either does not (yet) exist or is a
-      // relative ""-include (see init_args() for details). Reduce the second
-      // case to absolute.
-      //
-      // Note: we now always use absolute path to the translation unit so this
-      // no longer applies. But let's keep it for posterity.
-      //
-#if 0
-      if (f.relative () && rels.relative ())
+      struct data
       {
-        // If the relative source path has a directory component, make sure
-        // it matches since ""-include will always start with that (none of
-        // the compilers we support try to normalize this path). Failed that
-        // we may end up searching for a generated header in a random
-        // (working) directory.
-        //
-        const string& fs (f.string ());
-        const string& ss (rels.string ());
-
-        size_t p (path::traits::rfind_separator (ss));
-
-        if (p == string::npos || // No directory.
-            (fs.size () > p + 1 &&
-             path::traits::compare (fs.c_str (), p, ss.c_str (), p) == 0))
-        {
-          path t (work / f); // The rels path is relative to work.
-
-          if (exists (t))
-            f = move (t);
-        }
-      }
-#endif
+        linfo li;
+        optional<prefix_map>& pfx_map;
+      } d {li, pfx_map};
+
+      // If it is outside any project, or the project doesn't have such an
+      // extension, assume it is a plain old C header.
+      //
+      auto r (enter_file (
+                trace, "header",
+                a, bs, t,
+                fp, cache, norm,
+                [this] (const scope& bs, const string& n, const string& e)
+                {
+                  return map_extension (bs, n, e, x_inc);
+                },
+                h::static_type,
+                [this, &d] (action a, const scope& bs, const target& t)
+                  -> const prefix_map&
+                {
+                  if (!d.pfx_map)
+                    d.pfx_map = build_prefix_map (bs, a, t, d.li);
 
-      const file* pt (nullptr);
-      bool remapped (false);
+                  return *d.pfx_map;
+                },
+                so_map));
 
-      // If still relative then it does not exist.
+      // Cache.
       //
-      if (f.relative ())
+      if (r.first != nullptr)
       {
-        // This is probably as often an error as an auto-generated file, so
-        // trace at level 4.
-        //
-        l4 ([&]{trace << "non-existent header '" << f << "'";});
-
-        f.normalize ();
-
-        // The relative path might still contain '..' (e.g., ../foo.hxx;
-        // presumably ""-include'ed). We don't attempt to support auto-
-        // generated headers with such inclusion styles.
-        //
-        if (f.normalized ())
-        {
-          if (!pfx_map)
-            pfx_map = build_prefix_map (bs, a, t, li);
-
-          // First try the whole file. Then just the directory.
-          //
-          // @@ Has to be a separate map since the prefix can be the same as
-          //    the file name.
-          //
-          // auto i (pfx_map->find (f));
-
-          // Find the most qualified prefix of which we are a sub-path.
-          //
-          if (!pfx_map->empty ())
-          {
-            dir_path d (f.directory ());
-            auto i (pfx_map->find_sup (d));
+        hk.file = move (fp);
 
-            if (i != pfx_map->end ())
-            {
-              // Note: value in pfx_map is not necessarily canonical.
-              //
-              dir_path pd (i->second.directory);
-              pd.canonicalize ();
-
-              l4 ([&]{trace << "prefix '" << d << "' mapped to " << pd;});
-
-              // If this is a prefixless mapping, then only use it if we can
-              // resolve it to an existing target (i.e., it is explicitly
-              // spelled out in a buildfile).
-              //
-              // Note that at some point we will probably have a list of
-              // directories.
-              //
-              pt = find (pd / d, f.leaf (), !i->first.empty ());
-              if (pt != nullptr)
-              {
-                f = pd / f;
-                l4 ([&]{trace << "mapped as auto-generated " << f;});
-              }
-              else
-                l4 ([&]{trace << "no explicit target in " << pd;});
-            }
-            else
-              l4 ([&]{trace << "no prefix map entry for '" << d << "'";});
-          }
-          else
-            l4 ([&]{trace << "prefix map is empty";});
-        }
-      }
-      else
-      {
-        // Normalize the path unless it comes from the depdb, in which case
-        // we've already done that (normally). This is also where we handle
-        // src-out remap (again, not needed if cached).
+        // Calculate the hash if we haven't yet and re-calculate it if the
+        // path has changed (header has been remapped).
         //
-        if (!cache || norm)
-          normalize_header (f);
+        if (!e || r.second)
+          hk.hash = hash<path> () (hk.file);
 
-        if (!cache)
+        const file* f;
         {
-          if (!so_map.empty ())
-          {
-            // Find the most qualified prefix of which we are a sub-path.
-            //
-            auto i (so_map.find_sup (f));
-            if (i != so_map.end ())
-            {
-              // Ok, there is an out tree for this headers. Remap to a path
-              // from the out tree and see if there is a target for it. Note
-              // that the value in so_map is not necessarily canonical.
-              //
-              dir_path d (i->second);
-              d /= f.leaf (i->first).directory ();
-              d.canonicalize ();
-
-              pt = find (move (d), f.leaf (), false); // d is not moved from.
-
-              if (pt != nullptr)
-              {
-                path p (d / f.leaf ());
-                l4 ([&]{trace << "remapping " << f << " to " << p;});
-                f = move (p);
-                remapped = true;
-              }
-            }
-          }
+          ulock l (hc.header_map_mutex);
+          auto p (hc.header_map.emplace (move (hk), r.first));
+          f = p.second ? nullptr : p.first->second;
         }
 
-        if (pt == nullptr)
+        if (f != nullptr)
         {
-          l6 ([&]{trace << "entering " << f;});
-          pt = find (f.directory (), f.leaf (), true);
+          //cache_cls.fetch_add (1, memory_order_relaxed);
+          assert (r.first == f);
         }
       }
 
-      return make_pair (pt, remapped);
+      return r;
     }
 
-    // Update and add to the list of prerequisite targets a header or header
-    // unit target.
-    //
-    // Return the indication of whether it has changed or, if the passed
-    // timestamp is not timestamp_unknown, is older than the target. If the
-    // header does not exists nor can be generated (no rule), then issue
-    // diagnostics and fail if the fail argument is true and return nullopt
-    // otherwise.
-    //
     // Note: this used to be a lambda inside extract_headers() so refer to the
     // body of that function for the overall picture.
     //
     optional<bool> compile_rule::
     inject_header (action a, file& t,
-                   const file& pt, timestamp mt, bool f /* fail */) const
+                   const file& pt, timestamp mt, bool fail) const
     {
       tracer trace (x, "compile_rule::inject_header");
 
-      // Even if failing we still use try_match() in order to issue consistent
-      // (with extract_headers() below) diagnostics (rather than the generic
-      // "not rule to update ...").
-      //
-      if (!try_match (a, pt).first)
-      {
-        if (!f)
-          return nullopt;
-
-        diag_record dr;
-        dr << fail << "header " << pt << " not found and no rule to "
-           << "generate it";
-
-        if (verb < 4)
-          dr << info << "re-run with --verbose=4 for more information";
-      }
-
-      bool r (update (trace, a, pt, mt));
-
-      // Add to our prerequisite target list.
-      //
-      t.prerequisite_targets[a].push_back (&pt);
-
-      return r;
+      return inject_file (trace, "header", a, t, pt, mt, fail);
     }
 
-    // Extract and inject header dependencies. Return the preprocessed source
-    // file as well as an indication if it is usable for compilation (see
-    // below for details).
+    // Extract and inject header dependencies. Return (in result) the
+    // preprocessed source file as well as an indication if it is usable for
+    // compilation (see below for details). Note that result is expected to
+    // be initialized to {entry (), false}. Not using return type due to
+    // GCC bug #107555.
     //
     // This is also the place where we handle header units which are a lot
     // more like auto-generated headers than modules. In particular, if a
     // header unit BMI is out-of-date, then we have to re-preprocess this
     // translation unit.
     //
-    pair<file_cache::entry, bool> compile_rule::
+    void compile_rule::
     extract_headers (action a,
                      const scope& bs,
                      file& t,
@@ -3341,7 +3230,8 @@ namespace build2
                      depdb& dd,
                      bool& update,
                      timestamp mt,
-                     module_imports& imports) const
+                     module_imports& imports,
+                     pair<file_cache::entry, bool>& result) const
     {
       tracer trace (x, "compile_rule::extract_headers");
 
@@ -3354,19 +3244,16 @@ namespace build2
       file_cache::entry psrc;
       bool puse (true);
 
-      // If things go wrong (and they often do in this area), give the user a
-      // bit extra context.
+      // Preprocessed file extension.
       //
-      auto df = make_diag_frame (
-        [&src](const diag_record& dr)
-        {
-          if (verb != 0)
-            dr << info << "while extracting header dependencies from " << src;
-        });
+      const char* pext (x_assembler_cpp (src) ? ".Si"      :
+                        x_objective (src)     ? x_obj_pext :
+                        x_pext);
 
       // Preprocesor mode that preserves as much information as possible while
       // still performing inclusions. Also serves as a flag indicating whether
-      // this compiler uses the separate preprocess and compile setup.
+      // this (non-MSVC) compiler uses the separate preprocess and compile
+      // setup.
       //
       const char* pp (nullptr);
 
@@ -3377,7 +3264,16 @@ namespace build2
           // -fdirectives-only is available since GCC 4.3.0.
           //
           if (cmaj > 4 || (cmaj == 4 && cmin >= 3))
-            pp = "-fdirectives-only";
+          {
+            // Note that for assembler-with-cpp GCC currently forces full
+            // preprocessing in (what appears to be) an attempt to paper over
+            // a deeper issue (see GCC bug 109534). If/when that bug gets
+            // fixed, we can enable this on our side. Note also that Clang's
+            // -frewrite-includes appear to work correctly on such files.
+            //
+            if (!x_assembler_cpp (src))
+              pp = "-fdirectives-only";
+          }
 
           break;
         }
@@ -3467,7 +3363,7 @@ namespace build2
       //
       // GCC's -fdirective-only, on the other hand, processes all the
       // directives so they are gone from the preprocessed source. Here is
-      // what we are going to do to work around this: we will detect if any
+      // what we are going to do to work around this: we will sense if any
       // diagnostics has been written to stderr on the -E run. If that's the
       // case (but the compiler indicated success) then we assume they are
       // warnings and disable the use of the preprocessed output for
@@ -3496,6 +3392,8 @@ namespace build2
       //
       // So seeing that it is hard to trigger a legitimate VC preprocessor
       // warning, for now, we will just treat them as errors by adding /WX.
+      // BTW, another example of a plausible preprocessor warnings are C4819
+      // and C4828 (character unrepresentable in source charset).
       //
       // Finally, if we are using the module mapper, then all this mess falls
       // away: we only run the compiler once, we let the diagnostics through,
@@ -3503,7 +3401,9 @@ namespace build2
       // not found, and there is no problem with outdated generated headers
       // since we update/remap them before the compiler has a chance to read
       // them. Overall, this "dependency mapper" approach is how it should
-      // have been done from the beginning.
+      // have been done from the beginning. Note: that's the ideal world,
+      // the reality is that the required mapper extensions are not (yet)
+      // in libcody/GCC.
 
       // Note: diagnostics sensing is currently only supported if dependency
       // info is written to a file (see above).
@@ -3513,15 +3413,15 @@ namespace build2
       // And here is another problem: if we have an already generated header
       // in src and the one in out does not yet exist, then the compiler will
       // pick the one in src and we won't even notice. Note that this is not
-      // only an issue with mixing in- and out-of-tree builds (which does feel
+      // only an issue with mixing in and out of source builds (which does feel
       // wrong but is oh so convenient): this is also a problem with
       // pre-generated headers, a technique we use to make installing the
       // generator by end-users optional by shipping pre-generated headers.
       //
       // This is a nasty problem that doesn't seem to have a perfect solution
-      // (except, perhaps, C++ modules). So what we are going to do is try to
-      // rectify the situation by detecting and automatically remapping such
-      // mis-inclusions. It works as follows.
+      // (except, perhaps, C++ modules and/or module mapper). So what we are
+      // going to do is try to rectify the situation by detecting and
+      // automatically remapping such mis-inclusions. It works as follows.
       //
       // First we will build a map of src/out pairs that were specified with
       // -I. Here, for performance and simplicity, we will assume that they
@@ -3534,10 +3434,7 @@ namespace build2
       // case, then we calculate a corresponding header in the out tree and,
       // (this is the most important part), check if there is a target for
       // this header in the out tree. This should be fairly accurate and not
-      // require anything explicit from the user except perhaps for a case
-      // where the header is generated out of nothing (so there is no need to
-      // explicitly mention its target in the buildfile). But this probably
-      // won't be very common.
+      // require anything explicit from the user.
       //
       // One tricky area in this setup are target groups: if the generated
       // sources are mentioned in the buildfile as a group, then there might
@@ -3547,10 +3444,7 @@ namespace build2
       // generated depending on the options (e.g., inline files might be
       // suppressed), headers are usually non-optional.
       //
-      // Note that we use path_map instead of dir_path_map to allow searching
-      // using path (file path).
-      //
-      srcout_map so_map; // path_map<dir_path>
+      srcout_map so_map;
 
       // Dynamic module mapper.
       //
@@ -3558,13 +3452,13 @@ namespace build2
 
       // The gen argument to init_args() is in/out. The caller signals whether
       // to force the generated header support and on return it signals
-      // whether this support is enabled. The first call to init_args is
-      // expected to have gen false.
+      // whether this support is enabled. If gen is false, then stderr is
+      // expected to be either discarded or merged with sdtout.
       //
       // Return NULL if the dependency information goes to stdout and a
       // pointer to the temporary file path otherwise.
       //
-      auto init_args = [a, &t, ot, li, reprocess,
+      auto init_args = [a, &t, ot, li, reprocess, pext,
                         &src, &md, &psrc, &sense_diag, &mod_mapper, &bs,
                         pp, &env, &args, &args_gen, &args_i, &out, &drm,
                         &so_map, this]
@@ -3630,17 +3524,13 @@ namespace build2
           // Populate the src-out with the -I$out_base -I$src_base pairs.
           //
           {
+            srcout_builder builder (ctx, so_map);
+
             // Try to be fast and efficient by reusing buffers as much as
             // possible.
             //
             string ds;
 
-            // Previous -I innermost scope if out_base plus the difference
-            // between the scope path and the -I path (normally empty).
-            //
-            const scope* s (nullptr);
-            dir_path p;
-
             for (auto i (args.begin ()), e (args.end ()); i != e; ++i)
             {
               const char* o (*i);
@@ -3665,7 +3555,7 @@ namespace build2
 
                 if (p == 0)
                 {
-                  s = nullptr;
+                  builder.skip ();
                   continue;
                 }
 
@@ -3698,68 +3588,14 @@ namespace build2
                 //
                 if (!d.empty ())
                 {
-                  // Ignore any paths containing '.', '..' components. Allow
-                  // any directory separators though (think -I$src_root/foo
-                  // on Windows).
-                  //
-                  if (d.absolute () && d.normalized (false))
-                  {
-                    // If we have a candidate out_base, see if this is its
-                    // src_base.
-                    //
-                    if (s != nullptr)
-                    {
-                      const dir_path& bp (s->src_path ());
-
-                      if (d.sub (bp))
-                      {
-                        if (p.empty () || d.leaf (bp) == p)
-                        {
-                          // We've got a pair.
-                          //
-                          so_map.emplace (move (d), s->out_path () / p);
-                          s = nullptr; // Taken.
-                          continue;
-                        }
-                      }
-
-                      // Not a pair. Fall through to consider as out_base.
-                      //
-                      s = nullptr;
-                    }
-
-                    // See if this path is inside a project with an out-of-
-                    // tree build and is in the out directory tree.
-                    //
-                    const scope& bs (ctx.scopes.find_out (d));
-                    if (bs.root_scope () != nullptr)
-                    {
-                      if (!bs.out_eq_src ())
-                      {
-                        const dir_path& bp (bs.out_path ());
-
-                        bool e;
-                        if ((e = (d == bp)) || d.sub (bp))
-                        {
-                          s = &bs;
-                          if (e)
-                            p.clear ();
-                          else
-                            p = d.leaf (bp);
-                        }
-                      }
-                    }
-                  }
-                  else
-                    s = nullptr;
-
-                  ds = move (d).string (); // Move the buffer out.
+                  if (!builder.next (move (d)))
+                    ds = move (d).string (); // Move the buffer back out.
                 }
                 else
-                  s = nullptr;
+                  builder.skip ();
               }
               else
-                s = nullptr;
+                builder.skip ();
             }
           }
 
@@ -3806,19 +3642,41 @@ namespace build2
               append_options (args, cmode);
               append_sys_hdr_options (args); // Extra system header dirs (last).
 
-              // See perform_update() for details on /external:W0, /EHsc, /MD.
+              // Note that for MSVC stderr is merged with stdout and is then
+              // parsed, so no append_diag_color_options() call.
+
+              // See perform_update() for details on the choice of options.
               //
+              {
+                bool sc (find_option_prefixes (
+                           {"/source-charset:", "-source-charset:"}, args));
+                bool ec (find_option_prefixes (
+                           {"/execution-charset:", "-execution-charset:"}, args));
+
+                if (!sc && !ec)
+                  args.push_back ("/utf-8");
+                else
+                {
+                  if (!sc)
+                    args.push_back ("/source-charset:UTF-8");
+
+                  if (!ec)
+                    args.push_back ("/execution-charset:UTF-8");
+                }
+              }
+
               if (cvariant != "clang" && isystem (*this))
               {
-                if (find_option_prefix ("/external:I", args) &&
-                    !find_option_prefix ("/external:W", args))
+                if (find_option_prefixes ({"/external:I", "-external:I"}, args) &&
+                    !find_option_prefixes ({"/external:W", "-external:W"}, args))
                   args.push_back ("/external:W0");
               }
 
-              if (x_lang == lang::cxx && !find_option_prefix ("/EH", args))
+              if (x_lang == lang::cxx &&
+                  !find_option_prefixes ({"/EH", "-EH"}, args))
                 args.push_back ("/EHsc");
 
-              if (!find_option_prefixes ({"/MD", "/MT"}, args))
+              if (!find_option_prefixes ({"/MD", "/MT", "-MD", "-MT"}, args))
                 args.push_back ("/MD");
 
               args.push_back ("/P");            // Preprocess to file.
@@ -3829,7 +3687,7 @@ namespace build2
 
               msvc_sanitize_cl (args);
 
-              psrc = ctx.fcache.create (t.path () + x_pext, !modules);
+              psrc = ctx.fcache->create (t.path () + pext, !modules);
 
               if (fc)
               {
@@ -3848,8 +3706,20 @@ namespace build2
             }
           case compiler_class::gcc:
             {
+              append_options (args, cmode,
+                              cmode.size () - (modules && clang ? 1 : 0));
+              append_sys_hdr_options (args); // Extra system header dirs (last).
+
+              // If not gen, then stderr is discarded.
+              //
+              if (gen)
+                append_diag_color_options (args);
+
               // See perform_update() for details on the choice of options.
               //
+              if (!find_option_prefix ("-finput-charset=", args))
+                args.push_back ("-finput-charset=UTF-8");
+
               if (ot == otype::s)
               {
                 if (tclass == "linux" || tclass == "bsd")
@@ -3878,10 +3748,6 @@ namespace build2
                 }
               }
 
-              append_options (args, cmode,
-                              cmode.size () - (modules && clang ? 1 : 0));
-              append_sys_hdr_options (args); // Extra system header dirs (last).
-
               // Setup the dynamic module mapper if needed.
               //
               // Note that it's plausible in the future we will use it even if
@@ -3973,7 +3839,7 @@ namespace build2
 
                 // Preprocessor output.
                 //
-                psrc = ctx.fcache.create (t.path () + x_pext, !modules);
+                psrc = ctx.fcache->create (t.path () + pext, !modules);
                 args.push_back ("-o");
                 args.push_back (psrc.path ().string ().c_str ());
               }
@@ -4099,15 +3965,12 @@ namespace build2
         // to be inconvenient: some users like to re-run a failed build with
         // -s not to get "swamped" with errors.
         //
-        bool df (!ctx.match_only && !ctx.dry_run_option);
-
-        const file* ht (enter_header (a, bs, t, li,
-                                      move (hp), cache, false /* norm */,
-                                      pfx_map, so_map).first);
-        if (ht == nullptr)
+        auto fail = [&ctx] (const auto& h) -> optional<bool>
         {
+          bool df (!ctx.match_only && !ctx.dry_run_option);
+
           diag_record dr;
-          dr << error << "header '" << hp << "' not found and no rule to "
+          dr << error << "header " << h << " not found and no rule to "
              << "generate it";
 
           if (df)
@@ -4116,41 +3979,44 @@ namespace build2
           if (verb < 4)
             dr << info << "re-run with --verbose=4 for more information";
 
-          if (df) return nullopt; else dr << endf;
-        }
+          if (df)
+            return nullopt;
+          else
+            dr << endf;
+        };
 
-        // If we are reading the cache, then it is possible the file has since
-        // been removed (think of a header in /usr/local/include that has been
-        // uninstalled and now we need to use one from /usr/include). This
-        // will lead to the match failure which we translate to a restart.
-        //
-        if (optional<bool> u = inject_header (a, t, *ht, mt, false /* fail */))
+        if (const file* ht = enter_header (
+              a, bs, t, li,
+              move (hp), cache, cache /* normalized */,
+              pfx_map, so_map).first)
         {
-          // Verify/add it to the dependency database.
+          // If we are reading the cache, then it is possible the file has
+          // since been removed (think of a header in /usr/local/include that
+          // has been uninstalled and now we need to use one from
+          // /usr/include). This will lead to the match failure which we
+          // translate to a restart. And, yes, this case will trip up
+          // inject_header(), not enter_header().
           //
-          if (!cache)
-            dd.expect (ht->path ());
-
-          skip_count++;
-          return *u;
-        }
-        else if (!cache)
-        {
-          diag_record dr;
-          dr << error << "header " << *ht << " not found and no rule to "
-             << "generate it";
-
-          if (df)
-            dr << info << "failure deferred to compiler diagnostics";
-
-          if (verb < 4)
-            dr << info << "re-run with --verbose=4 for more information";
+          if (optional<bool> u = inject_header (a, t, *ht, mt, false /*fail*/))
+          {
+            // Verify/add it to the dependency database.
+            //
+            if (!cache)
+              dd.expect (ht->path ());
 
-          if (df) return nullopt; else dr << endf;
+            skip_count++;
+            return *u;
+          }
+          else if (cache)
+          {
+            dd.write (); // Invalidate this line.
+            return true;
+          }
+          else
+            return fail (*ht);
         }
-
-        dd.write (); // Invalidate this line.
-        return true;
+        else
+          return fail (hp); // hp is still valid.
       };
 
       // As above but for a header unit. Note that currently it is only used
@@ -4167,13 +4033,13 @@ namespace build2
 
         const file* ht (
           enter_header (a, bs, t, li,
-                        move (hp), true /* cache */, true /* norm */,
+                        move (hp), true /* cache */, false /* normalized */,
                         pfx_map, so_map).first);
 
-        if (ht == nullptr)
+        if (ht == nullptr) // hp is still valid.
         {
           diag_record dr;
-          dr << error << "header '" << hp << "' not found and no rule to "
+          dr << error << "header " << hp << " not found and no rule to "
              << "generate it";
 
           if (df)
@@ -4219,6 +4085,16 @@ namespace build2
 
       const path* drmp (nullptr); // Points to drm.path () if active.
 
+      // If things go wrong (and they often do in this area), give the user a
+      // bit extra context.
+      //
+      auto df = make_diag_frame (
+        [&src](const diag_record& dr)
+        {
+          if (verb != 0)
+            dr << info << "while extracting header dependencies from " << src;
+        });
+
       // If nothing so far has invalidated the dependency database, then try
       // the cached data before running the compiler.
       //
@@ -4255,11 +4131,14 @@ namespace build2
               //
               // See apply() for details on the extra MSVC check.
               //
-              return modules && (ctype != compiler_type::msvc ||
-                                 md.type != unit_type::module_intf)
-                ? make_pair (ctx.fcache.create_existing (t.path () + x_pext),
-                             true)
-                : make_pair (file_cache::entry (), false);
+              if (modules && (ctype != compiler_type::msvc ||
+                              md.type != unit_type::module_intf))
+              {
+                result.first = ctx.fcache->create_existing (t.path () + pext);
+                result.second = true;
+              }
+
+              return;
             }
 
             // This can be a header or a header unit (mapping).
@@ -4312,7 +4191,7 @@ namespace build2
 
               // Bail out early if we have deferred a failure.
               //
-              return make_pair (file_cache::entry (), false);
+              return;
             }
           }
         }
@@ -4338,6 +4217,12 @@ namespace build2
 
             process pr;
 
+            // We use the fdstream_mode::skip mode on stdout (cannot be used
+            // on both) and so dbuf must be destroyed (closed) first.
+            //
+            ifdstream is (ifdstream::badbit);
+            diag_buffer dbuf (ctx);
+
             try
             {
               // Assume the preprocessed output (if produced) is usable
@@ -4358,217 +4243,229 @@ namespace build2
               //
               bool good_error (false), bad_error (false);
 
-              // If we have no generated header support, then suppress all
-              // diagnostics (if things go badly we will restart with this
-              // support).
-              //
-              if (drmp == nullptr) // Dependency info goes to stdout.
+              if (mod_mapper) // Dependency info is implied by mapper requests.
               {
-                assert (!sense_diag); // Note: could support with fdselect().
+                assert (gen && !sense_diag); // Not used in this mode.
 
-                // For VC with /P the dependency info and diagnostics all go
-                // to stderr so redirect it to stdout.
+                // Note that here we use the skip mode on the diagnostics
+                // stream which means we have to use own instance of stdout
+                // stream for the correct destruction order (see below).
                 //
-                pr = process (
-                  cpath,
-                  args.data (),
-                  0,
-                  -1,
-                  cclass == compiler_class::msvc ? 1 : gen ? 2 : -2,
-                  nullptr, // CWD
-                  env.empty () ? nullptr : env.data ());
-              }
-              else // Dependency info goes to a temporary file.
-              {
                 pr = process (cpath,
-                              args.data (),
-                              mod_mapper ? -1 : 0,
-                              mod_mapper ? -1 : 2, // Send stdout to stderr.
-                              gen ? 2 : sense_diag ? -1 : -2,
+                              args,
+                              -1,
+                              -1,
+                              diag_buffer::pipe (ctx),
                               nullptr, // CWD
                               env.empty () ? nullptr : env.data ());
 
-                // Monitor for module mapper requests and/or diagnostics. If
-                // diagnostics is detected, mark the preprocessed output as
-                // unusable for compilation.
-                //
-                if (mod_mapper || sense_diag)
+                dbuf.open (args[0],
+                           move (pr.in_efd),
+                           fdstream_mode::non_blocking |
+                           fdstream_mode::skip);
+                try
                 {
-                  module_mapper_state mm_state (skip_count, imports);
+                  gcc_module_mapper_state mm_state (skip_count, imports);
+
+                  // Note that while we read both streams until eof in normal
+                  // circumstances, we cannot use fdstream_mode::skip for the
+                  // exception case on both of them: we may end up being
+                  // blocked trying to read one stream while the process may
+                  // be blocked writing to the other. So in case of an
+                  // exception we only skip the diagnostics and close the
+                  // mapper stream hard. The latter (together with closing of
+                  // the stdin stream) should happen first so the order of
+                  // the following variable is important.
+                  //
+                  // Note also that we open the stdin stream in the blocking
+                  // mode.
+                  //
+                  ifdstream is (move (pr.in_ofd),
+                                fdstream_mode::non_blocking,
+                                ifdstream::badbit); // stdout
+                  ofdstream os (move (pr.out_fd));  // stdin (badbit|failbit)
 
-                  const char* w (nullptr);
-                  try
+                  // Read until we reach EOF on all streams.
+                  //
+                  // Note that if dbuf is not opened, then we automatically
+                  // get an inactive nullfd entry.
+                  //
+                  fdselect_set fds {is.fd (), dbuf.is.fd ()};
+                  fdselect_state& ist (fds[0]);
+                  fdselect_state& dst (fds[1]);
+
+                  bool more (false);
+                  for (string l; ist.fd != nullfd || dst.fd != nullfd; )
                   {
-                    // For now we don't need to do both so let's use a simpler
-                    // blocking implementation. Note that the module mapper
-                    // also needs to be adjusted when switching to the
-                    // non-blocking version.
+                    // @@ Currently we will accept a (potentially truncated)
+                    //    line that ends with EOF rather than newline.
                     //
-#if 1
-                    assert (mod_mapper != sense_diag);
-
-                    if (mod_mapper)
+                    if (ist.fd != nullfd && getline_non_blocking (is, l))
                     {
-                      w = "module mapper request";
-
-                      // Note: the order is important (see the non-blocking
-                      // verison for details).
-                      //
-                      ifdstream is (move (pr.in_ofd),
-                                    fdstream_mode::skip,
-                                    ifdstream::badbit);
-                      ofdstream os (move (pr.out_fd));
-
-                      do
+                      if (eof (is))
                       {
-                        if (!gcc_module_mapper (mm_state,
-                                                a, bs, t, li,
-                                                is, os,
-                                                dd, update, bad_error,
-                                                pfx_map, so_map))
-                          break;
+                        os.close ();
+                        is.close ();
 
-                      } while (!is.eof ());
+                        if (more)
+                          throw_generic_ios_failure (EIO, "unexpected EOF");
 
-                      os.close ();
-                      is.close ();
-                    }
-
-                    if (sense_diag)
-                    {
-                      w = "diagnostics";
-                      ifdstream is (move (pr.in_efd), fdstream_mode::skip);
-                      puse = puse && (is.peek () == ifdstream::traits_type::eof ());
-                      is.close ();
-                    }
-#else
-                    fdselect_set fds;
-                    auto add = [&fds] (const auto_fd& afd) -> fdselect_state*
-                    {
-                      int fd (afd.get ());
-                      fdmode (fd, fdstream_mode::non_blocking);
-                      fds.push_back (fd);
-                      return &fds.back ();
-                    };
-
-                    // Note that while we read both streams until eof in
-                    // normal circumstances, we cannot use fdstream_mode::skip
-                    // for the exception case on both of them: we may end up
-                    // being blocked trying to read one stream while the
-                    // process may be blocked writing to the other. So in case
-                    // of an exception we only skip the diagnostics and close
-                    // the mapper stream hard. The latter should happen first
-                    // so the order of the following variable is important.
-                    //
-                    ifdstream es;
-                    ofdstream os;
-                    ifdstream is;
-
-                    fdselect_state* ds (nullptr);
-                    if (sense_diag)
-                    {
-                      w = "diagnostics";
-                      ds = add (pr.in_efd);
-                      es.open (move (pr.in_efd), fdstream_mode::skip);
-                    }
-
-                    fdselect_state* ms (nullptr);
-                    if (mod_mapper)
-                    {
-                      w = "module mapper request";
-                      ms = add (pr.in_ofd);
-                      is.open (move (pr.in_ofd));
-                      os.open (move (pr.out_fd)); // Note: blocking.
-                    }
-
-                    // Set each state pointer to NULL when the respective
-                    // stream reaches eof.
-                    //
-                    while (ds != nullptr || ms != nullptr)
-                    {
-                      w = "output";
-                      ifdselect (fds);
-
-                      // First read out the diagnostics in case the mapper
-                      // interaction produces more. To make sure we don't get
-                      // blocked by full stderr, the mapper should only handle
-                      // one request at a time.
-                      //
-                      if (ds != nullptr && ds->ready)
+                        ist.fd = nullfd;
+                      }
+                      else
                       {
-                        w = "diagnostics";
-
-                        for (char buf[4096];;)
-                        {
-                          streamsize c (sizeof (buf));
-                          streamsize n (es.readsome (buf, c));
+                        optional<bool> r (
+                          gcc_module_mapper (mm_state,
+                                             a, bs, t, li,
+                                             l, os,
+                                             dd, update, bad_error,
+                                             pfx_map, so_map));
 
-                          if (puse && n > 0)
-                            puse = false;
+                        more = !r.has_value ();
 
-                          if (n < c)
-                            break;
-                        }
-
-                        if (es.eof ())
-                        {
-                          es.close ();
-                          ds->fd = nullfd;
-                          ds = nullptr;
-                        }
-                      }
-
-                      if (ms != nullptr && ms->ready)
-                      {
-                        w = "module mapper request";
-
-                        gcc_module_mapper (mm_state,
-                                           a, bs, t, li,
-                                           is, os,
-                                           dd, update, bad_error,
-                                           pfx_map, so_map);
-                        if (is.eof ())
+                        if (more || *r)
+                          l.clear ();
+                        else
                         {
                           os.close ();
                           is.close ();
-                          ms->fd = nullfd;
-                          ms = nullptr;
+                          ist.fd = nullfd;
                         }
                       }
+
+                      continue;
                     }
-#endif
-                  }
-                  catch (const io_error& e)
-                  {
-                    if (pr.wait ())
-                      fail << "io error handling " << x_lang << " compiler "
-                           << w << ": " << e;
 
-                    // Fall through.
+                    ifdselect (fds);
+
+                    if (dst.ready)
+                    {
+                      if (!dbuf.read ())
+                        dst.fd = nullfd;
+                    }
                   }
 
-                  if (mod_mapper)
-                    md.header_units += mm_state.header_units;
+                  md.header_units += mm_state.header_units;
+                }
+                catch (const io_error& e)
+                {
+                  // Note that diag_buffer handles its own io errors so this
+                  // is about mapper stdin/stdout.
+                  //
+                  if (pr.wait ())
+                    fail << "io error handling " << x_lang << " compiler "
+                         << "module mapper request: " << e;
+
+                  // Fall through.
                 }
 
                 // The idea is to reduce this to the stdout case.
                 //
-                pr.wait ();
-
-                // With -MG we want to read dependency info even if there is
-                // an error (in case an outdated header file caused it). But
-                // with the GCC module mapper an error is non-negotiable, so
-                // to speak, and so we want to skip all of that. In fact, we
-                // now write directly to depdb without generating and then
+                // We now write directly to depdb without generating and then
                 // parsing an intermadiate dependency makefile.
                 //
-                pr.in_ofd = (ctype == compiler_type::gcc && mod_mapper)
-                  ? auto_fd (nullfd)
-                  : fdopen (*drmp, fdopen_mode::in);
+                pr.wait ();
+                pr.in_ofd = nullfd;
               }
+              else
+              {
+                // If we have no generated header support, then suppress all
+                // diagnostics (if things go badly we will restart with this
+                // support).
+                //
+                if (drmp == nullptr) // Dependency info goes to stdout.
+                {
+                  assert (!sense_diag); // Note: could support if necessary.
 
+                  // For VC with /P the dependency info and diagnostics all go
+                  // to stderr so redirect it to stdout.
+                  //
+                  int err (
+                    cclass == compiler_class::msvc ?  1 : // stdout
+                    !gen                           ? -2 : // /dev/null
+                    diag_buffer::pipe (ctx, sense_diag /* force */));
+
+                  pr = process (
+                    cpath,
+                    args,
+                    0,
+                    -1,
+                    err,
+                    nullptr, // CWD
+                    env.empty () ? nullptr : env.data ());
+
+                  if (cclass != compiler_class::msvc && gen)
+                  {
+                    dbuf.open (args[0],
+                               move (pr.in_efd),
+                               fdstream_mode::non_blocking); // Skip on stdout.
+                  }
+                }
+                else // Dependency info goes to temporary file.
+                {
+                  // Since we only need to read from one stream (dbuf) let's
+                  // use the simpler blocking setup.
+                  //
+                  int err (
+                    !gen && !sense_diag ? -2 : // /dev/null
+                    diag_buffer::pipe (ctx, sense_diag /* force */));
+
+                  pr = process (cpath,
+                                args,
+                                0,
+                                2, // Send stdout to stderr.
+                                err,
+                                nullptr, // CWD
+                                env.empty () ? nullptr : env.data ());
+
+                  if (gen || sense_diag)
+                  {
+                    dbuf.open (args[0], move (pr.in_efd));
+                    dbuf.read (sense_diag /* force */);
+                  }
+
+                  if (sense_diag)
+                  {
+                    if (!dbuf.buf.empty ())
+                    {
+                      puse = false;
+                      dbuf.buf.clear (); // Discard.
+                    }
+                  }
+
+                  // The idea is to reduce this to the stdout case.
+                  //
+                  // Note that with -MG we want to read dependency info even
+                  // if there is an error (in case an outdated header file
+                  // caused it).
+                  //
+                  pr.wait ();
+                  pr.in_ofd = fdopen (*drmp, fdopen_mode::in);
+                }
+              }
+
+              // Read and process dependency information, if any.
+              //
               if (pr.in_ofd != nullfd)
               {
+                // We have two cases here: reading from stdout and potentially
+                // stderr (dbuf) or reading from file (see the process startup
+                // code above for details). If we have to read from two
+                // streams, then we have to use the non-blocking setup. But we
+                // cannot use the non-blocking setup uniformly because on
+                // Windows it's only suppored for pipes. So things are going
+                // to get a bit hairy.
+                //
+                // And there is another twist to this: for MSVC we redirect
+                // stderr to stdout since the header dependency information is
+                // part of the diagnostics. If, however, there is some real
+                // diagnostics, we need to pass it through, potentially with
+                // buffering. The way we achieve this is by later opening dbuf
+                // in the EOF state and using it to buffer or stream the
+                // diagnostics.
+                //
+                bool nb (dbuf.is.is_open ());
+
                 // We may not read all the output (e.g., due to a restart).
                 // Before we used to just close the file descriptor to signal
                 // to the other end that we are not interested in the rest.
@@ -4576,20 +4473,69 @@ namespace build2
                 // impolite and complains, loudly (broken pipe). So now we are
                 // going to skip until the end.
                 //
-                ifdstream is (move (pr.in_ofd),
-                              fdstream_mode::text | fdstream_mode::skip,
-                              ifdstream::badbit);
+                // Note that this means we are not using skip on dbuf (see
+                // above for the destruction order details).
+                //
+                {
+                  fdstream_mode m (fdstream_mode::text |
+                                   fdstream_mode::skip);
+
+                  if (nb)
+                    m |= fdstream_mode::non_blocking;
+
+                  is.open (move (pr.in_ofd), m);
+                }
+
+                fdselect_set fds;
+                if (nb)
+                  fds = {is.fd (), dbuf.is.fd ()};
 
                 size_t skip (skip_count);
                 string l, l2; // Reuse.
                 for (bool first (true), second (false); !restart; )
                 {
-                  if (eof (getline (is, l)))
+                  if (nb)
                   {
-                    if (bad_error && !l2.empty ())
-                      text << l2;
+                    fdselect_state& ist (fds[0]);
+                    fdselect_state& dst (fds[1]);
 
-                    break;
+                    // We read until we reach EOF on both streams.
+                    //
+                    if (ist.fd == nullfd && dst.fd == nullfd)
+                      break;
+
+                    if (ist.fd != nullfd && getline_non_blocking (is, l))
+                    {
+                      if (eof (is))
+                      {
+                        ist.fd = nullfd;
+                        continue;
+                      }
+
+                      // Fall through to parse (and clear) the line.
+                    }
+                    else
+                    {
+                      ifdselect (fds);
+
+                      if (dst.ready)
+                      {
+                        if (!dbuf.read ())
+                          dst.fd = nullfd;
+                      }
+
+                      continue;
+                    }
+                  }
+                  else
+                  {
+                    if (eof (getline (is, l)))
+                    {
+                      if (bad_error && !l2.empty ()) // MSVC only (see below).
+                        dbuf.write (l2, true /* newline */);
+
+                      break;
+                    }
                   }
 
                   l6 ([&]{trace << "header dependency line '" << l << "'";});
@@ -4640,9 +4586,15 @@ namespace build2
                             else
                             {
                               l2 = l;
-                              bad_error = true;
+
+                              if (!bad_error)
+                              {
+                                dbuf.open_eof (args[0]);
+                                bad_error = true;
+                              }
                             }
 
+                            l.clear ();
                             continue;
                           }
 
@@ -4652,6 +4604,7 @@ namespace build2
                         }
 
                         first = false;
+                        l.clear ();
                         continue;
                       }
 
@@ -4659,8 +4612,13 @@ namespace build2
 
                       if (f.empty ()) // Some other diagnostics.
                       {
-                        text << l;
-                        bad_error = true;
+                        if (!bad_error)
+                        {
+                          dbuf.open_eof (args[0]);
+                          bad_error = true;
+                        }
+
+                        dbuf.write (l, true /* newline */);
                         break;
                       }
 
@@ -4754,12 +4712,9 @@ namespace build2
                         if (l.empty ()  ||
                             l[0] != '^' || l[1] != ':' || l[2] != ' ')
                         {
-                          // @@ Hm, we don't seem to redirect stderr to stdout
-                          //    for this class of compilers so I wonder why
-                          //    we are doing this?
-                          //
                           if (!l.empty ())
-                            text << l;
+                            l5 ([&]{trace << "invalid header dependency line '"
+                                          << l << "'";});
 
                           bad_error = true;
                           break;
@@ -4774,22 +4729,37 @@ namespace build2
                         // "^: \".
                         //
                         if (l.size () == 4 && l[3] == '\\')
+                        {
+                          l.clear ();
                           continue;
+                        }
                         else
                           pos = 3; // Skip "^: ".
 
                         // Fall through to the 'second' block.
                       }
 
-                      if (second)
-                      {
-                        second = false;
-                        next_make (l, pos); // Skip the source file.
-                      }
-
                       while (pos != l.size ())
                       {
-                        string f (next_make (l, pos));
+                        string f (
+                          make_parser::next (
+                            l, pos, make_parser::type::prereq).first);
+
+                        if (pos != l.size () && l[pos] == ':')
+                        {
+                          l5 ([&]{trace << "invalid header dependency line '"
+                                        << l << "'";});
+                          bad_error = true;
+                          break;
+                        }
+
+                        // Skip the source file.
+                        //
+                        if (second)
+                        {
+                          second = false;
+                          continue;
+                        }
 
                         // Skip until where we left off.
                         //
@@ -4833,19 +4803,56 @@ namespace build2
                   }
 
                   if (bad_error || md.deferred_failure)
+                  {
+                    // Note that it may be tempting to finish reading out the
+                    // diagnostics before bailing out. But that may end up in
+                    // a deadlock if the process gets blocked trying to write
+                    // to stdout.
+                    //
                     break;
+                  }
+
+                  l.clear ();
+                }
+
+                // We may bail out early from the above loop in case of a
+                // restart or error. Which means the stderr stream (dbuf) may
+                // still be open and we need to close it before closing the
+                // stdout stream (which may try to skip).
+                //
+                // In this case we may also end up with incomplete diagnostics
+                // so discard it.
+                //
+                // Generally, it may be tempting to start thinking if we
+                // should discard buffered diagnostics in other cases, such as
+                // restart. But remember that during serial execution it will
+                // go straight to stderr so for consistency (and simplicity)
+                // we should just print it unless there are good reasons not
+                // to (also remember that in the restartable modes we normally
+                // redirect stderr to /dev/null; see the process startup code
+                // for details).
+                //
+                if (dbuf.is.is_open ())
+                {
+                  dbuf.is.close ();
+                  dbuf.buf.clear ();
                 }
 
                 // Bail out early if we have deferred a failure.
                 //
+                // Let's ignore any buffered diagnostics in this case since
+                // it would appear after the deferred failure note.
+                //
                 if (md.deferred_failure)
                 {
                   is.close ();
-                  return make_pair (file_cache::entry (), false);
+                  return;
                 }
 
-                // In case of VC, we are parsing stderr and if things go
-                // south, we need to copy the diagnostics for the user to see.
+                // In case of VC, we are parsing redirected stderr and if
+                // things go south, we need to copy the diagnostics for the
+                // user to see. Note that we should have already opened dbuf
+                // at EOF above.
                 //
                 if (bad_error && cclass == compiler_class::msvc)
                 {
@@ -4860,7 +4867,7 @@ namespace build2
                         l.compare (p.first, 4, "1083") != 0 &&
                         msvc_header_c1083 (l, p))
                     {
-                      diag_stream_lock () << l << endl;
+                      dbuf.write (l, true /* newline */);
                     }
                   }
                 }
@@ -4883,27 +4890,42 @@ namespace build2
 
               if (pr.wait ())
               {
-                if (!bad_error) // Ignore expected successes (we are done).
                 {
-                  if (!restart && psrc)
-                    psrcw.close ();
+                  diag_record dr;
 
-                  continue;
+                  if (bad_error)
+                    dr << fail << "expected error exit status from "
+                       << x_lang << " compiler";
+
+                  if (dbuf.is_open ())
+                    dbuf.close (move (dr)); // Throws if error.
                 }
 
-                fail << "expected error exit status from " << x_lang
-                     << " compiler";
+                // Ignore expected successes (we are done).
+                //
+                if (!restart && psrc)
+                  psrcw.close ();
+
+                continue;
               }
               else if (pr.exit->normal ())
               {
                 if (good_error) // Ignore expected errors (restart).
+                {
+                  if (dbuf.is_open ())
+                    dbuf.close ();
+
                   continue;
+                }
               }
 
               // Fall through.
             }
             catch (const io_error& e)
             {
+              // Ignore buffered diagnostics (since reading it could be the
+              // cause of this failure).
+              //
               if (pr.wait ())
                 fail << "unable to read " << x_lang << " compiler header "
                      << "dependency output: " << e;
@@ -4912,18 +4934,23 @@ namespace build2
             }
 
             assert (pr.exit && !*pr.exit);
-            const process_exit& e (*pr.exit);
+            const process_exit& pe (*pr.exit);
 
             // For normal exit we assume the child process issued some
             // diagnostics.
             //
-            if (e.normal ())
+            if (pe.normal ())
             {
-              // If this run was with the generated header support then we
-              // have issued diagnostics and it's time to give up.
+              // If this run was with the generated header support then it's
+              // time to give up.
               //
               if (gen)
+              {
+                if (dbuf.is_open ())
+                  dbuf.close (args, pe, 2 /* verbosity */);
+
                 throw failed ();
+              }
 
               // Just to recap, being here means something is wrong with the
               // source: it can be a missing generated header, it can be an
@@ -4941,7 +4968,12 @@ namespace build2
               // or will issue diagnostics.
               //
               if (restart)
+              {
+                if (dbuf.is_open ())
+                  dbuf.close ();
+
                 l6 ([&]{trace << "trying again without generated headers";});
+              }
               else
               {
                 // In some pathological situations we may end up switching
@@ -4966,19 +4998,24 @@ namespace build2
                 // example, because we have removed all the partially
                 // preprocessed source files).
                 //
-                if (force_gen_skip && *force_gen_skip == skip_count)
                 {
-                  diag_record dr (fail);
+                  diag_record dr;
+                  if (force_gen_skip && *force_gen_skip == skip_count)
+                  {
+                    dr <<
+                      fail << "inconsistent " << x_lang << " compiler behavior" <<
+                      info << "run the following two commands to investigate";
 
-                  dr << "inconsistent " << x_lang << " compiler behavior" <<
-                    info << "run the following two commands to investigate";
+                    dr << info;
+                    print_process (dr, args.data ()); // No pipes.
 
-                  dr << info;
-                  print_process (dr, args.data ()); // No pipes.
+                    init_args ((gen = true));
+                    dr << info << "";
+                    print_process (dr, args.data ()); // No pipes.
+                  }
 
-                  init_args ((gen = true));
-                  dr << info << "";
-                  print_process (dr, args.data ()); // No pipes.
+                  if (dbuf.is_open ())
+                    dbuf.close (move (dr)); // Throws if error.
                 }
 
                 restart = true;
@@ -4989,7 +5026,15 @@ namespace build2
               continue;
             }
             else
-              run_finish (args, pr); // Throws.
+            {
+              if (dbuf.is_open ())
+              {
+                dbuf.close (args, pe, 2 /* verbosity */);
+                throw failed ();
+              }
+              else
+                run_finish (args, pr, 2 /* verbosity */);
+            }
           }
           catch (const process_error& e)
           {
@@ -5015,7 +5060,9 @@ namespace build2
       dd.expect ("");
 
       puse = puse && !reprocess && psrc;
-      return make_pair (move (psrc), puse);
+
+      result.first = move (psrc);
+      result.second = puse;
     }
 
     // Return the translation unit information (last argument) and its
@@ -5128,19 +5175,41 @@ namespace build2
               append_options (args, cmode);
               append_sys_hdr_options (args);
 
-              // See perform_update() for details on /external:W0, /EHsc, /MD.
+              // Note: no append_diag_color_options() call since the
+              // diagnostics is discarded.
+
+              // See perform_update() for details on the choice of options.
               //
+              {
+                bool sc (find_option_prefixes (
+                           {"/source-charset:", "-source-charset:"}, args));
+                bool ec (find_option_prefixes (
+                           {"/execution-charset:", "-execution-charset:"}, args));
+
+                if (!sc && !ec)
+                  args.push_back ("/utf-8");
+                else
+                {
+                  if (!sc)
+                    args.push_back ("/source-charset:UTF-8");
+
+                  if (!ec)
+                    args.push_back ("/execution-charset:UTF-8");
+                }
+              }
+
               if (cvariant != "clang" && isystem (*this))
               {
-                if (find_option_prefix ("/external:I", args) &&
-                    !find_option_prefix ("/external:W", args))
+                if (find_option_prefixes ({"/external:I", "-external:I"}, args) &&
+                    !find_option_prefixes ({"/external:W", "-external:W"}, args))
                   args.push_back ("/external:W0");
               }
 
-              if (x_lang == lang::cxx && !find_option_prefix ("/EH", args))
+              if (x_lang == lang::cxx &&
+                  !find_option_prefixes ({"/EH", "-EH"}, args))
                 args.push_back ("/EHsc");
 
-              if (!find_option_prefixes ({"/MD", "/MT"}, args))
+              if (!find_option_prefixes ({"/MD", "/MT", "-MD", "-MT"}, args))
                 args.push_back ("/MD");
 
               args.push_back ("/E");
@@ -5154,6 +5223,18 @@ namespace build2
             }
           case compiler_class::gcc:
             {
+              append_options (args, cmode,
+                              cmode.size () - (modules && clang ? 1 : 0));
+              append_sys_hdr_options (args);
+
+              // Note: no append_diag_color_options() call since the
+              // diagnostics is discarded.
+
+              // See perform_update() for details on the choice of options.
+              //
+              if (!find_option_prefix ("-finput-charset=", args))
+                args.push_back ("-finput-charset=UTF-8");
+
               if (ot == otype::s)
               {
                 if (tclass == "linux" || tclass == "bsd")
@@ -5182,10 +5263,6 @@ namespace build2
                 }
               }
 
-              append_options (args, cmode,
-                              cmode.size () - (modules && clang ? 1 : 0));
-              append_sys_hdr_options (args);
-
               args.push_back ("-E");
               append_lang_options (args, md);
 
@@ -5194,12 +5271,36 @@ namespace build2
               //
               if (ps)
               {
-                if (ctype == compiler_type::gcc)
+                switch (ctype)
                 {
-                  // Note that only these two *plus* -x do the trick.
-                  //
-                  args.push_back ("-fpreprocessed");
-                  args.push_back ("-fdirectives-only");
+                case compiler_type::gcc:
+                  {
+                    // Note that only these two *plus* -x do the trick.
+                    //
+                    args.push_back ("-fpreprocessed");
+                    args.push_back ("-fdirectives-only");
+                    break;
+                  }
+                case compiler_type::clang:
+                  {
+                    // See below for details.
+                    //
+                    if (ctype == compiler_type::clang &&
+                        cmaj >= (cvariant != "apple" ? 15 : 16))
+                    {
+                      if (find_options ({"-pedantic",  "-pedantic-errors",
+                                         "-Wpedantic", "-Werror=pedantic"},
+                                        args))
+                      {
+                        args.push_back ("-Wno-gnu-line-marker");
+                      }
+                    }
+
+                    break;
+                  }
+                case compiler_type::msvc:
+                case compiler_type::icc:
+                  assert (false);
                 }
               }
 
@@ -5253,10 +5354,10 @@ namespace build2
               print_process (args);
 
             // We don't want to see warnings multiple times so ignore all
-            // diagnostics.
+            // diagnostics (thus no need for diag_buffer).
             //
             pr = process (cpath,
-                          args.data (),
+                          args,
                           0, -1, -2,
                           nullptr, // CWD
                           env.empty () ? nullptr : env.data ());
@@ -5326,7 +5427,15 @@ namespace build2
             // accurate (parts of the translation unit could have been
             // #ifdef'ed out; see __build2_preprocess).
             //
-            return reprocess ? string () : move (p.checksum);
+            // Also, don't use the checksum for header units since it ignores
+            // preprocessor directives and may therefore cause us to ignore a
+            // change to an exported macro. @@ TODO: maybe we should add a
+            // flag to the parser not to waste time calculating the checksum
+            // in these cases.
+            //
+            return reprocess || ut == unit_type::module_header
+              ? string ()
+              : move (p.checksum);
           }
 
           // Fall through.
@@ -5357,7 +5466,7 @@ namespace build2
             info << "then run failing command to display compiler diagnostics";
         }
         else
-          run_finish (args, pr); // Throws.
+          run_finish (args, pr, 2 /* verbosity */); // Throws.
       }
       catch (const process_error& e)
       {
@@ -5770,10 +5879,11 @@ namespace build2
       // 1. There is no good place in prerequisite_targets to store the
       //    exported flag (no, using the marking facility across match/execute
       //    is a bad idea). So what we are going to do is put re-exported
-      //    bmi{}s at the back and store (in the target's data pad) the start
-      //    position. One bad aspect about this part is that we assume those
-      //    bmi{}s have been matched by the same rule. But let's not kid
-      //    ourselves, there will be no other rule that matches bmi{}s.
+      //    bmi{}s at the back and store (in the target's auxiliary data
+      //    storage) the start position. One bad aspect about this part is
+      //    that we assume those bmi{}s have been matched by the same
+      //    rule. But let's not kid ourselves, there will be no other rule
+      //    that matches bmi{}s.
       //
       //    @@ I think now we could use prerequisite_targets::data for this?
       //
@@ -6160,11 +6270,11 @@ namespace build2
 
         // Hash (we know it's a file).
         //
-        cs.append (static_cast<const file&> (*bt).path ().string ());
+        cs.append (bt->as<file> ().path ().string ());
 
         // Copy over bmi{}s from our prerequisites weeding out duplicates.
         //
-        if (size_t j = bt->data<match_data> ().modules.start)
+        if (size_t j = bt->data<match_data> (a).modules.start)
         {
           // Hard to say whether we should reserve or not. We will probably
           // get quite a bit of duplications.
@@ -6186,7 +6296,7 @@ namespace build2
                          }) == imports.end ())
             {
               pts.push_back (et);
-              cs.append (static_cast<const file&> (*et).path ().string ());
+              cs.append (et->as<file> ().path ().string ());
 
               // Add to the list of imports for further duplicate suppression.
               // We could have stored reference to the name (e.g., in score)
@@ -6226,6 +6336,9 @@ namespace build2
       // cc.config module and that is within our amalgmantion seems like a
       // good place.
       //
+      // @@ TODO: maybe we should cache this in compile_rule ctor like we
+      //          do for the header cache?
+      //
       const scope* as (&rs);
       {
         const scope* ws (as->weak_scope ());
@@ -6241,7 +6354,7 @@ namespace build2
             // This is also the module that registers the scope operation
             // callback that cleans up the subproject.
             //
-            if (cast_false<bool> ((*s)["cc.core.vars.loaded"]))
+            if (cast_false<bool> (s->vars["cc.core.vars.loaded"]))
               as = s;
 
           } while (s != ws);
@@ -6377,7 +6490,10 @@ namespace build2
       ps.push_back (prerequisite (lt));
       for (prerequisite_member p: group_prerequisite_members (a, lt))
       {
-        if (include (a, lt, p) != include_type::normal) // Excluded/ad hoc.
+        // Ignore update=match.
+        //
+        lookup l;
+        if (include (a, lt, p, &l) != include_type::normal) // Excluded/ad hoc.
           continue;
 
         if (p.is_a<libx> () ||
@@ -6394,8 +6510,9 @@ namespace build2
                 move (mf),
                 nullopt,     // Use default extension.
                 target_decl::implied,
-                trace));
-      file& bt (static_cast<file&> (p.first));
+                trace,
+                true /* skip_find */));
+      file& bt (p.first.as<file> ());
 
       // Note that this is racy and someone might have created this target
       // while we were preparing the prerequisite list.
@@ -6526,7 +6643,9 @@ namespace build2
               //
               process_libraries (a, bs, nullopt, sys_lib_dirs,
                                  *f, la, 0, // lflags unused.
-                                 imp, lib, nullptr, true /* self */,
+                                 imp, lib, nullptr,
+                                 true /* self */,
+                                 false /* proc_opt_group */,
                                  &lib_cache);
 
               if (lt != nullptr)
@@ -6611,7 +6730,10 @@ namespace build2
         //
         for (prerequisite_member p: group_prerequisite_members (a, t))
         {
-          if (include (a, t, p) != include_type::normal) // Excluded/ad hoc.
+          // Ignore update=match.
+          //
+          lookup l;
+          if (include (a, t, p, &l) != include_type::normal) // Excluded/ad hoc.
             continue;
 
           if (p.is_a<libx> () ||
@@ -6629,8 +6751,9 @@ namespace build2
                 move (mf),
                 nullopt,     // Use default extension.
                 target_decl::implied,
-                trace));
-      file& bt (static_cast<file&> (p.first));
+                trace,
+                true /* skip_find */));
+      file& bt (p.first.as<file> ());
 
       // Note that this is racy and someone might have created this target
       // while we were preparing the prerequisite list.
@@ -6668,7 +6791,7 @@ namespace build2
     // Filter cl.exe noise (msvc.cxx).
     //
     void
-    msvc_filter_cl (ifdstream&, const path& src);
+    msvc_filter_cl (diag_buffer&, const path& src);
 
     // Append header unit-related options.
     //
@@ -6898,12 +7021,11 @@ namespace build2
     }
 
     target_state compile_rule::
-    perform_update (action a, const target& xt) const
+    perform_update (action a, const target& xt, match_data& md) const
     {
       const file& t (xt.as<file> ());
       const path& tp (t.path ());
 
-      match_data md (move (t.data<match_data> ()));
       unit_type ut (md.type);
 
       context& ctx (t.ctx);
@@ -6926,9 +7048,6 @@ namespace build2
           },
           md.modules.copied)); // See search_modules() for details.
 
-      const file& s (pr.second);
-      const path* sp (&s.path ());
-
       // Force recompilation in case of a deferred failure even if nothing
       // changed.
       //
@@ -6945,11 +7064,14 @@ namespace build2
         return *pr.first;
       }
 
+      const file& s (pr.second);
+      const path* sp (&s.path ());
+
       // Make sure depdb is no older than any of our prerequisites (see md.mt
       // logic description above for details). Also save the sequence start
       // time if doing mtime checks (see the depdb::check_mtime() call below).
       //
-      timestamp start (depdb::mtime_check ()
+      timestamp start (!ctx.dry_run && depdb::mtime_check ()
                        ? system_clock::now ()
                        : timestamp_unknown);
 
@@ -7016,7 +7138,6 @@ namespace build2
       small_vector<string, 2> module_args; // Module options storage.
 
       size_t out_i (0);  // Index of the -o option.
-      size_t lang_n (0); // Number of lang options.
 
       switch (cclass)
       {
@@ -7037,13 +7158,40 @@ namespace build2
           if (md.pp != preprocessed::all)
             append_sys_hdr_options (args); // Extra system header dirs (last).
 
+          // Note: could be overridden in mode.
+          //
+          append_diag_color_options (args);
+
+          // Set source/execution charsets to UTF-8 unless a custom charset
+          // is specified.
+          //
+          // Note that clang-cl supports /utf-8 and /*-charset.
+          //
+          {
+            bool sc (find_option_prefixes (
+                       {"/source-charset:", "-source-charset:"}, args));
+            bool ec (find_option_prefixes (
+                       {"/execution-charset:", "-execution-charset:"}, args));
+
+            if (!sc && !ec)
+              args.push_back ("/utf-8");
+            else
+            {
+              if (!sc)
+                args.push_back ("/source-charset:UTF-8");
+
+              if (!ec)
+                args.push_back ("/execution-charset:UTF-8");
+            }
+          }
+
           // If we have any /external:I options but no /external:Wn, then add
           // /external:W0 to emulate the -isystem semantics.
           //
           if (cvariant != "clang" && isystem (*this))
           {
-            if (find_option_prefix ("/external:I", args) &&
-                !find_option_prefix ("/external:W", args))
+            if (find_option_prefixes ({"/external:I", "-external:I"}, args) &&
+                !find_option_prefixes ({"/external:W", "-external:W"}, args))
               args.push_back ("/external:W0");
           }
 
@@ -7057,7 +7205,9 @@ namespace build2
           // For C looks like no /EH* (exceptions supported but no C++ objects
           // destroyed) is a reasonable default.
           //
-          if (x_lang == lang::cxx && !find_option_prefix ("/EH", args))
+
+          if (x_lang == lang::cxx &&
+              !find_option_prefixes ({"/EH", "-EH"}, args))
             args.push_back ("/EHsc");
 
           // The runtime is a bit more interesting. At first it may seem like
@@ -7079,7 +7229,7 @@ namespace build2
           // unreasonable thing to do). So by default we will always use the
           // release runtime.
           //
-          if (!find_option_prefixes ({"/MD", "/MT"}, args))
+          if (!find_option_prefixes ({"/MD", "/MT", "-MD", "-MT"}, args))
             args.push_back ("/MD");
 
           msvc_sanitize_cl (args);
@@ -7104,7 +7254,7 @@ namespace build2
           //
           // @@ MOD: TODO deal with absent relo.
           //
-          if (find_options ({"/Zi", "/ZI"}, args))
+          if (find_options ({"/Zi", "/ZI", "-Zi", "-ZI"}, args))
           {
             if (fc)
               args.push_back ("/Fd:");
@@ -7150,6 +7300,65 @@ namespace build2
         }
       case compiler_class::gcc:
         {
+          append_options (args, cmode);
+
+          // Clang 15 introduced the unqualified-std-cast-call warning which
+          // warns about unqualified calls to std::move() and std::forward()
+          // (because they can be "hijacked" via ADL). Surprisingly, this
+          // warning is enabled by default, as opposed to with -Wextra or at
+          // least -Wall. It has also proven to be quite disruptive, causing a
+          // large number of warnings in a large number of packages. So we are
+          // going to "remap" it to -Wextra for now and in the future may
+          // "relax" it to -Wall and potentially to being enabled by default.
+          // See GitHub issue #259 for background and details.
+          //
+          if (x_lang == lang::cxx           &&
+              ctype == compiler_type::clang &&
+              cmaj >= 15)
+          {
+            bool w (false);       // Seen -W[no-]unqualified-std-cast-call
+            optional<bool> extra; // Seen -W[no-]extra
+
+            for (const char* s: reverse_iterate (args))
+            {
+              if (s != nullptr)
+              {
+                if (strcmp (s, "-Wunqualified-std-cast-call") == 0 ||
+                    strcmp (s, "-Wno-unqualified-std-cast-call") == 0)
+                {
+                  w = true;
+                  break;
+                }
+
+                if (!extra) // Last seen option wins.
+                {
+                  if      (strcmp (s, "-Wextra") == 0) extra = true;
+                  else if (strcmp (s, "-Wno-extra") == 0) extra = false;
+                }
+              }
+            }
+
+            if (!w && (!extra || !*extra))
+              args.push_back ("-Wno-unqualified-std-cast-call");
+          }
+
+          if (md.pp != preprocessed::all)
+            append_sys_hdr_options (args); // Extra system header dirs (last).
+
+          // Note: could be overridden in mode.
+          //
+          append_diag_color_options (args);
+
+          // Set the input charset to UTF-8 unless a custom one is specified.
+          //
+          // Note that the execution charset (-fexec-charset) is UTF-8 by
+          // default.
+          //
+          // Note that early versions of Clang only recognize uppercase UTF-8.
+          //
+          if (!find_option_prefix ("-finput-charset=", args))
+            args.push_back ("-finput-charset=UTF-8");
+
           if (ot == otype::s)
           {
             // On Darwin, Win32 -fPIC is the default.
@@ -7253,11 +7462,6 @@ namespace build2
             }
           }
 
-          append_options (args, cmode);
-
-          if (md.pp != preprocessed::all)
-            append_sys_hdr_options (args); // Extra system header dirs (last).
-
           append_header_options (env, args, header_args, a, t, md, md.dd);
           append_module_options (env, args, module_args, a, t, md, md.dd);
 
@@ -7332,7 +7536,7 @@ namespace build2
             args.push_back ("-c");
           }
 
-          lang_n = append_lang_options (args, md);
+          append_lang_options (args, md);
 
           if (md.pp == preprocessed::all)
           {
@@ -7381,19 +7585,32 @@ namespace build2
       // the source file, not its preprocessed version (so that it's easy to
       // copy and re-run, etc). Only at level 3 and above print the real deal.
       //
+      // @@ TODO: why don't we print env (here and/or below)? Also link rule.
+      //
       if (verb == 1)
-        text << x_name << ' ' << s;
+      {
+        const char* name (x_assembler_cpp (s) ? "as-cpp"   :
+                          x_objective (s)     ? x_obj_name :
+                          x_name);
+
+        print_diag (name, s, t);
+      }
       else if (verb == 2)
         print_process (args);
 
       // If we have the (partially) preprocessed output, switch to that.
       //
-      bool psrc (md.psrc);
+      // But we remember the original source/position to restore later.
+      //
+      bool psrc (md.psrc); // Note: false if cc.reprocess.
       bool ptmp (psrc && md.psrc.temporary);
+      pair<size_t, const char*> osrc;
       if (psrc)
       {
         args.pop_back (); // nullptr
+        osrc.second = args.back ();
         args.pop_back (); // sp
+        osrc.first = args.size ();
 
         sp = &md.psrc.path ();
 
@@ -7403,25 +7620,40 @@ namespace build2
         {
         case compiler_type::gcc:
           {
-            // The -fpreprocessed is implied by .i/.ii. But not when compiling
-            // a header unit (there is no .hi/.hii).
+            // -fpreprocessed is implied by .i/.ii unless compiling a header
+            // unit (there is no .hi/.hii). Also, we would need to pop -x
+            // since it takes precedence over the extension, which would mess
+            // up our osrc logic. So in the end it feels like always passing
+            // explicit -fpreprocessed is the way to go.
             //
-            if (ut == unit_type::module_header)
-              args.push_back ("-fpreprocessed");
-            else
-              // Pop -x since it takes precedence over the extension.
-              //
-              // @@ I wonder why bother and not just add -fpreprocessed? Are
-              //    we trying to save an option or does something break?
-              //
-              for (; lang_n != 0; --lang_n)
-                args.pop_back ();
-
+            // Also note that similarly there is no .Si for .S files.
+            //
+            args.push_back ("-fpreprocessed");
             args.push_back ("-fdirectives-only");
             break;
           }
         case compiler_type::clang:
           {
+            // Clang 15 and later with -pedantic warns about GNU-style line
+            // markers that it wrote itself in the -frewrite-includes output
+            // (llvm-project issue 63284). So we suppress this warning unless
+            // compiling from source.
+            //
+            // In Apple Clang this warning/option are absent in 14.0.3 (which
+            // is said to be based on vanilla Clang 15.0.5) for some reason
+            // (let's hope it's because they patched it out rather than due to
+            // a misleading __LIBCPP_VERSION value).
+            //
+            if (ctype == compiler_type::clang &&
+                cmaj >= (cvariant != "apple" ? 15 : 16))
+            {
+              if (find_options ({"-pedantic",  "-pedantic-errors",
+                                 "-Wpedantic", "-Werror=pedantic"}, args))
+              {
+                args.push_back ("-Wno-gnu-line-marker");
+              }
+            }
+
             // Note that without -x Clang will treat .i/.ii as fully
             // preprocessed.
             //
@@ -7470,45 +7702,38 @@ namespace build2
           file_cache::read psrcr (psrc ? md.psrc.open () : file_cache::read ());
 
           // VC cl.exe sends diagnostics to stdout. It also prints the file
-          // name being compiled as the first line. So for cl.exe we redirect
-          // stdout to a pipe, filter that noise out, and send the rest to
-          // stderr.
+          // name being compiled as the first line. So for cl.exe we filter
+          // that noise out.
           //
-          // For other compilers redirect stdout to stderr, in case any of
-          // them tries to pull off something similar. For sane compilers this
-          // should be harmless.
+          // For other compilers also redirect stdout to stderr, in case any
+          // of them tries to pull off something similar. For sane compilers
+          // this should be harmless.
           //
           bool filter (ctype == compiler_type::msvc);
 
           process pr (cpath,
-                      args.data (),
-                      0, (filter ? -1 : 2), 2,
+                      args,
+                      0, 2, diag_buffer::pipe (ctx, filter /* force */),
                       nullptr, // CWD
                       env.empty () ? nullptr : env.data ());
 
-          if (filter)
-          {
-            try
-            {
-              ifdstream is (
-                move (pr.in_ofd), fdstream_mode::text, ifdstream::badbit);
+          diag_buffer dbuf (ctx, args[0], pr);
 
-              msvc_filter_cl (is, *sp);
+          if (filter)
+            msvc_filter_cl (dbuf, *sp);
 
-              // If anything remains in the stream, send it all to stderr.
-              // Note that the eof check is important: if the stream is at
-              // eof, this and all subsequent writes to the diagnostics stream
-              // will fail (and you won't see a thing).
-              //
-              if (is.peek () != ifdstream::traits_type::eof ())
-                diag_stream_lock () << is.rdbuf ();
+          dbuf.read ();
 
-              is.close ();
-            }
-            catch (const io_error&) {} // Assume exits with error.
+          // Restore the original source if we switched to preprocessed.
+          //
+          if (psrc)
+          {
+            args.resize (osrc.first);
+            args.push_back (osrc.second);
+            args.push_back (nullptr);
           }
 
-          run_finish (args, pr);
+          run_finish (dbuf, args, pr, 1 /* verbosity */);
         }
         catch (const process_error& e)
         {
@@ -7559,12 +7784,14 @@ namespace build2
           try
           {
             process pr (cpath,
-                        args.data (),
-                        0, 2, 2,
+                        args,
+                        0, 2, diag_buffer::pipe (ctx),
                         nullptr, // CWD
                         env.empty () ? nullptr : env.data ());
 
-            run_finish (args, pr);
+            diag_buffer dbuf (ctx, args[0], pr);
+            dbuf.read ();
+            run_finish (dbuf, args, pr, 1 /* verbosity */);
           }
           catch (const process_error& e)
           {
@@ -7595,25 +7822,27 @@ namespace build2
     }
 
     target_state compile_rule::
-    perform_clean (action a, const target& xt) const
+    perform_clean (action a, const target& xt, const target_type& srct) const
     {
       const file& t (xt.as<file> ());
 
+      // Preprocessed file extension.
+      //
+      const char* pext (x_assembler_cpp (srct) ? ".Si"      :
+                        x_objective (srct)     ? x_obj_pext :
+                        x_pext);
+
       // Compressed preprocessed file extension.
       //
-      auto cpext = [this, &t, s = string ()] () mutable -> const char*
-      {
-        return (s = t.ctx.fcache.compressed_extension (x_pext)).c_str ();
-      };
+      string cpext (t.ctx.fcache->compressed_extension (pext));
 
       clean_extras extras;
-
       switch (ctype)
       {
-      case compiler_type::gcc:   extras = {".d", x_pext, cpext (), ".t"};          break;
-      case compiler_type::clang: extras = {".d", x_pext, cpext ()};                break;
-      case compiler_type::msvc:  extras = {".d", x_pext, cpext (), ".idb", ".pdb"};break;
-      case compiler_type::icc:   extras = {".d"};                                  break;
+      case compiler_type::gcc:   extras = {".d", pext, cpext.c_str (), ".t"};           break;
+      case compiler_type::clang: extras = {".d", pext, cpext.c_str ()};                 break;
+      case compiler_type::msvc:  extras = {".d", pext, cpext.c_str (), ".idb", ".pdb"}; break;
+      case compiler_type::icc:   extras = {".d"};                                       break;
       }
 
       return perform_clean_extra (a, t, extras);