src/parse.rs - platform/external/n2 - Git at Google

 //! Parser for .ninja files.
 //!
 //! See design notes on parsing in doc/design_notes.md.
 //!
 //! To avoid allocations parsing frequently uses references into the input
 //! text, marked with the lifetime `'text`.

 use crate::{
     eval::{EvalPart, EvalString},
     graph::{self, Build, BuildIns, BuildOuts, FileLoc},
     load::{Scope, ScopePosition},
     scanner::{ParseResult, Scanner},
     smallmap::SmallMap,
 };
 use std::{
     cell::UnsafeCell,
     path::PathBuf,
     sync::{atomic::AtomicBool, Arc, Mutex},
 };

 /// The parsed representation of a `rule` statement
 #[derive(Debug)]
 pub struct Rule {
     /// The variables that are local to the rule
     pub vars: SmallMap<String, EvalString<String>>,
     /// The scope position of the rule
     pub scope_position: ScopePosition,
 }

 /// The parsed representation of a `pool` statement
 #[derive(Debug, PartialEq)]
 pub struct Pool<'text> {
     /// The name of the pool
     pub name: &'text str,
     /// The depth of the pool (number of commands that can run in it)
     pub depth: usize,
 }

 /// The parsed representation of a single variable assignment
 #[derive(Debug)]
 pub struct VariableAssignment {
     unevaluated: EvalString<&'static str>,
     /// The position of the variable assignment in the Scope, used for
     /// determining the order of assignments to the same variable.
     pub scope_position: ScopePosition,
     evaluated: UnsafeCell<String>,
     is_evaluated: AtomicBool,
     lock: Mutex<()>,
 }

 // SAFETY: Sync is not automatically implemented because of the UnsafeCell,
 // but our usage of the UnsafeCell is guarded behind a Mutex.
 unsafe impl Sync for VariableAssignment {}

 impl VariableAssignment {
     fn new(unevaluated: EvalString<&'static str>) -> Self {
         Self {
             unevaluated,
             scope_position: ScopePosition(0),
             evaluated: UnsafeCell::new(String::new()),
             is_evaluated: AtomicBool::new(false),
             lock: Mutex::new(()),
         }
     }

     /// Evaluates the variable assignment and pushes the result onto the given
     /// result string.
     pub fn evaluate(&self, result: &mut String, scope: &Scope) {
         self.pre_evaluate(scope);
         unsafe {
             result.push_str(&(*self.evaluated.get()));
         }
     }

     /// This is the same as evaluate, but doesn't give any results back.
     /// Used to evalutate all the variables before 'text is over, as unevaluated
     /// should really have a 'text lifetime.
     pub fn pre_evaluate(&self, scope: &Scope) {
         if self.is_evaluated.load(std::sync::atomic::Ordering::Relaxed) {
             return;
         }
         let guard = self.lock.lock().unwrap();
         if self.is_evaluated.load(std::sync::atomic::Ordering::Relaxed) {
             return;
         }

         unsafe {
             self.unevaluated.evaluate_inner(
                 &mut *self.evaluated.get(),
                 &[],
                 scope,
                 self.scope_position,
             );
         }
         self.is_evaluated
             .store(true, std::sync::atomic::Ordering::Relaxed);
         drop(guard);
     }
 }

 /// The parsed representation of the `default` statement in the ninja file
 #[derive(Debug)]
 pub struct DefaultStmt<'text> {
     /// The files that are built by default
     pub files: Vec<EvalString<&'text str>>,
     /// Same as files, but evaluated into graph::File objects
     pub evaluated: Vec<Arc<graph::File>>,
     /// The position of the statement in the ninja file
     pub scope_position: ScopePosition,
 }

 /// Either an include or a subninja statement
 #[derive(Debug, PartialEq)]
 pub struct IncludeOrSubninja<'text> {
     /// The file that's being included
     pub file: EvalString<&'text str>,
     /// The position of the statement in the ninja file
     pub scope_position: ScopePosition,
 }

 /// Statement represents a parsed statement from the ninja file.
 #[derive(Debug)]
 pub enum Statement<'text> {
     /// A `rule` statement
     Rule((String, Rule)),
     /// A `build` statement
     Build(Box<Build>),
     /// A `default` statement
     Default(DefaultStmt<'text>),
     /// An `include` statement
     Include(IncludeOrSubninja<'text>),
     /// A `subninja` statement
     Subninja(IncludeOrSubninja<'text>),
     /// A `pool` statement
     Pool(Pool<'text>),
     /// A variable assignment
     VariableAssignment((String, VariableAssignment)),
 }

 /// Grouping the parse results into clumps allows us to do fewer vector
 /// concatenations when merging results of different chunks or different files
 /// together.
 #[derive(Default, Debug)]
 pub struct Clump<'text> {
     /// Variable assignments
     pub assignments: Vec<(String, VariableAssignment)>,
     /// Rules
     pub rules: Vec<(String, Rule)>,
     /// Pools
     pub pools: Vec<Pool<'text>>,
     /// Default statements
     pub defaults: Vec<DefaultStmt<'text>>,
     /// Builds
     pub builds: Vec<Box<Build>>,
     /// Subninjas
     pub subninjas: Vec<IncludeOrSubninja<'text>>,
     /// The number of scope positions used by this clump
     pub used_scope_positions: usize,
     /// The scope position that this clump starts at
     pub base_position: ScopePosition,
 }

 impl<'text> Clump<'text> {
     /// Returns `true` if the clump has no statements in it
     pub fn is_empty(&self) -> bool {
         self.assignments.is_empty()
             && self.rules.is_empty()
             && self.pools.is_empty()
             && self.defaults.is_empty()
             && self.builds.is_empty()
             && self.subninjas.is_empty()
     }
 }

 /// Either a clump of statements or an include statement. Includes have to
 /// be processed in serial with other statements in the file, so they are
 /// handled specially.
 #[derive(Debug)]
 pub enum ClumpOrInclude<'text> {
     /// A clump of statements
     Clump(Clump<'text>),
     /// A single include statement
     Include(EvalString<&'text str>),
 }

 /// A ninja file parser that will parse the raw ninja file text into a list of
 /// statements.
 pub struct Parser<'text> {
     filename: Arc<PathBuf>,
     scanner: Scanner<'text>,
     buf_len: usize,
 }

 impl<'text> Parser<'text> {
     /// Creates a new parser that parses the given buffer. The filename and
     /// chunk_index are used to track locations in the file for errors.
     pub fn new(buf: &'text [u8], filename: Arc<PathBuf>, chunk_index: usize) -> Parser<'text> {
         Parser {
             filename,
             scanner: Scanner::new(buf, chunk_index),
             buf_len: buf.len(),
         }
     }

     /// Reads the whole buffer, and returns all the statements in it in clumps.
     /// The clumps are separated by include statements, as includes must be
     /// processed inline with the rest of the statements in this file.
     pub fn read_clumps(&mut self) -> ParseResult<Vec<ClumpOrInclude<'text>>> {
         let mut result = Vec::new();
         let mut clump = Clump::default();
         let mut position = ScopePosition(0);
         while let Some(stmt) = self.read()? {
             match stmt {
                 Statement::Rule(mut r) => {
                     r.1.scope_position = position;
                     position.0 += 1;
                     clump.rules.push(r);
                 }
                 Statement::Build(mut b) => {
                     b.scope_position = position;
                     position.0 += 1;
                     clump.builds.push(b);
                 }
                 Statement::Default(mut d) => {
                     d.scope_position = position;
                     position.0 += 1;
                     clump.defaults.push(d);
                 }
                 Statement::Include(i) => {
                     if !clump.is_empty() {
                         clump.used_scope_positions = position.0;
                         result.push(ClumpOrInclude::Clump(clump));
                         clump = Clump::default();
                         position = ScopePosition(0);
                     }
                     result.push(ClumpOrInclude::Include(i.file));
                 }
                 Statement::Subninja(mut s) => {
                     s.scope_position = position;
                     position.0 += 1;
                     clump.subninjas.push(s);
                 }
                 Statement::Pool(p) => {
                     clump.pools.push(p);
                 }
                 Statement::VariableAssignment(mut v) => {
                     v.1.scope_position = position;
                     position.0 += 1;
                     clump.assignments.push(v);
                 }
             }
         }
         if !clump.is_empty() {
             clump.used_scope_positions = position.0;
             result.push(ClumpOrInclude::Clump(clump));
         }
         Ok(result)
     }

     /// Reads one statement out of the buffer.
     pub fn read(&mut self) -> ParseResult<Option<Statement<'text>>> {
         loop {
             match self.scanner.peek() {
                 '\0' => return Ok(None),
                 '\n' | '\r' => self.scanner.next(),
                 '#' => self.skip_comment()?,
                 ' ' | '\t' => return self.scanner.parse_error("unexpected whitespace"),
                 _ => {
                     if self.scanner.ofs >= self.buf_len {
                         // The parsing code expects there to be a null byte at the end of the file,
                         // to allow the parsing to be more performant and exclude most checks for
                         // EOF. However, when parsing an individual "chunk" of the manifest, there
                         // won't be a null byte at the end, the scanner will do an out-of-bounds
                         // read past the end of the chunk and into the next chunk. When we split
                         // the file into chunks, we made sure to end all the chunks just before
                         // identifiers at the start of a new line, so that we can easily detect
                         // that here.
                         assert!(self.scanner.ofs == self.buf_len);
                         return Ok(None);
                     }
                     let ident = self.read_ident()?;
                     self.skip_spaces();
                     match ident {
                         "rule" => return Ok(Some(Statement::Rule(self.read_rule()?))),
                         "build" => return Ok(Some(Statement::Build(Box::new(self.read_build()?)))),
                         "default" => return Ok(Some(Statement::Default(self.read_default()?))),
                         "include" => {
                             let result = IncludeOrSubninja {
                                 file: self.read_eval(false)?,
                                 scope_position: ScopePosition(0),
                             };
                             return Ok(Some(Statement::Include(result)));
                         }
                         "subninja" => {
                             let result = IncludeOrSubninja {
                                 file: self.read_eval(false)?,
                                 scope_position: ScopePosition(0),
                             };
                             return Ok(Some(Statement::Subninja(result)));
                         }
                         "pool" => return Ok(Some(Statement::Pool(self.read_pool()?))),
                         ident => {
                             let x = self.read_vardef()?;
                             // SAFETY: We need to make sure we call evaluate
                             // or pre_evaluate on all VariableAssignments before
                             // the lifetime of 'text is over. After evaluating,
                             // the VariableAssignments will cache their owned
                             // Strings.
                             let x = unsafe {
                                 std::mem::transmute::<
                                     EvalString<&'text str>,
                                     EvalString<&'static str>,
                                 >(x)
                             };
                             let result = VariableAssignment::new(x);
                             return Ok(Some(Statement::VariableAssignment((
                                 ident.to_owned(),
                                 result,
                             ))));
                         }
                     }
                 }
             }
         }
     }

     /// Read the `= ...` part of a variable definition.
     fn read_vardef(&mut self) -> ParseResult<EvalString<&'text str>> {
         self.skip_spaces();
         self.scanner.expect('=')?;
         self.skip_spaces();
         // read_eval will error out if there's nothing to read
         if self.scanner.peek_newline() {
             self.scanner.skip('\r');
             self.scanner.expect('\n')?;
             return Ok(EvalString::new(""));
         }
         let result = self.read_eval(false);
         self.scanner.skip('\r');
         self.scanner.expect('\n')?;
         result
     }

     /// Read a collection of `  foo = bar` variables, with leading indent.
     fn read_scoped_vars(
         &mut self,
         variable_name_validator: fn(var: &str) -> bool,
     ) -> ParseResult<SmallMap<String, EvalString<String>>> {
         let mut vars = SmallMap::default();
         while self.scanner.peek() == ' ' {
             self.scanner.skip_spaces();
             let name = self.read_ident()?;
             if !variable_name_validator(name) {
                 self.scanner
                     .parse_error(format!("unexpected variable {:?}", name))?;
             }
             self.skip_spaces();
             let val = self.read_vardef()?.into_owned();
             vars.insert(name.to_owned(), val);
         }
         Ok(vars)
     }

     fn read_rule(&mut self) -> ParseResult<(String, Rule)> {
         let name = self.read_ident()?;
         self.scanner.skip('\r');
         self.scanner.expect('\n')?;
         let vars = self.read_scoped_vars(|var| {
             matches!(
                 var,
                 "command"
                     | "depfile"
                     | "dyndep"
                     | "description"
                     | "deps"
                     | "generator"
                     | "pool"
                     | "restat"
                     | "rspfile"
                     | "rspfile_content"
                     | "msvc_deps_prefix"
             )
         })?;
         Ok((
             name.to_owned(),
             Rule {
                 vars,
                 scope_position: ScopePosition(0),
             },
         ))
     }

     fn read_pool(&mut self) -> ParseResult<Pool<'text>> {
         let name = self.read_ident()?;
         self.scanner.skip('\r');
         self.scanner.expect('\n')?;
         let vars = self.read_scoped_vars(|var| matches!(var, "depth"))?;
         let mut depth = 0;
         if let Some((_, val)) = vars.into_iter().next() {
             match val.maybe_literal() {
                 Some(x) => match x.parse::<usize>() {
                     Ok(d) => depth = d,
                     Err(err) => return self.scanner.parse_error(format!("pool depth: {}", err)),
                 },
                 None => {
                     return self.scanner.parse_error(format!(
                         "pool depth must be a literal string, got: {:?}",
                         val
                     ))
                 }
             }
         }
         Ok(Pool { name, depth })
     }

     fn read_unevaluated_paths_to(
         &mut self,
         v: &mut Vec<EvalString<&'text str>>,
     ) -> ParseResult<()> {
         self.skip_spaces();
         while !matches!(self.scanner.peek(), ':' | '|') && !self.scanner.peek_newline() {
             v.push(self.read_eval(true)?);
             self.skip_spaces();
         }
         Ok(())
     }

     fn read_build(&mut self) -> ParseResult<Build> {
         let line = self.scanner.line;
         let mut outs_and_ins = Vec::new();
         self.read_unevaluated_paths_to(&mut outs_and_ins)?;
         let explicit_outs = outs_and_ins.len();

         if self.scanner.peek() == '|' {
             self.scanner.next();
             self.read_unevaluated_paths_to(&mut outs_and_ins)?;
         }
         let implicit_outs = outs_and_ins.len() - explicit_outs;

         self.scanner.expect(':')?;
         self.skip_spaces();
         let rule = self.read_ident()?;

         self.read_unevaluated_paths_to(&mut outs_and_ins)?;
         let explicit_ins = outs_and_ins.len() - implicit_outs - explicit_outs;

         if self.scanner.peek() == '|' {
             self.scanner.next();
             let peek = self.scanner.peek();
             if peek == '|' || peek == '@' {
                 self.scanner.back();
             } else {
                 self.read_unevaluated_paths_to(&mut outs_and_ins)?;
             }
         }
         let implicit_ins = outs_and_ins.len() - explicit_ins - implicit_outs - explicit_outs;

         if self.scanner.peek() == '|' {
             self.scanner.next();
             if self.scanner.peek() == '@' {
                 self.scanner.back();
             } else {
                 self.scanner.expect('|')?;
                 self.read_unevaluated_paths_to(&mut outs_and_ins)?;
             }
         }
         let order_only_ins =
             outs_and_ins.len() - implicit_ins - explicit_ins - implicit_outs - explicit_outs;

         if self.scanner.peek() == '|' {
             self.scanner.next();
             self.scanner.expect('@')?;
             self.read_unevaluated_paths_to(&mut outs_and_ins)?;
         }

         self.scanner.skip('\r');
         self.scanner.expect('\n')?;
         let vars: SmallMap<String, EvalString<String>> = self.read_scoped_vars(|_| true)?;
         let phony_output = match vars.get("phony_output").map(|x| x.maybe_literal()) {
             Some(Some("false")) => false,
             Some(Some("true")) => true,
             Some(_) => return self.scanner.parse_error("invalid value for phony_output"),
             None => false,
         };

         // SAFETY: We will evaluate the ins/outs into owned strings before 'text
         // is over, and we don't want to attach the 'text lifetime to Build. So
         // instead, unsafely cast the lifetime to 'static.
         let outs_and_ins = unsafe {
             std::mem::transmute::<Vec<EvalString<&'text str>>, Vec<EvalString<&'static str>>>(
                 outs_and_ins,
             )
         };

         Ok(Build::new(
             rule.to_owned(),
             vars,
             FileLoc {
                 filename: self.filename.clone(),
                 line,
             },
             BuildIns {
                 ids: Vec::new(),
                 explicit: explicit_ins,
                 implicit: implicit_ins,
                 order_only: order_only_ins,
             },
             BuildOuts {
                 ids: Vec::new(),
                 explicit: explicit_outs,
                 implicit: implicit_outs,
             },
             outs_and_ins,
             phony_output,
         ))
     }

     fn read_default(&mut self) -> ParseResult<DefaultStmt<'text>> {
         let mut files = Vec::new();
         self.read_unevaluated_paths_to(&mut files)?;
         if files.is_empty() {
             return self.scanner.parse_error("expected path");
         }
         self.scanner.skip('\r');
         self.scanner.expect('\n')?;
         Ok(DefaultStmt {
             files,
             evaluated: Vec::new(),
             scope_position: ScopePosition(0),
         })
     }

     fn skip_comment(&mut self) -> ParseResult<()> {
         loop {
             match self.scanner.read() {
                 '\0' => {
                     self.scanner.back();
                     return Ok(());
                 }
                 '\n' => return Ok(()),
                 _ => {}
             }
         }
     }

     /// Read an identifier -- rule name, pool name, variable name, etc.
     fn read_ident(&mut self) -> ParseResult<&'text str> {
         let start = self.scanner.ofs;
         while matches!(
             self.scanner.read(),
             'a'..='z' | 'A'..='Z' | '0'..='9' | '_' | '-' | '.'
         ) {}
         self.scanner.back();
         let end = self.scanner.ofs;
         if end == start {
             return self.scanner.parse_error("failed to scan ident");
         }
         Ok(self.scanner.slice(start, end))
     }

     /// Reads an EvalString. Stops at either a newline, or ' ', ':', '|' if
     /// stop_at_path_separators is set, without consuming the character that
     /// caused it to stop.
     fn read_eval(&mut self, stop_at_path_separators: bool) -> ParseResult<EvalString<&'text str>> {
         let start = self.scanner.ofs;
         let mut ofs = self.scanner.ofs;
         let mut found_content = false;
         // This match block is copied twice, with the only difference being the check for
         // spaces, colons, and pipes in the stop_at_path_separators version. We could remove the
         // duplication by adding a match branch like `' ' | ':' | '|' if stop_at_path_separators =>`
         // or even moving the `if stop_at_path_separators` inside of the match body, but both of
         // those options are ~10% slower on a benchmark test of running the loader on llvm-cmake
         // ninja files.
         let end = if stop_at_path_separators {
             loop {
                 match self.scanner.read() {
                     '\0' => return self.scanner.parse_error("unexpected EOF"),
                     ' ' | ':' | '|' | '\n' => {
                         self.scanner.back();
                         break self.scanner.ofs;
                     }
                     '\r' if self.scanner.peek() == '\n' => {
                         self.scanner.back();
                         break self.scanner.ofs;
                     }
                     '$' => {
                         self.read_escape()?;
                         found_content = true;
                         ofs = self.scanner.ofs;
                     }
                     _ => {}
                 }
             }
         } else {
             loop {
                 match self.scanner.read() {
                     '\0' => return self.scanner.parse_error("unexpected EOF"),
                     '\n' => {
                         self.scanner.back();
                         break self.scanner.ofs;
                     }
                     '\r' if self.scanner.peek() == '\n' => {
                         self.scanner.back();
                         break self.scanner.ofs;
                     }
                     '$' => {
                         self.read_escape()?;
                         found_content = true;
                         ofs = self.scanner.ofs;
                     }
                     _ => {}
                 }
             }
         };
         if end > ofs {
             found_content = true;
         }
         if !found_content {
             return self.scanner.parse_error(format!("Expected a string"));
         }
         Ok(EvalString::new(self.scanner.slice(start, end)))
     }

     /// Read a variable name as found after a '$' in an eval.
     /// Ninja calls this a "simple" varname and it is the same as read_ident without
     /// period allowed(!), I guess because we expect things like
     ///   foo = $bar.d
     /// to parse as a reference to $bar.
     fn read_simple_varname(&mut self) -> ParseResult<()> {
         let start = self.scanner.ofs;
         while matches!(self.scanner.read(), 'a'..='z' | 'A'..='Z' | '0'..='9' | '_' | '-') {}
         self.scanner.back();
         let end = self.scanner.ofs;
         if end == start {
             return self.scanner.parse_error("failed to scan variable name");
         }
         Ok(())
     }

     /// Read and interpret the text following a '$' escape character.
     fn read_escape(&mut self) -> ParseResult<()> {
         Ok(match self.scanner.read() {
             '\n' | '\r' => {
                 self.scanner.skip_spaces();
             }
             ' ' | '$' | ':' => (),
             '{' => loop {
                 match self.scanner.read() {
                     '\0' => return self.scanner.parse_error("unexpected EOF"),
                     '}' => break,
                     _ => {}
                 }
             },
             _ => {
                 // '$' followed by some other text.
                 self.scanner.back();
                 self.read_simple_varname()?;
             }
         })
     }

     fn skip_spaces(&mut self) {
         loop {
             match self.scanner.read() {
                 ' ' => {}
                 '$' => {
                     if self.scanner.peek() != '\n' {
                         self.scanner.back();
                         return;
                     }
                     self.scanner.next();
                 }
                 _ => {
                     self.scanner.back();
                     return;
                 }
             }
         }
     }
 }

 /// Given a buffer of an entire ninja file and a number of threads to process
 /// the file in, return that number of chunks of the file. The chunks will be
 /// split at points that are easy to start/stop parsing at, namely it won't
 /// split the file in the middle of a ninja directive (build/rule/pool/variable)
 pub fn split_manifest_into_chunks(buf: &[u8], num_threads: usize) -> Vec<&[u8]> {
     let min_chunk_size = 1024 * 1024;
     let chunk_count = num_threads * 2;
     let chunk_size = std::cmp::max(min_chunk_size, buf.len() / chunk_count + 1);
     let mut result = Vec::with_capacity(chunk_count);
     let mut start = 0;
     while start < buf.len() {
         let next = std::cmp::min(start + chunk_size, buf.len());
         let next = find_start_of_next_manifest_chunk(buf, next);
         result.push(&buf[start..next]);
         start = next;
     }
     result
 }

 fn find_start_of_next_manifest_chunk(buf: &[u8], prospective_start: usize) -> usize {
     let mut idx = prospective_start;
     loop {
         // TODO: Replace the search with something that uses SIMD instructions like the memchr crate
         let Some(nl_index) = &buf[idx..].iter().position(|&b| b == b'\n') else {
             return buf.len();
         };
         idx += nl_index + 1;

         // This newline was escaped, try again. It's possible that this check is too conservative,
         // for example, you could have:
         //  - a comment that ends with a "$": "# $\n"
         //  - an escaped-dollar: "X=$$\n"
         if idx >= 2 && buf[idx - 2] == b'$'
             || idx >= 3 && buf[idx - 2] == b'\r' && buf[idx - 3] == b'$'
         {
             continue;
         }

         // We want chunk boundaries to be at an easy/predictable place for the scanner to stop
         // at. So only stop at an identifier after a newline.
         if idx == buf.len()
             || matches!(
                 buf[idx],
                 b'a'..=b'z' | b'A'..=b'Z' | b'0'..=b'9' | b'_' | b'-' | b'.'
             )
         {
             return idx;
         }
     }
 }

 /// An iterator over the EvalParts in the given string. Note that the
 /// string must be a valid EvalString, or undefined behavior will occur.
 pub struct EvalParser<'a> {
     buf: &'a [u8],
     offset: usize,
 }

 impl<'a> EvalParser<'a> {
     /// Returns a new EvalParser that parses the given buffer.
     pub fn new(buf: &'a [u8]) -> Self {
         Self { buf, offset: 0 }
     }

     fn peek(&self) -> u8 {
         unsafe { *self.buf.get_unchecked(self.offset) }
     }

     fn read(&mut self) -> u8 {
         let c = self.peek();
         self.offset += 1;
         c
     }

     fn slice(&self, start: usize, end: usize) -> &'a str {
         unsafe { std::str::from_utf8_unchecked(self.buf.get_unchecked(start..end)) }
     }
 }

 impl<'a> Iterator for EvalParser<'a> {
     type Item = EvalPart<&'a str>;

     fn next(&mut self) -> Option<Self::Item> {
         let mut start = self.offset;
         while self.offset < self.buf.len() {
             match self.peek() {
                 b'$' => {
                     if self.offset > start {
                         return Some(EvalPart::Literal(self.slice(start, self.offset)));
                     }
                     self.offset += 1;
                     match self.peek() {
                         b'\n' | b'\r' => {
                             self.offset += 1;
                             while self.offset < self.buf.len() && self.peek() == b' ' {
                                 self.offset += 1;
                             }
                             start = self.offset;
                         }
                         b' ' | b'$' | b':' => {
                             start = self.offset;
                             self.offset += 1;
                         }
                         b'{' => {
                             self.offset += 1;
                             start = self.offset;
                             while self.read() != b'}' {}
                             let end = self.offset - 1;
                             return Some(EvalPart::VarRef(self.slice(start, end)));
                         }
                         _ => {
                             // '$' followed by some other text.
                             start = self.offset;
                             while self.offset < self.buf.len()
                                 && matches!(self.peek(), b'a'..=b'z' | b'A'..=b'Z' | b'0'..=b'9' | b'_' | b'-')
                             {
                                 self.offset += 1;
                             }
                             return Some(EvalPart::VarRef(self.slice(start, self.offset)));
                         }
                     }
                 }
                 _ => self.offset += 1,
             }
         }
         if self.offset > start {
             return Some(EvalPart::Literal(self.slice(start, self.offset)));
         }
         None
     }
 }

 #[cfg(test)]
 mod tests {
     use super::*;

     fn test_case_buffer(test_case: &str) -> Vec<u8> {
         let mut buf = test_case.as_bytes().to_vec();
         buf.push(0);
         buf
     }

     fn test_for_line_endings(input: &[&str], test: fn(&str)) {
         let test_case_lf = input.join("\n");
         let test_case_crlf = input.join("\r\n");
         for test_case in [test_case_lf, test_case_crlf] {
             test(&test_case);
         }
     }

     #[test]
     fn parse_defaults() {
         test_for_line_endings(&["var = 3", "default a b$var c", ""], |test_case| {
             let mut buf = test_case_buffer(test_case);
             let mut parser = Parser::new(&mut buf, Arc::new(PathBuf::from("build.ninja")), 0);
             match parser.read().unwrap().unwrap() {
                 Statement::VariableAssignment(_) => {}
                 stmt => panic!("expected variable assignment, got {:?}", stmt),
             };
             let default = match parser.read().unwrap().unwrap() {
                 Statement::Default(d) => d.files,
                 stmt => panic!("expected default, got {:?}", stmt),
             };
             assert_eq!(
                 default
                     .iter()
                     .map(|x| x.parse().collect::<Vec<_>>())
                     .collect::<Vec<_>>(),
                 vec![
                     vec![EvalPart::Literal("a")],
                     vec![EvalPart::Literal("b"), EvalPart::VarRef("var")],
                     vec![EvalPart::Literal("c")],
                 ]
             );
         });
     }

     #[test]
     fn parse_dot_in_eval() {
         let mut buf = test_case_buffer("x = $y.z\n");
         let mut parser = Parser::new(&mut buf, Arc::new(PathBuf::from("build.ninja")), 0);
         let Ok(Some(Statement::VariableAssignment((name, x)))) = parser.read() else {
             panic!("Fail");
         };
         assert_eq!(name, "x");
         assert_eq!(
             x.unevaluated.parse().collect::<Vec<_>>(),
             vec![EvalPart::VarRef("y"), EvalPart::Literal(".z")]
         );
     }

     #[test]
     fn parse_dot_in_rule() {
         let mut buf = test_case_buffer("rule x.y\n  command = x\n");
         let mut parser = Parser::new(&mut buf, Arc::new(PathBuf::from("build.ninja")), 0);
         let Ok(Some(Statement::Rule((name, stmt)))) = parser.read() else {
             panic!("Fail");
         };
         assert_eq!(name, "x.y");
         assert_eq!(stmt.vars.len(), 1);
         assert_eq!(
             stmt.vars.get("command"),
             Some(&EvalString::new("x".to_owned()))
         );
     }

     #[test]
     fn parse_trailing_newline() {
         let mut buf = test_case_buffer("build$\n foo$\n : $\n  touch $\n\n");
         let mut parser = Parser::new(&mut buf, Arc::new(PathBuf::from("build.ninja")), 0);
         let stmt = parser.read().unwrap().unwrap();
         let Statement::Build(stmt) = stmt else {
             panic!("Wasn't a build");
         };
         assert_eq!(stmt.rule, "touch");
     }
 }