lix/src/libexpr/lexer.l

%option reentrant bison-bridge bison-locations
%option noyywrap
%option never-interactive
%option stack
%option nodefault
%option nounput noyy_top_state


%x STRING
%x IND_STRING


%{
#include "nixexpr.hh"
#include "parser-tab.hh"

using namespace nix;

namespace nix {


static void initLoc(YYLTYPE * loc)
{
    loc->first_line = loc->last_line = 1;
    loc->first_column = loc->last_column = 1;
}


static void adjustLoc(YYLTYPE * loc, const char * s, size_t len)
{
    loc->first_line = loc->last_line;
    loc->first_column = loc->last_column;

    while (len--) {
       switch (*s++) {
       case '\r':
           if (*s == '\n') /* cr/lf */
               s++;
           /* fall through */
       case '\n':
           ++loc->last_line;
           loc->last_column = 1;
           break;
       default:
           ++loc->last_column;
       }
    }
}


static Expr * unescapeStr(SymbolTable & symbols, const char * s)
{
    string t;
    char c;
    while ((c = *s++)) {
        if (c == '\\') {
            assert(*s);
            c = *s++;
            if (c == 'n') t += '\n';
            else if (c == 'r') t += '\r';
            else if (c == 't') t += '\t';
            else t += c;
        }
        else if (c == '\r') {
            /* Normalise CR and CR/LF into LF. */
            t += '\n';
            if (*s == '\n') s++; /* cr/lf */
        }
        else t += c;
    }
    return new ExprString(symbols.create(t));
}


}

#define YY_USER_INIT initLoc(yylloc)
#define YY_USER_ACTION adjustLoc(yylloc, yytext, yyleng);

#define PUSH_STATE(state) yy_push_state(state, yyscanner)
#define POP_STATE() yy_pop_state(yyscanner)

%}


ID          [a-zA-Z\_][a-zA-Z0-9\_\'\-]*
INT         [0-9]+
PATH        [a-zA-Z0-9\.\_\-\+]*(\/[a-zA-Z0-9\.\_\-\+]+)+
HPATH       \~(\/[a-zA-Z0-9\.\_\-\+]+)+
SPATH       \<[a-zA-Z0-9\.\_\-\+]+(\/[a-zA-Z0-9\.\_\-\+]+)*\>
URI         [a-zA-Z][a-zA-Z0-9\+\-\.]*\:[a-zA-Z0-9\%\/\?\:\@\&\=\+\$\,\-\_\.\!\~\*\']+


%%


if          { return IF; }
then        { return THEN; }
else        { return ELSE; }
assert      { return ASSERT; }
with        { return WITH; }
let         { return LET; }
in          { return IN; }
rec         { return REC; }
inherit     { return INHERIT; }
or          { return OR_KW; }
\.\.\.      { return ELLIPSIS; }

\=\=        { return EQ; }
\!\=        { return NEQ; }
\<\=        { return LEQ; }
\>\=        { return GEQ; }
\&\&        { return AND; }
\|\|        { return OR; }
\-\>        { return IMPL; }
\/\/        { return UPDATE; }
\+\+        { return CONCAT; }

{ID}        { yylval->id = strdup(yytext); return ID; }
{INT}       { errno = 0;
              yylval->n = strtol(yytext, 0, 10);
              if (errno != 0)
                  throw ParseError(format("invalid integer ‘%1%’") % yytext);
              return INT;
            }

\$\{        { PUSH_STATE(INITIAL); return DOLLAR_CURLY; }
\{          { PUSH_STATE(INITIAL); return '{'; }
\}          { POP_STATE(); return '}'; }

\"          { PUSH_STATE(STRING); return '"'; }
<STRING>([^\$\"\\]|\$[^\{\"\\]|\\.|\$\\.)*\$/\" |
<STRING>([^\$\"\\]|\$[^\{\"\\]|\\.|\$\\.)+ {
              /* It is impossible to match strings ending with '$' with one
                 regex because trailing contexts are only valid at the end
                 of a rule. (A sane but undocumented limitation.) */
              yylval->e = unescapeStr(data->symbols, yytext);
              return STR;
            }
<STRING>\$\{  { PUSH_STATE(INITIAL); return DOLLAR_CURLY; }
<STRING>\"  { POP_STATE(); return '"'; }
<STRING>.   return yytext[0]; /* just in case: shouldn't be reached */

\'\'(\ *\n)?     { PUSH_STATE(IND_STRING); return IND_STRING_OPEN; }
<IND_STRING>([^\$\']|\$[^\{\']|\'[^\'\$])+ {
                   yylval->e = new ExprIndStr(yytext);
                   return IND_STR;
                 }
<IND_STRING>\'\'\$ {
                   yylval->e = new ExprIndStr("$");
                   return IND_STR;
                 }
<IND_STRING>\'\'\' {
                   yylval->e = new ExprIndStr("''");
                   return IND_STR;
                 }
<IND_STRING>\'\'\\. {
                   yylval->e = unescapeStr(data->symbols, yytext + 2);
                   return IND_STR;
                 }
<IND_STRING>\$\{ { PUSH_STATE(INITIAL); return DOLLAR_CURLY; }
<IND_STRING>\'\' { POP_STATE(); return IND_STRING_CLOSE; }
<IND_STRING>\'   {
                   yylval->e = new ExprIndStr("'");
                   return IND_STR;
                 }
<IND_STRING>.    return yytext[0]; /* just in case: shouldn't be reached */

{PATH}      { yylval->path = strdup(yytext); return PATH; }
{HPATH}     { yylval->path = strdup(yytext); return HPATH; }
{SPATH}     { yylval->path = strdup(yytext); return SPATH; }
{URI}       { yylval->uri = strdup(yytext); return URI; }

[ \t\r\n]+    /* eat up whitespace */
\#[^\r\n]*    /* single-line comments */
\/\*([^*]|\*[^\/])*\*\/  /* long comments */

.           return yytext[0];


%%
-												* Replaced the SDF parser by a substantially faster Bison/Flex
  parser (roughly 80x faster).

  The absolutely latest version of Bison (1.875c) is required for
  reentrant GLR support, as well as a recent version of Flex (say,
  2.5.31).  Note that most Unix distributions ship with the
  prehistoric Flex 2.5.4, which doesn't support reentrancy.


											
										
										
											2004-01-30 15:21:42 +00:00
+								%option reentrant bison-bridge bison-locations
 								%option noyywrap
 								%option never-interactive
-												Fix the hack that resets the scanner state.

											
										
										
											2015-07-02 16:39:02 +00:00
+								%option stack
 								%option nodefault
 								%option nounput noyy_top_state
-												* Replaced the SDF parser by a substantially faster Bison/Flex
  parser (roughly 80x faster).

  The absolutely latest version of Bison (1.875c) is required for
  reentrant GLR support, as well as a recent version of Flex (say,
  2.5.31).  Note that most Unix distributions ship with the
  prehistoric Flex 2.5.4, which doesn't support reentrancy.


											
										
										
											2004-01-30 15:21:42 +00:00
-												* String interpolation.  Expressions like

    "--with-freetype2-library=" + freetype + "/lib"

  can now be written as

    "--with-freetype2-library=${freetype}/lib"

  An arbitrary expression can be enclosed within ${...}, not just
  identifiers.

* Escaping in string literals: \n, \r, \t interpreted as in C, any
  other character following \ is interpreted as-is.
  
* Newlines are now allowed in string literals.


											
										
										
											2006-05-01 14:01:47 +00:00
+								%x STRING
-												* Added a new kind of multi-line string literal delimited by two
  single quotes.  Example (from NixOS):

    job = ''
      start on network-interfaces

      start script

        rm -f /var/run/opengl-driver
        ${if videoDriver == "nvidia"        
          then "ln -sf ${nvidiaDrivers} /var/run/opengl-driver"
          else if cfg.driSupport
          then "ln -sf ${mesa} /var/run/opengl-driver"
          else ""
        }

        rm -f /var/log/slim.log

      end script
    '';

  This style has two big advantages:

  - \, ' and " aren't special, only '' and ${.  So you get a lot less
    escaping in shell scripts / configuration files in Nixpkgs/NixOS.
    The delimiter '' is rare in scripts (and can usually be written as
    "").  ${ is also fairly rare.

    Other delimiters such as <<...>>, {{...}} and <|...|> were also
    considered but this one appears to have the fewest drawbacks
    (thanks Martin).

  - Indentation is intelligently stripped so that multi-line strings
    can follow the nesting structure of the containing Nix
    expression.  E.g. in the example above 6 spaces are stripped from
    the start of each line.  This prevents unnecessary indentation in
    generated files (which sometimes even breaks things).

  See tests/lang/eval-okay-ind-string.nix for some examples.



											
										
										
											2007-11-30 16:48:45 +00:00
+								%x IND_STRING
-												* String interpolation.  Expressions like

    "--with-freetype2-library=" + freetype + "/lib"

  can now be written as

    "--with-freetype2-library=${freetype}/lib"

  An arbitrary expression can be enclosed within ${...}, not just
  identifiers.

* Escaping in string literals: \n, \r, \t interpreted as in C, any
  other character following \ is interpreted as-is.
  
* Newlines are now allowed in string literals.


											
										
										
											2006-05-01 14:01:47 +00:00
-												* Replaced the SDF parser by a substantially faster Bison/Flex
  parser (roughly 80x faster).

  The absolutely latest version of Bison (1.875c) is required for
  reentrant GLR support, as well as a recent version of Flex (say,
  2.5.31).  Note that most Unix distributions ship with the
  prehistoric Flex 2.5.4, which doesn't support reentrancy.


											
										
										
											2004-01-30 15:21:42 +00:00
+								%{
-												* Compile the lexer as C++ code.  Remove all the redundant C/C++
  marshalling code.


											
										
										
											2006-09-04 21:36:15 +00:00
+								#include "nixexpr.hh"
-												* Use a proper namespace.
* Optimise header file usage a bit.
* Compile the parser as C++.


											
										
										
											2006-09-04 21:06:23 +00:00
+								#include "parser-tab.hh"
-												* Replaced the SDF parser by a substantially faster Bison/Flex
  parser (roughly 80x faster).

  The absolutely latest version of Bison (1.875c) is required for
  reentrant GLR support, as well as a recent version of Flex (say,
  2.5.31).  Note that most Unix distributions ship with the
  prehistoric Flex 2.5.4, which doesn't support reentrancy.


											
										
										
											2004-01-30 15:21:42 +00:00
-												* Compile the lexer as C++ code.  Remove all the redundant C/C++
  marshalling code.


											
										
										
											2006-09-04 21:36:15 +00:00
+								using namespace nix;
 								namespace nix {
-												Fix whitespace

											
										
										
											2013-09-02 14:29:15 +00:00
-												* Replaced the SDF parser by a substantially faster Bison/Flex
  parser (roughly 80x faster).

  The absolutely latest version of Bison (1.875c) is required for
  reentrant GLR support, as well as a recent version of Flex (say,
  2.5.31).  Note that most Unix distributions ship with the
  prehistoric Flex 2.5.4, which doesn't support reentrancy.


											
										
										
											2004-01-30 15:21:42 +00:00
+								static void initLoc(YYLTYPE * loc)
 								{
-												* Store attribute positions in the AST and report duplicate attribute
  errors with position info.
* For all positions, use the position of the first character of the
  first token, rather than the last character of the first token plus
  one.


											
										
										
											2010-05-06 16:46:48 +00:00
+								    loc->first_line = loc->last_line = 1;
 								    loc->first_column = loc->last_column = 1;
-												* Replaced the SDF parser by a substantially faster Bison/Flex
  parser (roughly 80x faster).

  The absolutely latest version of Bison (1.875c) is required for
  reentrant GLR support, as well as a recent version of Flex (say,
  2.5.31).  Note that most Unix distributions ship with the
  prehistoric Flex 2.5.4, which doesn't support reentrancy.


											
										
										
											2004-01-30 15:21:42 +00:00
+								}
-												Fix whitespace

											
										
										
											2013-09-02 14:29:15 +00:00
-												* Replaced the SDF parser by a substantially faster Bison/Flex
  parser (roughly 80x faster).

  The absolutely latest version of Bison (1.875c) is required for
  reentrant GLR support, as well as a recent version of Flex (say,
  2.5.31).  Note that most Unix distributions ship with the
  prehistoric Flex 2.5.4, which doesn't support reentrancy.


											
										
										
											2004-01-30 15:21:42 +00:00
+								static void adjustLoc(YYLTYPE * loc, const char * s, size_t len)
 								{
-												* Store attribute positions in the AST and report duplicate attribute
  errors with position info.
* For all positions, use the position of the first character of the
  first token, rather than the last character of the first token plus
  one.


											
										
										
											2010-05-06 16:46:48 +00:00
+								    loc->first_line = loc->last_line;
 								    loc->first_column = loc->last_column;
-												* Replaced the SDF parser by a substantially faster Bison/Flex
  parser (roughly 80x faster).

  The absolutely latest version of Bison (1.875c) is required for
  reentrant GLR support, as well as a recent version of Flex (say,
  2.5.31).  Note that most Unix distributions ship with the
  prehistoric Flex 2.5.4, which doesn't support reentrancy.


											
										
										
											2004-01-30 15:21:42 +00:00
+								    while (len--) {
 								       switch (*s++) {
-												* Handle carriage returns.  Fixes NIX-53.


											
										
										
											2006-08-16 10:28:44 +00:00
+								       case '\r':
 								           if (*s == '\n') /* cr/lf */
 								               s++;
 								           /* fall through */
-												Fix whitespace

											
										
										
											2013-09-02 14:29:15 +00:00
+								       case '\n':
-												* Store attribute positions in the AST and report duplicate attribute
  errors with position info.
* For all positions, use the position of the first character of the
  first token, rather than the last character of the first token plus
  one.


											
										
										
											2010-05-06 16:46:48 +00:00
+								           ++loc->last_line;
 								           loc->last_column = 1;
-												* Replaced the SDF parser by a substantially faster Bison/Flex
  parser (roughly 80x faster).

  The absolutely latest version of Bison (1.875c) is required for
  reentrant GLR support, as well as a recent version of Flex (say,
  2.5.31).  Note that most Unix distributions ship with the
  prehistoric Flex 2.5.4, which doesn't support reentrancy.


											
										
										
											2004-01-30 15:21:42 +00:00
+								           break;
 								       default:
-												* Store attribute positions in the AST and report duplicate attribute
  errors with position info.
* For all positions, use the position of the first character of the
  first token, rather than the last character of the first token plus
  one.


											
										
										
											2010-05-06 16:46:48 +00:00
+								           ++loc->last_column;
-												* Replaced the SDF parser by a substantially faster Bison/Flex
  parser (roughly 80x faster).

  The absolutely latest version of Bison (1.875c) is required for
  reentrant GLR support, as well as a recent version of Flex (say,
  2.5.31).  Note that most Unix distributions ship with the
  prehistoric Flex 2.5.4, which doesn't support reentrancy.


											
										
										
											2004-01-30 15:21:42 +00:00
+								       }
 								    }
 								}
-												* Compile the lexer as C++ code.  Remove all the redundant C/C++
  marshalling code.


											
										
										
											2006-09-04 21:36:15 +00:00
-												* Optimise string constants by putting them in the symbol table.


											
										
										
											2010-10-23 21:11:59 +00:00
+								static Expr * unescapeStr(SymbolTable & symbols, const char * s)
-												* Use a proper namespace.
* Optimise header file usage a bit.
* Compile the parser as C++.


											
										
										
											2006-09-04 21:06:23 +00:00
+								{
-												* Compile the lexer as C++ code.  Remove all the redundant C/C++
  marshalling code.


											
										
										
											2006-09-04 21:36:15 +00:00
+								    string t;
 								    char c;
 								    while ((c = *s++)) {
 								        if (c == '\\') {
 								            assert(*s);
 								            c = *s++;
 								            if (c == 'n') t += '\n';
 								            else if (c == 'r') t += '\r';
 								            else if (c == 't') t += '\t';
 								            else t += c;
 								        }
 								        else if (c == '\r') {
 								            /* Normalise CR and CR/LF into LF. */
 								            t += '\n';
 								            if (*s == '\n') s++; /* cr/lf */
 								        }
 								        else t += c;
 								    }
-												* Optimise string constants by putting them in the symbol table.


											
										
										
											2010-10-23 21:11:59 +00:00
+								    return new ExprString(symbols.create(t));
-												* Use a proper namespace.
* Optimise header file usage a bit.
* Compile the parser as C++.


											
										
										
											2006-09-04 21:06:23 +00:00
+								}
-												Fix whitespace

											
										
										
											2013-09-02 14:29:15 +00:00
-												* Compile the lexer as C++ code.  Remove all the redundant C/C++
  marshalling code.


											
										
										
											2006-09-04 21:36:15 +00:00
+								}
-												* String interpolation.  Expressions like

    "--with-freetype2-library=" + freetype + "/lib"

  can now be written as

    "--with-freetype2-library=${freetype}/lib"

  An arbitrary expression can be enclosed within ${...}, not just
  identifiers.

* Escaping in string literals: \n, \r, \t interpreted as in C, any
  other character following \ is interpreted as-is.
  
* Newlines are now allowed in string literals.


											
										
										
											2006-05-01 14:01:47 +00:00
-												* Replaced the SDF parser by a substantially faster Bison/Flex
  parser (roughly 80x faster).

  The absolutely latest version of Bison (1.875c) is required for
  reentrant GLR support, as well as a recent version of Flex (say,
  2.5.31).  Note that most Unix distributions ship with the
  prehistoric Flex 2.5.4, which doesn't support reentrancy.


											
										
										
											2004-01-30 15:21:42 +00:00
+								#define YY_USER_INIT initLoc(yylloc)
 								#define YY_USER_ACTION adjustLoc(yylloc, yytext, yyleng);
-												Fix the hack that resets the scanner state.

											
										
										
											2015-07-02 16:39:02 +00:00
+								#define PUSH_STATE(state) yy_push_state(state, yyscanner)
 								#define POP_STATE() yy_pop_state(yyscanner)
-												* Replaced the SDF parser by a substantially faster Bison/Flex
  parser (roughly 80x faster).

  The absolutely latest version of Bison (1.875c) is required for
  reentrant GLR support, as well as a recent version of Flex (say,
  2.5.31).  Note that most Unix distributions ship with the
  prehistoric Flex 2.5.4, which doesn't support reentrancy.


											
										
										
											2004-01-30 15:21:42 +00:00
+								%}
-												Allow dashes in identifiers

In Nixpkgs, the attribute in all-packages.nix corresponding to a
package is usually equal to the package name.  However, this doesn't
work if the package contains a dash, which is fairly common.  The
convention is to replace the dash with an underscore (e.g. "dbus-lib"
becomes "dbus_glib"), but that's annoying.  So now dashes are valid in
variable / attribute names, allowing you to write:

  dbus-glib = callPackage ../development/libraries/dbus-glib { };

and

  buildInputs = [ dbus-glib ];

Since we don't have a negation or subtraction operation in Nix, this
is unambiguous.

											
										
										
											2012-09-27 19:43:08 +00:00
+								ID          [a-zA-Z\_][a-zA-Z0-9\_\'\-]*
-												* Replaced the SDF parser by a substantially faster Bison/Flex
  parser (roughly 80x faster).

  The absolutely latest version of Bison (1.875c) is required for
  reentrant GLR support, as well as a recent version of Flex (say,
  2.5.31).  Note that most Unix distributions ship with the
  prehistoric Flex 2.5.4, which doesn't support reentrancy.


											
										
										
											2004-01-30 15:21:42 +00:00
+								INT         [0-9]+
 								PATH        [a-zA-Z0-9\.\_\-\+]*(\/[a-zA-Z0-9\.\_\-\+]+)+
-												Allow the leading component of a path to be a ~

											
										
										
											2015-02-19 13:05:16 +00:00
+								HPATH       \~(\/[a-zA-Z0-9\.\_\-\+]+)+
-												* Add a Nix expression search path feature.  Paths between angle
  brackets, e.g.

    import <nixpkgs/pkgs/lib>

  are resolved by looking them up relative to the elements listed in
  the search path.  This allows us to get rid of hacks like

    import "${builtins.getEnv "NIXPKGS_ALL"}/pkgs/lib"

  The search path can be specified through the ‘-I’ command-line flag
  and through the colon-separated ‘NIX_PATH’ environment variable,
  e.g.,

    $ nix-build -I /etc/nixos ...

  If a file is not found in the search path, an error message is
  lazily thrown.


											
										
										
											2011-08-06 16:05:24 +00:00
+								SPATH       \<[a-zA-Z0-9\.\_\-\+]+(\/[a-zA-Z0-9\.\_\-\+]+)*\>
-												* Added plain lambdas, e.g., `let { id = x: x; const = x: y: x; }'.
  `bla:' is now no longer parsed as a URL.

* Re-enabled support for the `args' attribute in derivations to
  specify command line arguments to the builder, e.g.,

    ...
    builder = /usr/bin/python;
    args = ["-c" ./builder.py];
    ...


											
										
										
											2004-03-28 20:34:22 +00:00
+								URI         [a-zA-Z][a-zA-Z0-9\+\-\.]*\:[a-zA-Z0-9\%\/\?\:\@\&\=\+\$\,\-\_\.\!\~\*\']+
-												* Replaced the SDF parser by a substantially faster Bison/Flex
  parser (roughly 80x faster).

  The absolutely latest version of Bison (1.875c) is required for
  reentrant GLR support, as well as a recent version of Flex (say,
  2.5.31).  Note that most Unix distributions ship with the
  prehistoric Flex 2.5.4, which doesn't support reentrancy.


											
										
										
											2004-01-30 15:21:42 +00:00
 								%%
 								if          { return IF; }
 								then        { return THEN; }
 								else        { return ELSE; }
 								assert      { return ASSERT; }
-												* New language feature: with expressions.

  The expression `with E1; E2' evaluates to E2 with all bindings in
  the attribute set E1 substituted.  E.g.,

    with {x = 123;}; x

  evaluates to 123.  That is, the attribute set E1 is in scope in E2.

  This is particularly useful when importing files containing lots
  definitions.  E.g., instead of

    let {
      inherit (import ./foo.nix) a b c d e f;

      body = ... a ... f ...;
    }

  we can now say

    with import ./foo.nix;

    ... a ... f ...

  I.e., we don't have to say what variables should be brought into scope.


											
										
										
											2004-10-25 16:54:56 +00:00
+								with        { return WITH; }
-												* Replaced the SDF parser by a substantially faster Bison/Flex
  parser (roughly 80x faster).

  The absolutely latest version of Bison (1.875c) is required for
  reentrant GLR support, as well as a recent version of Flex (say,
  2.5.31).  Note that most Unix distributions ship with the
  prehistoric Flex 2.5.4, which doesn't support reentrancy.


											
										
										
											2004-01-30 15:21:42 +00:00
+								let         { return LET; }
-												* Finally, a real "let" syntax: `let x = ...; ... z = ...; in ...'.


											
										
										
											2006-10-02 15:52:44 +00:00
+								in          { return IN; }
-												* Replaced the SDF parser by a substantially faster Bison/Flex
  parser (roughly 80x faster).

  The absolutely latest version of Bison (1.875c) is required for
  reentrant GLR support, as well as a recent version of Flex (say,
  2.5.31).  Note that most Unix distributions ship with the
  prehistoric Flex 2.5.4, which doesn't support reentrancy.


											
										
										
											2004-01-30 15:21:42 +00:00
+								rec         { return REC; }
-												* Added syntactic sugar to the construction of attribute sets to
  `inherit' variables from the surrounding lexical scope.

  E.g.,

    {stdenv, libfoo}: derivation {
      builder = ./bla;
      inherit stdenv libfoo;
      xyzzy = 1;
    }

  is equivalent to

    {stdenv, libfoo}: derivation {
      builder = ./bla;
      stdenv = stdenv;
      libfoo = libfoo;
      xyzzy = 1;
    }

  Note that for mutually recursive attribute set definitions (`rec
  {...}'), this also works, that is, `rec {inherit x;}' is equivalent
  to `let {fresh = x; body = rec {x = fresh;};}', *not*
  `rec {x = x}'.


											
										
										
											2004-02-02 21:39:33 +00:00
+								inherit     { return INHERIT; }
-												* Allow a default value in attribute selection by writing

    x.y.z or default

  (as originally proposed in
  https://mail.cs.uu.nl/pipermail/nix-dev/2009-September/002989.html).

  For instance, an expression like

    stdenv.lib.attrByPath ["features" "ckSched"] false args

  can now be written as

    args.features.ckSched or false



											
										
										
											2011-07-13 12:19:57 +00:00
+								or          { return OR_KW; }
-												* Added an experimental feature suggested by Andres: ellipses ("...")
  in attribute set pattern matches.  This allows defining a function
  that takes *at least* the listed attributes, while ignoring
  additional attributes.  For instance,

    {stdenv, fetchurl, fuse, ...}:
    
    stdenv.mkDerivation {
      ...
    };
    
  defines a function that requires an attribute set that contains the 
  specified attributes but ignores others.  The main advantage is that
  we can then write in all-packages.nix

    aefs = import ../bla/aefs pkgs;

  instead of

    aefs = import ../bla/aefs {
      inherit stdenv fetchurl fuse;
    };

  This saves a lot of typing (not to mention not having to update
  all-packages.nix with purely mechanical changes).  It saves as much
  typing as the "args: with args;" style, but has the advantage that
  the function arguments are properly declared (not implicit in what
  the body of the "with" uses).


											
										
										
											2008-08-14 14:00:44 +00:00
+								\.\.\.      { return ELLIPSIS; }
-												* Replaced the SDF parser by a substantially faster Bison/Flex
  parser (roughly 80x faster).

  The absolutely latest version of Bison (1.875c) is required for
  reentrant GLR support, as well as a recent version of Flex (say,
  2.5.31).  Note that most Unix distributions ship with the
  prehistoric Flex 2.5.4, which doesn't support reentrancy.


											
										
										
											2004-01-30 15:21:42 +00:00
 								\=\=        { return EQ; }
 								\!\=        { return NEQ; }
-												Add comparison operators ‘<’, ‘<=’, ‘>’ and ‘>=’

											
										
										
											2013-08-02 16:39:40 +00:00
+								\<\=        { return LEQ; }
 								\>\=        { return GEQ; }
-												* Replaced the SDF parser by a substantially faster Bison/Flex
  parser (roughly 80x faster).

  The absolutely latest version of Bison (1.875c) is required for
  reentrant GLR support, as well as a recent version of Flex (say,
  2.5.31).  Note that most Unix distributions ship with the
  prehistoric Flex 2.5.4, which doesn't support reentrancy.


											
										
										
											2004-01-30 15:21:42 +00:00
+								\&\&        { return AND; }
 								\|\|        { return OR; }
 								\-\>        { return IMPL; }
-												* An attribute set update operator (//).  E.g.,

  {x=1; y=2; z=3;} // {y=4;}  =>  {x=1; y=4; z=3;}


											
										
										
											2004-02-04 16:49:51 +00:00
+								\/\/        { return UPDATE; }
-												* Added a list concatenation operator:
    [1 2 3] ++ [4 5 6] => [1 2 3 4 5 6]


											
										
										
											2005-07-25 15:05:34 +00:00
+								\+\+        { return CONCAT; }
-												* Replaced the SDF parser by a substantially faster Bison/Flex
  parser (roughly 80x faster).

  The absolutely latest version of Bison (1.875c) is required for
  reentrant GLR support, as well as a recent version of Flex (say,
  2.5.31).  Note that most Unix distributions ship with the
  prehistoric Flex 2.5.4, which doesn't support reentrancy.


											
										
										
											2004-01-30 15:21:42 +00:00
-												* Don't use ATerms for the abstract syntax trees anymore.  Not
  finished yet.


											
										
										
											2010-04-12 18:30:11 +00:00
+								{ID}        { yylval->id = strdup(yytext); return ID; }
-												Store Nix integers as longs

So on 64-bit systems, integers are now 64-bit.

Fixes #158.

											
										
										
											2013-08-19 10:35:03 +00:00
+								{INT}       { errno = 0;
 								              yylval->n = strtol(yytext, 0, 10);
 								              if (errno != 0)
-												Use proper quotes everywhere

											
										
										
											2014-08-20 15:00:17 +00:00
+								                  throw ParseError(format("invalid integer ‘%1%’") % yytext);
-												* Parser numbers again.
* Include missing files in distributions.


											
										
										
											2004-01-30 17:06:03 +00:00
+								              return INT;
 								            }
-												* String interpolation.  Expressions like

    "--with-freetype2-library=" + freetype + "/lib"

  can now be written as

    "--with-freetype2-library=${freetype}/lib"

  An arbitrary expression can be enclosed within ${...}, not just
  identifiers.

* Escaping in string literals: \n, \r, \t interpreted as in C, any
  other character following \ is interpreted as-is.
  
* Newlines are now allowed in string literals.


											
										
										
											2006-05-01 14:01:47 +00:00
-												Revert "next try for "don't abort when given unmatched '}' with 'start-condition stack underflow'. This fixes  #751""

This reverts commit ed23c8568e10d15196bb4ff2b79fc14191d28109. Let's
merge this *after* the 1.11.1 release.

											
										
										
											2016-01-19 23:05:28 +00:00
+								\$\{        { PUSH_STATE(INITIAL); return DOLLAR_CURLY; }
 								\{          { PUSH_STATE(INITIAL); return '{'; }
 								\}          { POP_STATE(); return '}'; }
-												Allow "bare" dynamic attrs

Now, in addition to a."${b}".c, you can write a.${b}.c (applicable
wherever dynamic attributes are valid).

Signed-off-by: Shea Levy <shea@shealevy.com>

											
										
										
											2014-01-06 15:27:26 +00:00
-												Revert "next try for "don't abort when given unmatched '}' with 'start-condition stack underflow'. This fixes  #751""

This reverts commit ed23c8568e10d15196bb4ff2b79fc14191d28109. Let's
merge this *after* the 1.11.1 release.

											
										
										
											2016-01-19 23:05:28 +00:00
+								\"          { PUSH_STATE(STRING); return '"'; }
-												Fix the parsing of "$"'s in strings.

											
										
										
											2015-07-02 21:53:04 +00:00
+								<STRING>([^\$\"\\]|\$[^\{\"\\]|\\.|\$\\.)*\$/\" |
 								<STRING>([^\$\"\\]|\$[^\{\"\\]|\\.|\$\\.)+ {
 								              /* It is impossible to match strings ending with '$' with one
 								                 regex because trailing contexts are only valid at the end
 								                 of a rule. (A sane but undocumented limitation.) */
-												* Optimise string constants by putting them in the symbol table.


											
										
										
											2010-10-23 21:11:59 +00:00
+								              yylval->e = unescapeStr(data->symbols, yytext);
-												* String interpolation.  Expressions like

    "--with-freetype2-library=" + freetype + "/lib"

  can now be written as

    "--with-freetype2-library=${freetype}/lib"

  An arbitrary expression can be enclosed within ${...}, not just
  identifiers.

* Escaping in string literals: \n, \r, \t interpreted as in C, any
  other character following \ is interpreted as-is.
  
* Newlines are now allowed in string literals.


											
										
										
											2006-05-01 14:01:47 +00:00
+								              return STR;
-												* Replaced the SDF parser by a substantially faster Bison/Flex
  parser (roughly 80x faster).

  The absolutely latest version of Bison (1.875c) is required for
  reentrant GLR support, as well as a recent version of Flex (say,
  2.5.31).  Note that most Unix distributions ship with the
  prehistoric Flex 2.5.4, which doesn't support reentrancy.


											
										
										
											2004-01-30 15:21:42 +00:00
+								            }
-												Revert "next try for "don't abort when given unmatched '}' with 'start-condition stack underflow'. This fixes  #751""

This reverts commit ed23c8568e10d15196bb4ff2b79fc14191d28109. Let's
merge this *after* the 1.11.1 release.

											
										
										
											2016-01-19 23:05:28 +00:00
+								<STRING>\$\{  { PUSH_STATE(INITIAL); return DOLLAR_CURLY; }
-												Fix the hack that resets the scanner state.

											
										
										
											2015-07-02 16:39:02 +00:00
+								<STRING>\"  { POP_STATE(); return '"'; }
-												* String interpolation.  Expressions like

    "--with-freetype2-library=" + freetype + "/lib"

  can now be written as

    "--with-freetype2-library=${freetype}/lib"

  An arbitrary expression can be enclosed within ${...}, not just
  identifiers.

* Escaping in string literals: \n, \r, \t interpreted as in C, any
  other character following \ is interpreted as-is.
  
* Newlines are now allowed in string literals.


											
										
										
											2006-05-01 14:01:47 +00:00
+								<STRING>.   return yytext[0]; /* just in case: shouldn't be reached */
-												Revert "next try for "don't abort when given unmatched '}' with 'start-condition stack underflow'. This fixes  #751""

This reverts commit ed23c8568e10d15196bb4ff2b79fc14191d28109. Let's
merge this *after* the 1.11.1 release.

											
										
										
											2016-01-19 23:05:28 +00:00
+								\'\'(\ *\n)?     { PUSH_STATE(IND_STRING); return IND_STRING_OPEN; }
-												* Fix the parsing of

    ''
      '${foo}'
    ''
    
  where the antiquote should work as expected, instead of giving the
  string "'${foo}'".


											
										
										
											2008-02-05 13:38:07 +00:00
+								<IND_STRING>([^\$\']|\$[^\{\']|\'[^\'\$])+ {
-												* Indented strings.


											
										
										
											2010-04-12 22:03:27 +00:00
+								                   yylval->e = new ExprIndStr(yytext);
-												* Added a new kind of multi-line string literal delimited by two
  single quotes.  Example (from NixOS):

    job = ''
      start on network-interfaces

      start script

        rm -f /var/run/opengl-driver
        ${if videoDriver == "nvidia"        
          then "ln -sf ${nvidiaDrivers} /var/run/opengl-driver"
          else if cfg.driSupport
          then "ln -sf ${mesa} /var/run/opengl-driver"
          else ""
        }

        rm -f /var/log/slim.log

      end script
    '';

  This style has two big advantages:

  - \, ' and " aren't special, only '' and ${.  So you get a lot less
    escaping in shell scripts / configuration files in Nixpkgs/NixOS.
    The delimiter '' is rare in scripts (and can usually be written as
    "").  ${ is also fairly rare.

    Other delimiters such as <<...>>, {{...}} and <|...|> were also
    considered but this one appears to have the fewest drawbacks
    (thanks Martin).

  - Indentation is intelligently stripped so that multi-line strings
    can follow the nesting structure of the containing Nix
    expression.  E.g. in the example above 6 spaces are stripped from
    the start of each line.  This prevents unnecessary indentation in
    generated files (which sometimes even breaks things).

  See tests/lang/eval-okay-ind-string.nix for some examples.



											
										
										
											2007-11-30 16:48:45 +00:00
+								                   return IND_STR;
-												* Syntax to escape '', ${.


											
										
										
											2007-12-06 10:20:58 +00:00
+								                 }
 								<IND_STRING>\'\'\$ {
-												* Indented strings.


											
										
										
											2010-04-12 22:03:27 +00:00
+								                   yylval->e = new ExprIndStr("$");
-												* Syntax to escape '', ${.


											
										
										
											2007-12-06 10:20:58 +00:00
+								                   return IND_STR;
 								                 }
 								<IND_STRING>\'\'\' {
-												* Indented strings.


											
										
										
											2010-04-12 22:03:27 +00:00
+								                   yylval->e = new ExprIndStr("''");
-												* Syntax to escape '', ${.


											
										
										
											2007-12-06 10:20:58 +00:00
+								                   return IND_STR;
 								                 }
 								<IND_STRING>\'\'\\. {
-												* Optimise string constants by putting them in the symbol table.


											
										
										
											2010-10-23 21:11:59 +00:00
+								                   yylval->e = unescapeStr(data->symbols, yytext + 2);
-												* Syntax to escape '', ${.


											
										
										
											2007-12-06 10:20:58 +00:00
+								                   return IND_STR;
-												* Added a new kind of multi-line string literal delimited by two
  single quotes.  Example (from NixOS):

    job = ''
      start on network-interfaces

      start script

        rm -f /var/run/opengl-driver
        ${if videoDriver == "nvidia"        
          then "ln -sf ${nvidiaDrivers} /var/run/opengl-driver"
          else if cfg.driSupport
          then "ln -sf ${mesa} /var/run/opengl-driver"
          else ""
        }

        rm -f /var/log/slim.log

      end script
    '';

  This style has two big advantages:

  - \, ' and " aren't special, only '' and ${.  So you get a lot less
    escaping in shell scripts / configuration files in Nixpkgs/NixOS.
    The delimiter '' is rare in scripts (and can usually be written as
    "").  ${ is also fairly rare.

    Other delimiters such as <<...>>, {{...}} and <|...|> were also
    considered but this one appears to have the fewest drawbacks
    (thanks Martin).

  - Indentation is intelligently stripped so that multi-line strings
    can follow the nesting structure of the containing Nix
    expression.  E.g. in the example above 6 spaces are stripped from
    the start of each line.  This prevents unnecessary indentation in
    generated files (which sometimes even breaks things).

  See tests/lang/eval-okay-ind-string.nix for some examples.



											
										
										
											2007-11-30 16:48:45 +00:00
+								                 }
-												Revert "next try for "don't abort when given unmatched '}' with 'start-condition stack underflow'. This fixes  #751""

This reverts commit ed23c8568e10d15196bb4ff2b79fc14191d28109. Let's
merge this *after* the 1.11.1 release.

											
										
										
											2016-01-19 23:05:28 +00:00
+								<IND_STRING>\$\{ { PUSH_STATE(INITIAL); return DOLLAR_CURLY; }
-												Fix the hack that resets the scanner state.

											
										
										
											2015-07-02 16:39:02 +00:00
+								<IND_STRING>\'\' { POP_STATE(); return IND_STRING_CLOSE; }
-												* Fix the parsing of

    ''
      '${foo}'
    ''
    
  where the antiquote should work as expected, instead of giving the
  string "'${foo}'".


											
										
										
											2008-02-05 13:38:07 +00:00
+								<IND_STRING>\'   {
-												* Indented strings.


											
										
										
											2010-04-12 22:03:27 +00:00
+								                   yylval->e = new ExprIndStr("'");
-												* Fix the parsing of

    ''
      '${foo}'
    ''
    
  where the antiquote should work as expected, instead of giving the
  string "'${foo}'".


											
										
										
											2008-02-05 13:38:07 +00:00
+								                   return IND_STR;
 								                 }
-												* Added a new kind of multi-line string literal delimited by two
  single quotes.  Example (from NixOS):

    job = ''
      start on network-interfaces

      start script

        rm -f /var/run/opengl-driver
        ${if videoDriver == "nvidia"        
          then "ln -sf ${nvidiaDrivers} /var/run/opengl-driver"
          else if cfg.driSupport
          then "ln -sf ${mesa} /var/run/opengl-driver"
          else ""
        }

        rm -f /var/log/slim.log

      end script
    '';

  This style has two big advantages:

  - \, ' and " aren't special, only '' and ${.  So you get a lot less
    escaping in shell scripts / configuration files in Nixpkgs/NixOS.
    The delimiter '' is rare in scripts (and can usually be written as
    "").  ${ is also fairly rare.

    Other delimiters such as <<...>>, {{...}} and <|...|> were also
    considered but this one appears to have the fewest drawbacks
    (thanks Martin).

  - Indentation is intelligently stripped so that multi-line strings
    can follow the nesting structure of the containing Nix
    expression.  E.g. in the example above 6 spaces are stripped from
    the start of each line.  This prevents unnecessary indentation in
    generated files (which sometimes even breaks things).

  See tests/lang/eval-okay-ind-string.nix for some examples.



											
										
										
											2007-11-30 16:48:45 +00:00
+								<IND_STRING>.    return yytext[0]; /* just in case: shouldn't be reached */
-												* String interpolation.  Expressions like

    "--with-freetype2-library=" + freetype + "/lib"

  can now be written as

    "--with-freetype2-library=${freetype}/lib"

  An arbitrary expression can be enclosed within ${...}, not just
  identifiers.

* Escaping in string literals: \n, \r, \t interpreted as in C, any
  other character following \ is interpreted as-is.
  
* Newlines are now allowed in string literals.


											
										
										
											2006-05-01 14:01:47 +00:00
-												* Don't use ATerms for the abstract syntax trees anymore.  Not
  finished yet.


											
										
										
											2010-04-12 18:30:11 +00:00
+								{PATH}      { yylval->path = strdup(yytext); return PATH; }
-												Allow the leading component of a path to be a ~

											
										
										
											2015-02-19 13:05:16 +00:00
+								{HPATH}     { yylval->path = strdup(yytext); return HPATH; }
-												* Add a Nix expression search path feature.  Paths between angle
  brackets, e.g.

    import <nixpkgs/pkgs/lib>

  are resolved by looking them up relative to the elements listed in
  the search path.  This allows us to get rid of hacks like

    import "${builtins.getEnv "NIXPKGS_ALL"}/pkgs/lib"

  The search path can be specified through the ‘-I’ command-line flag
  and through the colon-separated ‘NIX_PATH’ environment variable,
  e.g.,

    $ nix-build -I /etc/nixos ...

  If a file is not found in the search path, an error message is
  lazily thrown.


											
										
										
											2011-08-06 16:05:24 +00:00
+								{SPATH}     { yylval->path = strdup(yytext); return SPATH; }
-												* Don't use ATerms for the abstract syntax trees anymore.  Not
  finished yet.


											
										
										
											2010-04-12 18:30:11 +00:00
+								{URI}       { yylval->uri = strdup(yytext); return URI; }
-												* Replaced the SDF parser by a substantially faster Bison/Flex
  parser (roughly 80x faster).

  The absolutely latest version of Bison (1.875c) is required for
  reentrant GLR support, as well as a recent version of Flex (say,
  2.5.31).  Note that most Unix distributions ship with the
  prehistoric Flex 2.5.4, which doesn't support reentrancy.


											
										
										
											2004-01-30 15:21:42 +00:00
-												* Handle carriage returns.  Fixes NIX-53.


											
										
										
											2006-08-16 10:28:44 +00:00
+								[ \t\r\n]+    /* eat up whitespace */
 								\#[^\r\n]*    /* single-line comments */
-												* Bug fix in parsing of /* ... */ comments; due to longest match
  regexp there could be only one such comment per file.


											
										
										
											2004-10-27 13:00:31 +00:00
+								\/\*([^*]|\*[^\/])*\*\/  /* long comments */
-												* Replaced the SDF parser by a substantially faster Bison/Flex
  parser (roughly 80x faster).

  The absolutely latest version of Bison (1.875c) is required for
  reentrant GLR support, as well as a recent version of Flex (say,
  2.5.31).  Note that most Unix distributions ship with the
  prehistoric Flex 2.5.4, which doesn't support reentrancy.


											
										
										
											2004-01-30 15:21:42 +00:00
 								.           return yytext[0];
 								%%
-												* String interpolation.  Expressions like

    "--with-freetype2-library=" + freetype + "/lib"

  can now be written as

    "--with-freetype2-library=${freetype}/lib"

  An arbitrary expression can be enclosed within ${...}, not just
  identifiers.

* Escaping in string literals: \n, \r, \t interpreted as in C, any
  other character following \ is interpreted as-is.
  
* Newlines are now allowed in string literals.


											
										
										
											2006-05-01 14:01:47 +00:00