Blame src/lexer.hpp

Packit bfcc33
#ifndef SASS_LEXER_H
Packit bfcc33
#define SASS_LEXER_H
Packit bfcc33
Packit bfcc33
#include <cstring>
Packit bfcc33
Packit bfcc33
namespace Sass {
Packit bfcc33
  namespace Prelexer {
Packit bfcc33
Packit bfcc33
    //####################################
Packit bfcc33
    // BASIC CHARACTER MATCHERS
Packit bfcc33
    //####################################
Packit bfcc33
Packit bfcc33
    // Match standard control chars
Packit bfcc33
    const char* kwd_at(const char* src);
Packit bfcc33
    const char* kwd_dot(const char* src);
Packit bfcc33
    const char* kwd_comma(const char* src);
Packit bfcc33
    const char* kwd_colon(const char* src);
Packit bfcc33
    const char* kwd_star(const char* src);
Packit bfcc33
    const char* kwd_plus(const char* src);
Packit bfcc33
    const char* kwd_minus(const char* src);
Packit bfcc33
    const char* kwd_slash(const char* src);
Packit bfcc33
Packit bfcc33
    //####################################
Packit bfcc33
    // BASIC CLASS MATCHERS
Packit bfcc33
    //####################################
Packit bfcc33
Packit bfcc33
    // These are locale independant
Packit bfcc33
    bool is_space(const char& src);
Packit bfcc33
    bool is_alpha(const char& src);
Packit bfcc33
    bool is_punct(const char& src);
Packit bfcc33
    bool is_digit(const char& src);
Packit bfcc33
    bool is_alnum(const char& src);
Packit bfcc33
    bool is_xdigit(const char& src);
Packit bfcc33
    bool is_unicode(const char& src);
Packit bfcc33
    bool is_nonascii(const char& src);
Packit bfcc33
    bool is_character(const char& src);
Packit bfcc33
    bool is_uri_character(const char& src);
Packit bfcc33
    bool escapable_character(const char& src);
Packit bfcc33
Packit bfcc33
    // Match a single ctype predicate.
Packit bfcc33
    const char* space(const char* src);
Packit bfcc33
    const char* alpha(const char* src);
Packit bfcc33
    const char* digit(const char* src);
Packit bfcc33
    const char* xdigit(const char* src);
Packit bfcc33
    const char* alnum(const char* src);
Packit bfcc33
    const char* punct(const char* src);
Packit bfcc33
    const char* hyphen(const char* src);
Packit bfcc33
    const char* unicode(const char* src);
Packit bfcc33
    const char* nonascii(const char* src);
Packit bfcc33
    const char* character(const char* src);
Packit bfcc33
    const char* uri_character(const char* src);
Packit bfcc33
    const char* escapable_character(const char* src);
Packit bfcc33
Packit bfcc33
    // Match multiple ctype characters.
Packit bfcc33
    const char* spaces(const char* src);
Packit bfcc33
    const char* digits(const char* src);
Packit bfcc33
    const char* hyphens(const char* src);
Packit bfcc33
Packit bfcc33
    // Whitespace handling.
Packit bfcc33
    const char* no_spaces(const char* src);
Packit bfcc33
    const char* optional_spaces(const char* src);
Packit bfcc33
Packit bfcc33
    // Match any single character (/./).
Packit bfcc33
    const char* any_char(const char* src);
Packit bfcc33
Packit bfcc33
    // Assert word boundary (/\b/)
Packit bfcc33
    // Is a zero-width positive lookaheads
Packit bfcc33
    const char* word_boundary(const char* src);
Packit bfcc33
Packit bfcc33
    // Match a single linebreak (/(?:\n|\r\n?)/).
Packit bfcc33
    const char* re_linebreak(const char* src);
Packit bfcc33
Packit bfcc33
    // Assert string boundaries (/\Z|\z|\A/)
Packit bfcc33
    // There are zero-width positive lookaheads
Packit bfcc33
    const char* end_of_line(const char* src);
Packit bfcc33
Packit bfcc33
    // Assert end_of_file boundary (/\z/)
Packit bfcc33
    const char* end_of_file(const char* src);
Packit bfcc33
    // const char* start_of_string(const char* src);
Packit bfcc33
Packit bfcc33
    // Type definition for prelexer functions
Packit bfcc33
    typedef const char* (*prelexer)(const char*);
Packit bfcc33
Packit bfcc33
    //####################################
Packit bfcc33
    // BASIC "REGEX" CONSTRUCTORS
Packit bfcc33
    //####################################
Packit bfcc33
Packit bfcc33
    // Match a single character literal.
Packit bfcc33
    // Regex equivalent: /(?:x)/
Packit bfcc33
    template <char chr>
Packit bfcc33
    const char* exactly(const char* src) {
Packit bfcc33
      return *src == chr ? src + 1 : 0;
Packit bfcc33
    }
Packit bfcc33
Packit bfcc33
    // Match the full string literal.
Packit bfcc33
    // Regex equivalent: /(?:literal)/
Packit bfcc33
    template <const char* str>
Packit bfcc33
    const char* exactly(const char* src) {
Packit bfcc33
      if (str == NULL) return 0;
Packit bfcc33
      const char* pre = str;
Packit bfcc33
      if (src == NULL) return 0;
Packit bfcc33
      // there is a small chance that the search string
Packit bfcc33
      // is longer than the rest of the string to look at
Packit bfcc33
      while (*pre && *src == *pre) {
Packit bfcc33
        ++src, ++pre;
Packit bfcc33
      }
Packit bfcc33
      // did the matcher finish?
Packit bfcc33
      return *pre == 0 ? src : 0;
Packit bfcc33
    }
Packit bfcc33
Packit bfcc33
Packit bfcc33
    // Match the full string literal.
Packit bfcc33
    // Regex equivalent: /(?:literal)/i
Packit bfcc33
    // only define lower case alpha chars
Packit bfcc33
    template <const char* str>
Packit bfcc33
    const char* insensitive(const char* src) {
Packit bfcc33
      if (str == NULL) return 0;
Packit bfcc33
      const char* pre = str;
Packit bfcc33
      if (src == NULL) return 0;
Packit bfcc33
      // there is a small chance that the search string
Packit bfcc33
      // is longer than the rest of the string to look at
Packit bfcc33
      while (*pre && (*src == *pre || *src+32 == *pre)) {
Packit bfcc33
        ++src, ++pre;
Packit bfcc33
      }
Packit bfcc33
      // did the matcher finish?
Packit bfcc33
      return *pre == 0 ? src : 0;
Packit bfcc33
    }
Packit bfcc33
Packit bfcc33
    // Match for members of char class.
Packit bfcc33
    // Regex equivalent: /[axy]/
Packit bfcc33
    template <const char* char_class>
Packit bfcc33
    const char* class_char(const char* src) {
Packit bfcc33
      const char* cc = char_class;
Packit bfcc33
      while (*cc && *src != *cc) ++cc;
Packit bfcc33
      return *cc ? src + 1 : 0;
Packit bfcc33
    }
Packit bfcc33
Packit bfcc33
    // Match for members of char class.
Packit bfcc33
    // Regex equivalent: /[axy]+/
Packit bfcc33
    template <const char* char_class>
Packit bfcc33
    const char* class_chars(const char* src) {
Packit bfcc33
      const char* p = src;
Packit bfcc33
      while (class_char<char_class>(p)) ++p;
Packit bfcc33
      return p == src ? 0 : p;
Packit bfcc33
    }
Packit bfcc33
Packit bfcc33
    // Match for members of char class.
Packit bfcc33
    // Regex equivalent: /[^axy]/
Packit bfcc33
    template <const char* neg_char_class>
Packit bfcc33
    const char* neg_class_char(const char* src) {
Packit bfcc33
      if (*src == 0) return 0;
Packit bfcc33
      const char* cc = neg_char_class;
Packit bfcc33
      while (*cc && *src != *cc) ++cc;
Packit bfcc33
      return *cc ? 0 : src + 1;
Packit bfcc33
    }
Packit bfcc33
Packit bfcc33
    // Match for members of char class.
Packit bfcc33
    // Regex equivalent: /[^axy]+/
Packit bfcc33
    template <const char* neg_char_class>
Packit bfcc33
    const char* neg_class_chars(const char* src) {
Packit bfcc33
      const char* p = src;
Packit bfcc33
      while (neg_class_char<neg_char_class>(p)) ++p;
Packit bfcc33
      return p == src ? 0 : p;
Packit bfcc33
    }
Packit bfcc33
Packit bfcc33
    // Match all except the supplied one.
Packit bfcc33
    // Regex equivalent: /[^x]/
Packit bfcc33
    template <const char chr>
Packit bfcc33
    const char* any_char_but(const char* src) {
Packit bfcc33
      return (*src && *src != chr) ? src + 1 : 0;
Packit bfcc33
    }
Packit bfcc33
Packit bfcc33
    // Succeeds if the matcher fails.
Packit bfcc33
    // Aka. zero-width negative lookahead.
Packit bfcc33
    // Regex equivalent: /(?!literal)/
Packit bfcc33
    template <prelexer mx>
Packit bfcc33
    const char* negate(const char* src) {
Packit bfcc33
      return mx(src) ? 0 : src;
Packit bfcc33
    }
Packit bfcc33
Packit bfcc33
    // Succeeds if the matcher succeeds.
Packit bfcc33
    // Aka. zero-width positive lookahead.
Packit bfcc33
    // Regex equivalent: /(?=literal)/
Packit bfcc33
    // just hangs around until we need it
Packit bfcc33
    template <prelexer mx>
Packit bfcc33
    const char* lookahead(const char* src) {
Packit bfcc33
      return mx(src) ? src : 0;
Packit bfcc33
    }
Packit bfcc33
Packit bfcc33
    // Tries supplied matchers in order.
Packit bfcc33
    // Succeeds if one of them succeeds.
Packit bfcc33
    // Regex equivalent: /(?:FOO|BAR)/
Packit bfcc33
    template <const prelexer mx>
Packit bfcc33
    const char* alternatives(const char* src) {
Packit bfcc33
      const char* rslt;
Packit bfcc33
      if ((rslt = mx(src))) return rslt;
Packit bfcc33
      return 0;
Packit bfcc33
    }
Packit bfcc33
    template <const prelexer mx1, const prelexer mx2, const prelexer... mxs>
Packit bfcc33
    const char* alternatives(const char* src) {
Packit bfcc33
      const char* rslt;
Packit bfcc33
      if ((rslt = mx1(src))) return rslt;
Packit bfcc33
      return alternatives<mx2, mxs...>(src);
Packit bfcc33
    }
Packit bfcc33
Packit bfcc33
    // Tries supplied matchers in order.
Packit bfcc33
    // Succeeds if all of them succeeds.
Packit bfcc33
    // Regex equivalent: /(?:FOO)(?:BAR)/
Packit bfcc33
    template <const prelexer mx1>
Packit bfcc33
    const char* sequence(const char* src) {
Packit bfcc33
      const char* rslt = src;
Packit bfcc33
      if (!(rslt = mx1(rslt))) return 0;
Packit bfcc33
      return rslt;
Packit bfcc33
    }
Packit bfcc33
    template <const prelexer mx1, const prelexer mx2, const prelexer... mxs>
Packit bfcc33
    const char* sequence(const char* src) {
Packit bfcc33
      const char* rslt = src;
Packit bfcc33
      if (!(rslt = mx1(rslt))) return 0;
Packit bfcc33
      return sequence<mx2, mxs...>(rslt);
Packit bfcc33
    }
Packit bfcc33
Packit bfcc33
Packit bfcc33
    // Match a pattern or not. Always succeeds.
Packit bfcc33
    // Regex equivalent: /(?:literal)?/
Packit bfcc33
    template <prelexer mx>
Packit bfcc33
    const char* optional(const char* src) {
Packit bfcc33
      const char* p = mx(src);
Packit bfcc33
      return p ? p : src;
Packit bfcc33
    }
Packit bfcc33
Packit bfcc33
    // Match zero or more of the patterns.
Packit bfcc33
    // Regex equivalent: /(?:literal)*/
Packit bfcc33
    template <prelexer mx>
Packit bfcc33
    const char* zero_plus(const char* src) {
Packit bfcc33
      const char* p = mx(src);
Packit bfcc33
      while (p) src = p, p = mx(src);
Packit bfcc33
      return src;
Packit bfcc33
    }
Packit bfcc33
Packit bfcc33
    // Match one or more of the patterns.
Packit bfcc33
    // Regex equivalent: /(?:literal)+/
Packit bfcc33
    template <prelexer mx>
Packit bfcc33
    const char* one_plus(const char* src) {
Packit bfcc33
      const char* p = mx(src);
Packit bfcc33
      if (!p) return 0;
Packit bfcc33
      while (p) src = p, p = mx(src);
Packit bfcc33
      return src;
Packit bfcc33
    }
Packit bfcc33
Packit bfcc33
    // Match mx non-greedy until delimiter.
Packit bfcc33
    // Other prelexers are greedy by default.
Packit bfcc33
    // Regex equivalent: /(?:$mx)*?(?=$delim)\b/
Packit bfcc33
    template <prelexer mx, prelexer delim>
Packit bfcc33
    const char* non_greedy(const char* src) {
Packit bfcc33
      while (!delim(src)) {
Packit bfcc33
        const char* p = mx(src);
Packit bfcc33
        if (p == src) return 0;
Packit bfcc33
        if (p == 0) return 0;
Packit bfcc33
        src = p;
Packit bfcc33
      }
Packit bfcc33
      return src;
Packit bfcc33
    }
Packit bfcc33
Packit bfcc33
    //####################################
Packit bfcc33
    // ADVANCED "REGEX" CONSTRUCTORS
Packit bfcc33
    //####################################
Packit bfcc33
Packit bfcc33
    // Match with word boundary rule.
Packit bfcc33
    // Regex equivalent: /(?:$mx)\b/i
Packit bfcc33
    template <const char* str>
Packit bfcc33
    const char* keyword(const char* src) {
Packit bfcc33
      return sequence <
Packit bfcc33
               insensitive < str >,
Packit bfcc33
               word_boundary
Packit bfcc33
             >(src);
Packit bfcc33
    }
Packit bfcc33
Packit bfcc33
    // Match with word boundary rule.
Packit bfcc33
    // Regex equivalent: /(?:$mx)\b/
Packit bfcc33
    template <const char* str>
Packit bfcc33
    const char* word(const char* src) {
Packit bfcc33
      return sequence <
Packit bfcc33
               exactly < str >,
Packit bfcc33
               word_boundary
Packit bfcc33
             >(src);
Packit bfcc33
    }
Packit bfcc33
Packit bfcc33
    template <char chr>
Packit bfcc33
    const char* loosely(const char* src) {
Packit bfcc33
      return sequence <
Packit bfcc33
               optional_spaces,
Packit bfcc33
               exactly < chr >
Packit bfcc33
             >(src);
Packit bfcc33
    }
Packit bfcc33
    template <const char* str>
Packit bfcc33
    const char* loosely(const char* src) {
Packit bfcc33
      return sequence <
Packit bfcc33
               optional_spaces,
Packit bfcc33
               exactly < str >
Packit bfcc33
             >(src);
Packit bfcc33
    }
Packit bfcc33
Packit bfcc33
  }
Packit bfcc33
}
Packit bfcc33
Packit bfcc33
#endif