summaryrefslogtreecommitdiffstats
path: root/src/css.l
diff options
context:
space:
mode:
Diffstat (limited to 'src/css.l')
-rw-r--r--src/css.l167
1 files changed, 167 insertions, 0 deletions
diff --git a/src/css.l b/src/css.l
new file mode 100644
index 0000000..d6c34f6
--- /dev/null
+++ b/src/css.l
@@ -0,0 +1,167 @@
+%option case-insensitive
+%option noyywrap
+%option never-interactive
+%option nounput
+
+%top{
+/* config.h must precede flex's inclusion of <stdio.h>
+ in order for its _GNU_SOURCE definition to take effect. */
+#include <config.h>
+}
+
+%{
+/* Lex source for CSS tokenizing.
+ Taken from http://www.w3.org/TR/CSS21/grammar.html#q2
+ Copyright (C) 2006, 2009-2011, 2015, 2018 Free Software Foundation,
+ Inc.
+
+This file is part of GNU Wget.
+
+GNU Wget is free software; you can redistribute it and/or modify
+it under the terms of the GNU General Public License as published by
+the Free Software Foundation; either version 3 of the License, or (at
+your option) any later version.
+
+GNU Wget is distributed in the hope that it will be useful,
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with Wget. If not, see <http://www.gnu.org/licenses/>.
+
+Additional permission under GNU GPL version 3 section 7
+
+If you modify this program, or any covered work, by linking or
+combining it with the OpenSSL project's OpenSSL library (or a
+modified version of that library), containing parts covered by the
+terms of the OpenSSL or SSLeay licenses, the Free Software Foundation
+grants you additional permission to convey the resulting work.
+Corresponding Source for a non-source form of such a combination
+shall include the source code for the parts of OpenSSL used as well
+as that of the covered work. */
+
+#define YY_NO_INPUT
+
+#include "css-tokens.h"
+
+#if defined __clang__ || __GNUC__ > 4 || (__GNUC__ == 4 && __GNUC_MINOR__ >= 5)
+ #pragma GCC diagnostic ignored "-Wunknown-pragmas" // clang mourns about the next one
+ #pragma GCC diagnostic ignored "-Wunused-function"
+ #pragma GCC diagnostic ignored "-Wunused-macros"
+ #pragma GCC diagnostic ignored "-Wunused-parameter"
+ #pragma GCC diagnostic ignored "-Wsign-compare"
+ #pragma GCC diagnostic ignored "-Wswitch-default"
+ #pragma GCC diagnostic ignored "-Wunreachable-code" // clang
+ #pragma clang diagnostic ignored "-Wshorten-64-to-32"
+ #ifndef __clang__
+ #pragma GCC diagnostic ignored "-Wsuggest-attribute=pure"
+ #endif
+#endif
+
+%}
+
+h [0-9a-f]
+nonascii [\240-\377]
+unicode \\{h}{1,6}(\r\n|[ \t\r\n\f])?
+escape {unicode}|\\[^\r\n\f0-9a-f]
+nmstart [_a-z]|{nonascii}|{escape}
+nmchar [_a-z0-9-]|{nonascii}|{escape}
+string1 \"([^\n\r\f\\"]|\\{nl}|{escape})*\"
+string2 \'([^\n\r\f\\']|\\{nl}|{escape})*\'
+badstring1 \"([^\n\r\f\\"]|\\{nl}|{escape})*\\?
+badstring2 \'([^\n\r\f\\']|\\{nl}|{escape})*\\?
+badcomment1 \/\*[^*]*\*+([^/*][^*]*\*+)*
+badcomment2 \/\*[^*]*(\*+[^/*][^*]*)*
+baduri1 url\({w}([!#$%&*-\[\]-~]|{nonascii}|{escape})*{w}
+baduri2 url\({w}{string}{w}
+baduri3 url\({w}{badstring}
+comment \/\*[^*]*\*+([^/*][^*]*\*+)*\/
+ident -?{nmstart}{nmchar}*
+name {nmchar}+
+num [0-9]+|[0-9]*"."[0-9]+
+string {string1}|{string2}
+badstring {badstring1}|{badstring2}
+badcomment {badcomment1}|{badcomment2}
+baduri {baduri1}|{baduri2}|{baduri3}
+url ([!#$%&*-~]|{nonascii}|{escape})*
+s [ \t\r\n\f]+
+w {s}?
+nl \n|\r\n|\r|\f
+
+A a|\\0{0,4}(41|61)(\r\n|[ \t\r\n\f])?
+C c|\\0{0,4}(43|63)(\r\n|[ \t\r\n\f])?
+D d|\\0{0,4}(44|64)(\r\n|[ \t\r\n\f])?
+E e|\\0{0,4}(45|65)(\r\n|[ \t\r\n\f])?
+G g|\\0{0,4}(47|67)(\r\n|[ \t\r\n\f])?|\\g
+H h|\\0{0,4}(48|68)(\r\n|[ \t\r\n\f])?|\\h
+I i|\\0{0,4}(49|69)(\r\n|[ \t\r\n\f])?|\\i
+K k|\\0{0,4}(4b|6b)(\r\n|[ \t\r\n\f])?|\\k
+L l|\\0{0,4}(4c|6c)(\r\n|[ \t\r\n\f])?|\\l
+M m|\\0{0,4}(4d|6d)(\r\n|[ \t\r\n\f])?|\\m
+N n|\\0{0,4}(4e|6e)(\r\n|[ \t\r\n\f])?|\\n
+O o|\\0{0,4}(4f|6f)(\r\n|[ \t\r\n\f])?|\\o
+P p|\\0{0,4}(50|70)(\r\n|[ \t\r\n\f])?|\\p
+R r|\\0{0,4}(52|72)(\r\n|[ \t\r\n\f])?|\\r
+S s|\\0{0,4}(53|73)(\r\n|[ \t\r\n\f])?|\\s
+T t|\\0{0,4}(54|74)(\r\n|[ \t\r\n\f])?|\\t
+U u|\\0{0,4}(55|75)(\r\n|[ \t\r\n\f])?|\\u
+X x|\\0{0,4}(58|78)(\r\n|[ \t\r\n\f])?|\\x
+Z z|\\0{0,4}(5a|7a)(\r\n|[ \t\r\n\f])?|\\z
+
+%%
+
+{s} {return S;}
+
+{comment} {return COMMENT;}
+#\/\*[^*]*\*+([^/*][^*]*\*+)*\/ /* ignore comments */
+{badcomment} /* unclosed comment at EOF */
+
+"<!--" {return CDO;}
+"-->" {return CDC;}
+"~=" {return INCLUDES;}
+"|=" {return DASHMATCH;}
+
+{string} {return STRING;}
+{badstring} {return BAD_STRING;}
+
+{ident} {return IDENT;}
+
+"#"{name} {return HASH;}
+
+@{I}{M}{P}{O}{R}{T} {return IMPORT_SYM;}
+@{P}{A}{G}{E} {return PAGE_SYM;}
+@{M}{E}{D}{I}{A} {return MEDIA_SYM;}
+"@charset " {return CHARSET_SYM;}
+
+"!"({w}|{comment})*{I}{M}{P}{O}{R}{T}{A}{N}{T} {return IMPORTANT_SYM;}
+
+{num}{E}{M} {return EMS;}
+{num}{E}{X} {return EXS;}
+{num}{P}{X} {return LENGTH;}
+{num}{C}{M} {return LENGTH;}
+{num}{M}{M} {return LENGTH;}
+{num}{I}{N} {return LENGTH;}
+{num}{P}{T} {return LENGTH;}
+{num}{P}{C} {return LENGTH;}
+{num}{D}{E}{G} {return ANGLE;}
+{num}{R}{A}{D} {return ANGLE;}
+{num}{G}{R}{A}{D} {return ANGLE;}
+{num}{M}{S} {return TIME;}
+{num}{S} {return TIME;}
+{num}{H}{Z} {return FREQ;}
+{num}{K}{H}{Z} {return FREQ;}
+{num}{ident} {return DIMENSION;}
+
+{num}% {return PERCENTAGE;}
+{num} {return NUMBER;}
+
+"url("{w}{string}{w}")" {return URI;}
+"url("{w}{url}{w}")" {return URI;}
+{baduri} {return BAD_URI;}
+
+{ident}"(" {return FUNCTION;}
+
+. {return *yytext;}
+
+%%