Add tools/check-css and tools/lib/css_parser.py.

`tools/lint-all` now calls the new `tools/check-css` The css_parser library parsers CSS into a data structure that remembers line numbers and columns of semantically meaningful tokens and adjoining white space/tokens. It is intended to be used for various linting tasks. The file `tools/check-css` runs a few files through the parser and makes sure they round trip. This has some value right away, as files that fail to parse will cause an exception to be thrown and thus alert developers to syntax errors. We expect to grow this into more advanced linting tasks eventually.
2025-10-24 08:33:43 +00:00 · 2016-07-31 10:37:20 -07:00
parent b82836a901
commit 3b5c187f55
3 changed files with 552 additions and 0 deletions
--- a/tools/check-css
+++ b/tools/check-css
@@ -0,0 +1,40 @@
+#!/usr/bin/env python
+from __future__ import absolute_import
+from __future__ import print_function
+from lib.css_parser import parse, CssParserException
+import os
+import sys
+import glob
+
+try:
+    import lister
+    from typing import cast, Callable, Dict, Iterable, List
+except ImportError as e:
+    print("ImportError: {}".format(e))
+    print("You need to run the Zulip linters inside a Zulip dev environment.")
+    print("If you are using Vagrant, you can `vagrant ssh` to enter the Vagrant guest.")
+    sys.exit(1)
+
+def validate(fn):
+    # type: (str) -> None
+    text = open(fn).read()
+    section_list = parse(text)
+    if text != section_list.text():
+        print('BOO! %s broken' % (fn,))
+        open('foo.txt', 'w').write(section_list.text())
+        os.system('diff %s foo.txt' % (fn,))
+        sys.exit(1)
+
+def check_our_files():
+    # type: () -> None
+    fns = glob.glob('static/styles/*.css')
+    for fn in fns:
+        try:
+            validate(fn)
+        except CssParserException as e:
+            print('CssParserException raised while parsing file %s' % (fn,))
+            print(e)
+            sys.exit(1)
+
+if __name__ == '__main__':
+    check_our_files()
--- a/tools/lib/css_parser.py
+++ b/tools/lib/css_parser.py
@@ -0,0 +1,506 @@
+from __future__ import absolute_import
+from __future__ import print_function
+from six.moves import range
+from typing import Callable, List, Tuple, Union
+
+####### Helpers
+
+class Token(object):
+    def __init__(self, s, line, col):
+        # type: (str, int, int) -> None
+        self.s = s
+        self.line = line
+        self.col = col
+
+class CssParserException(Exception):
+    # TODO: Have callers pass in line numbers.
+    pass
+
+def find_end_brace(tokens, i):
+    # type: (List[Token], int) -> int
+    depth = 0
+    while i < len(tokens):
+        s = tokens[i].s
+        if s == '{':
+            depth += 1
+        elif s == '}':
+            if depth == 0:
+                for t in tokens[i-5:i]: print(repr(t.s))
+                raise CssParserException('unexpected }')
+            elif depth == 1:
+                break
+            depth -= 1
+        i += 1
+    return i
+
+def get_whitespace_and_comments(tokens, i, line=None):
+    # type: (List[Token], int, int) -> Tuple[int, str]
+
+    def is_fluff_token(token):
+        # type: (Token) -> bool
+        s = token.s
+        if ws(s[0]):
+            return True
+        elif s.startswith('/*'):
+            # For CSS comments, the caller may pass in a line
+            # number to indicate that they only want to get
+            # comments on the same line.  (Subsequent comments
+            # will be attached to the next actual line of code.)
+            if line is None:
+                return True
+            if tokens[i].line == line:
+                return True
+        return False
+
+    text = ''
+    while (i < len(tokens)) and is_fluff_token(tokens[i]):
+        s = tokens[i].s
+        text += s
+        i += 1
+
+    return i, text
+
+
+############### Begin parsing here
+
+
+def parse_sections(tokens):
+    # type: (List[Token]) -> CssSectionList
+    i = 0
+    sections = []
+    while i < len(tokens):
+        start, pre_fluff = get_whitespace_and_comments(tokens, i)
+
+        i = find_end_brace(tokens, start)
+
+        section_tokens = tokens[start:i+1]
+        i, post_fluff = get_whitespace_and_comments(tokens, i+1)
+
+        if section_tokens:
+            section = parse_section(
+                tokens=section_tokens,
+                pre_fluff=pre_fluff,
+                post_fluff=post_fluff
+            )
+            sections.append(section)
+        else:
+            raise CssParserException('unexpected empty section')
+
+    section_list = CssSectionList(
+        tokens=tokens,
+        sections=sections,
+    )
+    return section_list
+
+def parse_section(tokens, pre_fluff, post_fluff):
+    # type: (List[Token], str, str) -> Union[CssNestedSection, CssSection]
+    assert not ws(tokens[0].s)
+    if tokens[-1].s != '}': # caller should strip trailing fluff
+        # for t in tokens: print(repr(t.s))
+        raise CssParserException('found extraneous stuff at the end of a section')
+
+    first_token = tokens[0].s
+    if first_token in ('@media', '@keyframes') or first_token.startswith('@-'):
+        i, selector_list = parse_selectors_section(tokens) # not technically selectors
+        body_tokens = tokens[i+1:-1]
+        section_list = parse_sections(body_tokens)
+        nested_section = CssNestedSection(
+            tokens=tokens,
+            selector_list=selector_list,
+            section_list=section_list,
+            pre_fluff=pre_fluff,
+            post_fluff=post_fluff,
+        )
+        return nested_section
+    else:
+        i, selector_list = parse_selectors_section(tokens)
+        declaration_block = parse_declaration_block(tokens[i:])
+        section = CssSection(
+            tokens=tokens,
+            selector_list=selector_list,
+            declaration_block=declaration_block,
+            pre_fluff=pre_fluff,
+            post_fluff=post_fluff,
+        )
+        return section
+
+def parse_selectors_section(tokens):
+    # type: (List[Token]) -> Tuple[int, CssSelectorList]
+    start, pre_fluff = get_whitespace_and_comments(tokens, 0)
+    assert pre_fluff == ''
+    i = start
+    text = ''
+    while i < len(tokens) and tokens[i].s != '{' :
+        s = tokens[i].s
+        text += s
+        i += 1
+    selector_list = parse_selectors(tokens[start:i])
+    return i, selector_list
+
+def parse_selectors(tokens):
+    # type: (List[Token]) -> CssSelectorList
+    i = 0
+    start = i
+    selectors = []
+    while i < len(tokens):
+        s = tokens[i].s
+        if s == ',':
+            selector = parse_selector(tokens[start:i])
+            selectors.append(selector)
+            i += 1
+            start = i
+        if s.startswith('/*'):
+            raise CssParserException('Comments in selector section are not allowed')
+        i += 1
+    selector = parse_selector(tokens[start:i])
+    selectors.append(selector)
+    selector_list = CssSelectorList(
+        tokens=tokens,
+        selectors=selectors,
+    )
+    return selector_list
+
+def parse_selector(tokens):
+    # type: (List[Token]) -> CssSelector
+    i, pre_fluff = get_whitespace_and_comments(tokens, 0)
+    levels = []
+    last_i = None
+    while i < len(tokens):
+        token = tokens[i]
+        i += 1
+        if not ws(token.s[0]):
+            last_i = i
+            levels.append(token)
+
+    if last_i is None:
+        print([repr(t.s) for t in tokens])
+
+    assert last_i is not None
+    start, post_fluff = get_whitespace_and_comments(tokens, last_i)
+    selector = CssSelector(
+        tokens=tokens,
+        pre_fluff=pre_fluff,
+        post_fluff=post_fluff,
+        levels=levels,
+    )
+    return selector
+
+def parse_declaration_block(tokens):
+    # type: (List[Token]) -> CssDeclarationBlock
+    assert tokens[0].s == '{' # caller should strip leading fluff
+    assert tokens[-1].s == '}' # caller should strip trailing fluff
+    tokens = tokens[1:-1]
+    i = 0
+    declarations = []
+    while i < len(tokens):
+        start = i
+        i, _ = get_whitespace_and_comments(tokens, i)
+        while (i < len(tokens)) and (tokens[i].s != ';'):
+            i += 1
+        if i < len(tokens):
+            i, _ = get_whitespace_and_comments(tokens, i+1, line=tokens[i].line)
+        declaration = parse_declaration(tokens[start:i])
+        declarations.append(declaration)
+
+    declaration_block = CssDeclarationBlock(
+        tokens=tokens,
+        declarations=declarations,
+    )
+    return declaration_block
+
+def parse_declaration(tokens):
+    # type: (List[Token]) -> CssDeclaration
+    i, pre_fluff = get_whitespace_and_comments(tokens, 0)
+    css_property = tokens[i].s
+    if tokens[i+1].s != ':':
+        print(css_property)
+        for t in tokens: print(repr(t.s))
+        raise CssParserException('We expect a colon here')
+    i += 2
+    start = i
+    while (i < len(tokens)) and (tokens[i].s != ';'):
+        i += 1
+    css_value = parse_value(tokens[start:i])
+    semicolon = (i < len(tokens)) and (tokens[i].s == ';')
+    if semicolon:
+        i += 1
+    _, post_fluff = get_whitespace_and_comments(tokens, i)
+    declaration = CssDeclaration(
+        tokens=tokens,
+        pre_fluff=pre_fluff,
+        post_fluff=post_fluff,
+        css_property=css_property,
+        css_value=css_value,
+        semicolon=semicolon,
+    )
+    return declaration
+
+def parse_value(tokens):
+    # type: (List[Token]) -> CssValue
+    i, pre_fluff = get_whitespace_and_comments(tokens, 0)
+    value = tokens[i]
+    i, post_fluff = get_whitespace_and_comments(tokens, i+1)
+    return CssValue(
+        tokens=tokens,
+        value=value,
+        pre_fluff=pre_fluff,
+        post_fluff=post_fluff,
+    )
+
+
+#### Begin CSS classes here
+
+class CssSectionList(object):
+    def __init__(self, tokens, sections):
+        # type: (List[Token], List[Union[CssNestedSection, CssSection]]) -> None
+        self.tokens = tokens
+        self.sections = sections
+
+    def text(self):
+        # type: () -> str
+        res = ''.join(section.text() for section in self.sections)
+        return res
+
+class CssNestedSection(object):
+    def __init__(self, tokens, selector_list, section_list, pre_fluff, post_fluff):
+        # type: (List[Token], CssSelectorList, CssSectionList, str, str) -> None
+        self.tokens = tokens
+        self.selector_list = selector_list
+        self.section_list = section_list
+        self.pre_fluff = pre_fluff
+        self.post_fluff = post_fluff
+
+    def text(self):
+        # type: () -> str
+        res = ''
+        res += self.pre_fluff
+        res += self.selector_list.text()
+        res += '{'
+        res += self.section_list.text()
+        res += '}'
+        res += self.post_fluff
+        return res
+
+class CssSection(object):
+    def __init__(self, tokens, selector_list, declaration_block, pre_fluff, post_fluff):
+        # type: (List[Token], CssSelectorList, CssDeclarationBlock, str, str) -> None
+        self.tokens = tokens
+        self.selector_list = selector_list
+        self.declaration_block = declaration_block
+        self.pre_fluff = pre_fluff
+        self.post_fluff = post_fluff
+
+    def text(self):
+        # type: () -> str
+        res = ''
+        res += self.pre_fluff
+        res += self.selector_list.text()
+        res += self.declaration_block.text()
+        res += self.post_fluff
+        return res
+
+class CssSelectorList(object):
+    def __init__(self, tokens, selectors):
+        # type: (List[Token], List[CssSelector]) -> None
+        self.tokens = tokens
+        self.selectors = selectors
+
+    def text(self):
+        # type: () -> str
+        res = ','.join(sel.text() for sel in self.selectors)
+        return res
+
+class CssSelector(object):
+    def __init__(self, tokens, pre_fluff, post_fluff, levels):
+        # type: (List[Token],str, str, List[Token]) -> None
+        self.tokens = tokens
+        self.pre_fluff = pre_fluff
+        self.post_fluff = post_fluff
+        self.levels = levels
+
+    def text(self):
+        # type: () -> str
+        res = ''
+        res += self.pre_fluff
+        res += ' '.join(level.s for level in self.levels)
+        res += self.post_fluff
+        return res
+
+class CssDeclarationBlock(object):
+    def __init__(self, tokens, declarations):
+        # type: (List[Token], List[CssDeclaration]) -> None
+        self.tokens = tokens
+        self.declarations = declarations
+
+    def text(self):
+        # type: () -> str
+        res = '{'
+        for declaration in self.declarations:
+            res += declaration.text()
+        res += '}'
+        return res
+
+class CssDeclaration(object):
+    def __init__(self, tokens, pre_fluff, post_fluff, css_property, css_value, semicolon):
+        # type: (List[Token], str, str, str, CssValue, bool) -> None
+        self.tokens = tokens
+        self.pre_fluff = pre_fluff
+        self.post_fluff = post_fluff
+        self.css_property = css_property
+        self.css_value = css_value
+        self.semicolon = semicolon
+
+    def text(self):
+        # type: () -> str
+        res = ''
+        res += self.pre_fluff
+        res += self.css_property
+        res += ':'
+        res += self.css_value.text()
+        if self.semicolon:
+            res += ';'
+        res += self.post_fluff
+        return res
+
+class CssValue(object):
+    def __init__(self, tokens, value, pre_fluff, post_fluff):
+        # type: (List[Token], Token, str, str) -> None
+        self.value = value
+        self.pre_fluff = pre_fluff
+        self.post_fluff = post_fluff
+        assert pre_fluff.strip() == ''
+
+    def text(self):
+        # type: () -> str
+        return self.pre_fluff + self.value.s + self.post_fluff
+
+def parse(text):
+    # type: (str) -> CssSectionList
+    tokens = tokenize(text)
+    section_list = parse_sections(tokens=tokens)
+    return section_list
+
+#### Begin tokenizer section here
+
+def ws(c):
+    # type: (str) -> bool
+    return c in ' \t\n'
+
+def tokenize(text):
+    # type: (str) -> List[Token]
+
+    class State(object):
+        def __init__(self):
+            # type: () -> None
+            self.i = 0
+            self.line = 1
+            self.col = 1
+
+    tokens = []
+    state = State()
+
+    def add_token(s, state):
+        # type: (str, State) -> None
+        # deep copy data
+        token = Token(s=s, line=state.line, col=state.col)
+        tokens.append(token)
+
+    def legal(offset):
+        # type: (int) -> bool
+        return state.i + offset < len(text)
+
+    def advance(n):
+        # type: (int) -> None
+        for _ in range(n):
+            state.i += 1
+            if state.i >= 0 and text[state.i - 1] == '\n':
+                state.line += 1
+                state.col = 1
+            else:
+                state.col += 1
+
+    def looking_at(s):
+        # type: (str) -> bool
+        return text[state.i:state.i+len(s)] == s
+
+    def get_field(terminator):
+        # type: (Callable[[str], bool]) -> str
+        offset = 0
+        paren_level = 0
+        while legal(offset) and (paren_level or not terminator(text[state.i + offset])):
+            c = text[state.i + offset]
+            if c == '(':
+                paren_level += 1
+            elif c == ')':
+                paren_level -= 1
+            offset += 1
+        return text[state.i:state.i+offset]
+
+    in_property = False
+    in_value = False
+    in_media_line = False
+    starting_media_section = False
+    while state.i < len(text):
+        c = text[state.i]
+
+        if c in '{};:,':
+            if c == ':':
+                in_property = False
+                in_value = True
+            elif c == ';':
+                in_property = True
+                in_value = False
+            elif c in '{':
+                if starting_media_section:
+                    starting_media_section = False
+                else:
+                    in_property = True
+            elif c == '}':
+                in_property = False
+            s = c
+
+        elif ws(c):
+            terminator = lambda c: not ws(c)
+            s = get_field(terminator)
+
+        elif looking_at('/*'):
+            # hacky
+            old_i = state.i
+            while (state.i < len(text)) and not looking_at('*/'):
+                state.i += 1
+            if not looking_at('*/'):
+                raise CssParserException('unclosed comment')
+            s = text[old_i:state.i+2]
+            state.i = old_i
+
+        elif looking_at('@media'):
+            s = '@media'
+            in_media_line = True
+            starting_media_section = True
+
+        elif in_media_line:
+            in_media_line = False
+            terminator = lambda c: c == '{'
+            s = get_field(terminator)
+            s = s.rstrip()
+
+        elif in_property:
+            terminator = lambda c: ws(c) or c in ':{'
+            s = get_field(terminator)
+
+        elif in_value:
+            in_value = False
+            in_property = True
+            terminator = lambda c: c in ';}'
+            s = get_field(terminator)
+            s = s.rstrip()
+
+        else:
+            terminator = lambda c: ws(c) or c == ','
+            s = get_field(terminator)
+
+        add_token(s, state)
+        advance(len(s))
+
+    return tokens
+
--- a/tools/lint-all
+++ b/tools/lint-all
@@ -399,6 +399,12 @@ try:
        result = subprocess.call(args)
        return result

+    @lint
+    def css():
+        # type: () -> int
+        result = subprocess.call(['tools/check-css'])
+        return result
+
    @lint
    def jslint():
        # type: () -> int