2016-05-25 15:53:13 +02:00
|
|
|
#!/usr/bin/env python
|
2016-03-10 18:22:27 +01:00
|
|
|
from __future__ import absolute_import
|
2016-07-08 22:25:20 +02:00
|
|
|
from __future__ import print_function
|
2016-07-08 22:40:24 +02:00
|
|
|
import optparse
|
2013-10-25 23:46:02 +02:00
|
|
|
import os
|
|
|
|
import sys
|
2013-11-08 22:45:20 +01:00
|
|
|
import subprocess
|
2016-03-10 18:22:27 +01:00
|
|
|
from six.moves import filter
|
2016-03-10 18:39:37 +01:00
|
|
|
from six.moves import map
|
2016-03-10 18:43:31 +01:00
|
|
|
from six.moves import range
|
2016-07-08 22:25:20 +02:00
|
|
|
try:
|
|
|
|
import lister
|
2016-07-24 15:24:48 +02:00
|
|
|
from typing import cast, Callable, Dict, Iterable, List
|
2016-07-08 22:25:20 +02:00
|
|
|
except ImportError as e:
|
|
|
|
print("ImportError: {}".format(e))
|
|
|
|
print("You need to run the Zulip linters inside a Zulip dev environment.")
|
|
|
|
print("If you are using Vagrant, you can `vagrant ssh` to enter the Vagrant guest.")
|
|
|
|
sys.exit(1)
|
2013-10-25 23:46:02 +02:00
|
|
|
|
2016-08-01 19:33:23 +02:00
|
|
|
class TokenizerState(object):
|
|
|
|
def __init__(self):
|
2016-07-24 15:58:37 +02:00
|
|
|
self.i = 0
|
|
|
|
self.line = 1
|
|
|
|
self.col = 1
|
2013-10-08 14:31:16 +02:00
|
|
|
|
2016-08-01 19:33:23 +02:00
|
|
|
class Token(object):
|
|
|
|
def __init__(self, kind, s, tag, line, col):
|
|
|
|
self.kind = kind
|
|
|
|
self.s = s
|
|
|
|
self.tag = tag
|
|
|
|
self.line = line
|
|
|
|
self.col = col
|
2013-10-08 14:31:16 +02:00
|
|
|
|
2016-08-01 19:33:23 +02:00
|
|
|
def tokenize(text):
|
2013-10-08 14:31:16 +02:00
|
|
|
def advance(n):
|
2016-07-24 15:24:48 +02:00
|
|
|
# type: (int) -> None
|
2013-10-08 14:31:16 +02:00
|
|
|
for _ in range(n):
|
|
|
|
state.i += 1
|
|
|
|
if state.i >= 0 and text[state.i - 1] == '\n':
|
|
|
|
state.line += 1
|
|
|
|
state.col = 1
|
|
|
|
else:
|
|
|
|
state.col += 1
|
|
|
|
|
2014-02-27 17:21:36 +01:00
|
|
|
def looking_at(s):
|
2016-07-24 15:24:48 +02:00
|
|
|
# type: (str) -> bool
|
2014-02-27 17:21:36 +01:00
|
|
|
return text[state.i:state.i+len(s)] == s
|
|
|
|
|
2016-08-01 17:23:57 +02:00
|
|
|
def looking_at_html_start():
|
|
|
|
# type: () -> bool
|
|
|
|
return looking_at("<") and not looking_at("</")
|
|
|
|
|
|
|
|
def looking_at_html_end():
|
|
|
|
# type: () -> bool
|
|
|
|
return looking_at("</")
|
|
|
|
|
|
|
|
def looking_at_handlebars_start():
|
|
|
|
# type: () -> bool
|
|
|
|
return looking_at("{{#") or looking_at("{{^")
|
|
|
|
|
|
|
|
def looking_at_handlebars_end():
|
|
|
|
# type: () -> bool
|
|
|
|
return looking_at("{{/")
|
|
|
|
|
|
|
|
def looking_at_django_start():
|
|
|
|
# type: () -> bool
|
|
|
|
return looking_at("{% ") and not looking_at("{% end")
|
|
|
|
|
|
|
|
def looking_at_django_end():
|
|
|
|
# type: () -> bool
|
|
|
|
return looking_at("{% end")
|
|
|
|
|
2016-08-01 19:33:23 +02:00
|
|
|
state = TokenizerState()
|
|
|
|
tokens = []
|
2016-08-01 17:23:57 +02:00
|
|
|
|
2014-02-27 22:29:20 +01:00
|
|
|
while state.i < len(text):
|
2016-08-01 17:23:57 +02:00
|
|
|
if looking_at_html_start():
|
2014-02-27 16:50:18 +01:00
|
|
|
s = get_html_tag(text, state.i)
|
2014-02-27 22:33:59 +01:00
|
|
|
tag = s[1:-1].split()[0]
|
2016-08-01 19:33:23 +02:00
|
|
|
kind = 'html_start'
|
2016-08-01 17:23:57 +02:00
|
|
|
elif looking_at_html_end():
|
2014-02-27 22:33:59 +01:00
|
|
|
s = get_html_tag(text, state.i)
|
2016-08-01 19:33:23 +02:00
|
|
|
tag = s[2:-1]
|
|
|
|
kind = 'html_end'
|
2016-08-01 17:23:57 +02:00
|
|
|
elif looking_at_handlebars_start():
|
2014-02-27 17:21:36 +01:00
|
|
|
s = get_handlebars_tag(text, state.i)
|
2014-02-27 22:23:06 +01:00
|
|
|
tag = s[3:-2].split()[0]
|
2016-08-01 19:33:23 +02:00
|
|
|
kind = 'handlebars_start'
|
2016-08-01 17:23:57 +02:00
|
|
|
elif looking_at_handlebars_end():
|
2014-02-27 17:21:36 +01:00
|
|
|
s = get_handlebars_tag(text, state.i)
|
2016-08-01 19:33:23 +02:00
|
|
|
tag = s[3:-2]
|
|
|
|
kind = 'handlebars_end'
|
2016-08-01 17:23:57 +02:00
|
|
|
elif looking_at_django_start():
|
2014-02-27 22:59:36 +01:00
|
|
|
s = get_django_tag(text, state.i)
|
|
|
|
tag = s[3:-2].split()[0]
|
2016-08-01 19:33:23 +02:00
|
|
|
kind = 'django_start'
|
2016-08-01 17:23:57 +02:00
|
|
|
elif looking_at_django_end():
|
2014-02-27 22:59:36 +01:00
|
|
|
s = get_django_tag(text, state.i)
|
2016-08-01 19:33:23 +02:00
|
|
|
tag = s[6:-3]
|
|
|
|
kind = 'django_end'
|
2016-08-01 17:23:57 +02:00
|
|
|
else:
|
|
|
|
advance(1)
|
2016-08-01 19:33:23 +02:00
|
|
|
continue
|
|
|
|
|
|
|
|
token = Token(
|
|
|
|
kind=kind,
|
|
|
|
s=s,
|
|
|
|
tag=tag,
|
|
|
|
line=state.line,
|
|
|
|
col=state.col,
|
|
|
|
)
|
|
|
|
tokens.append(token)
|
|
|
|
advance(len(s))
|
|
|
|
|
|
|
|
return tokens
|
|
|
|
|
|
|
|
def validate(fn, check_indent=True):
|
|
|
|
# type: (str, bool) -> None
|
|
|
|
text = open(fn).read()
|
|
|
|
tokens = tokenize(text)
|
|
|
|
|
|
|
|
class State(object):
|
|
|
|
def __init__(self, func):
|
|
|
|
# type: (Callable[[Token], None]) -> None
|
|
|
|
self.depth = 0
|
|
|
|
self.matcher = func
|
|
|
|
|
|
|
|
def no_start_tag(token):
|
|
|
|
# type: (Token) -> None
|
|
|
|
raise Exception('''
|
|
|
|
No start tag
|
|
|
|
fn: %s
|
|
|
|
end tag:
|
|
|
|
%s
|
|
|
|
line %d, col %d
|
|
|
|
''' % (fn, token.tag, token.line, token.col))
|
|
|
|
|
|
|
|
state = State(no_start_tag)
|
|
|
|
|
|
|
|
def start_tag_matcher(start_token):
|
|
|
|
# type: (Token) -> None
|
|
|
|
state.depth += 1
|
|
|
|
start_tag = start_token.tag
|
|
|
|
start_line = start_token.line
|
|
|
|
start_col = start_token.col
|
|
|
|
|
|
|
|
old_matcher = state.matcher
|
|
|
|
def f(end_token):
|
|
|
|
# type: (Token) -> None
|
|
|
|
|
|
|
|
end_tag = end_token.tag
|
|
|
|
end_line = end_token.line
|
|
|
|
end_col = end_token.col
|
|
|
|
|
|
|
|
problem = None
|
|
|
|
if start_tag != end_tag:
|
|
|
|
problem = 'Mismatched tag.'
|
|
|
|
elif check_indent and end_line > start_line + 1 and end_col != start_col:
|
|
|
|
problem = 'Bad indentation.'
|
|
|
|
if problem:
|
|
|
|
raise Exception('''
|
|
|
|
fn: %s
|
|
|
|
%s
|
|
|
|
start:
|
|
|
|
%s
|
|
|
|
line %d, col %d
|
|
|
|
end tag:
|
|
|
|
%s
|
|
|
|
line %d, col %d
|
|
|
|
''' % (fn, problem, start_token.s, start_line, start_col, end_tag, end_line, end_col))
|
|
|
|
state.matcher = old_matcher
|
|
|
|
state.depth -= 1
|
|
|
|
state.matcher = f
|
|
|
|
|
|
|
|
for token in tokens:
|
|
|
|
kind = token.kind
|
|
|
|
tag = token.tag
|
|
|
|
s = token.s
|
|
|
|
|
|
|
|
if kind == 'html_start':
|
|
|
|
if not is_special_html_tag(s, tag):
|
|
|
|
start_tag_matcher(token)
|
|
|
|
elif kind == 'html_end':
|
|
|
|
state.matcher(token)
|
|
|
|
|
|
|
|
elif kind == 'handlebars_start':
|
|
|
|
start_tag_matcher(token)
|
|
|
|
elif kind == 'handlebars_end':
|
|
|
|
state.matcher(token)
|
|
|
|
|
|
|
|
elif kind == 'django_start':
|
|
|
|
if is_django_block_tag(tag):
|
|
|
|
start_tag_matcher(token)
|
|
|
|
elif kind == 'django_end':
|
|
|
|
state.matcher(token)
|
|
|
|
|
|
|
|
null_token = Token(
|
|
|
|
kind=None,
|
|
|
|
s='(NO TAG)',
|
|
|
|
tag='NO TAG',
|
|
|
|
line=0,
|
|
|
|
col=0,
|
|
|
|
)
|
2013-10-08 14:31:16 +02:00
|
|
|
|
2013-11-18 22:57:55 +01:00
|
|
|
if state.depth != 0:
|
2016-08-01 19:33:23 +02:00
|
|
|
state.matcher(null_token)
|
|
|
|
|
|
|
|
def is_special_html_tag(s, tag):
|
|
|
|
# type: (str, str) -> bool
|
|
|
|
return (s.startswith('<!--') or
|
|
|
|
s.endswith('/>') or
|
|
|
|
tag in ['link', 'meta', '!DOCTYPE'])
|
2013-10-08 14:31:16 +02:00
|
|
|
|
2014-02-27 22:59:36 +01:00
|
|
|
def is_django_block_tag(tag):
|
2016-07-24 15:24:48 +02:00
|
|
|
# type: (str) -> bool
|
2014-02-27 22:59:36 +01:00
|
|
|
return tag in [
|
|
|
|
'autoescape',
|
|
|
|
'block',
|
|
|
|
'comment',
|
|
|
|
'for',
|
|
|
|
'if',
|
|
|
|
'ifequal',
|
|
|
|
'verbatim',
|
2015-11-03 09:41:52 +01:00
|
|
|
'blocktrans',
|
2016-04-21 08:48:33 +02:00
|
|
|
'trans',
|
|
|
|
'raw',
|
2014-02-27 22:59:36 +01:00
|
|
|
]
|
|
|
|
|
2014-02-27 17:21:36 +01:00
|
|
|
def get_handlebars_tag(text, i):
|
2016-07-24 15:24:48 +02:00
|
|
|
# type: (str, int) -> str
|
2014-02-27 17:21:36 +01:00
|
|
|
end = i + 2
|
|
|
|
while end < len(text) -1 and text[end] != '}':
|
|
|
|
end += 1
|
|
|
|
if text[end] != '}' or text[end+1] != '}':
|
|
|
|
raise Exception('Tag missing }}')
|
|
|
|
s = text[i:end+2]
|
|
|
|
return s
|
|
|
|
|
2014-02-27 22:59:36 +01:00
|
|
|
def get_django_tag(text, i):
|
2016-07-24 15:24:48 +02:00
|
|
|
# type: (str, int) -> str
|
2014-02-27 22:59:36 +01:00
|
|
|
end = i + 2
|
|
|
|
while end < len(text) -1 and text[end] != '%':
|
|
|
|
end += 1
|
|
|
|
if text[end] != '%' or text[end+1] != '}':
|
|
|
|
raise Exception('Tag missing %}')
|
|
|
|
s = text[i:end+2]
|
|
|
|
return s
|
|
|
|
|
2014-02-27 16:50:18 +01:00
|
|
|
def get_html_tag(text, i):
|
2016-07-24 15:24:48 +02:00
|
|
|
# type: (str, int) -> str
|
2016-05-09 01:13:06 +02:00
|
|
|
quote_count = 0
|
2014-02-27 16:50:18 +01:00
|
|
|
end = i + 1
|
2016-05-09 01:13:06 +02:00
|
|
|
while end < len(text) and (text[end] != '>' or quote_count % 2 != 0):
|
|
|
|
if text[end] == '"':
|
|
|
|
quote_count += 1
|
2014-02-27 16:50:18 +01:00
|
|
|
end += 1
|
2016-07-14 01:08:39 +02:00
|
|
|
if end == len(text) or text[end] != '>':
|
2014-02-27 16:50:18 +01:00
|
|
|
raise Exception('Tag missing >')
|
|
|
|
s = text[i:end+1]
|
|
|
|
return s
|
|
|
|
|
2014-02-27 16:41:47 +01:00
|
|
|
def check_our_files():
|
2016-07-24 15:24:48 +02:00
|
|
|
# type: () -> None
|
2016-07-08 22:40:24 +02:00
|
|
|
parser = optparse.OptionParser()
|
|
|
|
parser.add_option('--modified', '-m',
|
2016-07-24 15:43:28 +02:00
|
|
|
action='store_true', default=False,
|
2016-07-08 22:40:24 +02:00
|
|
|
help='Only check modified files')
|
|
|
|
(options, _) = parser.parse_args()
|
|
|
|
|
2016-07-24 15:24:48 +02:00
|
|
|
by_lang = cast(
|
|
|
|
Dict[str, List[str]],
|
|
|
|
lister.list_files(
|
|
|
|
modified_only=options.modified,
|
|
|
|
ftypes=['handlebars', 'html'],
|
|
|
|
group_by_ftype=True))
|
2013-10-25 20:47:03 +02:00
|
|
|
|
2016-07-08 22:40:24 +02:00
|
|
|
check_handlebar_templates(by_lang['handlebars'], options.modified)
|
2016-07-09 02:43:32 +02:00
|
|
|
check_html_templates(by_lang['html'], options.modified)
|
2013-11-18 22:57:55 +01:00
|
|
|
|
2016-07-08 22:40:24 +02:00
|
|
|
def check_handlebar_templates(templates, modified_only):
|
2016-07-24 15:24:48 +02:00
|
|
|
# type: (Iterable[str], bool) -> None
|
2016-07-08 22:11:05 +02:00
|
|
|
# Check all our handlebars templates.
|
|
|
|
templates = [fn for fn in templates if fn.endswith('.handlebars')]
|
2016-07-08 22:40:24 +02:00
|
|
|
if not modified_only:
|
|
|
|
assert len(templates) >= 10 # sanity check that we are actually doing work
|
2016-07-08 22:11:05 +02:00
|
|
|
for fn in templates:
|
|
|
|
validate(fn, check_indent=True)
|
|
|
|
|
2016-07-09 02:43:32 +02:00
|
|
|
def check_html_templates(templates, modified_only):
|
2016-07-24 15:24:48 +02:00
|
|
|
# type: (Iterable[str], bool) -> None
|
2016-07-09 02:43:32 +02:00
|
|
|
# Our files with .html extensions are usually for Django, but we also
|
2016-07-12 21:28:08 +02:00
|
|
|
# have a few static .html files.
|
2016-07-09 02:43:32 +02:00
|
|
|
# The file base.html has a bit of funny HTML that we can't parse here yet.
|
2016-07-12 21:28:08 +02:00
|
|
|
#
|
|
|
|
# We also have .html files that we vendored from Casper.
|
|
|
|
# The casperjs files use HTML5 (whereas Zulip prefers XHTML), and
|
|
|
|
# there are also cases where Casper deliberately uses invalid HTML,
|
|
|
|
# so we exclude them from our linter.
|
|
|
|
templates = filter(
|
|
|
|
lambda fn: ('base.html' not in fn) and ('casperjs' not in fn),
|
|
|
|
templates)
|
2016-07-09 02:43:32 +02:00
|
|
|
templates = sorted(list(templates))
|
2013-10-25 20:47:03 +02:00
|
|
|
|
2016-07-08 22:40:24 +02:00
|
|
|
if not modified_only:
|
|
|
|
assert len(templates) >= 10 # sanity check that we are actually doing work
|
2014-02-27 16:41:47 +01:00
|
|
|
for fn in templates:
|
2016-07-12 22:32:36 +02:00
|
|
|
# Many of our Django templates have strange indentation. The
|
|
|
|
# indentation errors are often harmless, even stylistically
|
|
|
|
# harmless, but they tend to be in files that might be old
|
|
|
|
# and might eventually require more scrutiny for things like
|
|
|
|
# localization. See github #1236.
|
|
|
|
bad_files = [
|
|
|
|
'static/html/5xx.html',
|
|
|
|
'templates/500.html',
|
|
|
|
'templates/confirmation/confirm.html',
|
|
|
|
'templates/corporate/mit.html',
|
|
|
|
'templates/corporate/privacy.html',
|
|
|
|
'templates/corporate/terms-enterprise.html',
|
|
|
|
'templates/corporate/zephyr-mirror.html',
|
|
|
|
'templates/corporate/zephyr.html',
|
|
|
|
'templates/zerver/accounts_home.html',
|
|
|
|
'templates/zerver/accounts_send_confirm.html',
|
|
|
|
'templates/zerver/api.html',
|
|
|
|
'templates/zerver/api_endpoints.html',
|
|
|
|
'templates/zerver/apps.html',
|
|
|
|
'templates/zerver/create_realm.html',
|
|
|
|
'templates/zerver/emails/followup/day1.html',
|
|
|
|
'templates/zerver/emails/followup/day2.html',
|
|
|
|
'templates/zerver/features.html',
|
|
|
|
'templates/zerver/hello.html',
|
|
|
|
'templates/zerver/home.html',
|
|
|
|
'templates/zerver/integrations.html',
|
|
|
|
'templates/zerver/invite_user.html',
|
|
|
|
'templates/zerver/left-sidebar.html',
|
|
|
|
'templates/zerver/login.html',
|
|
|
|
'templates/zerver/markdown_help.html',
|
|
|
|
'templates/zerver/register.html',
|
|
|
|
'templates/zerver/right-sidebar.html',
|
|
|
|
'templates/zerver/search_operators.html',
|
|
|
|
]
|
|
|
|
validate(fn, check_indent=(fn not in bad_files))
|
2014-02-27 16:41:47 +01:00
|
|
|
|
|
|
|
if __name__ == '__main__':
|
|
|
|
check_our_files()
|