2017-02-15 05:39:42 +01:00
|
|
|
|
2017-03-03 19:01:52 +01:00
|
|
|
from typing import Any, Dict, List
|
2017-02-15 05:39:42 +01:00
|
|
|
|
|
|
|
from .template_parser import (
|
|
|
|
tokenize,
|
2017-02-23 18:12:52 +01:00
|
|
|
is_django_block_tag,
|
2017-02-15 05:39:42 +01:00
|
|
|
)
|
2017-05-24 08:46:44 +02:00
|
|
|
import subprocess
|
2017-02-15 05:39:42 +01:00
|
|
|
|
|
|
|
def pretty_print_html(html, num_spaces=4):
|
|
|
|
# type: (str, int) -> str
|
|
|
|
# We use 1-based indexing for both rows and columns.
|
|
|
|
tokens = tokenize(html)
|
|
|
|
lines = html.split('\n')
|
|
|
|
|
|
|
|
# We will keep a stack of "start" tags so that we know
|
|
|
|
# when HTML ranges end. Note that some start tags won't
|
|
|
|
# be blocks from an indentation standpoint.
|
|
|
|
stack = [] # type: List[Dict[str, Any]]
|
|
|
|
|
|
|
|
# Seed our stack with a pseudo entry to make depth calculations
|
|
|
|
# easier.
|
|
|
|
info = dict(
|
|
|
|
block=False,
|
|
|
|
depth=-1,
|
|
|
|
line=-1,
|
|
|
|
token_kind='html_start',
|
2017-02-23 18:12:52 +01:00
|
|
|
tag='html',
|
2017-06-13 07:14:48 +02:00
|
|
|
extra_indent=0,
|
|
|
|
ignore_lines=[]) # type: Dict[str, Any]
|
2017-02-15 05:39:42 +01:00
|
|
|
stack.append(info)
|
|
|
|
|
|
|
|
# Our main job is to figure out offsets that we use to nudge lines
|
|
|
|
# over by.
|
|
|
|
offsets = {} # type: Dict[int, int]
|
|
|
|
|
|
|
|
# Loop through our start/end tokens, and calculate offsets. As
|
|
|
|
# we proceed, we will push/pop info dictionaries on/off a stack.
|
|
|
|
for token in tokens:
|
|
|
|
|
2018-04-03 10:09:00 +02:00
|
|
|
if token.kind in ('html_start', 'handlebars_start', 'handlebars_singleton',
|
2017-02-23 18:12:52 +01:00
|
|
|
'html_singleton', 'django_start') and stack[-1]['tag'] != 'pre':
|
2017-02-15 05:39:42 +01:00
|
|
|
# An HTML start tag should only cause a new indent if we
|
|
|
|
# are on a new line.
|
2017-02-23 18:12:52 +01:00
|
|
|
if (token.tag not in ('extends', 'include', 'else', 'elif') and
|
|
|
|
(is_django_block_tag(token.tag) or
|
|
|
|
token.kind != 'django_start')):
|
2017-02-16 20:25:53 +01:00
|
|
|
is_block = token.line > stack[-1]['line']
|
2017-02-15 05:39:42 +01:00
|
|
|
|
2017-02-16 20:25:53 +01:00
|
|
|
if is_block:
|
2017-02-23 18:12:52 +01:00
|
|
|
if (((token.kind == 'handlebars_start' and
|
|
|
|
stack[-1]['token_kind'] == 'handlebars_start') or
|
|
|
|
(token.kind == 'django_start' and
|
|
|
|
stack[-1]['token_kind'] == 'django_start')) and
|
2017-02-16 20:25:53 +01:00
|
|
|
not stack[-1]['indenting']):
|
|
|
|
info = stack.pop()
|
|
|
|
info['depth'] = info['depth'] + 1
|
|
|
|
info['indenting'] = True
|
2017-02-23 18:12:52 +01:00
|
|
|
info['adjust_offset_until'] = token.line
|
2017-02-16 20:25:53 +01:00
|
|
|
stack.append(info)
|
|
|
|
new_depth = stack[-1]['depth'] + 1
|
|
|
|
extra_indent = stack[-1]['extra_indent']
|
|
|
|
line = lines[token.line - 1]
|
|
|
|
adjustment = len(line)-len(line.lstrip()) + 1
|
|
|
|
offset = (1 + extra_indent + new_depth * num_spaces) - adjustment
|
|
|
|
info = dict(
|
|
|
|
block=True,
|
|
|
|
depth=new_depth,
|
|
|
|
actual_depth=new_depth,
|
|
|
|
line=token.line,
|
2017-02-23 18:12:52 +01:00
|
|
|
tag=token.tag,
|
2017-02-16 20:25:53 +01:00
|
|
|
token_kind=token.kind,
|
2017-02-23 18:12:52 +01:00
|
|
|
line_span=token.line_span,
|
2017-02-16 20:25:53 +01:00
|
|
|
offset=offset,
|
|
|
|
extra_indent=token.col - adjustment + extra_indent,
|
2017-02-23 18:12:52 +01:00
|
|
|
extra_indent_prev=extra_indent,
|
|
|
|
adjustment=adjustment,
|
|
|
|
indenting=True,
|
2017-06-13 07:14:48 +02:00
|
|
|
adjust_offset_until=token.line,
|
|
|
|
ignore_lines=[]
|
2017-02-16 20:25:53 +01:00
|
|
|
)
|
2017-02-23 18:12:52 +01:00
|
|
|
if token.kind in ('handlebars_start', 'django_start'):
|
2017-02-16 20:25:53 +01:00
|
|
|
info.update(dict(depth=new_depth - 1, indenting=False))
|
|
|
|
else:
|
|
|
|
info = dict(
|
|
|
|
block=False,
|
|
|
|
depth=stack[-1]['depth'],
|
|
|
|
actual_depth=stack[-1]['depth'],
|
|
|
|
line=token.line,
|
2017-02-23 18:12:52 +01:00
|
|
|
tag=token.tag,
|
2017-02-16 20:25:53 +01:00
|
|
|
token_kind=token.kind,
|
2017-06-13 07:14:48 +02:00
|
|
|
extra_indent=stack[-1]['extra_indent'],
|
|
|
|
ignore_lines=[]
|
2017-02-16 20:25:53 +01:00
|
|
|
)
|
|
|
|
stack.append(info)
|
2017-11-08 03:47:28 +01:00
|
|
|
elif (token.kind in ('html_end', 'handlebars_end', 'html_singleton_end',
|
2018-04-03 10:09:00 +02:00
|
|
|
'django_end', 'handlebars_singleton_end') and
|
2017-11-08 03:47:28 +01:00
|
|
|
(stack[-1]['tag'] != 'pre' or token.tag == 'pre')):
|
2017-02-15 05:39:42 +01:00
|
|
|
info = stack.pop()
|
|
|
|
if info['block']:
|
|
|
|
# We are at the end of an indentation block. We
|
|
|
|
# assume the whole block was formatted ok before, just
|
|
|
|
# possibly at an indentation that we don't like, so we
|
|
|
|
# nudge over all lines in the block by the same offset.
|
|
|
|
start_line = info['line']
|
|
|
|
end_line = token.line
|
2017-02-23 18:12:52 +01:00
|
|
|
if token.tag == 'pre':
|
|
|
|
offsets[start_line] = 0
|
|
|
|
offsets[end_line] = 0
|
2017-06-13 07:14:48 +02:00
|
|
|
stack[-1]['ignore_lines'].append(start_line)
|
|
|
|
stack[-1]['ignore_lines'].append(end_line)
|
2017-02-23 18:12:52 +01:00
|
|
|
else:
|
|
|
|
offsets[start_line] = info['offset']
|
|
|
|
line = lines[token.line - 1]
|
|
|
|
adjustment = len(line)-len(line.lstrip()) + 1
|
2018-04-03 10:07:23 +02:00
|
|
|
if adjustment == token.col and token.kind != 'html_singleton_end':
|
2017-02-23 18:12:52 +01:00
|
|
|
offsets[end_line] = (info['offset'] +
|
|
|
|
info['adjustment'] -
|
|
|
|
adjustment +
|
|
|
|
info['extra_indent'] -
|
|
|
|
info['extra_indent_prev'])
|
|
|
|
elif (start_line + info['line_span'] - 1 == end_line and
|
2018-04-05 08:38:46 +02:00
|
|
|
info['line_span'] > 1):
|
2017-11-08 03:47:28 +01:00
|
|
|
offsets[end_line] = (1 + info['extra_indent'] +
|
|
|
|
(info['depth'] + 1) * num_spaces) - adjustment
|
2018-04-05 08:38:46 +02:00
|
|
|
# We would like singleton tags and tags which spread over
|
|
|
|
# multiple lines to have 2 space indentation.
|
|
|
|
offsets[end_line] -= 2
|
2017-02-23 18:12:52 +01:00
|
|
|
elif token.line != info['line']:
|
|
|
|
offsets[end_line] = info['offset']
|
2018-04-03 10:07:23 +02:00
|
|
|
if token.tag != 'pre' and token.tag != 'script':
|
2017-02-15 05:39:42 +01:00
|
|
|
for line_num in range(start_line + 1, end_line):
|
|
|
|
# Be careful not to override offsets that happened
|
|
|
|
# deeper in the HTML within our block.
|
|
|
|
if line_num not in offsets:
|
|
|
|
line = lines[line_num - 1]
|
|
|
|
new_depth = info['depth'] + 1
|
2017-02-16 20:25:53 +01:00
|
|
|
if (line.lstrip().startswith('{{else}}') or
|
|
|
|
line.lstrip().startswith('{% else %}') or
|
|
|
|
line.lstrip().startswith('{% elif')):
|
2017-02-15 05:39:42 +01:00
|
|
|
new_depth = info['actual_depth']
|
|
|
|
extra_indent = info['extra_indent']
|
|
|
|
adjustment = len(line)-len(line.lstrip()) + 1
|
|
|
|
offset = (1 + extra_indent + new_depth * num_spaces) - adjustment
|
2018-04-05 08:38:46 +02:00
|
|
|
if line_num <= start_line + info['line_span'] - 1:
|
|
|
|
# We would like singleton tags and tags which spread over
|
|
|
|
# multiple lines to have 2 space indentation.
|
2018-04-03 10:07:23 +02:00
|
|
|
offset -= 2
|
2017-02-15 05:39:42 +01:00
|
|
|
offsets[line_num] = offset
|
2017-02-23 18:12:52 +01:00
|
|
|
elif (token.kind in ('handlebars_end', 'django_end') and
|
|
|
|
info['indenting'] and
|
2017-06-13 07:14:48 +02:00
|
|
|
line_num < info['adjust_offset_until'] and
|
|
|
|
line_num not in info['ignore_lines']):
|
2017-02-23 18:12:52 +01:00
|
|
|
offsets[line_num] += num_spaces
|
|
|
|
elif token.tag != 'pre':
|
2017-02-15 05:39:42 +01:00
|
|
|
for line_num in range(start_line + 1, end_line):
|
|
|
|
if line_num not in offsets:
|
|
|
|
offsets[line_num] = info['offset']
|
2017-02-23 18:12:52 +01:00
|
|
|
else:
|
|
|
|
for line_num in range(start_line + 1, end_line):
|
|
|
|
if line_num not in offsets:
|
|
|
|
offsets[line_num] = 0
|
2017-06-13 07:14:48 +02:00
|
|
|
stack[-1]['ignore_lines'].append(line_num)
|
2017-02-15 05:39:42 +01:00
|
|
|
|
|
|
|
# Now that we have all of our offsets calculated, we can just
|
|
|
|
# join all our lines together, fixing up offsets as needed.
|
|
|
|
formatted_lines = []
|
|
|
|
for i, line in enumerate(html.split('\n')):
|
|
|
|
row = i + 1
|
|
|
|
offset = offsets.get(row, 0)
|
|
|
|
pretty_line = line
|
|
|
|
if line.strip() == '':
|
|
|
|
pretty_line = ''
|
|
|
|
else:
|
|
|
|
if offset > 0:
|
|
|
|
pretty_line = (' ' * offset) + pretty_line
|
|
|
|
elif offset < 0:
|
|
|
|
pretty_line = pretty_line[-1 * offset:]
|
|
|
|
assert line.strip() == pretty_line.strip()
|
|
|
|
formatted_lines.append(pretty_line)
|
|
|
|
|
|
|
|
return '\n'.join(formatted_lines)
|
2017-03-12 22:24:26 +01:00
|
|
|
|
|
|
|
|
|
|
|
def validate_indent_html(fn):
|
|
|
|
# type: (str) -> int
|
|
|
|
file = open(fn)
|
|
|
|
html = file.read()
|
|
|
|
phtml = pretty_print_html(html)
|
|
|
|
file.close()
|
|
|
|
if not html.split('\n') == phtml.split('\n'):
|
2017-11-08 03:47:28 +01:00
|
|
|
print('Invalid Indentation detected in file: '
|
2018-05-24 21:24:48 +02:00
|
|
|
'%s\nDiff for the file against expected indented file:' % (fn), flush=True)
|
2019-01-15 02:56:57 +01:00
|
|
|
with subprocess.Popen(
|
|
|
|
['diff', fn, '-'],
|
|
|
|
stdin=subprocess.PIPE,
|
|
|
|
stderr=subprocess.STDOUT,
|
|
|
|
universal_newlines=True) as p:
|
|
|
|
p.communicate(phtml)
|
2017-03-12 22:24:26 +01:00
|
|
|
return 0
|
|
|
|
return 1
|