pmacs3/highlight2.py

288 lines
10 KiB
Python

import sys
import lex2
color_list = []
color_list.extend(['\033[3%dm' % x for x in range(0, 8)])
color_list.extend(['\033[3%d;1m' % x for x in range(0, 8)])
color_list.extend(['\033[0m'])
color_names = [
'black', 'dred', 'dgreen', 'brown', 'dblue', 'dpurple', 'dcyan', 'lgrey',
'dgrey', 'lred', 'lgreen', 'yellow', 'lblue', 'lpurple', 'lcyan', 'white',
'unset',
]
color_dict ={}
for i in range(0, len(color_list)):
color_dict[color_names[i]] = color_list[i]
class Highlighter:
def __init__(self, lexer):
self.lexer = lexer
self.tokens = []
self.line_contexts = {}
def dump(self, fmt='(%3s, %2s) | %s'):
print fmt % ('y', 'x', 'string')
for i in range(0, len(self.tokens)):
group = self.tokens[i]
print 'LINE %d' % i
for token in group:
print fmt % (token.y, token.x, token.string)
def display(self, token_colors={}, debug=False):
for group in self.tokens:
for token in group:
color_name = None
name_parts = token.name.split('.')
for i in range(0, len(name_parts)):
if '.'.join(name_parts[i:]) in token_colors:
color_name = token_colors['.'.join(name_parts[i:])]
break
if color_name is not None:
sys.stdout.write(color_dict[color_name])
pass
elif debug:
raise Exception, "no highlighting for %r" % token.name
else:
color_name = 'white'
sys.stdout.write(color_dict[color_name])
sys.stdout.write(token.string)
sys.stdout.write('\n')
def highlight(self, lines):
self.tokens = [[] for l in lines]
self.lexer.lex(lines, y=0, x=0)
for token in self.lexer:
self.tokens[token.y].append(token)
self.line_contexts = dict(self.lexer.line_contexts)
# relexing
# ======================
def relex(self, lines, y1, x1, y2, x2):
# start the relexing process
self.lexer.lex(lines, y1, 0)
# these keep track of the current y coordinate, the current token index
# on line[y], and the current "new token", respectively.
y = y1
i = 0
getnext = True
new_token = None
while True:
# if we have overstepped our bounds, then exit!
if y >= len(lines):
break
# if we need another new_token, then try to get it.
if getnext:
try:
new_token = self.lexer.next()
getnext = False
except StopIteration:
# ok, so this means that ALL the rest of the tokens didn't
# show up, because we're done. so delete them and exit
for j in range(y, len(lines)):
del self.tokens[j][i:]
i = 0
break
# if our next token is one a future line, we need to just get rid of
# all our old tokens until we get there
while new_token.y > y:
del self.tokens[y][i:]
i = 0
y += 1
# ok, so see if we have current tokens on this line; if so get it
if i < len(self.tokens[y]):
old_token = self.tokens[y][i]
assert old_token.y == y, "%d == %d" % (old_token.y, y)
else:
old_token = None
if old_token is None:
# since we don't have a previous token at this location, just
# insert the new one
self.tokens[y].insert(i, new_token)
i += 1
getnext = True
elif old_token == new_token:
# if they match, then leave the old one alone
i += 1
getnext = True
if new_token.y >= y2 and new_token.end_x() >= x2:
# in this case, we can (probably) assume that the rest of
# the lines will lex the same way
break
elif old_token.x < new_token.end_x():
# ok, so we haven't gotten to this new token yet. obviously
# this token never showed up in the new lexing, so delete it.
del self.tokens[y][i]
elif old_token.x >= new_token.end_x():
# ok, this token is further out, so just insert the new token
# ahead of it, move our counter out and continue
self.tokens[y].insert(i, new_token)
i += 1
getnext = True
else:
# this should never happen
raise Exception, "this isn't happening"
# deletion
# ======================
def update_del(self, lines, y1, x1, y2, x2):
assert y1 >= 0
assert y1 <= y2
assert y2 < len(lines)
xdelta = x2 - x1
ydelta = y2 - y1
# construct a new token data structure; it will have one list for
# every y index in lines. also, fill in tokens before the change
newtokens = [[] for x in lines]
for y in range(0, y1):
newtokens[y] = self.tokens[y]
# so for each line we currently have, we need to process every token,
# transferring them from the old structure to the new, and modifying
# them appropriately to take the change into account.
for y in range(y1, len(self.tokens)):
while self.tokens[y]:
# so remove the token from the old structure, and figure out
# where it stands in relation to the deletion
token = self.tokens[y].pop(0)
tx1 = token.x
tx2 = token.x + len(token.string)
# the notation "*|*| " refers to what the text spans, i.e.:
# before|during|after the deletion
if (y, tx2) <= (y1, x1):
# *| |
newtokens[y].append(token)
elif (y, tx1) >= (y2, x2):
# | |*
token.y -= ydelta
if y == y2:
token.x -= xdelta
newtokens[token.y].append(token)
elif (y, tx1) < (y1, x1):
if (y, tx2) <= (y2, x2):
# *|*|
token.string = token.string[:x1 - tx1]
else:
# *|*|*
token.string = token.string[:x1 - tx1] + token.string[x2 - tx1:]
newtokens[y].append(token)
elif (y, tx1) < (y2, x2):
if (y, tx2) <= (y2, x2):
# |*|
pass
else:
# |*|*
token.x = x1
token.y -= ydelta
token.string = token.string[x2 - tx1:]
newtokens[token.y].append(token)
else:
raise Exception, "this should never happen: %r" % token
# ok, now that we have built a correct new structure, store a reference
# to it instead.
self.tokens = newtokens
def relex_del(self, lines, y1, x1, y2, x2):
# first let's update our existing tokens to fix their offsets, etc.
self.update_del(lines, y1, x1, y2, x2)
# then let's do some relexing
self.relex(lines, y1, x1, y2, x2)
# addition
# ======================
def update_add(self, lines, y1, x1, newlines):
assert y1 >= 0
assert len(newlines) > 0
y2 = y1 + len(newlines) - 1
if y2 == y1:
x2 = x1 + len(newlines[0])
else:
x2 = len(newlines[-1])
xdelta = x2 - x1
ydelta = y2 - y1
# construct a new token data structure, with the right number of lines
newtokens = []
for i in range(0, len(self.tokens) + ydelta):
newtokens.append([])
# copy the tokens that show up before the changed line
for y in range(0, y1):
newtokens[y] = self.tokens[y]
# process the tokens that show up on the changed line
post_change_list = []
for t in self.tokens[y1]:
tx1 = t.x
tx2 = t.x + len(t.string)
ty = t.y
ts = t.string
if tx2 <= x1:
# '*| ' before the insertion
newtokens[y1].append(t)
elif tx1 >= x1:
# ' |*' after the insertion
t.x += xdelta
t.y = y2
post_change_list.append(t)
else:
# '*|*' around the insertion
t1 = t.copy()
t1.string = t.string[:x1 - tx1]
newtokens[y1].append(t1)
t2 = t.copy()
t2.string = t.string[x1 - tx1:]
t2.x = x2
t2.y = y2
post_change_list.append(t2)
# add in the new data
newtokens[y1].append(lex2.Token('new', '', y1, x1, newlines[0]))
for i in range(1, len(newlines)):
yi = y1 + i
newtokens[yi].append(lex2.Token('new', '', yi, 0, newlines[i]))
# add the post-change tokens back
for t in post_change_list:
newtokens[y2].append(t)
# for each subsequent line, fix it's tokens' y coordinates
for y in range(y1 + 1, len(self.tokens)):
for t in self.tokens[y]:
t.y += ydelta
newtokens[t.y].append(t)
# ok, now that we have built a correct new structure, store a reference
# to it instead.
self.tokens = newtokens
def relex_add(self, lines, y1, x1, newlines):
# first let's update our existing tokens to fix their offsets, etc.
self.update_add(lines, y1, x1, newlines)
# create some extra info that we need
y2 = y1 + len(newlines) - 1
if y2 == y1:
x2 = x1 + len(newlines[0])
else:
x2 = len(newlines[-1])
# now let's start the relexing process
self.relex(lines, y1, x1, y2, x2)