1
0
Fork 0
mirror of https://github.com/suchmememanyskill/TegraExplorer.git synced 2024-11-22 11:56:42 +00:00

automation is here

automatically minifies scripts before embedding them
gotta save them bytes
This commit is contained in:
bleck9999 2021-07-27 00:01:46 +01:00
parent d4f95da062
commit e9fb276e46
No known key found for this signature in database
GPG key ID: D0CA0C41DB616843
2 changed files with 186 additions and 2 deletions

View file

@ -111,8 +111,11 @@ $(BUILDDIR)/$(TARGET)/script/builtin.o: $(BUILDDIR)/$(TARGET)/script/builtin.c
$(BUILDDIR)/$(TARGET)/script/builtin.c: scripts/*.te
@mkdir -p "$(@D)"
@mkdir -p "$(BUILDDIR)/$(TARGET)/scripts"
ifeq ($(OS),Windows_NT)
@py te2c.py "$(BUILDDIR)/$(TARGET)/script/builtin" scripts
@py ts-minifier.py --no-replace-functions -d "$(BUILDDIR)/$(TARGET)/scripts" $(wildcard scripts/*.te)
@py te2c.py "$(BUILDDIR)/$(TARGET)/script/builtin" "$(BUILDDIR)/$(TARGET)/scripts"
else
@python3 te2c.py "$(BUILDDIR)/$(TARGET)/script/builtin" scripts
@python3 ts-minifier.py --no-replace-functions -d "$(BUILDDIR)/$(TARGET)/scripts" $(wildcard scripts/*.te)
@python3 te2c.py "$(BUILDDIR)/$(TARGET)/script/builtin" "$(BUILDDIR)/$(TARGET)/scripts"
endif

181
ts-minifier.py Normal file
View file

@ -0,0 +1,181 @@
# Copyright (c) 2021 bleck9999
# https://github.com/bleck9999/ts-minifier
# Version: 92743efc
import argparse
import re
# if is not included because it's already 2 characters
sub_funcs = {'while': "_h", 'print': "_p", 'println': "_l", 'mountsys': "_s", 'mountemu': "_e", 'readsave': "_r",
'exit': "_q", 'break': "_b", 'dict': "_d", 'setpixel': "_y", 'readdir': "_i", 'copyfile': "_c",
'mkdir': "_k", 'memory': "_m", 'ncatype': "_n", 'pause': "_w", 'color': "_a", 'menu': "__", 'emu': "_u",
'clear': "_x", 'timer': "_t", 'deldir': "_g", 'fsexists': "_f", 'delfile': "_z", "copydir": "c_",
"movefile": "_v", "payload": "_j", "readfile": "_o", "writefile": "w_"}
replace_functions = True
def wantsumspace(s: str):
for c in s.lower():
if (ord(c) < 97 or ord(c) > 122) and (ord(c) != 95) and not (c.isnumeric()):
return False
return True
def commentstartswhere(s: str):
quoted = False
for c in range(len(s)):
if s[c] == '"':
quoted = not quoted
if s[c] == '#' and not quoted:
return c
return None
def minify(script: str):
# currently ts does not seem to allow 's to mark a quote
# (https://github.com/suchmememanyskill/TegraExplorer/blob/tsv3/source/script/parser.c#L173)
# im fine with that, it makes doing this a lot easier
# strings = script.split(sep='"')
str_reuse = {}
requires = ""
mcode = ""
stl_counts = {}.fromkeys(sub_funcs, 0)
# while part < len(strings):
for line in script.split(sep='\n'):
# maybe in future it'll shrink user defined names
# dont hold out hope for that because `a.files.foreach("b") {println(b)}` is valid syntax
# and i dont have the skill or patience to deal with that
# # in theory all the even numbered indexes should be outside quotes, so we ignore any parts with an odd index
# if part % 2 == 1:
# if strings[part] not in str_reuse:
# str_reuse[strings[part]] = 0
# else:
# str_reuse[strings[part]] += 1
# mcode += f'"{strings[part]}"'
start = commentstartswhere(line)
if start is None:
start = -1
if "REQUIRE " in line[start:]:
requires += line[start:] + '\n' # leave REQUIREs unmodified
# comments are terminated by a newline so we need to add one back in
# *deep breath*
# slicing is exclusive on the right side of the colon so the "no comment" value of start=-1 would cut off
# the last character of the line which would lead to several issues
# however this is desirable when there *is* a comment, since it being exclusive means there isn't a trailing #
# and if you're wondering about the above check that uses line[start:] this doesn't matter,
# one character cant contain an 8 character substring
if start != -1:
line = line[:start]
line = line.split(sep='"')
if len(line) % 2 == 0:
print("You appear to have string literals spanning multiple lines. Please seek professional help")
raise Exception("Too much hatred")
part = 0
while part < len(line):
# all the odd numbered indexes should be inside quotes
if part % 2 == 0:
if not line[part]:
break
for s in sub_funcs:
stl_counts[s] += len(re.findall("(?<!\\.)%s\\(" % s, line[part]))
mcode += line[part].replace('\t', '') + ' '
else:
if line[part] not in str_reuse:
str_reuse[line[part]] = 0
else:
str_reuse[line[part]] += 1
mcode += f'"{line[part]}"'
part += 1
# tsv3 is still an absolute nightmare
# so spaces have a couple edge cases
# 1. the - operator which requires space between the right operand
# yeah that's right only the right one
# thanks meme
# 2. between 2 letters
inquote = False
mmcode = ""
index = 0
newline = list(mcode)
while index < (len(mcode) - 3):
sec = mcode[index:index + 3]
if not inquote and sec[1] == '"':
inquote = True
elif inquote and sec[1] == '"':
inquote = False
if (sec[1] == ' ') and not inquote:
if wantsumspace(sec[0]) and wantsumspace(sec[2]):
pass
elif sec[0] == '-' and sec[2].isnumeric():
pass
else:
newline[index + 1] = ''
index += 1
mmcode += ''.join(newline).strip()
for func in sub_funcs:
# space saved here is given by n * (len(func) - len(min_func)) - (len(min_func)+1 + len(func))
# as such with one usage space is always lost (len(func)-2 is never > len(func)+3) so dont even try
if stl_counts[func] >= 2:
savings = stl_counts[func] * (len(func) - 2) - (len(func) + 3)
print(f"Replacing all {stl_counts[func]} usages of {func} would save {savings}byte{'s' if savings != 1 else ''}")
if (savings < 0) or not replace_functions:
print("Savings negative or automatic replacement disabled, continuing")
continue
func_min = sub_funcs[func] # now here we have to assume nobody is using any of our substitute vars
# should be a pretty safe assumption but knowing for sure would require about the same amount of effort
# as it would to replace all user defined variables
ucode = "" # this is rather hacky
sections = [0]
for m in re.finditer(r"(?<!\.)%s\(" % func, mmcode):
sections.append(m.span()[0])
sections.append(m.span()[1])
sections.append(len(mmcode))
i = 2 # change rather to very
while i < len(sections):
ucode += mmcode[sections[i-2]:sections[i-1]] + func_min + '('
i += 2
ucode += mmcode[sections[i-2]:]
ucode = f"{func_min}={func}\n" + ucode
mmcode = ucode
# a space isn't any shorter than \n so why not use \n
for string, count in str_reuse.items():
if count >= 2:
# we can't auto replace strings without a full parser
# unlike with the stdlib functions we cant make a lookup table ahead of time
# and generating shorter names on the fly sounds like an absolute nightmare no thanks
print(f'Warning: string "{string}" of len {len(string)} reused {count} times')
return requires + mmcode.strip()
if __name__ == '__main__':
parser = argparse.ArgumentParser(description="Minify tsv3 scripts, useful for embedding",
formatter_class=argparse.RawTextHelpFormatter)
parser.add_argument("source", type=str, nargs='+', help="source files to minify")
parser.add_argument("-d", type=str, nargs='?', help="destination folder for minified scripts"
"\ndefault: ./", default='./')
parser.add_argument("--replace-functions", action=argparse.BooleanOptionalAction,
help="if false, warn if functions are reused instead of replacing them\ndefault: true")
args = parser.parse_args()
files = args.source
dest = args.d[:-1] if args.d[-1] == '/' else args.d
replace_functions = args.replace_functions if args.replace_functions is not None else True
for file in files:
print(f"Minifying {file}")
with open(file, 'r') as f:
r = minify(f.read())
file = file.split(sep='.')[0].split(sep='/')[-1]
f = open(f"{dest}/{file}_min.te", 'w')
f.write(r)