forked from CensoredUsername/unrpyc
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathunrpyc.py
executable file
·315 lines (259 loc) · 13.1 KB
/
unrpyc.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
#!/usr/bin/env python2
# Copyright (c) 2012 Yuri K. Schlesner
#
# Permission is hereby granted, free of charge, to any person obtaining a copy
# of this software and associated documentation files (the "Software"), to deal
# in the Software without restriction, including without limitation the rights
# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
# copies of the Software, and to permit persons to whom the Software is
# furnished to do so, subject to the following conditions:
#
# The above copyright notice and this permission notice shall be included in
# all copies or substantial portions of the Software.
#
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
# SOFTWARE.
import argparse
from os import path, walk
import codecs
import glob
import itertools
import traceback
import struct
from multiprocessing import Pool, Lock, cpu_count
from operator import itemgetter
import decompiler
from decompiler import magic, astdump, translate
# special definitions for special classes
class PyExpr(magic.FakeStrict, unicode):
__module__ = "renpy.ast"
def __new__(cls, s, filename, linenumber):
self = unicode.__new__(cls, s)
self.filename = filename
self.linenumber = linenumber
return self
def __getnewargs__(self):
return unicode(self), self.filename, self.linenumber
class PyCode(magic.FakeStrict):
__module__ = "renpy.ast"
def __setstate__(self, state):
(_, self.source, self.location, self.mode) = state
self.bytecode = None
class RevertableList(magic.FakeStrict, list):
__module__ = "renpy.python"
def __new__(cls):
return list.__new__(cls)
class RevertableDict(magic.FakeStrict, dict):
__module__ = "renpy.python"
def __new__(cls):
return dict.__new__(cls)
class RevertableSet(magic.FakeStrict, set):
__module__ = "renpy.python"
def __new__(cls):
return set.__new__(cls)
def __setstate__(self, state):
if isinstance(state, tuple):
self.update(state[0].keys())
else:
self.update(state)
class Sentinel(magic.FakeStrict, object):
__module__ = "renpy.object"
def __new__(cls, name):
obj = object.__new__(cls)
obj.name = name
return obj
class_factory = magic.FakeClassFactory((PyExpr, PyCode, RevertableList, RevertableDict, RevertableSet, Sentinel), magic.FakeStrict)
printlock = Lock()
# needs class_factory
import deobfuscate
# API
def read_ast_from_file(in_file):
# .rpyc files are just zlib compressed pickles of a tuple of some data and the actual AST of the file
raw_contents = in_file.read()
if raw_contents.startswith("RENPY RPC2"):
# parse the archive structure
position = 10
chunks = {}
while True:
slot, start, length = struct.unpack("III", raw_contents[position: position + 12])
if slot == 0:
break
position += 12
chunks[slot] = raw_contents[start: start + length]
raw_contents = chunks[1]
raw_contents = raw_contents.decode('zlib')
data, stmts = magic.safe_loads(raw_contents, class_factory, {"_ast", "collections"})
return stmts
def decompile_rpyc(input_filename, overwrite=False, dump=False, decompile_python=False,
comparable=False, no_pyexpr=False, translator=None, tag_outside_block=False,
init_offset=False, try_harder=False):
# Output filename is input filename but with .rpy extension
filepath, ext = path.splitext(input_filename)
if dump:
out_filename = filepath + ".txt"
elif ext == ".rpymc":
out_filename = filepath + ".rpym"
else:
out_filename = filepath + ".rpy"
with printlock:
print("Decompiling %s to %s..." % (input_filename, out_filename))
if not overwrite and path.exists(out_filename):
print("Output file already exists. Pass --clobber to overwrite.")
return False # Don't stop decompiling if one file already exists
with open(input_filename, 'rb') as in_file:
if try_harder:
ast = deobfuscate.read_ast(in_file)
else:
ast = read_ast_from_file(in_file)
with codecs.open(out_filename, 'w', encoding='utf-8') as out_file:
if dump:
astdump.pprint(out_file, ast, decompile_python=decompile_python, comparable=comparable,
no_pyexpr=no_pyexpr)
else:
decompiler.pprint(out_file, ast, decompile_python=decompile_python, printlock=printlock,
translator=translator, tag_outside_block=tag_outside_block,
init_offset=init_offset)
return True
def extract_translations(input_filename, language):
with printlock:
print("Extracting translations from %s..." % input_filename)
with open(input_filename, 'rb') as in_file:
ast = read_ast_from_file(in_file)
translator = translate.Translator(language, True)
translator.translate_dialogue(ast)
# we pickle and unpickle this manually because the regular unpickler will choke on it
return magic.safe_dumps(translator.dialogue), translator.strings
def worker(t):
(args, filename, filesize) = t
try:
if args.write_translation_file:
return extract_translations(filename, args.language)
else:
if args.translation_file is not None:
translator = translate.Translator(None)
translator.language, translator.dialogue, translator.strings = magic.loads(args.translations, class_factory)
else:
translator = None
return decompile_rpyc(filename, args.clobber, args.dump, decompile_python=args.decompile_python,
no_pyexpr=args.no_pyexpr, comparable=args.comparable, translator=translator,
tag_outside_block=args.tag_outside_block, init_offset=args.init_offset, try_harder=args.try_harder)
except Exception as e:
with printlock:
print("Error while decompiling %s:" % filename)
print(traceback.format_exc())
return False
def sharelock(lock):
global printlock
printlock = lock
def main():
# python27 unrpyc.py [-c] [-d] [--python-screens|--ast-screens|--no-screens] file [file ...]
parser = argparse.ArgumentParser(description="Decompile .rpyc/.rpymc files")
parser.add_argument('-c', '--clobber', dest='clobber', action='store_true',
help="overwrites existing output files")
parser.add_argument('-d', '--dump', dest='dump', action='store_true',
help="instead of decompiling, pretty print the ast to a file")
parser.add_argument('-p', '--processes', dest='processes', action='store', default=cpu_count(),
help="use the specified number of processes to decompile")
parser.add_argument('-t', '--translation-file', dest='translation_file', action='store', default=None,
help="use the specified file to translate during decompilation")
parser.add_argument('-T', '--write-translation-file', dest='write_translation_file', action='store', default=None,
help="store translations in the specified file instead of decompiling")
parser.add_argument('-l', '--language', dest='language', action='store', default='english',
help="if writing a translation file, the language of the translations to write")
parser.add_argument('--sl1-as-python', dest='decompile_python', action='store_true',
help="Only dumping and for decompiling screen language 1 screens. "
"Convert SL1 Python AST to Python code instead of dumping it or converting it to screenlang.")
parser.add_argument('--comparable', dest='comparable', action='store_true',
help="Only for dumping, remove several false differences when comparing dumps. "
"This suppresses attributes that are different even when the code is identical, such as file modification times. ")
parser.add_argument('--no-pyexpr', dest='no_pyexpr', action='store_true',
help="Only for dumping, disable special handling of PyExpr objects, instead printing them as strings. "
"This is useful when comparing dumps from different versions of Ren'Py. "
"It should only be used if necessary, since it will cause loss of information such as line numbers.")
parser.add_argument('--tag-outside-block', dest='tag_outside_block', action='store_true',
help="Always put SL2 'tag's on the same line as 'screen' rather than inside the block. "
"This will break compiling with Ren'Py 7.3 and above, but is needed to get correct line numbers "
"from some files compiled with older Ren'Py versions.")
parser.add_argument('--init-offset', dest='init_offset', action='store_true',
help="Attempt to guess when init offset statements were used and insert them. "
"This is always safe to enable if the game's Ren'Py version supports init offset statements, "
"and the generated code is exactly equivalent, only less cluttered.")
parser.add_argument('file', type=str, nargs='+',
help="The filenames to decompile. "
"All .rpyc files in any directories passed or their subdirectories will also be decompiled.")
parser.add_argument('--try-harder', dest="try_harder", action="store_true",
help="Tries some workarounds against common obfuscation methods. This is a lot slower.")
args = parser.parse_args()
if args.write_translation_file and not args.clobber and path.exists(args.write_translation_file):
# Fail early to avoid wasting time going through the files
print("Output translation file already exists. Pass --clobber to overwrite.")
return
if args.translation_file:
with open(args.translation_file, 'rb') as in_file:
args.translations = in_file.read()
# Expand wildcards
def glob_or_complain(s):
retval = glob.glob(s)
if not retval:
print("File not found: " + s)
return retval
filesAndDirs = map(glob_or_complain, args.file)
# Concatenate lists
filesAndDirs = list(itertools.chain(*filesAndDirs))
# Recursively add .rpyc files from any directories passed
files = []
for i in filesAndDirs:
if path.isdir(i):
for dirpath, dirnames, filenames in walk(i):
files.extend(path.join(dirpath, j) for j in filenames if len(j) >= 5 and j.endswith(('.rpyc', '.rpymc')))
else:
files.append(i)
# Check if we actually have files. Don't worry about
# no parameters passed, since ArgumentParser catches that
if len(files) == 0:
print("No script files to decompile.")
return
files = map(lambda x: (args, x, path.getsize(x)), files)
processes = int(args.processes)
if processes > 1:
# If a big file starts near the end, there could be a long time with
# only one thread running, which is inefficient. Avoid this by starting
# big files first.
files.sort(key=itemgetter(2), reverse=True)
results = Pool(int(args.processes), sharelock, [printlock]).map(worker, files, 1)
else:
# Decompile in the order Ren'Py loads in
files.sort(key=itemgetter(1))
results = map(worker, files)
if args.write_translation_file:
print("Writing translations to %s..." % args.write_translation_file)
translated_dialogue = {}
translated_strings = {}
good = 0
bad = 0
for result in results:
if not result:
bad += 1
continue
good += 1
translated_dialogue.update(magic.loads(result[0], class_factory))
translated_strings.update(result[1])
with open(args.write_translation_file, 'wb') as out_file:
magic.safe_dump((args.language, translated_dialogue, translated_strings), out_file)
else:
# Check per file if everything went well and report back
good = results.count(True)
bad = results.count(False)
if bad == 0:
print("Decompilation of %d script file%s successful" % (good, 's' if good>1 else ''))
elif good == 0:
print("Decompilation of %d file%s failed" % (bad, 's' if bad>1 else ''))
else:
print("Decompilation of %d file%s successful, but decompilation of %d file%s failed" % (good, 's' if good>1 else '', bad, 's' if bad>1 else ''))
if __name__ == '__main__':
main()