-
Notifications
You must be signed in to change notification settings - Fork 226
Expand file tree
/
Copy pathBytecodeLoader.java
More file actions
318 lines (296 loc) · 13.1 KB
/
BytecodeLoader.java
File metadata and controls
318 lines (296 loc) · 13.1 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
// Copyright (c) Corporation for National Research Initiatives
package org.python.core;
import org.objectweb.asm.ClassReader;
import java.io.ByteArrayInputStream;
import java.io.IOException;
import java.io.ObjectInputStream;
import java.lang.reflect.Constructor;
import java.lang.reflect.Field;
import java.net.URL;
import java.net.URLClassLoader;
import java.util.LinkedList;
import java.util.List;
/**
* Utility class for loading compiled Python modules and Java classes defined in Python modules.
*/
public class BytecodeLoader {
/**
* Turn the Java class file data into a Java class.
*
* @param name fully-qualified binary name of the class
* @param data a class file as a byte array
* @param referents super-classes and interfaces that the new class will reference.
*/
@SuppressWarnings("unchecked")
public static Class<?> makeClass(String name, byte[] data, Class<?>... referents) {
@SuppressWarnings("resource")
Loader loader = new Loader();
for (Class<?> referent : referents) {
try {
loader.addParent(referent.getClassLoader());
} catch (SecurityException e) {}
}
Class<?> c = loader.loadClassFromBytes(name, data);
if (ContainsPyBytecode.class.isAssignableFrom(c)) {
try {
fixPyBytecode((Class<? extends ContainsPyBytecode>) c);
} catch (IllegalAccessException | NoSuchFieldException | ClassNotFoundException
| IOException e) {
throw new RuntimeException(e);
}
}
BytecodeNotification.notify(name, data, c);
return c;
}
/**
* Turn the Java class file data into a Java class.
*
* @param name the name of the class
* @param referents super-classes and interfaces that the new class will reference.
* @param data a class file as a byte array
*/
public static Class<?> makeClass(String name, List<Class<?>> referents, byte[] data) {
if (referents != null) {
return makeClass(name, data, referents.toArray(new Class[referents.size()]));
}
return makeClass(name, data);
}
private static PyCode parseSerializedCode(String code_str)
throws IOException, ClassNotFoundException {
// From Java 8 use: byte[] b = Base64.getDecoder().decode(code_str);
byte[] b = base64decode(code_str);
ByteArrayInputStream bi = new ByteArrayInputStream(b);
ObjectInputStream si = new ObjectInputStream(bi);
PyBytecode meth_code = (PyBytecode) si.readObject();
si.close();
bi.close();
return meth_code;
}
/**
* Implement a restricted form of base64 decoding compatible with the encoding in Module. This
* decoder treats characters outside the set of 64 necessary to encode data as errors, including
* the pad "=". As a result, the length of the argument exactly determines the size of array
* returned.
*
* @param src to decode
* @return a new byte array
* @throws IllegalArgumentException if src has an invalid character or impossible length.
*/
private static byte[] base64decode(String src) throws IllegalArgumentException {
// Length L is a multiple of 4 plus 0, 2 or 3 tail characters (bearing 0, 8, or 16 bits)
final int L = src.length();
final int tail = L % 4; // 0 to 3 where 1 (an extra 6 bits) is invalid.
if (tail == 1) {
throw new IllegalArgumentException("Input length invalid (4n+1)");
}
// src encodes exactly this many bytes:
final int N = (L / 4) * 3 + (tail > 0 ? tail - 1 : 0);
byte[] data = new byte[N];
// Work through src in blocks of 4
int s = 0, b = 0, quantum;
while (s <= L - 4) {
// Process src[s:s+4]
quantum = (base64CharToBits(src.charAt(s++)) << 18)
+ (base64CharToBits(src.charAt(s++)) << 12)
+ (base64CharToBits(src.charAt(s++)) << 6) + base64CharToBits(src.charAt(s++));
data[b++] = (byte) (quantum >> 16);
data[b++] = (byte) (quantum >> 8);
data[b++] = (byte) quantum;
}
// Now deal with 2 or 3 tail characters, generating one or two bytes.
if (tail >= 2) {
// Repeat the loop body, but everything is 8 bits to the right.
quantum = (base64CharToBits(src.charAt(s++)) << 10)
+ (base64CharToBits(src.charAt(s++)) << 4);
data[b++] = (byte) (quantum >> 8);
if (tail == 3) {
quantum += (base64CharToBits(src.charAt(s++)) >> 2);
data[b++] = (byte) quantum;
}
}
return data;
}
/**
* Helper for {@link #base64decode(String)}, converting one character.
*
* @param c to convert
* @return value 0..63
* @throws IllegalArgumentException if not a base64 character
*/
private static int base64CharToBits(char c) throws IllegalArgumentException {
if (c >= 'a') {
if (c <= 'z') {
return c - 71; // c - 'a' + 26
}
} else if (c >= 'A') {
if (c <= 'Z') {
return c - 'A';
}
} else if (c >= '0') {
if (c <= '9') {
return c + 4; // c - '0' + 52
}
} else if (c == '+') {
return 62;
} else if (c == '/') {
return 63;
}
throw new IllegalArgumentException("Invalid character " + c);
}
/**
* This method looks for Python-Bytecode stored in String literals.
* While Java supports rather long strings, constrained only by
* int-addressing of arrays, it supports only up to 65535 characters
* in literals (not sure how escape-sequences are counted).
* To circumvent this limitation, the code is automatically splitted
* into several literals with the following naming-scheme.
*
* - The marker-interface 'ContainsPyBytecode' indicates that a class
* contains (static final) literals of the following scheme:
* - a prefix of '___' indicates a bytecode-containing string literal
* - a number indicating the number of parts follows
* - '0_' indicates that no splitting occurred
* - otherwise another number follows, naming the index of the literal
* - indexing starts at 0
*
* Examples:
* ___0_method1 contains bytecode for method1
* ___2_0_method2 contains first part of method2's bytecode
* ___2_1_method2 contains second part of method2's bytecode
*
* Note that this approach is provisional. In future, Jython might contain
* the bytecode directly as bytecode-objects. The current approach was
* feasible with much less complicated JVM bytecode-manipulation, but needs
* special treatment after class-loading.
*/
public static void fixPyBytecode(Class<? extends ContainsPyBytecode> c)
throws IllegalAccessException, NoSuchFieldException, java.io.IOException,
ClassNotFoundException {
Field[] fields = c.getDeclaredFields();
for (Field fld: fields) {
String fldName = fld.getName();
if (fldName.startsWith("___")) {
fldName = fldName.substring(3);
String[] splt = fldName.split("_");
if (splt[0].equals("0")) {
fldName = fldName.substring(2);
Field codeField = c.getDeclaredField(fldName);
if (codeField.get(null) == null) {
codeField.set(null, parseSerializedCode((String) fld.get(null)));
}
} else {
if (splt[1].equals("0")) {
fldName = fldName.substring(splt[0].length()+splt[1].length()+2);
Field codeField = c.getDeclaredField(fldName);
if (codeField.get(null) == null) {
// assemble original code-string:
int len = Integer.parseInt(splt[0]);
StringBuilder blt = new StringBuilder((String) fld.get(null));
int pos = 1, pos0;
String partName;
while (pos < len) {
pos0 = pos;
for (Field fldPart: fields) {
partName = fldPart.getName();
if (partName.length() != fldName.length() &&
partName.startsWith("___") &&
partName.endsWith(fldName)) {
String[] splt2 = partName.substring(3).split("_");
if (Integer.parseInt(splt2[1]) == pos) {
blt.append((String) fldPart.get(null));
pos += 1;
if (pos == len) {
break;
}
}
}
}
if (pos0 == pos) {
throw new RuntimeException(
"Invalid PyBytecode splitting in " + c.getName()
+ ":\nSplit-index " + pos + " wasn't found.");
}
}
codeField.set(null, parseSerializedCode(blt.toString()));
}
}
}
}
}
}
/**
* Turn the Java class file data for a compiled Python module into a {@code PyCode} object, by
* constructing an instance of the named class and calling the instance's
* {@link PyRunnable#getMain()}.
*
* @param name fully-qualified binary name of the class
* @param data a class file as a byte array
* @param filename to provide to the constructor of the named class
* @return the {@code PyCode} object produced by the named class' {@code getMain}
*/
public static PyCode makeCode(String name, byte[] data, String filename) {
try {
Class<?> c = makeClass(name, data);
// A compiled module has a constructor taking a String filename argument.
Constructor<?> cons = c.getConstructor(new Class<?>[] {String.class});
Object instance = cons.newInstance(new Object[] {filename});
PyCode result = ((PyRunnable) instance).getMain();
return result;
} catch (Exception e) {
throw Py.JavaError(e);
}
}
public static class Loader extends URLClassLoader {
private LinkedList<ClassLoader> parents = new LinkedList<>();
public Loader() {
super(new URL[0]);
parents.add(imp.getSyspathJavaLoader());
}
/** Add given loader at the front of the list of the parent list (if not {@code null}). */
public void addParent(ClassLoader referent) {
if (referent != null && !parents.contains(referent)) {
parents.addFirst(referent);
}
}
@Override
protected Class<?> loadClass(String name, boolean resolve) throws ClassNotFoundException {
Class<?> c = findLoadedClass(name);
if (c != null) {
return c;
}
for (ClassLoader loader : parents) {
try {
return loader.loadClass(name);
} catch (ClassNotFoundException cnfe) {}
}
// couldn't find the .class file on sys.path
throw new ClassNotFoundException(name);
}
/**
* Define the named class using the class file data provided, and resolve it. (See JVM
* specification.) For class names ending "$py", this method may adjust that name to that
* found in the class file itself.
*
* @param name fully-qualified binary name of the class
* @param data a class file as a byte array
* @return the defined and resolved class
*/
public Class<?> loadClassFromBytes(String name, byte[] data) {
if (name.endsWith("$py")) {
try {
// Get the real class name: we might request a 'bar'
// Jython module that was compiled as 'foo.bar', or
// even 'baz.__init__' which is compiled as just 'baz'
ClassReader cr = new ClassReader(data);
name = cr.getClassName().replace('/', '.');
} catch (RuntimeException re) {
// Probably an invalid .class, fallback to the
// specified name
}
}
Class<?> c = defineClass(name, data, 0, data.length, getClass().getProtectionDomain());
resolveClass(c);
return c;
}
}
}