511 lines
16 KiB
Java
511 lines
16 KiB
Java
import java.io.File;
|
|
import java.io.FileInputStream;
|
|
import java.nio.ByteBuffer;
|
|
import java.nio.ByteOrder;
|
|
import java.nio.channels.Channels;
|
|
import java.util.ArrayList;
|
|
import java.util.Arrays;
|
|
import java.util.List;
|
|
|
|
public class Jocaml {
|
|
private static String TRAILER_MAGIC = "Caml1999X028";
|
|
private static long MARSHAL_MAGIC_SMALL = 0x8495A6BE;
|
|
private static long MARSHAL_MAGIC_BIG = 0x8495A6BF;
|
|
|
|
private static enum CamlInst {
|
|
ACC0(0, 0),
|
|
ACC1(1, 0),
|
|
ACC2(2, 0),
|
|
ACC3(3, 0),
|
|
ACC4(4, 0),
|
|
ACC5(5, 0),
|
|
ACC6(6, 0),
|
|
ACC7(7, 0),
|
|
ACC(8, 1),
|
|
PUSH(9, 0),
|
|
PUSHACC0(10, 0),
|
|
PUSHACC1(11, 0),
|
|
PUSHACC2(12, 0),
|
|
PUSHACC3(13, 0),
|
|
PUSHACC4(14, 0),
|
|
PUSHACC5(15, 0),
|
|
PUSHACC6(16, 0),
|
|
PUSHACC7(17, 0),
|
|
PUSHACC(18, 1),
|
|
POP(19, 1),
|
|
ASSIGN(20, 1),
|
|
ENVACC1(21, 0),
|
|
ENVACC2(22, 0),
|
|
ENVACC3(23, 0),
|
|
ENVACC4(24, 0),
|
|
ENVACC(25, 1),
|
|
PUSHENVACC1(26, 0),
|
|
PUSHENVACC2(27, 0),
|
|
PUSHENVACC3(28, 0),
|
|
PUSHENVACC4(29, 0),
|
|
PUSHENVACC(30, 1),
|
|
PUSH_RETADDR(31, 1),
|
|
APPLY(32, 1),
|
|
APPLY1(33, 0),
|
|
APPLY2(34, 0),
|
|
APPLY3(35, 0),
|
|
APPTERM(36, 2),
|
|
APPTERM1(37, 1),
|
|
APPTERM2(38, 1),
|
|
APPTERM3(39, 1),
|
|
RETURN(40, 1),
|
|
RESTART(41, 0),
|
|
GRAB(42, 1),
|
|
CLOSURE(43, 2),
|
|
CLOSUREREC(44, 2),
|
|
OFFSETCLOSUREM2(45, 0),
|
|
OFFSETCLOSURE0(46, 0),
|
|
OFFSETCLOSURE2(47, 0),
|
|
OFFSETCLOSURE(48, 1),
|
|
PUSHOFFSETCLOSUREM2(49, 0),
|
|
PUSHOFFSETCLOSURE0(50, 0),
|
|
PUSHOFFSETCLOSURE2(51, 0),
|
|
PUSHOFFSETCLOSURE(52, 1),
|
|
GETGLOBAL(53, 1),
|
|
PUSHGETGLOBAL(54, 1),
|
|
GETGLOBALFIELD(55, 2),
|
|
PUSHGETGLOBALFIELD(56, 2),
|
|
SETGLOBAL(57, 1),
|
|
ATOM0(58, 0),
|
|
ATOM(59, 1),
|
|
PUSHATOM0(60, 0),
|
|
PUSHATOM(61, 1),
|
|
MAKEBLOCK(62, 2),
|
|
MAKEBLOCK1(63, 1),
|
|
MAKEBLOCK2(64, 1),
|
|
MAKEBLOCK3(65, 1),
|
|
MAKEFLOATBLOCK(66, 1),
|
|
GETFIELD0(67, 0),
|
|
GETFIELD1(68, 0),
|
|
GETFIELD2(69, 0),
|
|
GETFIELD3(70, 0),
|
|
GETFIELD(71, 1),
|
|
GETFLOATFIELD(72, 1),
|
|
SETFIELD0(73, 0),
|
|
SETFIELD1(74, 0),
|
|
SETFIELD2(75, 0),
|
|
SETFIELD3(76, 0),
|
|
SETFIELD(77, 1),
|
|
SETFLOATFIELD(78, 1),
|
|
VECTLENGTH(79, 0),
|
|
GETVECTITEM(80, 0),
|
|
SETVECTITEM(81, 0),
|
|
GETBYTESCHAR(82, 0),
|
|
SETBYTESCHAR(83, 0),
|
|
BRANCH(84, 1),
|
|
BRANCHIF(85, 1),
|
|
BRANCHIFNOT(86, 1),
|
|
SWITCH(87, 2),
|
|
BOOTNOT(88, 0),
|
|
PUSHTRAP(89, 1),
|
|
POPTRAP(90, 0),
|
|
RAISE(91, 0),
|
|
CHECK_SIGNALS(92, 0),
|
|
C_CALL1(93, 1),
|
|
C_CALL2(94, 1),
|
|
C_CALL3(95, 1),
|
|
C_CALL4(96, 1),
|
|
C_CALL5(97, 1),
|
|
C_CALLN(98, 2),
|
|
CONST0(99, 0),
|
|
CONST1(100, 0),
|
|
CONST2(101, 0),
|
|
CONST3(102, 0),
|
|
CONSTINT(103, 1),
|
|
PUSHCONST0(104, 0),
|
|
PUSHCONST1(105, 0),
|
|
PUSHCONST2(106, 0),
|
|
PUSHCONST3(107, 0),
|
|
PUSHCONSTINT(108, 1),
|
|
NEGINT(109, 0),
|
|
ADDINT(110, 0),
|
|
SUBINT(111, 0),
|
|
MULINT(112, 0),
|
|
DIVINT(113, 0),
|
|
MODINT(114, 0),
|
|
ANDINT(115, 0),
|
|
ORINT(116, 0),
|
|
XORINT(117, 0),
|
|
LSLINT(118, 0),
|
|
LSRINT(119, 0),
|
|
ASRINT(120, 0),
|
|
EQ(121, 0),
|
|
NEQ(122, 0),
|
|
LTINT(123, 0),
|
|
LEINT(124, 0),
|
|
GTINT(125, 0),
|
|
GEINT(126, 0),
|
|
OFFSETINT(127, 1),
|
|
OFFSETREF(128, 1),
|
|
ISINT(129, 0),
|
|
GETMETHOD(130, 0),
|
|
BEQ(131, 2),
|
|
BNEQ(132, 2),
|
|
BLTINT(133, 2),
|
|
BLEINT(134, 2),
|
|
BGTINT(135, 2),
|
|
BGEINT(136, 2),
|
|
ULTINT(137, 0),
|
|
UGEINT(138, 0),
|
|
BULTINT(139, 2),
|
|
BUGEINT(140, 2),
|
|
GETPUBMET(141, 2),
|
|
GETDYNMET(142, 0),
|
|
STOP(143, 0),
|
|
EVENT(144, 0),
|
|
BREAK(145, 0),
|
|
|
|
RERAISE(146, 0), // ???
|
|
RAISE_NOTRACE(147, 0),
|
|
GETSTRINGCHAR(148, 0);
|
|
|
|
public final int code;
|
|
public final int numArgs;
|
|
CamlInst(int code, int numArgs) {
|
|
this.code = code;
|
|
this.numArgs = numArgs;
|
|
}
|
|
|
|
static {
|
|
for (int i = 0; i < CamlInst.values().length; i++) {
|
|
if (CamlInst.values()[i].code != i) {
|
|
throw new RuntimeException("what");
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
private static class CodeOffset {
|
|
public final int offset;
|
|
|
|
public CodeOffset(int offset) {
|
|
this.offset = offset;
|
|
}
|
|
|
|
public String toString() {
|
|
return "CodeOffset<" + offset + ">";
|
|
}
|
|
|
|
public boolean equals(Object other) {
|
|
return other instanceof CodeOffset && ((CodeOffset) other).offset == this.offset;
|
|
}
|
|
|
|
public int hashCode() {
|
|
return offset * 13;
|
|
}
|
|
}
|
|
|
|
private static class Block {
|
|
public final int tag;
|
|
public final List<Object> contents;
|
|
|
|
public Block(int tag, List<Object> contents) {
|
|
this.tag = tag;
|
|
this.contents = contents;
|
|
}
|
|
|
|
public String toString() {
|
|
return "Block<" + tag + ": " + contents.toString() + ">";
|
|
}
|
|
}
|
|
|
|
private static class Section {
|
|
String name;
|
|
ByteBuffer data;
|
|
|
|
public Section(String name, ByteBuffer data) {
|
|
this.name = name;
|
|
this.data = data;
|
|
}
|
|
|
|
public String toString() {
|
|
return "Section<name=" + name + ", length=" + data.capacity() + ">";
|
|
}
|
|
|
|
public List<String> unstring() {
|
|
List<String> strings = new ArrayList<>();
|
|
for (int i = 0; i < this.data.capacity();) {
|
|
StringBuffer buf = new StringBuffer();
|
|
while (this.data.get(i) != 0) {
|
|
buf.append((char) this.data.get(i));
|
|
i += 1;
|
|
}
|
|
strings.add(buf.toString());
|
|
i += 1;
|
|
}
|
|
return strings;
|
|
}
|
|
|
|
private Object parseNextObject(List<Object> shared) throws Exception {
|
|
int nextTag = this.data.get() & (short) 0xff;
|
|
switch (nextTag) {
|
|
// integers
|
|
case 0x00: {
|
|
byte value = this.data.get();
|
|
return Long.valueOf(value);
|
|
}
|
|
case 0x01: {
|
|
short value = this.data.getShort();
|
|
return Long.valueOf(value);
|
|
}
|
|
case 0x02: {
|
|
int value = this.data.getInt();
|
|
return Long.valueOf(value);
|
|
}
|
|
case 0x03: {
|
|
long value = this.data.getLong();
|
|
return Long.valueOf(value);
|
|
}
|
|
|
|
// shared elements
|
|
case 0x04: {
|
|
long offset = this.data.get() & (long) 0xff;
|
|
return shared.get(shared.size() - 1 - (int) offset);
|
|
}
|
|
case 0x05: {
|
|
long offset = this.data.getShort() & (long) 0xff;
|
|
return shared.get(shared.size() - 1 - (int) offset);
|
|
}
|
|
case 0x06: {
|
|
long offset = this.data.getInt() & (long) 0xff;
|
|
return shared.get(shared.size() - 1 - (int) offset);
|
|
}
|
|
|
|
// blocks
|
|
case 0x08: {
|
|
long header = this.data.getInt() & (long) 0xff;
|
|
int tag = (int) header & 0xff;
|
|
long size = header >> 10;
|
|
List<Object> elems = new ArrayList<>();
|
|
Block block = new Block(tag, elems);
|
|
if (size > 0) {
|
|
shared.add(block);
|
|
for (int i = 0; i < size; i++) {
|
|
elems.add(parseNextObject(shared));
|
|
}
|
|
}
|
|
return block;
|
|
}
|
|
case 0x13: {
|
|
throw new Exception("long block not supported");
|
|
}
|
|
|
|
// string
|
|
case 0x09: {
|
|
int len = this.data.get() & (short) 0xff;
|
|
byte[] buf = new byte[len];
|
|
this.data.get(buf);
|
|
String s = new String(buf);
|
|
shared.add(s);
|
|
return s;
|
|
}
|
|
case 0x0a: {
|
|
long len = this.data.getInt() & (long) 0xff;
|
|
byte[] buf = new byte[(int)len];
|
|
this.data.get(buf);
|
|
String s = new String(buf);
|
|
shared.add(s);
|
|
return s;
|
|
}
|
|
|
|
// float
|
|
case 0x0b:
|
|
case 0x0c: {
|
|
Double obj = Double.valueOf(this.data.getDouble());
|
|
shared.add(obj);
|
|
return obj;
|
|
}
|
|
case 0x0D:
|
|
case 0x0E: {
|
|
throw new Exception("double array not supported");
|
|
}
|
|
case 0x07:
|
|
case 0x0f: {
|
|
throw new Exception("double array not supported");
|
|
}
|
|
|
|
// misc
|
|
case 0x10: {
|
|
throw new Exception("code pointer with checksum");
|
|
}
|
|
case 0x11: {
|
|
throw new Exception("code pointer with closure");
|
|
}
|
|
case 0x12:
|
|
case 0x18:
|
|
case 0x19: {
|
|
StringBuffer buf = new StringBuffer();
|
|
while (true) {
|
|
int next = this.data.get() & (short) 0xff;
|
|
if (next == 0) {
|
|
break;
|
|
}
|
|
buf.append((char) next);
|
|
}
|
|
String name = buf.toString();
|
|
switch (name) {
|
|
// int64
|
|
case "_j": {
|
|
long v = Long.valueOf(this.data.getLong());
|
|
shared.add(v);
|
|
return v;
|
|
}
|
|
default:
|
|
throw new Exception("unknown custom op: " + name);
|
|
}
|
|
}
|
|
default: {
|
|
if (nextTag < 0x20) {
|
|
throw new Exception("invalid tag " + nextTag);
|
|
} else if (nextTag < 0x40) {
|
|
int length = nextTag & 0x1f;
|
|
byte[] buf = new byte[(int)length];
|
|
this.data.get(buf);
|
|
String s = new String(buf);
|
|
shared.add(s);
|
|
return s;
|
|
} else if (nextTag < 0x80) {
|
|
Long value = Long.valueOf(nextTag & 0x3f);
|
|
return value;
|
|
} else {
|
|
long size = (nextTag >> 4) & 0x07;
|
|
int tag = nextTag & 0x0f;
|
|
List<Object> elems = new ArrayList<>();
|
|
Block block = new Block(tag, elems);
|
|
if (size > 0) {
|
|
shared.add(block);
|
|
for (int i = 0; i < size; i++) {
|
|
elems.add(parseNextObject(shared));
|
|
}
|
|
}
|
|
return block;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
public List<Object> unmarshal() throws Exception {
|
|
this.data.order(ByteOrder.BIG_ENDIAN);
|
|
int magic = this.data.getInt(0);
|
|
if (magic != MARSHAL_MAGIC_SMALL) {
|
|
throw new Exception("bad marshal magic");
|
|
}
|
|
|
|
// int byteLength = this.data.getInt(4);
|
|
int numObjs = this.data.getInt(8);
|
|
System.out.println(numObjs);
|
|
|
|
List<Object> shared = new ArrayList<>();
|
|
List<Object> objs = new ArrayList<>();
|
|
|
|
this.data.position(20);
|
|
|
|
while (this.data.position() < this.data.capacity()) {
|
|
Object next = parseNextObject(shared);
|
|
objs.add(next);
|
|
}
|
|
|
|
System.out.println(shared.size());
|
|
return objs;
|
|
}
|
|
|
|
public void disassemble(List<String> prim) throws Exception {
|
|
this.data.order(ByteOrder.LITTLE_ENDIAN);
|
|
this.data.position(0);
|
|
while (this.data.position() < this.data.capacity()) {
|
|
int pc = this.data.position() / 4;
|
|
int op = this.data.getInt();
|
|
String rep = null;
|
|
try {
|
|
CamlInst inst = CamlInst.values()[op];
|
|
rep = inst.name();
|
|
if (inst == CamlInst.C_CALL1 || inst == CamlInst.C_CALL2
|
|
|| inst == CamlInst.C_CALL3 || inst == CamlInst.C_CALL4
|
|
|| inst == CamlInst.C_CALL5 || inst == CamlInst.C_CALLN) {
|
|
int p = this.data.getInt();
|
|
rep += " " + prim.get(p);
|
|
if (inst == CamlInst.C_CALLN) {
|
|
int n = this.data.getInt();
|
|
rep += " " + n;
|
|
}
|
|
} else if (inst == CamlInst.CLOSUREREC) {
|
|
int nfuncs = this.data.getInt();
|
|
int nargs = this.data.getInt();
|
|
rep += " " + nfuncs + " " + nargs;
|
|
for (int i = 0; i < nfuncs; i++) {
|
|
rep += " " + this.data.getInt();
|
|
}
|
|
} else {
|
|
for (int i = 0; i < inst.numArgs; i++) {
|
|
rep += " " + this.data.getInt();
|
|
}
|
|
}
|
|
} catch (ArrayIndexOutOfBoundsException e) {
|
|
rep = "<UNKNOWN " + op + ">";
|
|
}
|
|
System.out.printf("%05d: ", pc);
|
|
System.out.println(rep);
|
|
}
|
|
}
|
|
}
|
|
|
|
public static Section findSection(Section[] sections, String name) {
|
|
for (Section section : sections) {
|
|
if (section.name.equals(name)) {
|
|
return section;
|
|
}
|
|
}
|
|
return null;
|
|
}
|
|
|
|
public static void main(String[] args) throws Exception {
|
|
ByteBuffer buf;
|
|
int len;
|
|
{
|
|
FileInputStream in = new FileInputStream(new File(args[0]));
|
|
len = in.available();
|
|
buf = ByteBuffer.allocate(len);
|
|
Channels.newChannel(in).read(buf);
|
|
}
|
|
|
|
for (int i = 0; i < 12; i++) {
|
|
if (buf.get(len - 12 + i) != (byte) TRAILER_MAGIC.charAt(i)) {
|
|
throw new Exception("invalid trailer");
|
|
}
|
|
}
|
|
|
|
int numSections = buf.getInt(len - 16);
|
|
Section[] sections = new Section[numSections];
|
|
|
|
for (int i = numSections - 1, sectionBase = len - 16 - (numSections * 8); i >= 0; i--) {
|
|
int base = len - 16 - (numSections * 8) + (i * 8);
|
|
char[] name = new char[4];
|
|
name[0] = (char) buf.get(base + 0);
|
|
name[1] = (char) buf.get(base + 1);
|
|
name[2] = (char) buf.get(base + 2);
|
|
name[3] = (char) buf.get(base + 3);
|
|
int sectionLength = buf.getInt(base + 4);
|
|
sectionBase -= sectionLength;
|
|
byte[] data = new byte[sectionLength];
|
|
buf.position(sectionBase);
|
|
buf.get(data);
|
|
sections[i] = new Section(new String(name), ByteBuffer.wrap(data));
|
|
}
|
|
|
|
System.out.println(Arrays.toString(sections));
|
|
List<Object> symb = findSection(sections, "SYMB").unmarshal();
|
|
System.out.println(symb);
|
|
List<Object> crcs = findSection(sections, "CRCS").unmarshal();
|
|
System.out.println(crcs);
|
|
List<Object> data = findSection(sections, "DATA").unmarshal();
|
|
System.out.println(data);
|
|
List<String> prim = findSection(sections, "PRIM").unstring();
|
|
findSection(sections, "CODE").disassemble(prim);
|
|
}
|
|
}
|