gitweb on Svarog

projekti pod git sistemom za održavanje verzija -- projects under the git version control system
274bb7e448cd0d90f883ecab19e0093b868ac04a
[mjc2wsl.git] / src / mjc2wsl.java
1 import java.io.*;
2 import java.util.*;
4 /**
5 * This program converts file from compiled MicroJava bytecode to WSL language
6 * which is a part of the FermaT Transformation system. MicroJava is a subset
7 * used in Compiler Construction courses by Hanspeter Moessenboeck, not
8 * "Java ME".
9 *
10 * @author Doni Pracner, http://perun.dmi.rs/pracner http://quemaster.com
11 */
12 public class mjc2wsl{
13 public static String versionN = "0.1.4";
15 public static final int M_ERR = 2, M_WAR = 1, M_DEB = 0;
17 private int printLevel = M_ERR;
19 private int[] messageCounters = new int[M_ERR+1];
21 private void message(String mes, int level){
22 if (level>=printLevel)
23 System.out.println(mes);
24 messageCounters[level]++;
25 }
27 private void printMessageCounters(){
28 printMessageCounters(System.out);
29 }
31 private void printMessageCounters(PrintStream out){
32 out.println("total errors:"+messageCounters[M_ERR]+" warnings:"+messageCounters[M_WAR]);
33 }
35 private boolean genPauseAfterEachAddress=false,
36 genPrintForEachAddress = false,
37 genPrintEStackOnChange = false;
39 /** Constant used for marking a regular comment from the original file */
40 public static final char C_REG = ' ';
41 /**
42 * Constant used for marking when original code is inserted in the file,
43 * next to the translations
44 */
45 public static final char C_OC = '#';
46 /** Constant used for marking special messages from the translator */
47 public static final char C_SPEC = '&';
48 /** Constant used for marking error messages from the translator */
49 public static final char C_ERR = '!';
51 /** instruction code in MicroJava bytecode. */
52 public static final int
53 load = 1,
54 load_0 = 2,
55 load_1 = 3,
56 load_2 = 4,
57 load_3 = 5,
58 store = 6,
59 store_0 = 7,
60 store_1 = 8,
61 store_2 = 9,
62 store_3 = 10,
63 getstatic = 11,
64 putstatic = 12,
65 getfield = 13,
66 putfield = 14,
67 const_0 = 15,
68 const_1 = 16,
69 const_2 = 17,
70 const_3 = 18,
71 const_4 = 19,
72 const_5 = 20,
73 const_m1 = 21,
74 const_ = 22,
75 add = 23,
76 sub = 24,
77 mul = 25,
78 div = 26,
79 rem = 27,
80 neg = 28,
81 shl = 29,
82 shr = 30,
83 inc = 31,
84 new_ = 32,
85 newarray = 33,
86 aload = 34,
87 astore = 35,
88 baload = 36,
89 bastore = 37,
90 arraylength = 38,
91 pop = 39,
92 dup = 40,
93 dup2 = 41,
94 jmp = 42,
95 jeq = 43,
96 jne = 44,
97 jlt = 45,
98 jle = 46,
99 jgt = 47,
100 jge = 48,
101 call = 49,
102 return_ = 50,
103 enter = 51,
104 exit = 52,
105 read = 53,
106 print = 54,
107 bread = 55,
108 bprint = 56,
109 trap = 57;
111 public String getStandardStart(){
112 return getStandardStart(10);
115 public String getStandardStart(int numWords){
116 StringBuilder ret = new StringBuilder(
117 "C:\" This file automatically converted from microjava bytecode\";\n"
118 +"C:\" with mjc2wsl v "+versionN+"\";\n");
120 ret.append("VAR < tempa := 0, tempb := 0, tempres :=0,\n\t");
121 ret.append("mjvm_locals := ARRAY(1,0), ");
122 ret.append("\n\tmjvm_statics := ARRAY("+numWords+",0), ");
123 ret.append("\n\tmjvm_arrays := < >, ");
124 ret.append("\n\tmjvm_objects := < >, ");
125 ret.append("\n mjvm_estack := < >, mjvm_mstack := < >, ");
126 ret.append("\n mjvm_fp := 0, mjvm_sp := 0,");
127 ret.append("\n t_e_m_p := 0 > :");
129 return ret.toString();
132 public String getStandardEnd(){
133 return "SKIP\nENDVAR";
136 private boolean originalInComments = false;
138 private HashMap<Integer,String> opMap = null;
140 private String opCodeFile = "mj-bytecodes.properties";
142 private HashMap<Integer,String> getOpMap() {
143 if (opMap==null) {
144 opMap = new HashMap<Integer, String> (60, 0.98f);
145 try{
146 BufferedReader in = new BufferedReader(
147 new InputStreamReader(getClass().getResourceAsStream(opCodeFile)));
148 String str = in.readLine();
149 while (str != null) {
150 String[] ss = str.split("=");
151 opMap.put(Integer.parseInt(ss[0]),ss[1]);
152 str = in.readLine();
154 in.close();
155 }catch (Exception ex) {
156 ex.printStackTrace();
159 return opMap;
162 public String getOpString(int op) {
163 return getOpMap().get(op);
166 public String describeOpCode(int op) {
167 return op + " (" + getOpString(op) + ")";
170 private InputStream mainIn;
171 private PrintWriter out = null;
172 private int counter = -1;
174 private void pr(int i){
175 out.print(i);
178 private void pr(char i){
179 out.print(i);
182 private void pr(String i){
183 out.print(i);
186 private void prl(String i){
187 out.println(i);
190 private int get() {
191 int res = -1;
192 try {
193 res = mainIn.read();
194 if (res >= 0)
195 res = res << 24 >>> 24;
196 } catch (IOException ex) {
197 ex.printStackTrace();
199 counter++;
200 return res;
203 private int get2() {
204 return (get() * 256 + get()) << 16 >> 16;
207 private int get4() {
208 return (get2() << 16) + (get2() << 16 >>> 16);
211 private String loc(int i){
212 //arrays start at 1 in WSL, so we need an offset
213 return "mjvm_locals[" + (i+1)+"]";
216 private String genStatic(int i){
217 return "mjvm_statics[" + (i+1)+"]";
220 private String genArray(int i){
221 return "mjvm_arrays["+ i +"]";
224 private String genArray(String i){
225 return "mjvm_arrays["+ i+"]";
228 private String genObject(String i){
229 return "mjvm_objects["+ i+"]";
232 /**
233 * Creates a WSL comment with care to quote chars.
234 */
235 public static String createComment(String str){
236 return createComment(str, C_REG);
239 /**
240 * Creates a WSL comment with care to quote chars, of the
241 * given type. Types are given as char constants. They can be
242 * default comments, comments that contain the original code
243 * in them, or additional comments regarding the translation
244 * process.
245 */
246 public static String createComment(String str, char type) {
247 return "C:\"" + type + str.replace("\"", "''") + "\";";
250 //Expression stack
252 private String cmdToEStack(int i) {
253 String res = "mjvm_estack := <" + i + " > ++ mjvm_estack;";
254 if (genPrintEStackOnChange) res +="PRINT(\"eStack\",mjvm_estack);";
255 return res;
258 private String cmdToEStack(String i) {
259 String res = "mjvm_estack := <" + i + " > ++ mjvm_estack;";
260 if (genPrintEStackOnChange) res +="PRINT(\"eStack\",mjvm_estack);";
261 return res;
264 private String cmdFromEStack(String st) {
265 String res = st + " := HEAD(mjvm_estack); mjvm_estack := TAIL(mjvm_estack);";
266 if (genPrintEStackOnChange) res +="PRINT(\"eStack\",mjvm_estack);";
267 return res;
270 private String cmdPopEStack() {
271 String res = "mjvm_estack := TAIL(mjvm_estack);";
272 if (genPrintEStackOnChange) res +="PRINT(\"eStack\",mjvm_estack);";
273 return res;
277 private String getTopTwo(){
278 return cmdFromEStack("tempa") + "\n" + cmdFromEStack("tempb");
281 private String getTop() {
282 return cmdFromEStack("tempa");
285 //Method stack
287 private String cmdToMStack(int i) {
288 return "mjvm_mstack := <" + i + " > ++ mjvm_mstack;";
291 private String cmdToMStack(String i) {
292 return "mjvm_mstack := <" + i + " > ++ mjvm_mstack;";
295 private String cmdFromMStack(String st) {
296 return st + " := HEAD(mjvm_mstack); mjvm_mstack := TAIL(mjvm_mstack);";
299 private String getRelationFor(int opcode) throws Exception {
300 switch (opcode) {
301 case jeq: return "=";
302 case jne: return "<>";
303 case jlt: return "<";
304 case jle: return "<=";
305 case jgt: return ">";
306 case jge: return ">=";
308 throw new Exception("Wrong opcode for a relation");
311 private boolean isJumpCode(int opcode) {
312 return (opcode>=jmp) && (opcode<=jge);
315 public void convertStream(InputStream ins) throws Exception{
316 mainIn = ins;
317 //process start
318 byte m = (byte) get();
319 byte j = (byte) get();
320 if (m!='M' || j !='J')
321 throw new Exception("Wrong start of bytecode file");
322 int codesize = get4();
323 int numberOfWords = get4();
324 int mainAdr = get4();
326 prl(getStandardStart(numberOfWords));
327 prl("SKIP;\n ACTIONS A_S_start:\n A_S_start == CALL a"+(14+mainAdr)+" END");
328 int op = get();
329 while (op >= 0) {
330 if (originalInComments)
331 prl(createComment(describeOpCode(op), C_OC));
332 prl("a" + counter + " == ");
333 if (genPrintForEachAddress) {
334 prl("PRINT(\"a"+counter+"\");");
335 if (genPauseAfterEachAddress)
336 prl("debug_disposable_string := @Read_Line(Standard_Input_Port);");
338 switch (op) {
339 case load: {
340 prl(cmdToEStack(loc(get())));
341 break;
343 case load_0:
344 case load_1:
345 case load_2:
346 case load_3: {
347 prl(cmdToEStack(loc(op - load_0)));
348 break;
350 case store: {
351 prl(cmdFromEStack(loc(get())));
352 break;
354 case store_0:
355 case store_1:
356 case store_2:
357 case store_3: {
358 prl(cmdFromEStack(loc(op - store_0)));
359 break;
362 case getstatic:{
363 prl(cmdToEStack(genStatic(get2())));
364 break;
365 }
366 case putstatic: {
367 prl(cmdFromEStack(genStatic(get2())));
368 break;
371 case getfield:{
372 int f = get2();
373 prl(getTop());
374 prl(cmdToEStack(genObject("tempa")+"["+(f+1)+"]"));
375 break;
377 case putfield:{
378 int f = get2();
379 //we need to use a temparray as a pointer, WSL
380 //otherwise tries to access it as a list of lists and fails
381 prl(getTopTwo());
382 prl("VAR < tempArray := "+genObject("tempb")+" > :");
383 prl("tempArray["+(f+1)+"]:=tempa ENDVAR;");
384 break;
387 case const_: {
388 prl(cmdToEStack(get4()));
389 break;
392 case const_0:
393 case const_1:
394 case const_2:
395 case const_3:
396 case const_4:
397 case const_5: {
398 prl(cmdToEStack(op - const_0));
399 break;
402 case add: {
403 prl(getTopTwo());
404 prl("tempres := tempb + tempa;");
405 prl(cmdToEStack("tempres"));
406 break;
408 case sub: {
409 prl(getTopTwo());
410 prl("tempres := tempb - tempa;");
411 prl(cmdToEStack("tempres"));
412 break;
414 case mul: {
415 prl(getTopTwo());
416 prl("tempres := tempb * tempa;");
417 prl(cmdToEStack("tempres"));
418 break;
420 case div: {
421 prl(getTopTwo());
422 prl("IF tempa = 0 THEN ERROR(\"division by zero\") FI;");
423 prl("tempres := tempb DIV tempa;");
424 prl(cmdToEStack("tempres"));
425 break;
427 case rem: {
428 prl(getTopTwo());
429 prl("IF tempa = 0 THEN ERROR(\"division by zero\") FI;");
430 prl("tempres := tempb MOD tempa;");
431 prl(cmdToEStack("tempres"));
432 break;
435 case neg :{
436 prl(getTop());
437 prl(cmdToEStack("-tempa"));
438 break;
439 }
440 //TODO shl, shr
442 case inc : {
443 int b1 = get(), b2 = get();
444 prl(loc(b1)+" := " +loc(b1)+" + "+b2+";");
445 break;
448 case new_ :{
449 int size = get2();
450 //TODO maybe objects and arrays should be in the same list?
451 prl("mjvm_objects := mjvm_objects ++ < ARRAY("+size+",0) >;");
452 prl(cmdToEStack("LENGTH(mjvm_objects)"));
453 break;
455 case newarray :{
456 get();// 0 - bytes, 1 - words; ignore for now
457 //TODO take into consideration 0/1
458 prl(getTop());
459 prl("mjvm_arrays := mjvm_arrays ++ < ARRAY(tempa,0) >;");
460 prl(cmdToEStack("LENGTH(mjvm_arrays)"));
461 break;
464 case aload:
465 case baload:{
466 prl(getTopTwo());
467 prl(cmdToEStack(genArray("tempb")+"[tempa+1]"));
468 break;
470 case astore:
471 case bastore:{
472 prl(cmdFromEStack("tempres"));
473 prl(getTopTwo());
474 //we need to use a temparray as a pointer, WSL
475 //otherwise tries to access it as a list of lists and fails
476 prl("VAR < tempArray := "+genArray("tempb")+" > :");
477 prl("tempArray[tempa+1]:=tempres ENDVAR;");
478 break;
480 case arraylength :{
481 prl(getTop());
482 //TODO make an array length function of some sort!
483 prl(createComment("array length not known - LENGTH not aplicable to arrays",C_ERR));
484 message("array length not known - LENGTH not aplicable to arrays",M_ERR);
485 prl(createComment("put 1 on the stack for consistency",C_SPEC));
486 prl(cmdToEStack(1));
487 break;
490 case dup : {
491 prl(getTop());
492 prl(cmdToEStack("tempa"));
493 prl(cmdToEStack("tempa"));
494 break;
496 case dup2 : {
497 prl(getTopTwo());
498 prl(cmdToEStack("tempb"));
499 prl(cmdToEStack("tempa"));
500 prl(cmdToEStack("tempb"));
501 prl(cmdToEStack("tempa"));
502 break;
505 case pop : {
506 prl(cmdPopEStack());
507 break;
510 case jmp: {
511 prl("CALL a" + (counter + get2()) + ";");
512 break;
515 case jeq:
516 case jne:
517 case jlt:
518 case jle:
519 case jgt:
520 case jge: {
521 prl(getTopTwo());
522 prl("IF tempb "+ getRelationFor(op)
523 +" tempa THEN CALL a" + (counter + get2())
524 +" ELSE CALL a" + (counter+1)
525 + " FI;");
526 break;
529 case call: {
530 prl("CALL a" + (counter + get2()) + ";");
531 break;
534 case return_: {
535 //we let the actions return
536 // there is nothing to clean up
537 prl("SKIP END b"+counter+" ==");
538 break;
540 case enter: {
541 int parameters = get();
543 int locals = get();
544 prl(cmdToMStack("mjvm_locals"));
545 prl("mjvm_locals := ARRAY("+locals+",0);");
546 for (int i = parameters-1; i >= 0; i--)
547 prl(cmdFromEStack(loc(i)));
548 break;
550 case exit: {
551 prl(cmdFromMStack("mjvm_locals"));
552 break;
555 // read, print
556 case bread:{
557 //TODO make it a char for read
558 message("char is read like a number", M_WAR);
559 prl(createComment("char is read like a number",C_SPEC));
561 case read: {
562 prl("tempa := @String_To_Num(@Read_Line(Standard_Input_Port));");
563 prl(cmdToEStack("tempa"));
564 break;
567 // the prints
568 case bprint:{
569 // TODO need to make it a char on print
570 message("chars will be printed as number codes", M_WAR);
571 prl(createComment("char will be printed as a number code",C_SPEC));
573 case print: {
574 // TODO printing numbers needs different lengths of spacing
575 prl(getTopTwo());
576 pr(createComment("print spacing",C_SPEC));
577 prl("IF tempa>1 THEN FOR i:=2 TO tempa STEP 1 DO PRINFLUSH(\" \") OD FI;");
578 prl("PRINFLUSH(tempb);");
579 break;
582 case trap: {
583 prl("ERROR(\"Runtime error: trap("+get()+")\");");
584 break;
588 default:
589 prl(createComment("unknown op error: " + op, C_ERR));
590 message("unknown op error: "+ op, M_ERR);
591 break;
594 boolean wasJump = isJumpCode(op);
595 op = get();
596 if (op >= 0)
597 if (wasJump)
598 prl("SKIP END");
599 else
600 prl("CALL a" + counter + " END");
602 prl("CALL Z;\nSKIP END\nENDACTIONS;\n");
603 prl(getStandardEnd());
607 public void convertFile(File f) {
608 try {
609 convertStream(new FileInputStream(f));
610 } catch (Exception ex) {
611 ex.printStackTrace();
615 public void printHelp() {
616 System.out.println("MicroJava bytecode to WSL converter. v " + versionN
617 + ", by Doni Pracner");
618 System.out.println("usage:\n\t mjc2wsl {options} filename [outfile]");
619 System.out.println("options:\n\t--screen print output to screen");
620 System.out.println("\t-o --oc[+-] include original code in comments");
621 System.out.println("\t-v verbose, print warning messages");
622 System.out.println("\t-q don't print even the error messages");
623 System.out.println("\t-d print detailed debug messages");
626 public String makeDefaultOutName(String inname){
627 String rez = inname;
628 if (inname.endsWith(".obj"))
629 rez = rez.substring(0, rez.length() - 4);
630 return rez + ".wsl";
633 public void run(String[] args) {
634 if (args.length == 0) {
635 printHelp();
636 } else {
637 int i = 0;
638 while (i < args.length && args[i].charAt(0) == '-') {
639 if (args[i].compareTo("-h") == 0) {
640 printHelp();
641 return;
642 } else if (args[i].compareTo("-o") == 0
643 || args[i].startsWith("--oc")) {
644 if (args[i].length() == 2)
645 originalInComments = true;
646 else if (args[i].length() == 5)
647 originalInComments = args[i].charAt(4) == '+';
648 else
649 originalInComments = true;
650 } else if (args[i].compareTo("--screen") == 0) {
651 out = new PrintWriter(System.out);
652 } else if (args[i].compareTo("-d") == 0) {
653 printLevel = M_DEB;//print debug info
654 } else if (args[i].compareTo("-v") == 0) {
655 printLevel = M_WAR;//print warnings
656 } else if (args[i].compareTo("-q") == 0) {
657 printLevel = M_ERR+1;//no printing
658 } else if (args[i].compareToIgnoreCase("--genEStackPrint") == 0) {
659 genPrintEStackOnChange = true;
660 } else if (args[i].compareToIgnoreCase("--genAddrPause") == 0) {
661 genPauseAfterEachAddress = true;
662 } else if (args[i].compareToIgnoreCase("--genAddrPrint") == 0) {
663 genPrintForEachAddress = true;
664 } else if (args[i].compareToIgnoreCase("--genAddr") == 0) {
665 genPrintForEachAddress = true;
666 genPauseAfterEachAddress = true;
667 } else if (args[i].compareToIgnoreCase("--genAll") == 0) {
668 genPrintEStackOnChange = true;
669 genPrintForEachAddress = true;
670 genPauseAfterEachAddress = true;
671 }i++;
674 if (i >= args.length) {
675 System.out.println("no filename supplied");
676 System.exit(2);
678 File f = new File(args[i]);
680 if (i + 1 < args.length) {
681 try {
682 out = new PrintWriter(args[i + 1]);
683 } catch (Exception e) {
684 System.err.println("error in opening out file:");
685 e.printStackTrace();
688 if (out == null) {
689 // if not set to screen, or a file, make a default filename
690 try {
691 out = new PrintWriter(makeDefaultOutName(args[i]));
692 } catch (Exception e) {
693 System.err.println("error in opening out file:");
694 e.printStackTrace();
697 if (f.exists()) {
698 Calendar now = Calendar.getInstance();
699 convertFile(f);
700 long mili = Calendar.getInstance().getTimeInMillis()
701 - now.getTimeInMillis();
702 System.out.println("conversion time:" + mili + " ms");
703 printMessageCounters();
704 out.close();
705 } else
706 System.out.println("file does not exist");
710 public static void main(String[] args) {
711 new mjc2wsl().run(args);
Svarog.pmf.uns.ac.rs/gitweb maintanance Doni Pracner