457 lines
14 KiB
C#
457 lines
14 KiB
C#
|
using System;
|
|||
|
using System.Collections.Generic;
|
|||
|
using System.IO;
|
|||
|
using System.Linq;
|
|||
|
using System.Text;
|
|||
|
using System.Text.RegularExpressions;
|
|||
|
using System.Threading.Tasks;
|
|||
|
|
|||
|
namespace CompilerVVM
|
|||
|
{
|
|||
|
class pair
|
|||
|
{
|
|||
|
public int start;
|
|||
|
public int end;
|
|||
|
public pair(int one, int two)
|
|||
|
{
|
|||
|
start = one;
|
|||
|
end = two;
|
|||
|
}
|
|||
|
}
|
|||
|
|
|||
|
class str_header
|
|||
|
{
|
|||
|
public byte[] signature
|
|||
|
{ get; set; }
|
|||
|
public int version
|
|||
|
{ get; set; }
|
|||
|
public int const_count
|
|||
|
{ get; set; }
|
|||
|
public int size_const
|
|||
|
{ get; set; }
|
|||
|
|
|||
|
public str_header()
|
|||
|
{
|
|||
|
signature = new byte[2];
|
|||
|
signature[0] = 0xBA;
|
|||
|
signature[1] = 0xBA;
|
|||
|
version = 0100;
|
|||
|
}
|
|||
|
|
|||
|
public byte[] Serialize()
|
|||
|
{
|
|||
|
using (MemoryStream m = new MemoryStream())
|
|||
|
{
|
|||
|
using (BinaryWriter writer = new BinaryWriter(m))
|
|||
|
{
|
|||
|
writer.Write(signature);
|
|||
|
writer.Write(version);
|
|||
|
writer.Write(const_count);
|
|||
|
writer.Write(size_const);
|
|||
|
}
|
|||
|
return m.ToArray();
|
|||
|
}
|
|||
|
}
|
|||
|
}
|
|||
|
|
|||
|
class funcH_common
|
|||
|
{
|
|||
|
public ushort start_id
|
|||
|
{ get; set; }
|
|||
|
public int count_of_funcs
|
|||
|
{ get; set; }
|
|||
|
|
|||
|
public funcH_common(ushort id, int count)
|
|||
|
{
|
|||
|
start_id = id;
|
|||
|
count_of_funcs = count;
|
|||
|
}
|
|||
|
|
|||
|
public byte[] Serialize()
|
|||
|
{
|
|||
|
using (MemoryStream m = new MemoryStream())
|
|||
|
{
|
|||
|
using (BinaryWriter writer = new BinaryWriter(m))
|
|||
|
{
|
|||
|
writer.Write(start_id);
|
|||
|
writer.Write(count_of_funcs);
|
|||
|
|
|||
|
}
|
|||
|
return m.ToArray();
|
|||
|
}
|
|||
|
}
|
|||
|
}
|
|||
|
|
|||
|
class funcH_signature
|
|||
|
{
|
|||
|
public int size_func
|
|||
|
{ get; set; }
|
|||
|
public int size_bytecode
|
|||
|
{ get; set; }
|
|||
|
public int size_signature
|
|||
|
{ get; set; }
|
|||
|
|
|||
|
public byte[] Serialize()
|
|||
|
{
|
|||
|
using (MemoryStream m = new MemoryStream())
|
|||
|
{
|
|||
|
using (BinaryWriter writer = new BinaryWriter(m))
|
|||
|
{
|
|||
|
writer.Write(size_func);
|
|||
|
writer.Write(size_bytecode);
|
|||
|
writer.Write(size_signature);
|
|||
|
}
|
|||
|
return m.ToArray();
|
|||
|
}
|
|||
|
}
|
|||
|
}
|
|||
|
|
|||
|
class funcH_bytecode
|
|||
|
{
|
|||
|
public ushort id
|
|||
|
{ get; set; }
|
|||
|
public int count_locals
|
|||
|
{ get; set; }
|
|||
|
public int count_args
|
|||
|
{ get; set; }
|
|||
|
|
|||
|
public byte[] Serialize()
|
|||
|
{
|
|||
|
using (MemoryStream m = new MemoryStream())
|
|||
|
{
|
|||
|
using (BinaryWriter writer = new BinaryWriter(m))
|
|||
|
{
|
|||
|
writer.Write(id);
|
|||
|
writer.Write(count_locals);
|
|||
|
writer.Write(count_args);
|
|||
|
}
|
|||
|
return m.ToArray();
|
|||
|
}
|
|||
|
}
|
|||
|
|
|||
|
public funcH_bytecode()
|
|||
|
{
|
|||
|
count_locals = 0;
|
|||
|
count_args = 0;
|
|||
|
}
|
|||
|
}
|
|||
|
|
|||
|
public class ByteCode
|
|||
|
{
|
|||
|
public static void GenerateByteCode(string[] code, string outname)
|
|||
|
{
|
|||
|
Dictionary<int, string> ConstID_VALUE = new Dictionary<int, string>();
|
|||
|
Dictionary<string, int> ConstKEY_ID = new Dictionary<string, int>();
|
|||
|
Dictionary<string, int> CodeMARK_POS = new Dictionary<string, int>();
|
|||
|
|
|||
|
List<pair> FuncPos = new List<pair>();
|
|||
|
|
|||
|
int[] pos_d = new int[2] { 0, 0 };
|
|||
|
string[] source = code;
|
|||
|
List<string> src = PositionAnalyse(source, ref pos_d, ref FuncPos, ref CodeMARK_POS);
|
|||
|
|
|||
|
|
|||
|
using (var bw = new BinaryWriter(File.Open(outname, FileMode.OpenOrCreate)))
|
|||
|
{
|
|||
|
|
|||
|
HeaderAnalyse(src, pos_d, bw, ref ConstID_VALUE, ref ConstKEY_ID);
|
|||
|
funcH_common FuncCommonH = new funcH_common(CRC16_alg("main"), FuncPos.Count);
|
|||
|
bw.Write(FuncCommonH.Serialize());
|
|||
|
for (int i = 0; i < FuncPos.Count; i++)
|
|||
|
{
|
|||
|
FuncAnalyse(src, FuncPos[i], bw, ConstKEY_ID, CodeMARK_POS);
|
|||
|
}
|
|||
|
}
|
|||
|
}
|
|||
|
|
|||
|
private static List<string> PositionAnalyse(string[] input, ref int[] posD, ref List<pair> posC, ref Dictionary<string, int> marks)
|
|||
|
{
|
|||
|
List<string> src = new List<string>();
|
|||
|
bool func_flag = false;
|
|||
|
int pos1 = 0, pos2 = 0, numline = 0;
|
|||
|
foreach (string s in input)
|
|||
|
if (s != "")
|
|||
|
{
|
|||
|
if (func_flag == true && Regex.IsMatch(s, @"\w+:"))
|
|||
|
{
|
|||
|
marks.Add(s.Trim(' ', '\t', ':'), numline);
|
|||
|
}
|
|||
|
else
|
|||
|
{
|
|||
|
src.Add(s.Trim(' ', '\t'));
|
|||
|
|
|||
|
if (s.Contains(".data"))
|
|||
|
posD[0] = src.Count - 1;
|
|||
|
if (s.Contains(".endd"))
|
|||
|
posD[1] = src.Count - 1;
|
|||
|
|
|||
|
if (s.Contains(".proc"))
|
|||
|
{
|
|||
|
numline = 0;
|
|||
|
pos1 = src.Count - 1;
|
|||
|
func_flag = true;
|
|||
|
}
|
|||
|
|
|||
|
if (s.Contains(".endp"))
|
|||
|
{
|
|||
|
pos2 = src.Count - 1;
|
|||
|
if (func_flag == true)
|
|||
|
{
|
|||
|
func_flag = false;
|
|||
|
posC.Add(new pair(pos1, pos2));
|
|||
|
}
|
|||
|
}
|
|||
|
numline++;
|
|||
|
}
|
|||
|
}
|
|||
|
return src;
|
|||
|
}
|
|||
|
private static void HeaderAnalyse(List<string> src, int[] pos, BinaryWriter bw, ref Dictionary<int, string> id_v, ref Dictionary<string, int> k_id)
|
|||
|
{
|
|||
|
str_header ConstH = new str_header();
|
|||
|
string pattern = "\".*\"";
|
|||
|
int j = 1;
|
|||
|
for (int i = pos[0] + 1; i < pos[1]; i++)
|
|||
|
{
|
|||
|
int position = src[i].IndexOf(" ");
|
|||
|
string key = src[i].Substring(0, position);
|
|||
|
string value = Regex.Match(src[i], pattern).ToString().Trim('"').Replace(@"\n", "\n").Replace(@"\r", "\r") + "\0";
|
|||
|
id_v.Add(j, value); k_id.Add(key, j++);
|
|||
|
ConstH.const_count++; ConstH.size_const += (value.Length);
|
|||
|
}
|
|||
|
bw.Write(ConstH.Serialize());
|
|||
|
for (int i = 1; i < j; i++)
|
|||
|
{
|
|||
|
bw.Write(Encoding.ASCII.GetBytes(id_v[i]));
|
|||
|
}
|
|||
|
}
|
|||
|
private static void FuncAnalyse(List<string> code, pair pos, BinaryWriter bw, Dictionary<string, int> dictStr, Dictionary<string, int> dictJmp)
|
|||
|
{
|
|||
|
string name = "";
|
|||
|
MemoryStream str = new MemoryStream();
|
|||
|
funcH_signature sign = new funcH_signature();
|
|||
|
funcH_bytecode bc = new funcH_bytecode();
|
|||
|
|
|||
|
|
|||
|
string[] current_str = code[pos.start].Split(' ');
|
|||
|
switch (current_str.Length)
|
|||
|
{
|
|||
|
case 4:
|
|||
|
bc.count_args = System.Convert.ToInt32(current_str[3]);
|
|||
|
bc.count_locals = System.Convert.ToInt32(current_str[2]);
|
|||
|
name = current_str[1];
|
|||
|
break;
|
|||
|
case 3:
|
|||
|
bc.count_locals = System.Convert.ToInt32(current_str[2]);
|
|||
|
name = current_str[1];
|
|||
|
break;
|
|||
|
|
|||
|
case 2:
|
|||
|
name = current_str[1];
|
|||
|
break;
|
|||
|
}
|
|||
|
bc.id = CRC16_alg(name);
|
|||
|
name += "\0";
|
|||
|
sign.size_signature = name.Length;
|
|||
|
using (BinaryWriter writer = new BinaryWriter(str))
|
|||
|
{
|
|||
|
int j = 1;
|
|||
|
for (int i = pos.start + 1; i < pos.end; i++)
|
|||
|
{
|
|||
|
current_str = code[i].Split(' ');
|
|||
|
opcode current_opc = (opcode)Enum.Parse(typeof(opcode), current_str[0].ToUpper());
|
|||
|
writer.Write((byte)current_opc);
|
|||
|
|
|||
|
if (current_opc == opcode.DLOAD)
|
|||
|
writer.Write(Convert.ToDouble(current_str[1]));
|
|||
|
else if (current_opc == opcode.ILOAD)
|
|||
|
writer.Write(Convert.ToInt64(current_str[1]));
|
|||
|
else if (current_opc == opcode.SLOAD)
|
|||
|
writer.Write((ushort)dictStr[current_str[1]]);
|
|||
|
else if (current_opc == opcode.CALL)
|
|||
|
writer.Write(CRC16_alg(current_str[1]));
|
|||
|
else if (threebytes.Contains(current_opc))
|
|||
|
writer.Write(ushort.Parse(current_str[1]));
|
|||
|
else if (fivebytes.Contains(current_opc))
|
|||
|
{
|
|||
|
writer.Write(CRC16_alg(current_str[1]));
|
|||
|
writer.Write(ushort.Parse(current_str[2]));
|
|||
|
}
|
|||
|
else if (jumps.Contains(current_opc))
|
|||
|
writer.Write(FindOffset(code, pos, j, ((ushort)dictJmp[current_str[1]] - j)));
|
|||
|
j++;
|
|||
|
}
|
|||
|
}
|
|||
|
|
|||
|
byte[] bcode = str.ToArray();
|
|||
|
sign.size_bytecode = bcode.Length;
|
|||
|
sign.size_func = 22 + sign.size_bytecode + sign.size_signature;
|
|||
|
|
|||
|
bw.Write(sign.Serialize());
|
|||
|
bw.Write(Encoding.ASCII.GetBytes(name));
|
|||
|
bw.Write(bc.Serialize());
|
|||
|
bw.Write(bcode);
|
|||
|
}
|
|||
|
|
|||
|
private static short FindOffset(List<string> code, pair pos, int curr_pos, int off)
|
|||
|
{
|
|||
|
short result = 0;
|
|||
|
if (off > 0)
|
|||
|
{
|
|||
|
for (int i = curr_pos + 1; i < curr_pos + off; i++)
|
|||
|
{
|
|||
|
result += OpCodeSize((opcode)Enum.Parse(typeof(opcode), code[pos.start + i].Split(' ')[0].ToUpper()));
|
|||
|
}
|
|||
|
}
|
|||
|
else
|
|||
|
{
|
|||
|
for (int i = curr_pos; i >= curr_pos + off; i--)
|
|||
|
{
|
|||
|
result -= OpCodeSize((opcode)Enum.Parse(typeof(opcode), code[pos.start + i].Split(' ')[0].ToUpper()));
|
|||
|
}
|
|||
|
}
|
|||
|
return result;
|
|||
|
}
|
|||
|
|
|||
|
private static short OpCodeSize(opcode opc)
|
|||
|
{
|
|||
|
short result = 0;
|
|||
|
if (jumps.Contains(opc) || threebytes.Contains(opc))
|
|||
|
result += 3;
|
|||
|
else if (fivebytes.Contains(opc))
|
|||
|
result += 5;
|
|||
|
else if (ninebytes.Contains(opc))
|
|||
|
result += 9;
|
|||
|
else result++;
|
|||
|
return result;
|
|||
|
|
|||
|
}
|
|||
|
|
|||
|
private static ushort CRC16_alg(string msg)
|
|||
|
{
|
|||
|
byte[] text = Encoding.ASCII.GetBytes(msg);
|
|||
|
const ushort polinom = 0xa001;
|
|||
|
ushort code = 0xffff;
|
|||
|
|
|||
|
for (int i = 0, size = text.Length; i < size; ++i)
|
|||
|
{
|
|||
|
code ^= (ushort)(text[i] << 8);
|
|||
|
|
|||
|
for (uint j = 0; j < 8; ++j)
|
|||
|
{
|
|||
|
code >>= 1;
|
|||
|
if ((code & 0x01) != 0) code ^= polinom;
|
|||
|
}
|
|||
|
}
|
|||
|
|
|||
|
return code;
|
|||
|
}
|
|||
|
|
|||
|
/*static List<opcode> onebyte = new List<opcode>{opcode.INVALID, opcode.DLOAD0, opcode.ILOAD0, opcode.SLOAD0, opcode.DLOAD1, opcode.ILOAD1, opcode.DLOADM1,
|
|||
|
opcode.ILOADM1, opcode.DADD, opcode.IADD, opcode.DSUB, opcode.ISUB, opcode.DMUL, opcode.IMUL, opcode.DDIV, opcode.IDIV, opcode.IMOD, opcode.DNEG,
|
|||
|
opcode.INEG, opcode.IAOR, opcode.IAAND, opcode.IAXOR, opcode.IPRINT, opcode.DPRINT, opcode.SPRINT, opcode.I2D, opcode.D2I, opcode.S2I, opcode.SWAP,
|
|||
|
opcode.POP, opcode.LOADDVAR0, opcode.LOADDVAR1, opcode.LOADDVAR2, opcode.LOADDVAR3, opcode.LOADIVAR0, opcode.LOADIVAR1, opcode.LOADIVAR2, opcode.LOADIVAR3,
|
|||
|
opcode.LOADSVAR0, opcode.LOADSVAR1, opcode.LOADSVAR2, opcode.LOADSVAR3, opcode.STOREDVAR0, opcode.STOREDVAR1, opcode.STOREDVAR2, opcode.STOREDVAR3,
|
|||
|
opcode.STOREIVAR0, opcode.STOREIVAR1, opcode.STOREIVAR2, opcode.STOREIVAR3, opcode.STORESVAR0, opcode.STORESVAR1, opcode.STORESVAR2, opcode.STORESVAR3,
|
|||
|
opcode.ICMP, opcode.DCMP, opcode.DUMP, opcode.STOP, opcode.RETURN, opcode.BREAK};*/
|
|||
|
|
|||
|
static List<opcode> ninebytes = new List<opcode> { opcode.DLOAD, opcode.ILOAD };
|
|||
|
|
|||
|
static List<opcode> threebytes = new List<opcode> { opcode.LOADDVAR, opcode.LOADIVAR, opcode.LOADSVAR, opcode.STOREDVAR,
|
|||
|
opcode.STOREIVAR, opcode.STORESVAR, opcode.SLOAD, opcode.CALL};
|
|||
|
|
|||
|
static List<opcode> fivebytes = new List<opcode> {opcode.LOADCTXDVAR, opcode.LOADCTXIVAR, opcode.LOADCTXSVAR, opcode.STORECTXDVAR,
|
|||
|
opcode.STORECTXIVAR, opcode.STORECTXSVAR};
|
|||
|
|
|||
|
static List<opcode> jumps = new List<opcode> {opcode.JA, opcode.IFICMPE, opcode.IFICMPG, opcode.IFICMPGE, opcode.IFICMPL,
|
|||
|
opcode.IFICMPLE, opcode.IFICMPNE};
|
|||
|
}
|
|||
|
|
|||
|
enum opcode
|
|||
|
{
|
|||
|
INVALID,
|
|||
|
DLOAD,
|
|||
|
ILOAD,
|
|||
|
SLOAD,
|
|||
|
DLOAD0,
|
|||
|
ILOAD0,
|
|||
|
SLOAD0,
|
|||
|
DLOAD1,
|
|||
|
ILOAD1,
|
|||
|
DLOADM1,
|
|||
|
ILOADM1,
|
|||
|
DADD,
|
|||
|
IADD,
|
|||
|
DSUB,
|
|||
|
ISUB,
|
|||
|
DMUL,
|
|||
|
IMUL,
|
|||
|
DDIV,
|
|||
|
IDIV,
|
|||
|
IMOD,
|
|||
|
DNEG,
|
|||
|
INEG,
|
|||
|
IAOR,
|
|||
|
IAAND,
|
|||
|
IAXOR,
|
|||
|
IPRINT,
|
|||
|
DPRINT,
|
|||
|
SPRINT,
|
|||
|
I2D,
|
|||
|
D2I,
|
|||
|
S2I,
|
|||
|
SWAP,
|
|||
|
POP,
|
|||
|
LOADDVAR0,
|
|||
|
LOADDVAR1,
|
|||
|
LOADDVAR2,
|
|||
|
LOADDVAR3,
|
|||
|
LOADIVAR0,
|
|||
|
LOADIVAR1,
|
|||
|
LOADIVAR2,
|
|||
|
LOADIVAR3,
|
|||
|
LOADSVAR0,
|
|||
|
LOADSVAR1,
|
|||
|
LOADSVAR2,
|
|||
|
LOADSVAR3,
|
|||
|
STOREDVAR0,
|
|||
|
STOREDVAR1,
|
|||
|
STOREDVAR2,
|
|||
|
STOREDVAR3,
|
|||
|
STOREIVAR0,
|
|||
|
STOREIVAR1,
|
|||
|
STOREIVAR2,
|
|||
|
STOREIVAR3,
|
|||
|
STORESVAR0,
|
|||
|
STORESVAR1,
|
|||
|
STORESVAR2,
|
|||
|
STORESVAR3,
|
|||
|
LOADDVAR,
|
|||
|
LOADIVAR,
|
|||
|
LOADSVAR,
|
|||
|
STOREDVAR,
|
|||
|
STOREIVAR,
|
|||
|
STORESVAR,
|
|||
|
LOADCTXDVAR,
|
|||
|
LOADCTXIVAR,
|
|||
|
LOADCTXSVAR,
|
|||
|
STORECTXDVAR,
|
|||
|
STORECTXIVAR,
|
|||
|
STORECTXSVAR,
|
|||
|
DCMP,
|
|||
|
ICMP,
|
|||
|
JA,
|
|||
|
IFICMPNE,
|
|||
|
IFICMPE,
|
|||
|
IFICMPG,
|
|||
|
IFICMPGE,
|
|||
|
IFICMPL,
|
|||
|
IFICMPLE,
|
|||
|
DUMP,
|
|||
|
STOP,
|
|||
|
CALL,
|
|||
|
RETURN,
|
|||
|
BREAK
|
|||
|
};
|
|||
|
}
|