This commit is contained in:
2025-10-11 23:42:21 +02:00
commit 0e549b6e0a
32 changed files with 584 additions and 0 deletions

201
Program.cs Normal file
View File

@ -0,0 +1,201 @@
using System;
using System.IO;
using System.Text;
using System.Collections.Generic;
class Program {
static int Main(string[] args) {
if (args.Length < 2) {
Console.WriteLine("Usage: StEmitter <input.st> <output.bin>");
return 1;
}
var input = File.ReadAllText(args[0]);
var parser = new StParser(input);
var prog = parser.ParseProgram();
var emitter = new BytecodeEmitter();
emitter.Compile(prog);
File.WriteAllBytes(args[1], emitter.BuildBinary());
Console.WriteLine($"Wrote {args[1]}: consts={emitter.ConstantsCount}, vars={emitter.VarCount}, code={emitter.CodeLength}");
return 0;
}
}
// === AST & TYPES ===
public enum VarType { Int8=1, Int16=2, Int32=3, Byte=4, Bool=5 }
public abstract class StNode{}
public class ProgramNode:StNode{ public List<VarDecl> Vars=new(); public List<Stmt> Stmts=new(); }
public class VarDecl:StNode{ public string Name; public VarType Type; public Expr? Init; }
public abstract class Stmt:StNode{}
public class AssignStmt:Stmt{ public string Target; public Expr Expr; }
public abstract class Expr:StNode{}
public class IntExpr:Expr{ public int Value; public IntExpr(int v){Value=v;} }
public class VarExpr:Expr{ public string Name; public VarExpr(string n){Name=n;} }
public class BinaryExpr:Expr{ public Expr L; public Expr R; public TokType Op; public BinaryExpr(Expr l,TokType op,Expr r){L=l;Op=op;R=r;} }
// === LEXER ===
public enum TokType { IDENT, INT, ASSIGN, SEMI, LPAREN, RPAREN, PLUS, MINUS, MUL, DIV, PROGRAM, VAR, END_VAR, END_PROGRAM, EOF }
public class Token { public TokType Type; public string Text; public Token(TokType t,string s){Type=t;Text=s;} }
public class StLexer {
private readonly string src; private int i;
public StLexer(string s){src=s;}
char Peek()=> i<src.Length?src[i]:'\0';
char Next()=> i<src.Length?src[i++]:'\0';
public Token NextToken(){
while(char.IsWhiteSpace(Peek())) Next();
if (Peek()=='\0') return new Token(TokType.EOF,"");
if (char.IsLetter(Peek())||Peek()=='_'){
var sb=new StringBuilder();
while(char.IsLetterOrDigit(Peek())||Peek()=='_') sb.Append(Next());
var s=sb.ToString();
switch(s.ToUpperInvariant()){
case "PROGRAM":return new Token(TokType.PROGRAM,s);
case "VAR":return new Token(TokType.VAR,s);
case "END_VAR":return new Token(TokType.END_VAR,s);
case "END_PROGRAM":return new Token(TokType.END_PROGRAM,s);
default:return new Token(TokType.IDENT,s);
}
}
if (char.IsDigit(Peek())){
var sb=new StringBuilder();
while(char.IsDigit(Peek())) sb.Append(Next());
return new Token(TokType.INT,sb.ToString());
}
if (Peek()==':'){ Next(); if(Peek()=='='){Next(); return new Token(TokType.ASSIGN,":=");} }
char c=Next();
return c switch {
';'=>new Token(TokType.SEMI,";"),
'('=>new Token(TokType.LPAREN,"("),
')'=>new Token(TokType.RPAREN,")"),
'+'=>new Token(TokType.PLUS,"+"),
'-'=>new Token(TokType.MINUS,"-"),
'*'=>new Token(TokType.MUL,"*"),
'/'=>new Token(TokType.DIV,"/"),
_=>throw new Exception($"Unexpected char '{c}'")
};
}
}
// === PARSER ===
public class StParser {
StLexer lex; Token cur;
public StParser(string s){lex=new StLexer(s);cur=lex.NextToken();}
void Next()=>cur=lex.NextToken();
void Expect(TokType t){if(cur.Type!=t)throw new Exception($"Expected {t}, got {cur.Type}");Next();}
public ProgramNode ParseProgram(){
var p=new ProgramNode();
Expect(TokType.PROGRAM);
if(cur.Type==TokType.IDENT) Next();
if(cur.Type==TokType.VAR){
Next();
while(cur.Type==TokType.IDENT) p.Vars.Add(ParseVarDecl());
Expect(TokType.END_VAR);
}
while(cur.Type!=TokType.END_PROGRAM&&cur.Type!=TokType.EOF)
p.Stmts.Add(ParseStmt());
Expect(TokType.END_PROGRAM);
return p;
}
VarDecl ParseVarDecl(){
string name=cur.Text; Expect(TokType.IDENT);
string tname=cur.Text.ToLowerInvariant(); Expect(TokType.IDENT);
VarType vt=tname switch {
"int8"=>VarType.Int8,"int16"=>VarType.Int16,"int32"=>VarType.Int32,
"byte"=>VarType.Byte,"bool"=>VarType.Bool,_=>throw new Exception($"Unknown type {tname}")
};
Expr? init=null;
if(cur.Type==TokType.ASSIGN){Next();init=ParseExpr();}
Expect(TokType.SEMI);
return new VarDecl{Name=name,Type=vt,Init=init};
}
Stmt ParseStmt(){
if(cur.Type==TokType.IDENT){
var n=cur.Text;Next();Expect(TokType.ASSIGN);
var e=ParseExpr();Expect(TokType.SEMI);
return new AssignStmt{Target=n,Expr=e};
}
throw new Exception($"Invalid stmt start {cur.Type}");
}
Expr ParseExpr(){return ParseAddSub();}
Expr ParseAddSub(){var l=ParseMulDiv();while(cur.Type==TokType.PLUS||cur.Type==TokType.MINUS){var op=cur.Type;Next();var r=ParseMulDiv();l=new BinaryExpr(l,op,r);}return l;}
Expr ParseMulDiv(){var l=ParsePrimary();while(cur.Type==TokType.MUL||cur.Type==TokType.DIV){var op=cur.Type;Next();var r=ParsePrimary();l=new BinaryExpr(l,op,r);}return l;}
Expr ParsePrimary(){
if(cur.Type==TokType.INT){int v=int.Parse(cur.Text);Next();return new IntExpr(v);}
if(cur.Type==TokType.IDENT){string n=cur.Text;Next();return new VarExpr(n);}
if(cur.Type==TokType.LPAREN){Next();var e=ParseExpr();Expect(TokType.RPAREN);return e;}
throw new Exception($"Unexpected token {cur.Type}");
}
}
// === BYTECODE EMITTER ===
public class BytecodeEmitter {
List<int> consts=new(); Dictionary<string,Symbol> syms=new(); List<byte> code=new();
class Symbol{public string Name;public VarType Type;public int Index;}
public int ConstantsCount=>consts.Count; public int VarCount=>syms.Count; public int CodeLength=>code.Count;
public void Compile(ProgramNode p){
int idx=0;
// Pass 1: Definiere Variablen (ohne Init)
foreach(var v in p.Vars)
syms[v.Name]=new Symbol{Name=v.Name,Type=v.Type,Index=idx++};
// Pass 2: Generiere Initialisierungscode
foreach(var v in p.Vars){
if(v.Init!=null){
EmitExpr(v.Init);
EmitByte(0x03); EmitU16((ushort)syms[v.Name].Index);
}
}
// Main-Code
foreach(var s in p.Stmts)
EmitStmt(s);
EmitByte(0xF0);
}
void EmitStmt(Stmt s){
if(s is AssignStmt a){
EmitExpr(a.Expr);
EmitByte(0x03); EmitU16((ushort)syms[a.Target].Index);
}
}
void EmitExpr(Expr e){
switch(e){
case IntExpr ie:
int ci=AddConst(ie.Value); EmitByte(0x01); EmitU16((ushort)ci); break;
case VarExpr ve:
if(!syms.ContainsKey(ve.Name))
throw new Exception($"Unknown variable {ve.Name}");
int vi=syms[ve.Name].Index; EmitByte(0x02); EmitU16((ushort)vi); break;
case BinaryExpr be:
EmitExpr(be.L); EmitExpr(be.R);
EmitByte(be.Op switch {
TokType.PLUS=>0x10, TokType.MINUS=>0x11, TokType.MUL=>0x12, TokType.DIV=>0x13,
_=>throw new Exception("bad op")
});
break;
default: throw new Exception("bad expr");
}
}
int AddConst(int v){int i=consts.IndexOf(v);if(i>=0)return i;consts.Add(v);return consts.Count-1;}
void EmitByte(byte b)=>code.Add(b);
void EmitU16(ushort v){code.Add((byte)(v&0xFF));code.Add((byte)(v>>8));}
public byte[] BuildBinary(){
using var ms=new MemoryStream();
var w=new BinaryWriter(ms);
w.Write(Encoding.ASCII.GetBytes("STBC"));
w.Write((ushort)1);
w.Write((ushort)consts.Count);
foreach(var c in consts) w.Write(c);
w.Write((ushort)syms.Count);
var types=new byte[syms.Count];
foreach(var kv in syms) types[kv.Value.Index]=(byte)kv.Value.Type;
foreach(var b in types) w.Write(b);
w.Write((ushort)code.Count); w.Write(code.ToArray());
return ms.ToArray();
}
}