From 3b390967e7c2ee4ac6d1a67c77f40ed43005e012 Mon Sep 17 00:00:00 2001 From: tomsmeding Date: Sun, 20 Nov 2016 11:27:07 +0100 Subject: Initial --- .gitignore | 3 + Makefile | 26 ++++ ast.cpp | 244 ++++++++++++++++++++++++++++++++++++ ast.h | 85 +++++++++++++ environment.cpp | 383 ++++++++++++++++++++++++++++++++++++++++++++++++++++++++ environment.h | 34 +++++ error.cpp | 13 ++ error.h | 19 +++ global.h | 20 +++ indirect.cpp | 11 ++ indirect.h | 157 +++++++++++++++++++++++ main.cpp | 29 +++++ prelude.cpp | 68 ++++++++++ prelude.h | 6 + 14 files changed, 1098 insertions(+) create mode 100644 .gitignore create mode 100644 Makefile create mode 100644 ast.cpp create mode 100644 ast.h create mode 100644 environment.cpp create mode 100644 environment.h create mode 100644 error.cpp create mode 100644 error.h create mode 100644 global.h create mode 100644 indirect.cpp create mode 100644 indirect.h create mode 100644 main.cpp create mode 100644 prelude.cpp create mode 100644 prelude.h diff --git a/.gitignore b/.gitignore new file mode 100644 index 0000000..740a324 --- /dev/null +++ b/.gitignore @@ -0,0 +1,3 @@ +*.o +*.dSYM +main diff --git a/Makefile b/Makefile new file mode 100644 index 0000000..591ace8 --- /dev/null +++ b/Makefile @@ -0,0 +1,26 @@ +CXX = g++ +CXXFLAGS = -Wall -Wextra -std=c++11 -fwrapv -Werror=switch +BIN = main +DEBUG = 1 +ifneq ($(DEBUG),) + CXXFLAGS += -g +else + CXXFLAGS += -O2 +endif + + +.PHONY: all clean remake + +all: $(BIN) + +clean: + rm -rf $(BIN) *.o *.dSYM + +remake: clean all + + +$(BIN): $(patsubst %.cpp,%.o,$(wildcard *.cpp)) + $(CXX) -o $@ $^ $(LDFLAGS) + +%.o: %.cpp $(wildcard *.h) + $(CXX) $(CXXFLAGS) -c -o $@ $< diff --git a/ast.cpp b/ast.cpp new file mode 100644 index 0000000..88d716a --- /dev/null +++ b/ast.cpp @@ -0,0 +1,244 @@ +#include +#include +#include "ast.h" + +using namespace std; + + +ParseError::ParseError(const string &what_arg) + :runtime_error(what_arg){} +ParseError::ParseError(const char *what_arg) + :runtime_error(what_arg){} + + +Lambda::Lambda(){} +Lambda::Lambda(const Name &arg,const AST &ast) + :arg(arg),body(ast){} + + +AST::AST() + :type(Type::tuple){} + +AST AST::makeNumber(Number numval){ + AST ast; ast.type=AST::Type::number; ast.numval=numval; return ast; +} +AST AST::makeString(String strval){ + AST ast; ast.type=AST::Type::string; ast.strval=strval; return ast; +} +AST AST::makeName(Name nameval){ + AST ast; ast.type=AST::Type::name; ast.nameval=nameval; return ast; +} +AST AST::makeIndex(Index indexval){ + AST ast; ast.type=AST::Type::index; ast.indexval=indexval; return ast; +} +AST AST::makeTuple(Terms terms){ + AST ast; ast.type=AST::Type::tuple; ast.terms=terms; return ast; +} +AST AST::makeLambda(Lambda lambdaval){ + AST ast; ast.type=AST::Type::lambda; ast.lambdaval=lambdaval; return ast; +} +AST AST::makeLambda(const Name &arg,const AST &body){ + AST ast; ast.type=AST::Type::lambda; ast.lambdaval.arg=arg; ast.lambdaval.body=body; return ast; +} +AST AST::makeNative(const Native &native){ + AST ast; ast.type=AST::Type::native; ast.nativeval=native; return ast; +} + + +bool iswordchar(char c){ + return isalpha(c)||isdigit(c)||strchr("!$%&*+,-./:;<=>?@^_|~",c)!=nullptr; +} + +class AST::Tokeniser{ + const string source; + const i64 size; + i64 index=0,nextat=0; + +public: + Tokeniser(const string &source) + :source(source),size(source.size()){ + // cerr<<"Tokeniser: initialised with <<"<>"<>"<>"<>"<1&&token[0]=='-'&&isdigit(token[1]))){ + // cerr<<"AST::parse: type = number"<=32&&c<=126){ + os< +#include +#include +#include +#include "global.h" +#include "indirect.h" + +using namespace std; + + +class AST; + + +using Number = i64; +using String = string; +using Name = string; +using Index = i64; +class Terms : public vector{ +public: + using vector::vector; + using vector::operator=; +}; +class Lambda{ +public: + Name arg; // if empty, then can only be referred to with indices + Indirect body=Indirect::makeEmpty(); + + Lambda(); + Lambda(const Name &arg,const AST &ast); +}; +using Native = function; + + + +class ParseError : public runtime_error{ +public: + explicit ParseError(const string &what_arg); + explicit ParseError(const char *what_arg); +}; + +class AST{ +public: + enum class Type{ + number, + string, + name, + index, + tuple, + lambda, + native, + }; + + Type type; + Number numval; + String strval; + Name nameval; + Index indexval; + Terms terms; + Lambda lambdaval; + Native nativeval; + + bool quoted=false; + +private: + class Tokeniser; + AST& parse(Tokeniser &tokeniser); + +public: + AST(); // initialises to nil value () + explicit AST(const string &source); // parses source + explicit AST(const char *source); // parses source + + static AST makeNumber(Number numval); + static AST makeString(String strval); + static AST makeName(Name nameval); + static AST makeIndex(Index indexval); + static AST makeTuple(Terms terms); + static AST makeLambda(Lambda lambdaval); + static AST makeLambda(const Name &arg,const AST &body); + static AST makeNative(const Native &native); +}; + +ostream& operator<<(ostream &os,const AST &ast); diff --git a/environment.cpp b/environment.cpp new file mode 100644 index 0000000..1d2c657 --- /dev/null +++ b/environment.cpp @@ -0,0 +1,383 @@ +#include +#include +#include "environment.h" +#include "error.h" + +using namespace std; + +#undef DEBUG + + +void Environment::load(const Environment &other){ + defs.insert(other.defs.begin(),other.defs.end()); + hooks.insert(other.hooks.begin(),other.hooks.end()); +} + +void Environment::define(const Name &name,const AST &ast){ + defs.insert({name,ast}); +} + +void Environment::define(const Name &name,const Hook &hook){ + hooks.insert({name,hook}); +} + +void Environment::define2(const Name &name,const Hook2 &hook2){ + hooks.insert({name,[hook2](Environment &env,const AST &arg1) -> AST { + return AST::makeNative([&env,arg1,hook2](const AST &arg2) -> AST { + return hook2(env,arg1,arg2); + }); + }}); +} + +AST Environment::get(const Name &name){ + auto it=defs.find(name); + if(it==defs.end()){ + auto it=hooks.find(name); + if(it==hooks.end()){ + throw NameError(name); + } + Hook hook=it->second; + return AST::makeNative([this,hook](const AST &ast){ + return hook(*this,ast); + }); + } + return it->second; +} + + +// ------------------------------------------------------------ + + +void indexReplace(AST &ast,const Name &name,Index index){ + if(ast.quoted){ + return; + } + + switch(ast.type){ + case AST::Type::number: + case AST::Type::string: + case AST::Type::index: + case AST::Type::native: + break; + + case AST::Type::name: + if(ast.nameval==name){ + ast.type=AST::Type::index; + ast.indexval=index; + } + break; + + case AST::Type::tuple: + for(AST &term : ast.terms){ + indexReplace(term,name,index); + } + break; + + case AST::Type::lambda: + if(ast.lambdaval.arg!=name){ + indexReplace(*ast.lambdaval.body,name,index+1); + } + break; + } +} + + +void indexify(AST &ast){ + if(ast.quoted){ + return; + } + + switch(ast.type){ + case AST::Type::number: + case AST::Type::string: + case AST::Type::name: + case AST::Type::index: + case AST::Type::native: + break; + + case AST::Type::tuple: + for(AST &term : ast.terms){ + indexify(term); + } + break; + + case AST::Type::lambda: + indexReplace(*ast.lambdaval.body,ast.lambdaval.arg,1); + ast.lambdaval.arg=""; + indexify(*ast.lambdaval.body); + break; + } +} + +void singlify(AST &ast){ + if(ast.quoted){ + return; + } + + switch(ast.type){ + case AST::Type::number: + case AST::Type::string: + case AST::Type::name: + case AST::Type::index: + case AST::Type::native: + break; + + case AST::Type::lambda: + singlify(*ast.lambdaval.body); + break; + + case AST::Type::tuple: + if(ast.terms.size()==0){ + break; + } + if(ast.terms.size()==1){ + AST newast=ast.terms[0]; + ast=newast; + singlify(ast); + break; + } + while(ast.terms.size()>2){ + AST two=AST::makeTuple({ast.terms[0],ast.terms[1]}); + ast.terms.erase(ast.terms.begin()+1); + ast.terms[0]=move(two); + } + if(ast.terms.size()==2){ + singlify(ast.terms[0]); + singlify(ast.terms[1]); + } + break; + } +} + + +AST Environment::run(const AST &astinput){ + AST ast(astinput); + indexify(ast); +#ifdef DEBUG + cerr<<"indexify gave "<> &nodes){ + if(ast.quoted){ + return; + } + + switch(ast.type){ + case AST::Type::number: + case AST::Type::string: + case AST::Type::name: + case AST::Type::native: + break; + + case AST::Type::index: + if(ast.indexval==index){ + nodes.emplace_back(&ast,index); + } + break; + + case AST::Type::tuple: + for(AST &term : ast.terms){ + recursiveFindLevel(term,index,nodes); + } + break; + + case AST::Type::lambda: + recursiveFindLevel(*ast.lambdaval.body,index+1,nodes); + break; + } +} + + +void increaseFree(AST &ast,Index amount,Index fromIndex){ + if(ast.quoted){ + return; + } + + switch(ast.type){ + case AST::Type::number: + case AST::Type::string: + case AST::Type::name: + case AST::Type::native: + break; + + case AST::Type::index: + if(ast.indexval>=fromIndex){ + ast.indexval+=amount; + } + break; + + case AST::Type::tuple: + for(AST &term : ast.terms){ + increaseFree(term,amount,fromIndex); + } + break; + + case AST::Type::lambda: + increaseFree(*ast.lambdaval.body,amount,fromIndex+1); + break; + } +} + + +bool hasFree(AST &ast,Index fromIndex){ + if(ast.quoted){ + return false; + } + + switch(ast.type){ + case AST::Type::number: + case AST::Type::string: + case AST::Type::native: + return false; + + case AST::Type::name: + return true; + + case AST::Type::index: + return ast.indexval>=fromIndex; + + case AST::Type::tuple: + for(AST &term : ast.terms){ + if(hasFree(term,fromIndex)){ + return true; + } + } + return false; + + case AST::Type::lambda: + return hasFree(*ast.lambdaval.body,fromIndex+1); + } +} + + +#ifdef DEBUG +static string indent(i64 depth){ + string s(2*depth,' '); + for(i64 i=0;i &p : repl){ + *p.first=ast.terms[1]; + increaseFree(*p.first,p.second-1,1); + } + newterm=ast.terms[0]; + ast=newterm; + success=true; + } else if(ast.terms[0].type==AST::Type::native){ + reduce(ast.terms[1],depth+1); + ast=ast.terms[0].nativeval(ast.terms[1]); + success=true; + } else if(ast.terms[0].type==AST::Type::name&&ast.terms[0].nameval=="do"){ + reduce(ast.terms[1],depth+1); + ast=ast.terms[0]; + success=true; + } else { + success=false; + } + +#ifdef DEBUG + cerr< "<0); + if(ast.type==AST::Type::name){ + // TODO: this is really dodgy; why is this necessary? + reduce(ast,depth+1); + } + break; + } +#ifdef DEBUG + cerr< "< +#include +#include +#include "ast.h" +#include "global.h" + +using namespace std; + + +class Environment{ +public: + using Hook = function; + using Hook2 = function; + +private: + unordered_map defs; + unordered_map hooks; + + void reduce(AST &ast,i64 depth=0); + bool betareduce(AST &ast,i64 depth); + +public: + void load(const Environment &other); + + AST run(const AST &ast); + + void define(const Name &name,const AST &ast); + void define(const Name &name,const Hook &hook); + void define2(const Name &name,const Hook2 &hook2); + + AST get(const Name &name); +}; diff --git a/error.cpp b/error.cpp new file mode 100644 index 0000000..2084319 --- /dev/null +++ b/error.cpp @@ -0,0 +1,13 @@ +#include "error.h" + +using namespace std; + +NameError::NameError(const string &what_arg) + :runtime_error("Name '"+what_arg+"' not found"){} +NameError::NameError(const char *what_arg) + :NameError(string(what_arg)){} + +TypeError::TypeError(const string &what_arg) + :runtime_error(what_arg){} +TypeError::TypeError(const char *what_arg) + :runtime_error(what_arg){} diff --git a/error.h b/error.h new file mode 100644 index 0000000..02aafec --- /dev/null +++ b/error.h @@ -0,0 +1,19 @@ +#pragma once + +#include +#include + +using namespace std; + + +class NameError : public runtime_error{ +public: + NameError(const string &what_arg); + NameError(const char *what_arg); +}; + +class TypeError : public runtime_error{ +public: + TypeError(const string &what_arg); + TypeError(const char *what_arg); +}; diff --git a/global.h b/global.h new file mode 100644 index 0000000..522dd1f --- /dev/null +++ b/global.h @@ -0,0 +1,20 @@ +#pragma once + +#include + +using i64 = int64_t; +using u64 = uint64_t; + +#define TYPESUBCLASS(parenttype,newtype) \ + class newtype : public parenttype{ \ + public: \ + using parenttype::parenttype; \ + using parenttype::operator=; \ + } + +#define TYPESUBCLASSTEMPLATE(parenttype,parenttemplate,newtype) \ + class newtype : public parenttype parenttemplate{ \ + public: \ + using parenttype parenttemplate::parenttype; \ + using parenttype parenttemplate::operator=; \ + } diff --git a/indirect.cpp b/indirect.cpp new file mode 100644 index 0000000..75d35be --- /dev/null +++ b/indirect.cpp @@ -0,0 +1,11 @@ +#include "indirect.h" + +using namespace std; + + +NullIndirectError::NullIndirectError() + :runtime_error("NullIndirectError()"){} +NullIndirectError::NullIndirectError(const string &what_arg) + :runtime_error(what_arg){} +NullIndirectError::NullIndirectError(const char *what_arg) + :runtime_error(what_arg){} diff --git a/indirect.h b/indirect.h new file mode 100644 index 0000000..da93955 --- /dev/null +++ b/indirect.h @@ -0,0 +1,157 @@ +#pragma once + +#include + +using namespace std; + + +class NullIndirectError : public runtime_error{ +public: + NullIndirectError(); + NullIndirectError(const string &what_arg); + NullIndirectError(const char *what_arg); +}; + + +template +class Indirect{ + T *ptr; + + class Dummy{}; + + Indirect(Dummy); + +public: + template + Indirect(Args... args); + + Indirect(const Indirect &other); + Indirect(Indirect &&other); + + ~Indirect(); + + Indirect& operator=(const T &value); + Indirect& operator=(T &&value); + + Indirect& operator=(const Indirect &other); + Indirect& operator=(Indirect &&other); + + bool isEmpty() const; + + T& operator*(); + const T& operator*() const; + + static Indirect makeEmpty(); +}; + +template +Indirect::Indirect(Dummy) + :ptr(nullptr){} + +template +Indirect Indirect::makeEmpty(){ + return Indirect(Indirect::Dummy()); +}; + + +template +template +Indirect::Indirect(Args... args) + :ptr(new T(args...)){} + +template +Indirect::Indirect(const Indirect &other){ + if(!other.ptr){ + ptr=nullptr; + } else { + ptr=new T(*other.ptr); + } +} + +template +Indirect::Indirect(Indirect &&other){ + if(!other.ptr){ + ptr=nullptr; + } else { + ptr=new T(move(*other.ptr)); + other.ptr=nullptr; + } +} + +template +Indirect::~Indirect(){ + if(ptr){ + delete ptr; + } +} + + +template +Indirect& Indirect::operator=(const T &value){ + if(!ptr){ + ptr=new T(value); + } else { + *ptr=value; + } + return *this; +} + +template +Indirect& Indirect::operator=(T &&value){ + if(!ptr){ + ptr=new T(value); + } else { + *ptr=value; + } + return *this; +} + + +template +Indirect& Indirect::operator=(const Indirect &other){ + if(ptr){ + delete ptr; + } + if(!other.ptr){ + ptr=nullptr; + } else { + ptr=new T(*other.ptr); + } + return *this; +} + +template +Indirect& Indirect::operator=(Indirect &&other){ + if(ptr){ + delete ptr; + } + if(!other.ptr){ + ptr=nullptr; + } else { + ptr=new T(move(*other.ptr)); + other.ptr=nullptr; + } + return *this; +} + + +template +bool Indirect::isEmpty() const { + return ptr!=nullptr; +} + +template +T& Indirect::operator*(){ + if(!ptr){ + throw NullIndirectError(); + } + return *ptr; +} + +template +const T& Indirect::operator*() const { + if(!ptr){ + throw NullIndirectError(); + } + return *ptr; +} diff --git a/main.cpp b/main.cpp new file mode 100644 index 0000000..1918874 --- /dev/null +++ b/main.cpp @@ -0,0 +1,29 @@ +#include +#include "ast.h" +#include "environment.h" +#include "error.h" +#include "prelude.h" + +using namespace std; + + +int main(){ + Environment env; + env.load(prelude); + // cerr<<"Global env = "<<&env< "; + while(getline(cin,line)){ + try { + AST parsed(line); + cerr<<"Parsed: "< "; + } + return 0; +} diff --git a/prelude.cpp b/prelude.cpp new file mode 100644 index 0000000..eb503b0 --- /dev/null +++ b/prelude.cpp @@ -0,0 +1,68 @@ +#include +#include +#include +#include "error.h" +#include "prelude.h" + +using namespace std; + + +Environment prelude; + +const AST afterBootstrap=AST(R"RAW( +(do + (def '. \f \g \x (f (g x))) + (def 'flip \f \a \b (f b a)) + (def 'id \x x) + (def 'const \x \y x) + (def 'print (. putstr repr))) +)RAW"); + +class PreludeInit{ +public: + PreludeInit(Environment &intoEnv){ + intoEnv.define("repr",AST::makeNative([](const AST &ast) -> AST { + stringstream ss; + ss< AST { + if(ast.type!=AST::Type::string){ + throw TypeError("Argument to 'putstr' is not a String"); + } + cout< AST { + return AST::makeNative([&env,arg1](const AST &arg2) -> AST { + if(arg1.type!=AST::Type::name){ + throw TypeError("First argument to 'def' is not a Name"); + } + env.define(arg1.nameval,arg2); + return AST(); + }); + }); + + intoEnv.define("do",AST::makeNative([](const AST&) -> AST { + throw logic_error("'do' stub called; this should not happen"); + })); + + intoEnv.define2("+",[](Environment&,const AST &arg1,const AST &arg2) -> AST { + if(arg1.type!=arg2.type){ + throw TypeError("Unequal types in '+'"); + } + if(arg1.type==AST::Type::number){ + return AST::makeNumber(arg1.numval+arg2.numval); + } else if(arg1.type==AST::Type::string){ + return AST::makeString(arg1.strval+arg2.strval); + } else { + throw TypeError("Arguments to '+' neither Number nor String"); + } + }); + + intoEnv.run(afterBootstrap); + } +} preludeInit(prelude); diff --git a/prelude.h b/prelude.h new file mode 100644 index 0000000..643eb43 --- /dev/null +++ b/prelude.h @@ -0,0 +1,6 @@ +#pragma once + +#include "environment.h" + + +extern Environment prelude; -- cgit v1.2.3-70-g09d2