123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188 |
- -module(scheme).
- -export([compile/1, lex/1, parse/1]).
- %%% CONSTANTS %%%
- % Mostly used for built-in Scheme functions.
- -define(PRELUDE, ["+", "-", "*", "/", "=", "<", ">", "<=", ">=",
- "cons", "list", "append", "car", "cdr", "map",
- "filter", "member", "list-ref"]).
- %%% LEXING %%%
- % Lex a string representing Scheme code into a list.
- lex(S) -> lists:filter(fun(Match) -> (Match /= "") and
- (re:run(Match, "[ \n]+") == nomatch) end,
- re:split(S, "(\()|(\))|(')|([^ \n()']+)", [{return, list}])).
- %%% PARSING %%%
- % String -> Regex -> Bool
- % true if Regex matches the entirety of Str; false otherwise.
- string_matches(Str, Regex) -> case re:run(Str, Regex, [{capture, first, list}]) of
- {match, [S]} -> S == Str;
- _ -> false
- end.
- % String -> Bool
- % true if Str consists entirely of number characters; false otherwise.
- is_number_string(Str) -> string_matches(Str, "[0-9]+").
- % [String] -> Heterogeneous List
- % Returns the tuple { Parsed, Unparsed } consisting of a deep list of
- % parsed tokens and a flat list of unparsed tokens.
- parse([]) -> [];
- parse(["(" | Rest]) -> parse_list(Rest);
- parse([")" | _]) -> error;
- parse(["'" | Rest]) -> case parse(Rest) of
- {Dat, R} ->
- {[{atom, "quote"}, Dat], R};
- error ->
- error
- end;
- parse([S | Rest]) -> case is_number_string(S) of
- true ->
- {{number, S}, Rest};
- false ->
- {{atom, S}, Rest}
- end.
- parse_list([]) -> {[], []};
- parse_list([")" | Rest]) -> {[], Rest};
- parse_list(S) -> case parse(S) of
- {L, R} -> case parse_list(R) of
- {List, Rest} -> {lists:append([L], List),
- Rest};
- error -> error
- end;
- error -> error
- end.
- %%% COMPILATION %%%
- % Char -> String
- % converts a Scheme character to an Erlang character for identifiers; converts
- % certain special characters to three-character equivalents.
- char_convert(C) -> case C of
- $* -> "_ml";
- $+ -> "_pl";
- $/ -> "_dv";
- $- -> "_mn";
- $_ -> "_us";
- $< -> "_lt";
- $> -> "_gt";
- $= -> "_eq";
- $! -> "_ex";
- $? -> "_qs";
- $: -> "_cn";
- X -> [X]
- end.
- % a -> Bool
- % Well; "string" is more properly "is a list of non-lists", which also (in this case)
- % includes strings and lists of integers indistinguishably. With that caveat--
- % recogizes whether something is a "string".
- is_string(S) ->
- is_list(S) and lists:foldl(fun(X, Y) -> X and Y end, true,
- lists:map(fun(X) -> not(is_list(X)) end, S)).
- % Heterogeneous List of Strings -> String
- deep_string_append(L) ->
- string:join(lists:map(fun(M) -> case is_string(M) of
- true -> M;
- false -> deep_string_append(M)
- end end, L),
- "").
- % String -> String
- % Convert a string representing a Scheme identifier to a string representing
- % an Erlang function identifier or an atom, i.e. lower-case
- to_erlang_atom([S|XS]) ->
- lists:foldr(fun(X, Y) -> X ++ Y end, "",
- lists:map(fun(C) -> char_convert(C) end,
- [string:to_lower(S)|XS]));
- to_erlang_atom({atom, X}) -> to_erlang_atom(X).
- % Convert a string representing a Scheme identifier to a string representing
- % an Erlang variable, i.e. upper-case.
- to_erlang_variable([S|XS]) ->
- lists:foldr(fun(X, Y) -> X ++ Y end, "",
- lists:map(fun(C) -> char_convert(C) end,
- [string:to_upper(S)|XS]));
- to_erlang_variable({atom, X}) -> to_erlang_variable(X).
- % Heterogeneous List -> String
- generate([{atom, "define"} |
- [ [Name | Args] | Body]], Vars, Variadics) ->
- [to_erlang_atom(Name),
- " ( ", string:join(
- lists:map(fun(X) -> to_erlang_variable(X) end, Args),
- " , "), " ) -> ",
- string:join(lists:map(fun(X) -> generate(X, Vars ++ Args, Variadics) end,
- Body), " ; "),
- " . "];
- generate([{atom, "lambda"} | [Args | Body]], Vars, Variadics) ->
- ["fun (",
- string:join(
- lists:map(fun(X) -> to_erlang_variable(X) end, Args),
- " , "),
- ") -> ",
- string:join(lists:map(fun(X) -> generate(X, Vars ++ Args, Variadics) end,
- Body), " ; "),
- "end"];
- generate([{atom, "if"}
- | [ Condition
- | [ Then_Case
- | [ Else_Case ]]]], Vars, Variadics) ->
- ["case scheme_prelude:is_true( ",
- generate(Condition, Vars, Variadics),
- ") of true -> ",
- generate(Then_Case, Vars, Variadics),
- " ; false -> ",
- generate(Else_Case, Vars, Variadics),
- " end "];
- generate([{atom, "quote"} | [Rest]], _, _) ->
- generate_quoted(Rest);
- generate([{atom, Func} | Args], Vars, Variadics) ->
- case lists:member(Func, Variadics) of
- true -> [generate({atom, Func}, Vars, Variadics),
- " ([ ",
- string:join(lists:map(fun(X) -> generate(X, Vars, Variadics) end, Args),
- [" , "]),
- " ]) "];
- false -> [generate({atom, Func}, Vars, Variadics),
- " ( ",
- string:join(lists:map(fun(X) -> generate(X, Vars, Variadics) end, Args),
- [" , "]),
- " ) "]
- end;
- generate({number, X}, _, _) -> [X];
- generate({atom, X}, Vars, _) ->
- [case lists:member(X, Vars) of
- true -> to_erlang_variable(X);
- false -> case lists:member(X, ?PRELUDE) of
- true -> ["scheme_prelude:", to_erlang_variable(X)];
- false -> to_erlang_variable(X)
- end
- end].
- generate_quoted({atom, X}) ->
- [to_erlang_atom(X)];
- generate_quoted({number, X}) ->
- [X];
- generate_quoted(List) ->
- [" [ ", string:join(lists:map(fun(X) -> generate_quoted(X) end,
- List), [" , "]),
- " ] "].
- % String -> String
- % Compiles a string representing Scheme code into a string representing an
- % Erlang module.
- compile(S) -> case parse_list(lex(S)) of
- {[X|_], _} -> deep_string_append(generate(X,
- [],
- ["-", "+", "*", "list"]));
- _ -> "NOTHING"
- end.
|