Tonksy-fmt
This commit is contained in:
parent
d6a547bdcb
commit
5d78d5f823
|
@ -1,29 +1,29 @@
|
|||
(ns ludus.parser
|
||||
(:require
|
||||
[ludus.token :as token]
|
||||
[ludus.scanner :as scanner]
|
||||
[ludus.ast :as ast]
|
||||
[clojure.pprint :as pp]))
|
||||
(:require
|
||||
[ludus.token :as token]
|
||||
[ludus.scanner :as scanner]
|
||||
[ludus.ast :as ast]
|
||||
[clojure.pprint :as pp]))
|
||||
|
||||
;; a parser map and some functions to work with them
|
||||
(defn- parser [tokens]
|
||||
{::tokens tokens ::token 0 ::ast {}})
|
||||
{::tokens tokens ::token 0 ::ast {}})
|
||||
|
||||
(defn- current [parser]
|
||||
(nth (::tokens parser) (::token parser) nil))
|
||||
(nth (::tokens parser) (::token parser) nil))
|
||||
|
||||
(defn- peek [parser]
|
||||
(nth (::tokens parser) (inc (::token parser)) nil))
|
||||
(nth (::tokens parser) (inc (::token parser)) nil))
|
||||
|
||||
(defn- at-end? [parser]
|
||||
(let [curr (current parser)]
|
||||
(or (nil? curr) (= ::token/eof (::token/type curr)))))
|
||||
(let [curr (current parser)]
|
||||
(or (nil? curr) (= ::token/eof (::token/type curr)))))
|
||||
|
||||
(defn- advance [parser]
|
||||
(update parser ::token inc))
|
||||
(update parser ::token inc))
|
||||
|
||||
(defn- token-type [parser]
|
||||
(::token/type (current parser)))
|
||||
(::token/type (current parser)))
|
||||
|
||||
;; some forward declarations
|
||||
(declare parse-expr)
|
||||
|
@ -31,265 +31,265 @@
|
|||
|
||||
;; various parsing functions
|
||||
(defn- parse-atom [parser token]
|
||||
(-> parser
|
||||
(advance)
|
||||
(assoc ::ast {
|
||||
::ast/type ::ast/atom
|
||||
:value (::token/literal token)})))
|
||||
(-> parser
|
||||
(advance)
|
||||
(assoc ::ast {
|
||||
::ast/type ::ast/atom
|
||||
:value (::token/literal token)})))
|
||||
|
||||
;; just a quick and dirty map to associate atomic words with values
|
||||
(def atomic-words {
|
||||
::token/nil nil
|
||||
::token/true true
|
||||
::token/false false})
|
||||
::token/nil nil
|
||||
::token/true true
|
||||
::token/false false})
|
||||
|
||||
(defn parse-atomic-word [parser token]
|
||||
(-> parser
|
||||
(advance)
|
||||
(assoc ::ast {
|
||||
::ast/type ::ast/atom
|
||||
:value (get atomic-words (::token/type token))})))
|
||||
(-> parser
|
||||
(advance)
|
||||
(assoc ::ast {
|
||||
::ast/type ::ast/atom
|
||||
:value (get atomic-words (::token/type token))})))
|
||||
|
||||
|
||||
(defn- add-member [members member]
|
||||
(if (nil? member)
|
||||
members
|
||||
(conj members member)))
|
||||
(if (nil? member)
|
||||
members
|
||||
(conj members member)))
|
||||
|
||||
(defn- parse-tuple [parser]
|
||||
(loop [parser (advance parser)
|
||||
members []
|
||||
current_member nil]
|
||||
(let [curr (current parser)]
|
||||
(case (::token/type curr)
|
||||
::token/rparen (let [ms (add-member members current_member)]
|
||||
(assoc (advance parser) ::ast
|
||||
{::ast/type ::ast/tuple
|
||||
:length (count ms)
|
||||
:members ms}))
|
||||
(::token/comma ::token/newline) (recur (advance parser) (add-member members current_member) nil)
|
||||
(loop [parser (advance parser)
|
||||
members []
|
||||
current_member nil]
|
||||
(let [curr (current parser)]
|
||||
(case (::token/type curr)
|
||||
::token/rparen (let [ms (add-member members current_member)]
|
||||
(assoc (advance parser) ::ast
|
||||
{::ast/type ::ast/tuple
|
||||
:length (count ms)
|
||||
:members ms}))
|
||||
(::token/comma ::token/newline) (recur (advance parser) (add-member members current_member) nil)
|
||||
|
||||
(let [parsed (parse-expr parser)]
|
||||
(recur parsed members (::ast parsed)))
|
||||
(let [parsed (parse-expr parser)]
|
||||
(recur parsed members (::ast parsed)))
|
||||
|
||||
))))
|
||||
))))
|
||||
|
||||
(defn- parse-list [parser]
|
||||
(loop [parser (advance parser)
|
||||
members []
|
||||
current_member nil]
|
||||
(let [curr (current parser)]
|
||||
(case (::token/type curr)
|
||||
::token/rbracket (let [ms (add-member members current_member)]
|
||||
(assoc (advance parser) ::ast
|
||||
{::ast/type ::ast/list
|
||||
:members ms}))
|
||||
(::token/comma ::token/newline) (recur (advance parser) (add-member members current_member) nil)
|
||||
(loop [parser (advance parser)
|
||||
members []
|
||||
current_member nil]
|
||||
(let [curr (current parser)]
|
||||
(case (::token/type curr)
|
||||
::token/rbracket (let [ms (add-member members current_member)]
|
||||
(assoc (advance parser) ::ast
|
||||
{::ast/type ::ast/list
|
||||
:members ms}))
|
||||
(::token/comma ::token/newline) (recur (advance parser) (add-member members current_member) nil)
|
||||
|
||||
(let [parsed (parse-expr parser)]
|
||||
(recur parsed members (::ast parsed)))
|
||||
(let [parsed (parse-expr parser)]
|
||||
(recur parsed members (::ast parsed)))
|
||||
|
||||
))))
|
||||
))))
|
||||
|
||||
(defn- parse-set [parser]
|
||||
(loop [parser (advance parser)
|
||||
members []
|
||||
current_member nil]
|
||||
(let [curr (current parser)]
|
||||
(case (::token/type curr)
|
||||
::token/rbrace (let [ms (add-member members current_member)]
|
||||
(assoc (advance parser) ::ast
|
||||
{::ast/type ::ast/set
|
||||
:members ms}))
|
||||
(::token/comma ::token/newline) (recur (advance parser) (add-member members current_member) nil)
|
||||
(loop [parser (advance parser)
|
||||
members []
|
||||
current_member nil]
|
||||
(let [curr (current parser)]
|
||||
(case (::token/type curr)
|
||||
::token/rbrace (let [ms (add-member members current_member)]
|
||||
(assoc (advance parser) ::ast
|
||||
{::ast/type ::ast/set
|
||||
:members ms}))
|
||||
(::token/comma ::token/newline) (recur (advance parser) (add-member members current_member) nil)
|
||||
|
||||
(let [parsed (parse-expr parser)]
|
||||
(recur parsed members (::ast parsed)))
|
||||
(let [parsed (parse-expr parser)]
|
||||
(recur parsed members (::ast parsed)))
|
||||
|
||||
))))
|
||||
))))
|
||||
|
||||
(defn- parse-block [parser]
|
||||
(loop [parser (advance parser)
|
||||
exprs []
|
||||
current_expr nil]
|
||||
(case (::token/type (current parser))
|
||||
::token/rbrace
|
||||
(assoc (advance parser) ::ast
|
||||
(if (and (empty? exprs) (nil? current_expr))
|
||||
{::ast/type ::ast/poison :message "Blocks must have at least one expression"}
|
||||
{::ast/type ::ast/block :exprs (add-member exprs current_expr)}))
|
||||
(loop [parser (advance parser)
|
||||
exprs []
|
||||
current_expr nil]
|
||||
(case (::token/type (current parser))
|
||||
::token/rbrace
|
||||
(assoc (advance parser) ::ast
|
||||
(if (and (empty? exprs) (nil? current_expr))
|
||||
{::ast/type ::ast/poison :message "Blocks must have at least one expression"}
|
||||
{::ast/type ::ast/block :exprs (add-member exprs current_expr)}))
|
||||
|
||||
(::token/semicolon ::token/newline)
|
||||
(recur (advance parser) (add-member exprs current_expr) nil)
|
||||
(::token/semicolon ::token/newline)
|
||||
(recur (advance parser) (add-member exprs current_expr) nil)
|
||||
|
||||
(if current_expr
|
||||
(-> parser
|
||||
(advance)
|
||||
(assoc ::ast {::ast/type ::ast/poison :message "Expected end of expression"}))
|
||||
(let [parsed (parse-expr parser)]
|
||||
(recur parsed exprs (::ast parsed))))
|
||||
)))
|
||||
(if current_expr
|
||||
(-> parser
|
||||
(advance)
|
||||
(assoc ::ast {::ast/type ::ast/poison :message "Expected end of expression"}))
|
||||
(let [parsed (parse-expr parser)]
|
||||
(recur parsed exprs (::ast parsed))))
|
||||
)))
|
||||
|
||||
(defn- parse-script [parser]
|
||||
(loop [parser parser
|
||||
exprs []
|
||||
current_expr nil]
|
||||
(case (::token/type (current parser))
|
||||
::token/eof (assoc parser ::ast
|
||||
{::ast/type ::ast/script :exprs (add-member exprs current_expr)})
|
||||
(loop [parser parser
|
||||
exprs []
|
||||
current_expr nil]
|
||||
(case (::token/type (current parser))
|
||||
::token/eof (assoc parser ::ast
|
||||
{::ast/type ::ast/script :exprs (add-member exprs current_expr)})
|
||||
|
||||
(::token/semicolon ::token/newline)
|
||||
(recur (advance parser) (add-member exprs current_expr) nil)
|
||||
(::token/semicolon ::token/newline)
|
||||
(recur (advance parser) (add-member exprs current_expr) nil)
|
||||
|
||||
(if current_expr
|
||||
(-> parser
|
||||
(advance)
|
||||
(assoc ::ast {::ast/type ::ast/poison :message "Expected end of expression"}))
|
||||
(let [parsed (parse-expr parser)]
|
||||
(recur parsed exprs (::ast parsed))))
|
||||
(if current_expr
|
||||
(-> parser
|
||||
(advance)
|
||||
(assoc ::ast {::ast/type ::ast/poison :message "Expected end of expression"}))
|
||||
(let [parsed (parse-expr parser)]
|
||||
(recur parsed exprs (::ast parsed))))
|
||||
|
||||
)))
|
||||
)))
|
||||
|
||||
(defn- parse-synthetic [parser]
|
||||
(loop [parser parser
|
||||
terms []]
|
||||
(let [curr (current parser)
|
||||
type (::token/type curr)]
|
||||
(case type
|
||||
::token/keyword
|
||||
(recur (advance parser) (conj terms (::ast (parse-atom parser curr))))
|
||||
(loop [parser parser
|
||||
terms []]
|
||||
(let [curr (current parser)
|
||||
type (::token/type curr)]
|
||||
(case type
|
||||
::token/keyword
|
||||
(recur (advance parser) (conj terms (::ast (parse-atom parser curr))))
|
||||
|
||||
::token/word
|
||||
(recur (advance parser) (conj terms (::ast (parse-word parser))))
|
||||
::token/word
|
||||
(recur (advance parser) (conj terms (::ast (parse-word parser))))
|
||||
|
||||
::token/lparen
|
||||
(let [parsed (parse-tuple parser)]
|
||||
(recur parsed (conj terms (::ast parsed))))
|
||||
::token/lparen
|
||||
(let [parsed (parse-tuple parser)]
|
||||
(recur parsed (conj terms (::ast parsed))))
|
||||
|
||||
(-> parser
|
||||
(assoc ::ast {::ast/type ::ast/synthetic :terms terms})
|
||||
(-> parser
|
||||
(assoc ::ast {::ast/type ::ast/synthetic :terms terms})
|
||||
|
||||
)))))
|
||||
)))))
|
||||
|
||||
(defn- parse-word [parser]
|
||||
(let [curr (current parser)]
|
||||
(-> parser
|
||||
(advance)
|
||||
(assoc ::ast {::ast/type ::ast/word :word (::token/lexeme curr)}))))
|
||||
(let [curr (current parser)]
|
||||
(-> parser
|
||||
(advance)
|
||||
(assoc ::ast {::ast/type ::ast/word :word (::token/lexeme curr)}))))
|
||||
|
||||
(defn- parse-pattern [parser]
|
||||
(let [curr (current parser)
|
||||
type (::token/type curr)]
|
||||
(case type
|
||||
::token/word (parse-word parser)
|
||||
(let [curr (current parser)
|
||||
type (::token/type curr)]
|
||||
(case type
|
||||
::token/word (parse-word parser)
|
||||
|
||||
(::token/number ::token/string ::token/keyword) (parse-atom parser curr)
|
||||
(::token/number ::token/string ::token/keyword) (parse-atom parser curr)
|
||||
|
||||
(-> parser
|
||||
(advance)
|
||||
(assoc ::ast {::ast/type ::ast/poison :message "Expected pattern"}))
|
||||
)))
|
||||
(-> parser
|
||||
(advance)
|
||||
(assoc ::ast {::ast/type ::ast/poison :message "Expected pattern"}))
|
||||
)))
|
||||
|
||||
(defn- expect [token message parser]
|
||||
(let [curr (current parser)
|
||||
type (::token/type curr)]
|
||||
(if (= type token)
|
||||
(advance parser)
|
||||
(-> parser
|
||||
(advance)
|
||||
(assoc ::ast {::ast/type ::ast/poison :message message})))))
|
||||
(let [curr (current parser)
|
||||
type (::token/type curr)]
|
||||
(if (= type token)
|
||||
(advance parser)
|
||||
(-> parser
|
||||
(advance)
|
||||
(assoc ::ast {::ast/type ::ast/poison :message message})))))
|
||||
|
||||
(defn- accept [token parser]
|
||||
(let [curr (current parser)
|
||||
type (::token/type curr)]
|
||||
(if (= type token)
|
||||
(advance parser)
|
||||
parser)))
|
||||
(let [curr (current parser)
|
||||
type (::token/type curr)]
|
||||
(if (= type token)
|
||||
(advance parser)
|
||||
parser)))
|
||||
|
||||
(defn- accept-many [token parser]
|
||||
(loop [curr (current parser)]
|
||||
(let [type (::token/type curr)]
|
||||
(if (= type token)
|
||||
(recur (advance parser))
|
||||
parser))))
|
||||
(loop [curr (current parser)]
|
||||
(let [type (::token/type curr)]
|
||||
(if (= type token)
|
||||
(recur (advance parser))
|
||||
parser))))
|
||||
|
||||
|
||||
(defn- parse-let [parser]
|
||||
(let [
|
||||
pattern (parse-pattern (advance parser))
|
||||
equals (expect ::token/equals "Expected assignment" pattern)
|
||||
expr (parse-expr equals)
|
||||
results (map #(get-in % [::ast ::ast/type]) [pattern equals expr])
|
||||
]
|
||||
(if (some #(= ::ast/poison %) results)
|
||||
(println ::poison)
|
||||
(assoc expr ::ast {
|
||||
::ast/type ::ast/let
|
||||
:pattern (::ast pattern)
|
||||
:expr (::ast expr)}))
|
||||
))
|
||||
(let [
|
||||
pattern (parse-pattern (advance parser))
|
||||
equals (expect ::token/equals "Expected assignment" pattern)
|
||||
expr (parse-expr equals)
|
||||
results (map #(get-in % [::ast ::ast/type]) [pattern equals expr])
|
||||
]
|
||||
(if (some #(= ::ast/poison %) results)
|
||||
(println ::poison)
|
||||
(assoc expr ::ast {
|
||||
::ast/type ::ast/let
|
||||
:pattern (::ast pattern)
|
||||
:expr (::ast expr)}))
|
||||
))
|
||||
|
||||
(defn- parse-if [parser]
|
||||
(let [
|
||||
if-expr (parse-expr (advance parser))
|
||||
then (expect ::token/then "Expected then" (accept ::token/newline if-expr))
|
||||
then-expr (parse-expr then)
|
||||
else (expect ::token/else "Epected else" (accept ::token/newline then-expr))
|
||||
else-expr (parse-expr else)
|
||||
results (map #(get-in % [::ast ::ast/type]) [if-expr then then-expr else else-expr])
|
||||
]
|
||||
(if (some #(= ::ast/poison %) results)
|
||||
(println ::ast/poison)
|
||||
(assoc else-expr ::ast {
|
||||
::ast/type ::ast/let
|
||||
:if-expr (::ast if-expr)
|
||||
:then-expr (::ast then-expr)
|
||||
:else-expr (::ast else-expr)
|
||||
}))
|
||||
))
|
||||
(let [
|
||||
if-expr (parse-expr (advance parser))
|
||||
then (expect ::token/then "Expected then" (accept ::token/newline if-expr))
|
||||
then-expr (parse-expr then)
|
||||
else (expect ::token/else "Epected else" (accept ::token/newline then-expr))
|
||||
else-expr (parse-expr else)
|
||||
results (map #(get-in % [::ast ::ast/type]) [if-expr then then-expr else else-expr])
|
||||
]
|
||||
(if (some #(= ::ast/poison %) results)
|
||||
(println ::ast/poison)
|
||||
(assoc else-expr ::ast {
|
||||
::ast/type ::ast/let
|
||||
:if-expr (::ast if-expr)
|
||||
:then-expr (::ast then-expr)
|
||||
:else-expr (::ast else-expr)
|
||||
}))
|
||||
))
|
||||
|
||||
(defn- parse-expr [parser]
|
||||
(let [token (current parser)]
|
||||
(case (::token/type token)
|
||||
(let [token (current parser)]
|
||||
(case (::token/type token)
|
||||
|
||||
(::token/number ::token/string)
|
||||
(parse-atom parser token)
|
||||
(::token/number ::token/string)
|
||||
(parse-atom parser token)
|
||||
|
||||
::token/keyword (let [next (peek parser)
|
||||
type (::token/type next)]
|
||||
(if (= type ::token/lparen)
|
||||
(parse-synthetic parser)
|
||||
(parse-atom parser token)))
|
||||
::token/keyword (let [next (peek parser)
|
||||
type (::token/type next)]
|
||||
(if (= type ::token/lparen)
|
||||
(parse-synthetic parser)
|
||||
(parse-atom parser token)))
|
||||
|
||||
::token/word (let [next (peek parser)
|
||||
type (::token/type next)]
|
||||
(case type
|
||||
(::token/lparen ::token/keyword) (parse-synthetic parser)
|
||||
(parse-word parser)))
|
||||
::token/word (let [next (peek parser)
|
||||
type (::token/type next)]
|
||||
(case type
|
||||
(::token/lparen ::token/keyword) (parse-synthetic parser)
|
||||
(parse-word parser)))
|
||||
|
||||
(::token/nil ::token/true ::token/false)
|
||||
(parse-atomic-word parser token)
|
||||
(::token/nil ::token/true ::token/false)
|
||||
(parse-atomic-word parser token)
|
||||
|
||||
::token/lparen (parse-tuple parser)
|
||||
::token/lparen (parse-tuple parser)
|
||||
|
||||
::token/lbracket (parse-list parser)
|
||||
::token/lbracket (parse-list parser)
|
||||
|
||||
::token/startset (parse-set parser)
|
||||
::token/startset (parse-set parser)
|
||||
|
||||
::token/lbrace (parse-block parser)
|
||||
::token/lbrace (parse-block parser)
|
||||
|
||||
::token/let (parse-let parser)
|
||||
::token/let (parse-let parser)
|
||||
|
||||
::token/if (parse-if parser)
|
||||
::token/if (parse-if parser)
|
||||
|
||||
(-> parser
|
||||
(advance)
|
||||
(assoc ::ast {::ast/type ::ast/poison :message "Expected expression"}))
|
||||
(-> parser
|
||||
(advance)
|
||||
(assoc ::ast {::ast/type ::ast/poison :message "Expected expression"}))
|
||||
|
||||
)))
|
||||
)))
|
||||
|
||||
(do
|
||||
(def source "if let foo = :foo
|
||||
(def source "if let foo = :foo
|
||||
then {
|
||||
bar (baz) :quux
|
||||
}
|
||||
|
@ -301,13 +301,13 @@
|
|||
(false, nil, ())
|
||||
]")
|
||||
|
||||
(def tokens (:tokens (scanner/scan source)))
|
||||
(def tokens (:tokens (scanner/scan source)))
|
||||
|
||||
(def p (parser tokens))
|
||||
(def p (parser tokens))
|
||||
|
||||
(-> (parse-script p)
|
||||
(::ast)
|
||||
(pp/pprint)))
|
||||
(-> (parse-script p)
|
||||
(::ast)
|
||||
(pp/pprint)))
|
||||
|
||||
(comment "
|
||||
Further thoughts/still to do:
|
||||
|
|
Loading…
Reference in New Issue
Block a user