Tidying up and polishing prior to publication.

This commit is contained in:
Simon Brooke 2013-11-09 08:51:04 +00:00
parent f9af58889e
commit 6d59b813de
4 changed files with 19 additions and 9 deletions

View file

@ -1,10 +1,10 @@
(defproject milkwood-clj "0.1.0-SNAPSHOT" (defproject milkwood-clj "0.1.0"
:description "Reimplementation of the Milkwood rule driven nonsense generator in Clojure" :description "Rule driven nonsense generator in Clojure"
:url "http://example.com/FIXME" :url "http://example.com/FIXME"
:license {:name "Eclipse Public License" :license {:name "Eclipse Public License"
:url "http://www.eclipse.org/legal/epl-v10.html"} :url "http://www.eclipse.org/legal/epl-v10.html"}
:dependencies [[org.clojure/clojure "1.5.1"] :dependencies [[org.clojure/clojure "1.5.1"]
[org.clojure/tools.cli "0.2.4"]] [org.clojure/tools.cli "0.2.4"]]
:main milkwood-clj.core
:jvm-opts ["-Xss4m"] :jvm-opts ["-Xss4m"]
:profiles {:uberjar {:aot :all}}) :profiles {:uberjar
{:main milkwood-clj.core :aot :all}})

View file

@ -4,6 +4,12 @@
[clojure.set :as set]) [clojure.set :as set])
(:gen-class)) (:gen-class))
(def token-pattern
"Regular expression used to split input into tokens."
;; #"\w+\'[stdm]|\w+|\p{Punct}"
#"\w+['-]\w+|\w+|\p{Punct}"
)
(defn compose-rule (defn compose-rule
"Compose a new rule tree (containing (obviously) only one rule) from this path. "Compose a new rule tree (containing (obviously) only one rule) from this path.
@ -57,6 +63,4 @@
depth: the depth of rules/length of window we're considering" depth: the depth of rules/length of window we're considering"
[file depth] [file depth]
(analyse-tokens nil nil (analyse-tokens nil nil
(map (re-seq token-pattern (slurp file)) depth))
(fn [string] (.toLowerCase string))
(re-seq #"\w+\'[stdm]|\w+|\p{Punct}" (slurp file))) depth))

View file

@ -10,7 +10,10 @@
(defn -main (defn -main
"Parse command line arguments and kick off the process." "Parse command line arguments and kick off the process."
[& args] [& args]
(let [[arguments _ banner] (cli args ["-f" "--file" "The path name of the file to analyse (string)"] (let [[arguments _ banner] (cli args
"Rule driven nonsense generator.
See http://codekata.pragprog.com/2007/01/kata_fourteen_t.html"
["-f" "--file" "The path name of the file to analyse (string)"]
["-l" "--output-length" ["-l" "--output-length"
"The length in tokens of the output to generate (integer)" "The length in tokens of the output to generate (integer)"
:parse-fn #(Integer. %) :parse-fn #(Integer. %)

View file

@ -4,7 +4,10 @@
(:gen-class)) (:gen-class))
(def end-magic-token "END") (def end-magic-token
"A token to mark the end of the generated test, used to
distinguish completion from failure."
"ENDMAGICTOKEN")
(defn next-tokens (defn next-tokens
"Given these rules and this path, return a list of valid next tokens to emit. "Given these rules and this path, return a list of valid next tokens to emit.