%classpath config resolver snapshots https://repository.apache.org/content/repositories/snapshots
%classpath config resolver vendredi https://repository.hellonico.info/repository/hellonico/
%classpath config resolver staging https://repository.apache.org/content/repositories/staging
Added new repo: snapshots Added new repo: vendredi Added new repo: staging
%classpath add mvn org.apache.mxnet.contrib.clojure clojure-mxnet-linux-cpu 1.4.0
%classpath add mvn origami origami 4.0.0-7
(require '[clojure.java.io :as io])
;; MXNet namespaces
(require '[org.apache.clojure-mxnet.image :as mx-img])
(require '[org.apache.clojure-mxnet.ndarray :as ndarray])
(require '[org.apache.clojure-mxnet.shape :as mx-shape])
;; OpenCV namespaces
(require '[opencv4.colors.rgb :as rgb])
(require '[opencv4.mxnet :as mx-cv])
(require '[opencv4.core :as cv])
(require '[opencv4.utils :as cvu])
(import org.opencv.core.Mat)
(import java.awt.image.DataBufferByte)
class java.awt.image.DataBufferByte
(defn download!
"Download `uri` and store it in `filename` on disk"
[uri filename]
(with-open [in (io/input-stream uri)
out (io/output-stream filename)]
(io/make-parents filename)
(io/copy in out)))
#'beaker_clojure_shell_130355d5-3a4d-45b3-b4dd-681b29f5432e/download!
;; Download a cat image from a `uri` and save it into `images/cat.jpg`
(download! "https://raw.githubusercontent.com/dmlc/web-data/master/mxnet/doc/tutorials/python/predict_image/cat.jpg" "images/cat.jpg")
;; Download a dog image from a `uri` and save it into `images/dog.jpg`
(download! "https://github.com/dmlc/web-data/blob/master/mxnet/doc/tutorials/python/predict_image/dog.jpg?raw=true" "images/dog.jpg")
null
(-> "images/dog.jpg"
;; Convert filename to NDArray
(mx-img/read-image {:to-rgb true}) ;; option :to-rgb, true by default
;; Resizing image to height = 400, width = 400
(mx-img/resize-image 400 400)
;; Convert to BufferedImage
(mx-img/to-image)
;; Saving BufferedImage to disk
(javax.imageio.ImageIO/write "jpg" (java.io.File. "test2.jpg")))
true
(defn mat->ndarray
"Convert a `mat` from OpenCV to an MXNet `ndarray`"
[mat]
(let [h (.height mat)
w (.width mat)
c (.channels mat)]
(-> mat
cvu/mat->flat-rgb-array
(ndarray/array [c h w]))))
(defn ndarray->mat
"Convert a `ndarray` to an OpenCV `mat`"
[ndarray]
(let [shape (mx-shape/->vec ndarray)
[h w _ _] (mx-shape/->vec (ndarray/shape ndarray))
bytes (byte-array shape)
mat (cv/new-mat h w cv/CV_8UC3)]
(.put mat 0 0 bytes)
mat))
#'beaker_clojure_shell_130355d5-3a4d-45b3-b4dd-681b29f5432e/ndarray->mat
(defn filename->ndarray!
"Convert an image stored on disk `filename` into an `ndarray`
`filename`: string representing the image on disk
`shape-vec`: is the actual shape of the returned `ndarray`
return: ndarray"
[filename shape-vec]
(-> filename
(cv/imread)
(mat->ndarray)))
#'beaker_clojure_shell_130355d5-3a4d-45b3-b4dd-681b29f5432e/filename->ndarray!
(defn draw-bounding-box!
"Draw bounding box on `img` given the `top-left` and `bottom-right` coordonates.
Add `label` when provided.
returns: nil"
[img {:keys [label top-left bottom-right]}]
(let [[x0 y0] top-left
[x1 y1] bottom-right
top-left-point (cv/new-point x0 y0)
bottom-right-point (cv/new-point x1 y1)]
(cv/rectangle img top-left-point bottom-right-point rgb/white 1)
(when label
(cv/put-text! img label top-left-point cv/FONT_HERSHEY_DUPLEX 1.0 rgb/white 1))))
#'beaker_clojure_shell_130355d5-3a4d-45b3-b4dd-681b29f5432e/draw-bounding-box!
(defn draw-predictions!
"Draw all predictions on an `img` passing `results` which is a collection
of bounding boxes data.
returns: nil"
[img results]
(doseq [{:keys [label top-left bottom-right] :as result} results]
(draw-bounding-box! img result)))
#'beaker_clojure_shell_130355d5-3a4d-45b3-b4dd-681b29f5432e/draw-predictions!
(require '[clojure.string :as string])
;; MXNet namespaces
(require '[org.apache.clojure-mxnet.module :as m])
(require '[org.apache.clojure-mxnet.ndarray :as ndarray])
;; OpenCV namespaces
(require '[opencv4.core :as cv])
(require '[opencv4.utils :as cvu])
java.io.FileNotFoundException: Could not locate org/apache/clojure_mxnet/module__init.class or org/apache/clojure_mxnet/module.clj on classpath. Please check that namespaces with dashes use underscores in the Clojure file name. at clojure.lang.RT.load(RT.java:463) at clojure.lang.RT.load(RT.java:426) at clojure.core$load$fn__6548.invoke(core.clj:6046) at clojure.core$load.invokeStatic(core.clj:6045) at clojure.core$load.doInvoke(core.clj:6029) at clojure.lang.RestFn.invoke(RestFn.java:408) at clojure.core$load_one.invokeStatic(core.clj:5848) at clojure.core$load_one.invoke(core.clj:5843) at clojure.core$load_lib$fn__6493.invoke(core.clj:5888) at clojure.core$load_lib.invokeStatic(core.clj:5887) at clojure.core$load_lib.doInvoke(core.clj:5868) at clojure.lang.RestFn.applyTo(RestFn.java:142) at clojure.core$apply.invokeStatic(core.clj:659) at clojure.core$load_libs.invokeStatic(core.clj:5925) at clojure.core$load_libs.doInvoke(core.clj:5909) at clojure.lang.RestFn.applyTo(RestFn.java:137) at clojure.core$apply.invokeStatic(core.clj:659) at clojure.core$require.invokeStatic(core.clj:5947) at clojure.core$require.doInvoke(core.clj:5947) at clojure.lang.RestFn.invoke(RestFn.java:408) at beaker_clojure_shell_a443d272_058c_4787_9d4d_a0e0eb8d09ba$eval161.invokeStatic(Unknown Source) at beaker_clojure_shell_a443d272_058c_4787_9d4d_a0e0eb8d09ba$eval161.invoke(Unknown Source) at clojure.lang.Compiler.eval(Compiler.java:7062) at clojure.lang.Compiler.load(Compiler.java:7514) at clojure.lang.Compiler.load(Compiler.java:7461) at clojure.core$load_reader.invokeStatic(core.clj:4053) at clojure.core$load_string.invokeStatic(core.clj:4055) at clojure.core$load_string.invoke(core.clj:4055) at beaker_clojure_shell_a443d272_058c_4787_9d4d_a0e0eb8d09ba$run_str_a443d272_058c_4787_9d4d_a0e0eb8d09ba.invokeStatic(Unknown Source) at beaker_clojure_shell_a443d272_058c_4787_9d4d_a0e0eb8d09ba$run_str_a443d272_058c_4787_9d4d_a0e0eb8d09ba.invoke(Unknown Source) at clojure.lang.Var.invoke(Var.java:381) at com.twosigma.beakerx.clojure.evaluator.ClojureEvaluator.runCode(ClojureEvaluator.java:164) at com.twosigma.beakerx.clojure.evaluator.ClojureCodeRunner.call(ClojureCodeRunner.java:47) at com.twosigma.beakerx.clojure.evaluator.ClojureCodeRunner.call(ClojureCodeRunner.java:28) at java.util.concurrent.FutureTask.run(FutureTask.java:266) at java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1142) at java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:617) at java.lang.Thread.run(Thread.java:745)
(require '[org.apache.clojure-mxnet.dtype :as d])
null
(def model-dir "model/")
(def h 224) ;; Image height
(def w 224) ;; Image width
(def c 3) ;; Number of channels: Red, Green, Blue
(defonce vgg-16-mod
(-> {:prefix (str model-dir "vgg16") :epoch 0}
(m/load-checkpoint)
;; Define the shape of input data and bind the name of the input layer
;; to "data"
(m/bind {:for-training false
:data-shapes [{:name "data" :shape [1 c h w]}]})))
(defonce inception-mod
(-> {:prefix (str model-dir "Inception-BN") :epoch 0}
(m/load-checkpoint)
;; Define the shape of input data and bind the name of the input layer
;; to "data"
(m/bind {:for-training false
:data-shapes [{:name "data" :shape [1 c h w]}]})))
#'beaker_clojure_shell_130355d5-3a4d-45b3-b4dd-681b29f5432e/inception-mod
(defonce image-net-labels
(-> (str model-dir "/synset.txt")
(slurp)
(string/split #"\n")))
;; ImageNet 1000 Labels check
(assert (= 1000 (count image-net-labels)))
java.lang.RuntimeException: No such namespace: string at clojure.lang.Util.runtimeException(Util.java:221) at clojure.lang.Compiler.resolveIn(Compiler.java:7269) at clojure.lang.Compiler.resolve(Compiler.java:7243) at clojure.lang.Compiler.analyzeSymbol(Compiler.java:7204) at clojure.lang.Compiler.analyze(Compiler.java:6752) at clojure.lang.Compiler.analyze(Compiler.java:6729) at clojure.lang.Compiler$InvokeExpr.parse(Compiler.java:3813) at clojure.lang.Compiler.analyzeSeq(Compiler.java:7005) at clojure.lang.Compiler.analyze(Compiler.java:6773) at clojure.lang.Compiler.analyzeSeq(Compiler.java:6991) at clojure.lang.Compiler.analyze(Compiler.java:6773) at clojure.lang.Compiler.access$300(Compiler.java:38) at clojure.lang.Compiler$DefExpr$Parser.parse(Compiler.java:595) at clojure.lang.Compiler.analyzeSeq(Compiler.java:7003) at clojure.lang.Compiler.analyze(Compiler.java:6773) at clojure.lang.Compiler.analyze(Compiler.java:6729) at clojure.lang.Compiler$BodyExpr$Parser.parse(Compiler.java:6100) at clojure.lang.Compiler.analyzeSeq(Compiler.java:7003) at clojure.lang.Compiler.analyze(Compiler.java:6773) at clojure.lang.Compiler.analyze(Compiler.java:6729) at clojure.lang.Compiler$IfExpr$Parser.parse(Compiler.java:2830) at clojure.lang.Compiler.analyzeSeq(Compiler.java:7003) at clojure.lang.Compiler.analyze(Compiler.java:6773) at clojure.lang.Compiler.analyzeSeq(Compiler.java:6991) at clojure.lang.Compiler.analyze(Compiler.java:6773) at clojure.lang.Compiler.analyze(Compiler.java:6729) at clojure.lang.Compiler$BodyExpr$Parser.parse(Compiler.java:6100) at clojure.lang.Compiler$LetExpr$Parser.parse(Compiler.java:6420) at clojure.lang.Compiler.analyzeSeq(Compiler.java:7003) at clojure.lang.Compiler.analyze(Compiler.java:6773) at clojure.lang.Compiler.analyze(Compiler.java:6729) at clojure.lang.Compiler$BodyExpr$Parser.parse(Compiler.java:6100) at clojure.lang.Compiler$FnMethod.parse(Compiler.java:5460) at clojure.lang.Compiler$FnExpr.parse(Compiler.java:4022) at clojure.lang.Compiler.analyzeSeq(Compiler.java:7001) at clojure.lang.Compiler.analyze(Compiler.java:6773) at clojure.lang.Compiler.eval(Compiler.java:7059) at clojure.lang.Compiler.load(Compiler.java:7514) at clojure.lang.Compiler.load(Compiler.java:7461) at clojure.core$load_reader.invokeStatic(core.clj:4053) at clojure.core$load_string.invokeStatic(core.clj:4055) at clojure.core$load_string.invoke(core.clj:4055) at beaker_clojure_shell_a443d272_058c_4787_9d4d_a0e0eb8d09ba$run_str_a443d272_058c_4787_9d4d_a0e0eb8d09ba.invokeStatic(Unknown Source) at beaker_clojure_shell_a443d272_058c_4787_9d4d_a0e0eb8d09ba$run_str_a443d272_058c_4787_9d4d_a0e0eb8d09ba.invoke(Unknown Source) at clojure.lang.Var.invoke(Var.java:381) at com.twosigma.beakerx.clojure.evaluator.ClojureEvaluator.runCode(ClojureEvaluator.java:164) at com.twosigma.beakerx.clojure.evaluator.ClojureCodeRunner.call(ClojureCodeRunner.java:47) at com.twosigma.beakerx.clojure.evaluator.ClojureCodeRunner.call(ClojureCodeRunner.java:28) at java.util.concurrent.FutureTask.run(FutureTask.java:266) at java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1142) at java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:617) at java.lang.Thread.run(Thread.java:745)
(defn preprocess-img-mat
"Preprocessing steps on an `img-mat` from OpenCV to feed into the Model"
[img-mat]
(-> img-mat
;; Resize image to (w, h)
(cv/resize! (cv/new-size w h))
;; Maps pixel values from [-128, 128] to [0, 127]
(cv/convert-to! cv/CV_8SC3 0.5)
;; Substract mean pixel values from ImageNet dataset
(cv/add! (cv/new-scalar -103.939 -116.779 -123.68))
;; Flatten matrix
(cvu/mat->flat-rgb-array)
;; Reshape to (1, c, h, w)
(ndarray/array [1 c h w])))
#'beaker_clojure_shell_1adc332d-8bd2-42c6-8038-38d33cd15c5d/preprocess-img-mat
(defn- top-k
"Return top `k` from prob-maps with :prob key"
[k prob-maps]
(->> prob-maps
(sort-by :prob)
(reverse)
(take k)))
(defn predict
"Predict with `model` the top `k` labels from `labels` of the ndarray `x`"
([model labels x]
(predict model labels x 5))
([model labels x k]
(let [probs (-> model
(m/forward {:data [x]})
(m/outputs)
(ffirst)
(ndarray/->vec))
prob-maps (mapv (fn [p l] {:prob p :label l}) probs labels)]
(top-k k prob-maps))))
#'beaker_clojure_shell_1adc332d-8bd2-42c6-8038-38d33cd15c5d/predict
(->> "images/cat.jpg"
(cv/imread)
(preprocess-img-mat)
(predict inception-mod image-net-labels))
(comment (->> "images/cat.jpg"
(cv/imread)
(preprocess-img-mat)
(predict vgg-16-mod image-net-labels)))
(defonce image-net-labels
(-> (str model-dir "/synset.txt")
(slurp)
(string/split #"\n")))
;; ImageNet 1000 Labels check
(assert (= 1000 (count image-net-labels)))
(defn preprocess-img-mat
"Preprocessing steps on an `img-mat` from OpenCV to feed into the Model"
[img-mat]
(-> img-mat
;; Resize image to (w, h)
(cv/resize! (cv/new-size w h))
;; Maps pixel values from [-128, 128] to [0, 127]
(cv/convert-to! cv/CV_8SC3 0.5)
;; Substract mean pixel values from ImageNet dataset
(cv/add! (cv/new-scalar -103.939 -116.779 -123.68))
;; Flatten matrix
(cvu/mat->flat-rgb-array)
;; Reshape to (1, c, h, w)
(ndarray/array [1 c h w])))
First getting the dependencies from maven (might take some time, so one has to wait until the final output before going further).
%classpath add mvn rhizome rhizome 0.2.9
%classpath add mvn instaparse instaparse 1.4.9
;; with leiningen one would have a project.clj with
;;
;;(defproject languages "0.1.0-SNAPSHOT"
;; :description "FIXME: write description"
;; :url "http://example.com/FIXME"
;; :license {:name "Eclipse Public License"
;; :url "http://www.eclipse.org/legal/epl-v10.html"}
;; :dependencies [[org.clojure/clojure "1.8.0"]
;; [instaparse "1.4.9"]
;; [rhizome "0.2.9"]])
null
If we only ever wanted to parse integers, of course we would just use Integer.pasreInt()
or actually Long.parseLong()
. However, as this is just a stepping stone to more interesting languages, we will use the same infrastructure of parsing and then interpreting or compiling.
When represented as a string of characters, integers are a string of one or more digits possibly prefixed by a minus sign for negative numbers.
One could write the following parsing rule using only literal terminals :
number= '-'? ('0'|'1'|'2'|'3'|'4'|'5'|'6'|'7'|'8'|'9')+
Note that this will accept leading zeros while we could also want to forbid them.
Parsing the string "-123"
would give the following result :[:number "-" "1" "2" "3"]
So it would be up to the AST processing step to collate those strings before turning them into a number.
In order to speed both the parsing and the processing of our numbers, we can /tokenize/ them with a regular expression instead :
NUMBER= #'-?[0-9]+'
In Clojure, we can build the parser using the instaparse library :
(use 'instaparse.core)
(def const-parser
(instaparse.core/parser
"PROG= NUMBER
NUMBER= #'-?[0-9]+'"))
(prn (const-parser "-123"))
[:PROG [:NUMBER "-123"]]
null
(System/setProperty "java.awt.headless" "true");; required for the notebook
(use 'rhizome.viz)
(instaparse.core/visualize (const-parser "-256") :output-file :buffered-image )
But this minimal parser fails to parse strings that we would want to consider valid :
(prn (const-parser " -123456 "))
Parse error at line 1, column 1: -123456 ^ Expected: #"-?[0-9]+" (followed by end-of-string)
null
As we want to handle spaces before and after the number, we have to modify the grammar accordingly. For efficiency reasons, we also handle the plurality of consecutive spaces at the lexing stage with a regular expression :
(def const-parser
(instaparse.core/parser
"prog= spaces number spaces
number=#'-?[0-9]+'
<spaces> = <#'[ ]'*>"))
(instaparse.core/visualize (const-parser " -123456 ") :output-file :buffered-image )
Exercice : What if we remove the angle brackets in the grammar rules ?
The simplest interpreter would be something like :
(defn const-interpreter [ast]
(instaparse.core/transform {:number #(Long/parseLong %)} ast))
#'beaker_clojure_shell_24f2c611-5642-4afc-b5bf-59a032bac84a/const-interpreter
(prn (-> "-123" const-parser const-interpreter))
[:prog -123]
null
However, as we will want reuse code between the various languages, we will separate the language specific transform map and a generic function to turn an AST into a clojure function.
The generic function taking a transform map and returning the function turning an AST into a clojure function :
(defn dynamic-eval [interpreter]
(fn[ast]
(fn[]
(instaparse.core/transform interpreter ast))))
#'beaker_clojure_shell_24f2c611-5642-4afc-b5bf-59a032bac84a/dynamic-eval
We can use this function for our const language to create a const-eval
function that will turn an AST into a clojure function:
(def const-interpreting
{:prog identity
:number #(Long/parseLong %)})
(def const-eval (dynamic-eval const-interpreting))
#'beaker_clojure_shell_24f2c611-5642-4afc-b5bf-59a032bac84a/const-eval
This function can be called on the result of parsing a string :
(def const-eval-test (-> "-123 " const-parser const-eval))
#'beaker_clojure_shell_24f2c611-5642-4afc-b5bf-59a032bac84a/const-eval-test
The result can then be called like any other clojure function :
(const-eval-test)
-123
The compiler will be implemented in two steps :
As we will be processing an AST, we can do this with a transform map :
(def const-compiling
{:prog (fn[& instrs](conj (reduce into [[:loadi 0]] instrs)[:reti]))
:number #(vector [:loadi (Long/parseLong %)])})
#'beaker_clojure_shell_24f2c611-5642-4afc-b5bf-59a032bac84a/const-compiling
The first [:loadi 0]
will be useful when we allow empty programs : we will
then always have a 0 on the stack, to return if nothing has been put on the
stack by the program.
(prn (->> "-123" const-parser (instaparse.core/transform const-compiling)))
[[:loadi 0] [:loadi -123] [:reti]]
null
The actual bytecode will be generated by reducing a function over our sequence of bytecode instructions, calling the relevant method from a MethodVisitor object. The simplest way to implement it is the following :
(import '(clojure.asm Opcodes Type ClassWriter))
(import '(clojure.asm.commons Method GeneratorAdapter))
class clojure.asm.commons.GeneratorAdapter
(defn const-instr-generating [mv instr]
"Generate the method call to an org.objectweb.asm.MethodVisitor for a given instruction."
(do
(condp = (first instr)
:loadi (.visitLdcInsn mv (int (second instr)))
:reti (.visitInsn mv Opcodes/IRETURN)
)
mv))
#'beaker_clojure_shell_24f2c611-5642-4afc-b5bf-59a032bac84a/const-instr-generating
A compiled
function will take care of creating class with a given class name,
generating the bytecode in a static method called run
and returning a clojure
function calling the static method. We will be forward thinking by taking a
number of arguments as a parameter, even if this argument will be 0 for all of
our languages until lang1. The bytecode-generator
will be a function calling
the reducing function over the sequence of bytecode instructions, taking the
MethodVisitor
as argument :
(defn compiled [n-args class-name bytecode-generator]
(let [cw (ClassWriter. (+ ClassWriter/COMPUTE_FRAMES ClassWriter/COMPUTE_MAXS ))
init (Method/getMethod "void <init>()")
meth-name "run"
meth-sig (str "(" (apply str (repeat n-args "I")) ")I")]
(.visit cw Opcodes/V1_6 Opcodes/ACC_PUBLIC (.replace class-name \. \/) nil "java/lang/Object" nil)
(doto (GeneratorAdapter. Opcodes/ACC_PUBLIC init nil nil cw)
(.visitCode)
(.loadThis)
(.invokeConstructor (Type/getType Object) init)
(.returnValue)
(.endMethod))
(doto (.visitMethod cw (+ Opcodes/ACC_PUBLIC Opcodes/ACC_STATIC) meth-name meth-sig nil nil )
(.visitCode)
(bytecode-generator)
(.visitMaxs 0 0 )
(.visitEnd))
(.visitEnd cw)
(let [b (.toByteArray cw)
cl (clojure.lang.DynamicClassLoader.)]
(.defineClass cl class-name b nil))
(fn [& args] (clojure.lang.Reflector/invokeStaticMethod class-name meth-name (into-array args))))
)
#'beaker_clojure_shell_24f2c611-5642-4afc-b5bf-59a032bac84a/compiled
It can be used in a bytecode-generating-eval
function to create a compiler
that will take an ast as argument and return the function created with compiled
:
(defn bytecode-generating-eval [n-args class-name compiling instr-generating]
(fn[ast]
(let[instrs (instaparse.core/transform compiling ast)
generate-prog (fn[mv] (reduce instr-generating mv instrs))]
(compiled n-args class-name generate-prog))))
#'beaker_clojure_shell_24f2c611-5642-4afc-b5bf-59a032bac84a/bytecode-generating-eval
Using this function for our const language would be :
(def const-compiler (bytecode-generating-eval 0 "ConstCompiler" const-compiling const-instr-generating))
#'beaker_clojure_shell_24f2c611-5642-4afc-b5bf-59a032bac84a/const-compiler
Such a compiler can then be used like :
(def const-compiler-test (-> "-123" const-parser const-compiler ))
#'beaker_clojure_shell_24f2c611-5642-4afc-b5bf-59a032bac84a/const-compiler-test
And the resulting function is a normal clojure function :
(const-compiler-test)
-123
The const-instr-generating
function defined above works perfectly fine. In
order to define other languages, we could just replace it with new functions
adding cases to the condp
expression. However, it can also be rewritten to be
extended rather than replaced, by using dynamic dispatching on the instruction
type. This can easily be done in clojure with a multimethod. A dispatching
implementation could use a generate-instr
multimethod :
(defmulti generate-instr (fn [mv [instr & args]] instr))
(defn dispatching-bytecode-generating-eval [n-args class-name compiling]
(fn[ast]
(let[instrs (instaparse.core/transform compiling ast)
generate-prog (fn[mv] (reduce generate-instr mv instrs))]
(compiled n-args class-name generate-prog))))
#'beaker_clojure_shell_24f2c611-5642-4afc-b5bf-59a032bac84a/dispatching-bytecode-generating-eval
The generate-instr
multimethod is defined as dispatching according to the
value of the first element of the vector argument (which will be the keyword
indicating the kind of bytecode instruction).
For our const language, we only need two implementation mirroring the two
cases of the condp
in const-instr-generating
:
(defmethod generate-instr :loadi [mv [instr & args]]
(doto mv
(.visitLdcInsn (int (first args)))))
(defmethod generate-instr :reti [mv [instr & args]]
(doto mv
(.visitInsn Opcodes/IRETURN)))
clojure.lang.MultiFn@15db8da9
The new implementation is called exactly in the same way :
(def const-compiler (dispatching-bytecode-generating-eval 0 "ConstCompiler" const-compiling))
(def const-compiler-test (-> "-123" const-parser const-compiler))
(const-compiler-test)
-123
(def addsub-parser
(instaparse.core/parser
"prog= spaces add-sub spaces
<add-sub>= number | add | sub
add= add-sub spaces <'+'> spaces number
sub= add-sub spaces <'-'> spaces number
number= #'-?[0-9]+'
<spaces>= <#'\\s*'>"))
#'beaker_clojure_shell_24f2c611-5642-4afc-b5bf-59a032bac84a/addsub-parser
The parser can be used on a sample string :
(-> "1+2-3-1" addsub-parser (instaparse.core/visualize :output-file :buffered-image ))
We can define our interpreting transform map by adding the functions to process
the new :add
and :sub
nodes in the AST :
(def addsub-interpreting
(assoc const-interpreting :add + :sub -))
#'beaker_clojure_shell_24f2c611-5642-4afc-b5bf-59a032bac84a/addsub-interpreting
We can then reuse our previous functions :
(def addsub-eval (dynamic-eval addsub-interpreting))
(def addsub-eval-test (-> "1+2-3-1" addsub-parser addsub-eval))
(addsub-eval-test)
-1
The bytecode sequence for a binary operation is the concatenation of the
bytecode sequence for the first operand, the bytecode sequence for the second
operand, and the specific bytecode for the given operation. We define a function
assoc-binary-op
to add such function to a transform map turning an AST into a
sequence of bytecode instructions. The op
argument is the AST node and the
instr
argument is the keyword representing bytecode instruction :
(defn assoc-binary-op [m [op instr]]
(let[binary-op-compiling (fn[op]
(fn[instrs-v0 instrs-v1]
(conj (into instrs-v0 instrs-v1) [op])))]
(assoc m op (binary-op-compiling instr))))
#'beaker_clojure_shell_24f2c611-5642-4afc-b5bf-59a032bac84a/assoc-binary-op
We can use it to create our addsub
transform map :
(def addsub-compiling
(reduce assoc-binary-op const-compiling [[:add :addi][:sub :subi]]))
#'beaker_clojure_shell_24f2c611-5642-4afc-b5bf-59a032bac84a/addsub-compiling
We can test it :
(str (->> "1+2-3-1" addsub-parser (instaparse.core/transform addsub-compiling)))
[[:loadi 0] [:loadi 1] [:loadi 2] [:addi] [:loadi 3] [:subi] [:loadi 1] [:subi] [:reti]]
We just have to add the multimethod definitions for the new instructions :
(defmethod generate-instr :addi [mv [instr & args]]
(doto mv
(.visitInsn Opcodes/IADD)))
(defmethod generate-instr :subi [mv [instr & args]]
(doto mv
(.visitInsn Opcodes/ISUB)))
clojure.lang.MultiFn@15db8da9
The addsub compiler can then be created reusing our previous functions :
(def addsub-compiler (dispatching-bytecode-generating-eval 0 "AddsubCompiler" addsub-compiling))
#'beaker_clojure_shell_24f2c611-5642-4afc-b5bf-59a032bac84a/addsub-compiler
We can use it as usual :
(def addsub-compiler-test (-> "1+ 2 - 3 - 1" addsub-parser addsub-compiler))
(addsub-compiler-test)
-1
(def addmult-parser
(instaparse.core/parser
"prog= spaces add-sub spaces
<add-sub>= mult-div | add | sub
add= add-sub spaces <'+'> spaces mult-div
sub= add-sub spaces <'-'> spaces mult-div
<mult-div>= number | mult | div
mult= mult-div spaces <'*'> spaces number
div= mult-div spaces <'/'> spaces number
number= #'-?[0-9]+'
<spaces>= <#'\\s*'>"))
#'beaker_clojure_shell_24f2c611-5642-4afc-b5bf-59a032bac84a/addmult-parser
We can use this parser on a sample program :
(-> "1 + 3 * -2 -1" addmult-parser (instaparse.core/visualize :output-file :buffered-image ))
We can add the new AST node types to the transform map :
(def addmult-interpreting (assoc addsub-interpreting :mult * :div /))
#'beaker_clojure_shell_24f2c611-5642-4afc-b5bf-59a032bac84a/addmult-interpreting
And reuse our previous functions :
(def addmult-eval (dynamic-eval addmult-interpreting ))
#'beaker_clojure_shell_24f2c611-5642-4afc-b5bf-59a032bac84a/addmult-eval
The interpreter can be used as usual :
(def addmult-eval-test (-> "1 + 3 * -2 -1" addmult-parser addmult-eval))
(addmult-eval-test)
-6
We can easily add the two new binary operations :
(def addmult-compiling
(reduce assoc-binary-op addsub-compiling [[:mult :multi][:div :divi]]))
(defmethod generate-instr :multi [mv [instr & args]]
(doto mv
(.visitInsn Opcodes/IMUL)))
(defmethod generate-instr :divi [mv [instr & args]]
(doto mv
(.visitInsn Opcodes/IDIV)))
clojure.lang.MultiFn@15db8da9
And then reuse the previous functions :
(def addmult-compiler (dispatching-bytecode-generating-eval 0 "AddmultCompiler" addmult-compiling))
#'beaker_clojure_shell_24f2c611-5642-4afc-b5bf-59a032bac84a/addmult-compiler
This compiler can be used as usual :
(def addmult-compiler-test (-> "1 + 3 * -2 - 1" addmult-parser addmult-compiler))
(addmult-compiler-test)
-6
(def arith-parser
(instaparse.core/parser
"prog = spaces add-sub spaces
<add-sub> = mult-div | add | sub
add = add-sub spaces <'+'> spaces mult-div
sub = add-sub spaces <'-'> spaces mult-div
<mult-div> = term | mult | div
mult = mult-div spaces <'*'> spaces term
div = mult-div spaces <'/'> spaces term
<term> = number | <'('> add-sub <')'>
<spaces> = <#'\\s'*>
number = #'-?[0-9]+'"))
#'beaker_clojure_shell_24f2c611-5642-4afc-b5bf-59a032bac84a/arith-parser
We can use this grammar on a sample program :
(-> "(1 + 3) * -2 -1" arith-parser (instaparse.core/visualize :output-file :buffered-image ))
The AST containts exactly the same kind of nodes as for the addmult language (neither the new (
and )
symbols nor the new term
rule produce any node), so the interpreter is exactly the same:
(def arith-eval-test (-> "(1 + 3) * -2 -1" arith-parser addmult-eval))
(arith-eval-test)
-9
For exactly the same reason, the compiler is exactly the same as the addmult compiler:
(def arith-compiler-test (-> "1 + 3 * (-2 - 1)" arith-parser addmult-compiler))
(arith-compiler-test)
-8
We update the parser to define :
varget
or assignments (the value of the assignment expression is the assigned value)(def lang0-parser
(instaparse.core/parser
"prog = (spaces expr spaces <';'> spaces)*
<expr> = assig | add-sub
assig = varname spaces <'='> spaces expr
<add-sub> = mult-div | add | sub
add = add-sub spaces <'+'> spaces mult-div
sub = add-sub spaces <'-'> spaces mult-div
<mult-div> = factor | mult |div
mult = mult-div spaces <'*'> spaces factor
div = mult-div spaces <'/'> spaces factor
<factor> = number | <'('> spaces expr spaces <')'> | varget |assig
<spaces> = <#'\\s*'>
number = #'-?[0-9]+'
varget = varname
varname = #'[a-zA-Z]\\w*'"))
#'beaker_clojure_shell_24f2c611-5642-4afc-b5bf-59a032bac84a/lang0-parser
The parser can be used on a sample program :
(-> "a=1+1*3;b=a-2; a+b;" lang0-parser (instaparse.core/visualize :output-file :buffered-image ))
Now, our interpreter must be able to access an environment, so that assignments
can have an effect. This environment is a map, mapping from variable names (as
keywords) to values, with a special key :_ret
for the current value of an
expression. When evaluating the nodes of an AST with a transform map, each node
will evaluate to the new environment. The first transform map just reduces the actual
transform map over the environment :
(defn make-interpreting [make-instr-interpreting init-env]
{:prog (fn [& instrs] (:_ret (reduce
(fn[env instr]
(instaparse.core/transform (make-instr-interpreting env) instr))
init-env
instrs)))})
(defn make-lang0-instr-interpreting [env]
{ :assig (fn[{varname :_ret :as env1} {value :_ret :as env2}]
(assoc (merge env1 env2) varname value :_ret value))
:add (fn[{v1 :_ret :as env1} {v2 :_ret :as env2}]
(assoc (merge env1 env2) :_ret (+ v1 v2)))
:sub (fn[{v1 :_ret :as env1} {v2 :_ret :as env2}]
(assoc (merge env1 env2) :_ret (- v1 v2)))
:mult (fn[{v1 :_ret :as env1} {v2 :_ret :as env2}]
(assoc (merge env1 env2) :_ret (* v1 v2)))
:div (fn[{v1 :_ret :as env1} {v2 :_ret :as env2}]
(assoc (merge env1 env2) :_ret (quot v1 v2)))
:number #(assoc env :_ret (Integer/parseInt %))
:varname #(assoc env :_ret (keyword %))
:varget (fn [{varname :_ret :as env1}]
(assoc env1 :_ret (varname env1)))})
#'beaker_clojure_shell_24f2c611-5642-4afc-b5bf-59a032bac84a/make-lang0-instr-interpreting
We can reuse the previous functions :
(def lang0-interpret (dynamic-eval (make-interpreting make-lang0-instr-interpreting {:_ret 0})))
#'beaker_clojure_shell_24f2c611-5642-4afc-b5bf-59a032bac84a/lang0-interpret
And test our interpreter as usual:
(def lang0-interpret-test (->> "a=1+1*3;b=a-2; a+b;" lang0-parser lang0-interpret))
(lang0-interpret-test)
6
We update the transform map :
(def lang0-compiling
(assoc addmult-compiling
:varget #(vector [:load %])
:assig (fn[var instrs](conj instrs [:store var]))))
#'beaker_clojure_shell_24f2c611-5642-4afc-b5bf-59a032bac84a/lang0-compiling
But we also have to replace variable names with numbers (the JVM bytecode numbers arguments and local variables in the order they appear in a method). We are forward thinking by taking a =nb-args= argument even if for now we will number our variables starting with 0.
(use 'clojure.set)
;; helper function that replaces all the values in map m with the given value v
(defn replace-vals [m v]
(into {} (map vector (keys m) (repeat v ))))
(defn to-numeric-vars[nb-args ast]
(let[varnames
(instaparse.core/transform
(assoc (replace-vals
lang0-compiling
(fn[& instrs] (apply clojure.set/union (filter set? instrs))))
:varname (fn[varname]#{varname}))
ast)
name->num (into {} (map vector varnames (iterate inc nb-args)))]
(instaparse.core/transform {:varname #(get name->num %)} ast)))
#'beaker_clojure_shell_24f2c611-5642-4afc-b5bf-59a032bac84a/to-numeric-vars
We can test this helper function :
(str (->> "a=1+1*3;b=a-2; a+b;" lang0-parser (to-numeric-vars 0)))
[:prog [:assig 0 [:add [:number "1"] [:mult [:number "1"] [:number "3"]]]] [:assig 1 [:sub [:varget 0] [:number "2"]]] [:add [:varget 0] [:varget 1]]]
And see how it works when called before compiling to bytecode representation :
(str (->> "a=1+1*3;b=a-2; a+b;" lang0-parser (to-numeric-vars 0) (instaparse.core/transform lang0-compiling)))
[[:loadi 0] [:loadi 1] [:loadi 1] [:loadi 3] [:multi] [:addi] [:store 0] [:load 0] [:loadi 2] [:subi] [:store 1] [:load 0] [:load 1] [:addi] [:reti]]
We also have to provide the new implementations for the generate-instr
multimethod.
For the assignment, we first duplicate the value at the top of the stack (that
will be assigned) so that it will still be there after the assignment (store
instruction). This enables us to use assignments as expressions : the value of
the assignment expression is the assigned value.
(defmethod generate-instr :load [mv [instr & args]]
(doto mv
(.visitVarInsn Opcodes/ILOAD (int (first args)))))
(defmethod generate-instr :store [mv [instr & args]]
(doto mv
(.visitInsn Opcodes/DUP)
(.visitVarInsn Opcodes/ISTORE (int (first args)))))
clojure.lang.MultiFn@15db8da9
We can then reuse our previous functions :
(def lang0-compiler (dispatching-bytecode-generating-eval 0 "Lang0Compiler" lang0-compiling))
#'beaker_clojure_shell_24f2c611-5642-4afc-b5bf-59a032bac84a/lang0-compiler
And test our compiler as usual :
(def lang0-compiler-test (->> "a=1 + 3 * (-2 - 1);b= 0 - a;" lang0-parser (to-numeric-vars 0) lang0-compiler))
(lang0-compiler-test)
8
(def lang1-parser
(instaparse.core/parser
"prog = (spaces expr spaces <';'> spaces)*
<expr> = assig | add-sub
assig = varname spaces <'='> spaces expr
<add-sub> = mult-div | add | sub
add = add-sub spaces <'+'> spaces mult-div
sub = add-sub spaces <'-'> spaces mult-div
<mult-div> = factor | mult |div
mult = mult-div spaces <'*'> spaces factor
div = mult-div spaces <'/'> spaces factor
<factor> = number | <'('> spaces expr spaces <')'> | varget |assig
<spaces> = <#'\\s*'>
number = #'-?[0-9]+'
varget = varname | argument
varname = #'[a-zA-Z]\\w*'
argument= <'%'>#'[0-9]+'"))
#'beaker_clojure_shell_24f2c611-5642-4afc-b5bf-59a032bac84a/lang1-parser
We can test this parser on a sample program :
(-> "a=%0;a + %1 *3;" lang1-parser (instaparse.core/visualize :output-file :buffered-image ))
Instead of starting with an empty environment, we fill the initial environment with arguments :
(defn args-to-env[args]
(into {} (map-indexed #(vector (keyword (str "%" %1)) %2) args)))
(defn dynamic-eval-args [make-interpreter]
(fn[ast]
(fn[& args]
(instaparse.core/transform (make-interpreting make-interpreter
(assoc (args-to-env args)
:_ret 0))
ast))))
#'beaker_clojure_shell_24f2c611-5642-4afc-b5bf-59a032bac84a/dynamic-eval-args
We can easily update the transform map from lang0 :
(defn make-lang1-instr-interpreting [env]
(assoc (make-lang0-instr-interpreting env)
:argument #(assoc env :_ret (keyword (str "%" %)))))
#'beaker_clojure_shell_24f2c611-5642-4afc-b5bf-59a032bac84a/make-lang1-instr-interpreting
And define our interpreter :
(def lang1-interpret (dynamic-eval-args make-lang1-instr-interpreting))
#'beaker_clojure_shell_24f2c611-5642-4afc-b5bf-59a032bac84a/lang1-interpret
The interpreter can be called as usual, except that now we can pass arguments to our function when we call it :
(def lang1-interpret-test (->> "a=%0;a + %1 *3;" lang1-parser lang1-interpret))
(lang1-interpret-test 2 3)
11
In order to implement the compiler, we will first have to be able to know how many arguments are used in a program. This can be easily done with a transform map :
(defn nb-args[ast]
(inc (instaparse.core/transform (assoc (replace-vals
lang0-compiling (fn[& args]
(apply max (conj (filter number? args)
-1))))
:argument #(Integer/parseInt %))
ast)))
#'beaker_clojure_shell_24f2c611-5642-4afc-b5bf-59a032bac84a/nb-args
We can test this function :
(->> "a=%0;a + %1 *3;" lang1-parser nb-args)
2
Then we add an AST transformation step to replace the :argument
nodes with the
value of the argument number:
(defn args->varnum[ast]
(instaparse.core/transform {:argument #(Integer/parseInt %)} ast))
#'beaker_clojure_shell_24f2c611-5642-4afc-b5bf-59a032bac84a/args->varnum
As a few steps in the compilation chain will depend on the number of arguments, we define a new function instead of just piping our AST through the various stages :
(defn lang1-compiler-chain[class-name ast]
(let[n-args (nb-args ast)
compiler (dispatching-bytecode-generating-eval n-args class-name lang0-compiling)]
(->> ast args->varnum (to-numeric-vars n-args) compiler)))
#'beaker_clojure_shell_24f2c611-5642-4afc-b5bf-59a032bac84a/lang1-compiler-chain
We can then use this function after parsing as follows :
(def lang1-compiler-test (->> "a=%0;a + %1 *3;" lang1-parser (lang1-compiler-chain "Lang1Compiler")))
(lang1-compiler-test 2 5)
17
;; TODO parser should be defined here
null
;; TODO test the parser
null
In order to reuse the functions used for the lang1 interpreter, we have to define a transform map. Also this transform map will have to take the modulo factor into account.
;; TODO function creating the transform map and defining the modulo-interpret function.
null
;; TODO test the interpreter
null
In order to reuse the functions used for the lang1 compiler, we have to redefine the multimethods.
;; TODO redefine multimethods and define the modulo-compiler-chain function
null
;; TODO test the compiler
null