Pymc tutorial - rendering setup (#3)

daslu · web-flow · commit ecb2db99a387 · 2024-10-16T23:17:36.000+02:00
* pymc - reorganizing tuturials as a book - WIP

* pymc - updated Clay setup for book

* pymc - added render command

* pymc - fixed render command
diff --git a/notebooks/toc.edn b/notebooks/toc.edn
@@ -42,10 +42,10 @@
   :title "Using PyMC from Clojure - DRAFT 🛠"
   :url "projects/stats/pymc/index.html"
   :source-path "projects/stats/pymc"
-  ;:cmd ""
+  :cmd "clj -Adev notebooks/render.clj"
   :tags [:pymc :stats :bayes :python :draft]}
 
-  {:created "2024-09-07"
+ {:created "2024-09-07"
   :updated "2024-09-07"
   :title "Using sklearn models from Clojure with sklearn-clj"
   :url "projects/ml/sklearn-clj/index.html"
diff --git a/projects/stats/pymc/clay.edn b/projects/stats/pymc/clay.edn
@@ -1,4 +1,3 @@
 {:remote-repo {:git-url "https://github.com/scicloj/clojure-data-scrapbook"
                :branch "main"}
- :base-target-path "temp"
- :title "Using PyMC from Clojure - DRAFT 🛠"}
+ :base-target-path "temp"}
diff --git a/projects/stats/pymc/notebooks/index.clj b/projects/stats/pymc/notebooks/index.clj
@@ -1,152 +1,12 @@
 (load-string (slurp  "https://raw.githubusercontent.com/scicloj/clojure-data-tutorials/main/header.edn"))
-;; ---------------
 
-;; This tutorial demonstrates using
-;; the probabilistic programming library PyMC
-;; from Clojure.
-
-;; We follow the linear regression example from
-;; the [Introductory Overview of PyMC](https://www.pymc.io/projects/docs/en/stable/learn/core_notebooks/pymc_overview.html).
-
-;; ## Setup
-
-;; Relevant Clojure namespaces:
-
-(ns index
-  (:require [libpython-clj2.require :refer [require-python]]
-            [libpython-clj2.python :refer [py. py.. py.-] :as py]
-            [fastmath.random :as random]
-            [tablecloth.api :as tc]
-            [tablecloth.column.api :as tcc]
-            [tech.v3.datatype :as dtype]
-            [scicloj.hanamicloth.v1.plotlycloth :as ploclo]
-            [scicloj.kind-pyplot.v1.api :as pyplot]
-            [scicloj.kindly.v4.kind :as kind]))
-
-;; Relevant Python modules:
-
-(require-python '[builtins :as python]
-                'operator
-                '[arviz :as az]
-                '[arviz.style :as az.style]
-                '[pandas :as pd]
-                '[matplotlib.pyplot :as plt]
-                '[numpy :as np]
-                '[numpy.random :as np.random]
-                '[pymc :as pm])
-
-;; Some convenience functions to access Python idioms:
-
-(defn brackets [obj entry]
-  (py. obj __getitem__ entry))
-
-(def colon
-  (python/slice nil nil))
-
-;; Theme for ArViZ visualizations:
-
-(arviz.style/use "arviz-darkgrid")
-
-;; ## Synthetic data
-
-(def random-seed 8927)
-
-(def dataset-size 101)
-
-(def true-parameter-values
-  {:alpha 1
-   :sigma 1
-   :beta [1 2.5]})
-
-;; We will generate a dataset by the following recipe:
-
-(defn gen-dataset [{:keys [size random-seed
-                           alpha sigma beta]}]
-  (let [rng (random/rng :isaac random-seed)]
-    (-> {:x1 (take size (random/->seq rng))
-         :x2 (-> (take size (random/->seq rng))
-                 (tcc/* 0.2))}
-        tc/dataset
-        (tc/add-column :y
-                       #(-> (tcc/+ alpha
-                                   (tcc/* (beta 0) (:x1 %))
-                                   (tcc/* (beta 1) (:x2 %))
-                                   (tcc/* sigma
-                                          (dtype/make-reader
-                                           :float32 size (rand)))))))))
+^:kindly/hide-code
+(ns index)
 
-(def dataset
-  (gen-dataset (merge {:random-seed random-seed
-                       :size dataset-size}
-                      true-parameter-values)))
+;; # Preface
 
-(tc/head dataset)
-
-;; Let us visualize our dataset:
-
-(->> [:x1 :x2]
-     (mapv (fn [x]
-             (-> dataset
-                 (ploclo/layer-point
-                  {:=x :x1}))))
-     kind/fragment)
-
-;; ## Using PyMC
-
-pm/__version__
-
-;; Let us define a Bayesian model for our data:
-
-(def basic-model (pm/Model))
-
-(py/with [_ basic-model]
-         (let [{:keys [x1 x2 y]} (-> dataset
-                                     (update-vals np/array))
-               alpha (pm/Normal "alpha"
-                                :mu 0
-                                :sigma 10)
-               beta (pm/Normal "beta"
-                               :mu 0
-                               :sigma 10
-                               :shape 2)
-               sigma (pm/HalfNormal "sigma"
-                                    :sigma 1)
-               mu (operator/add alpha
-                                (operator/mul (brackets beta 0)
-                                              x1)
-                                (operator/mul (brackets beta 0)
-                                              x2))
-               y_obs (pm/Normal "y_obs"
-                                :mu mu
-                                :sigma sigma
-                                :observed y)]))
-
-;; Now we can sample from the posterior:
-
-(def idata
-  (py/with [_ basic-model]
-           (pm/sample)))
-
-;; Here is the resulting structure:
-
-(-> idata
-    (py.- posterior)
-    (py.- alpha)
-    (py. sel :draw (python/slice 0 4)))
-
-;; Alternativelty, we could also use the Slice sampling algorithm
-;; instead of the default NUTS.
-
-(def slice-idata
-  (py/with [_ basic-model]
-           (let [step (pm/Slice)]
-             (pm/sample 5000 :step step))))
-
-slice-idata
-
-;; ## Posterior analysis
-
-;; Let us plot our sampling using ArViZ:
+;; These tutorials demonstrate using
+;; the probabilistic programming library [PyMC](https://www.pymc.io/)
+;; from Clojure.
 
-(pyplot/pyplot
- #(az/plot_trace idata :combined true))
+;; * [Intro](./intro.html)
diff --git a/projects/stats/pymc/notebooks/intro.clj b/projects/stats/pymc/notebooks/intro.clj
@@ -0,0 +1,149 @@
+;; # Intro
+
+;; Here is our introduction to using PyMC from Clojure.
+
+;; We follow the linear regression example from
+;; the [Introductory Overview of PyMC](https://www.pymc.io/projects/docs/en/stable/learn/core_notebooks/pymc_overview.html).
+
+;; ## Setup
+
+;; Relevant Clojure namespaces:
+
+(ns intro
+  (:require [libpython-clj2.require :refer [require-python]]
+            [libpython-clj2.python :refer [py. py.. py.-] :as py]
+            [fastmath.random :as random]
+            [tablecloth.api :as tc]
+            [tablecloth.column.api :as tcc]
+            [tech.v3.datatype :as dtype]
+            [scicloj.hanamicloth.v1.plotlycloth :as ploclo]
+            [scicloj.kind-pyplot.v1.api :as pyplot]
+            [scicloj.kindly.v4.kind :as kind]))
+
+;; Relevant Python modules:
+
+(require-python '[builtins :as python]
+                'operator
+                '[arviz :as az]
+                '[arviz.style :as az.style]
+                '[pandas :as pd]
+                '[matplotlib.pyplot :as plt]
+                '[numpy :as np]
+                '[numpy.random :as np.random]
+                '[pymc :as pm])
+
+;; Some convenience functions to access Python idioms:
+
+(defn brackets [obj entry]
+  (py. obj __getitem__ entry))
+
+(def colon
+  (python/slice nil nil))
+
+;; Theme for ArViZ visualizations:
+
+(arviz.style/use "arviz-darkgrid")
+
+;; ## Synthetic data
+
+(def random-seed 8927)
+
+(def dataset-size 101)
+
+(def true-parameter-values
+  {:alpha 1
+   :sigma 1
+   :beta [1 2.5]})
+
+;; We will generate a dataset by the following recipe:
+
+(defn gen-dataset [{:keys [size random-seed
+                           alpha sigma beta]}]
+  (let [rng (random/rng :isaac random-seed)]
+    (-> {:x1 (take size (random/->seq rng))
+         :x2 (-> (take size (random/->seq rng))
+                 (tcc/* 0.2))}
+        tc/dataset
+        (tc/add-column :y
+                       #(-> (tcc/+ alpha
+                                   (tcc/* (beta 0) (:x1 %))
+                                   (tcc/* (beta 1) (:x2 %))
+                                   (tcc/* sigma
+                                          (dtype/make-reader
+                                           :float32 size (rand)))))))))
+
+(def dataset
+  (gen-dataset (merge {:random-seed random-seed
+                       :size dataset-size}
+                      true-parameter-values)))
+
+(tc/head dataset)
+
+;; Let us visualize our dataset:
+
+(->> [:x1 :x2]
+     (mapv (fn [x]
+             (-> dataset
+                 (ploclo/layer-point
+                  {:=x :x1}))))
+     kind/fragment)
+
+;; ## Using PyMC
+
+pm/__version__
+
+;; Let us define a Bayesian model for our data:
+
+(def basic-model (pm/Model))
+
+(py/with [_ basic-model]
+         (let [{:keys [x1 x2 y]} (-> dataset
+                                     (update-vals np/array))
+               alpha (pm/Normal "alpha"
+                                :mu 0
+                                :sigma 10)
+               beta (pm/Normal "beta"
+                               :mu 0
+                               :sigma 10
+                               :shape 2)
+               sigma (pm/HalfNormal "sigma"
+                                    :sigma 1)
+               mu (operator/add alpha
+                                (operator/mul (brackets beta 0)
+                                              x1)
+                                (operator/mul (brackets beta 0)
+                                              x2))
+               y_obs (pm/Normal "y_obs"
+                                :mu mu
+                                :sigma sigma
+                                :observed y)]))
+
+;; Now we can sample from the posterior:
+
+(def idata
+  (py/with [_ basic-model]
+           (pm/sample)))
+
+;; Here is the resulting structure:
+
+(-> idata
+    (py.- posterior)
+    (py.- alpha)
+    (py. sel :draw (python/slice 0 4)))
+
+;; Alternativelty, we could also use the Slice sampling algorithm
+;; instead of the default NUTS.
+
+(def slice-idata
+  (py/with [_ basic-model]
+           (let [step (pm/Slice)]
+             (pm/sample 5000 :step step))))
+
+slice-idata
+
+;; ## Posterior analysis
+
+;; Let us plot our sampling using ArViZ:
+
+(pyplot/pyplot
+ #(az/plot_trace idata :combined true))
diff --git a/projects/stats/pymc/notebooks/render.clj b/projects/stats/pymc/notebooks/render.clj
@@ -0,0 +1,13 @@
+(ns render
+  (:require [scicloj.clay.v2.api :as clay]))
+
+(clay/make! {:format [:quarto :html]
+             :show false
+             :base-source-path "notebooks"
+             :source-path ["index.clj"
+                           "intro.clj"]
+             :base-target-path "docs"
+             :book {:title "Using PyMC from clojure"}
+             :clean-up-target-dir true})
+
+(System/exit 0)