pymc-devs
diff --git a/‎examples/diagnostics_and_criticism/model_averaging.ipynb‎
Lines changed: 1 addition & 1 deletion b/‎examples/diagnostics_and_criticism/model_averaging.ipynb‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎examples/survival_analysis/bayes_param_survival.ipynb‎
Lines changed: 849 additions & 167 deletions b/‎examples/survival_analysis/bayes_param_survival.ipynb‎
Lines changed: 849 additions & 167 deletions
diff --git a/‎examples/survival_analysis/bayes_param_survival.myst.md‎
Lines changed: 55 additions & 51 deletions b/‎examples/survival_analysis/bayes_param_survival.myst.md‎
Lines changed: 55 additions & 51 deletions
diff --git a/‎examples/survival_analysis/censored_data.ipynb‎
Lines changed: 158 additions & 219 deletions b/‎examples/survival_analysis/censored_data.ipynb‎
Lines changed: 158 additions & 219 deletions
diff --git a/‎examples/survival_analysis/censored_data.myst.md‎
Lines changed: 27 additions & 21 deletions b/‎examples/survival_analysis/censored_data.myst.md‎
Lines changed: 27 additions & 21 deletions
@@ -759,7 +759,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.13.5"
+   "version": "3.11.5"
   }
  },
  "nbformat": 4,
 
@@ -5,7 +5,7 @@ jupytext:
     format_name: myst
     format_version: 0.13
 kernelspec:
-  display_name: default
+  display_name: pymc
   language: python
   name: python3
 ---
@@ -17,12 +17,12 @@ kernelspec:
 ```{code-cell} ipython3
 import warnings
 
-import arviz as az
+import arviz.preview as az
 import numpy as np
 import pymc as pm
 import pytensor.tensor as pt
 import scipy as sp
-import seaborn as sns
+import xarray as xr
 
 from matplotlib import pyplot as plt
 from matplotlib.ticker import StrMethodFormatter
@@ -33,7 +33,7 @@ print(f"Running on PyMC v{pm.__version__}")
 
 ```{code-cell} ipython3
 %config InlineBackend.figure_format = 'retina'
-az.style.use("arviz-darkgrid")
+az.style.use("arviz-variat")
 warnings.filterwarnings("ignore")
 ```
 
@@ -45,9 +45,6 @@ This post illustrates a parametric approach to Bayesian survival analysis in PyM
 We will analyze the [mastectomy data](https://vincentarelbundock.github.io/Rdatasets/doc/HSAUR/mastectomy.html) from `R`'s [`HSAUR`](https://cran.r-project.org/web/packages/HSAUR/index.html) package. 
 
 ```{code-cell} ipython3
-sns.set()
-blue, green, red, purple, gold, teal = sns.color_palette(n_colors=6)
-
 pct_formatter = StrMethodFormatter("{x:.1%}")
 ```
 
@@ -228,19 +225,19 @@ with weibull_model:
 The energy plot and Bayesian fraction of missing information give no cause for concern about poor mixing in NUTS.
 
 ```{code-cell} ipython3
-az.plot_energy(weibull_trace, fill_color=("C0", "C1"));
+az.plot_energy(weibull_trace);
 ```
 
 The $\hat{R}$ statistics also indicate convergence.
 
 ```{code-cell} ipython3
-max(np.max(gr_stats) for gr_stats in az.rhat(weibull_trace).values())
+az.rhat(weibull_trace).to_array().max()
 ```
 
 Below we plot posterior distributions of the parameters.
 
 ```{code-cell} ipython3
-az.plot_forest(weibull_trace, figsize=(10, 4));
+az.plot_forest(weibull_trace);
 ```
 
 These are somewhat interesting (especially the fact that the posterior of $\beta_1$ is fairly well-separated from zero), but the posterior predictive survival curves will be much more interpretable.
@@ -268,34 +265,32 @@ with weibull_model:
 The posterior predictive survival times show that, on average, patients whose cancer had not metastized survived longer than those whose cancer had metastized.
 
 ```{code-cell} ipython3
-t_plot = np.linspace(0, 230, 100)
+t_plot = xr.DataArray(np.linspace(0, 230, 100), dims=["time"])
+pp_samples = az.extract(pp_weibull_trace.posterior_predictive["events"])
 
-weibull_pp_surv = np.greater_equal.outer(
-    np.exp(
-        y.mean()
-        + y.std() * az.extract(pp_weibull_trace.posterior_predictive["events"])["events"].values
-    ),
-    t_plot,
-)
-weibull_pp_surv_mean = weibull_pp_surv.mean(axis=1)
+linear_pred = y.mean() + y.std() * pp_samples
+
+weibull_pp_surv = np.exp(linear_pred) >= t_plot
+
+weibull_pp_surv_mean = weibull_pp_surv.mean(dim="sample")
 ```
 
 ```{code-cell} ipython3
 fig, ax = plt.subplots(figsize=(8, 6))
 
 
-ax.plot(t_plot, weibull_pp_surv_mean[0], c=blue, label="Not metastized")
-ax.plot(t_plot, weibull_pp_surv_mean[1], c=red, label="Metastized")
-
-ax.set_xlim(0, 230)
-ax.set_xlabel("Weeks since mastectomy")
+ax.plot(t_plot, weibull_pp_surv_mean[0], label="Not metastized")
+ax.plot(t_plot, weibull_pp_surv_mean[1], label="Metastized")
 
-ax.set_ylim(top=1)
+ax.set(
+    xlabel="Weeks since mastectomy",
+    ylabel="Survival probability",
+    title="Weibull survival regression model",
+    xlim=(0, 230),
+    ylim=(0, 1),
+)
+ax.legend()
 ax.yaxis.set_major_formatter(pct_formatter)
-ax.set_ylabel("Survival probability")
-
-ax.legend(loc=1)
-ax.set_title("Weibull survival regression model");
 ```
 
 ### Log-logistic survival regression
@@ -342,11 +337,11 @@ with log_logistic_model:
 All of the sampling diagnostics look good for this model.
 
 ```{code-cell} ipython3
-az.plot_energy(log_logistic_trace, fill_color=("C0", "C1"));
+az.plot_energy(log_logistic_trace);
 ```
 
 ```{code-cell} ipython3
-max(np.max(gr_stats) for gr_stats in az.rhat(log_logistic_trace).values())
+az.rhat(log_logistic_trace).to_array().max()
 ```
 
 Again, we calculate the posterior expected survival functions for this model.
@@ -360,35 +355,35 @@ with log_logistic_model:
 ```
 
 ```{code-cell} ipython3
-log_logistic_pp_surv = np.greater_equal.outer(
-    np.exp(
-        y.mean()
-        + y.std()
-        * az.extract(pp_log_logistic_trace.posterior_predictive["events"])["events"].values
-    ),
-    t_plot,
-)
-log_logistic_pp_surv_mean = log_logistic_pp_surv.mean(axis=1)
+pp_samples = az.extract(pp_log_logistic_trace.posterior_predictive["events"])
+
+linear_pred = y.mean() + y.std() * pp_samples
+
+log_logistic_pp_surv = np.exp(linear_pred) >= t_plot
+
+log_logistic_pp_surv_mean = log_logistic_pp_surv.mean(dim="sample")
 ```
 
 ```{code-cell} ipython3
 fig, ax = plt.subplots(figsize=(8, 6))
 
-ax.plot(t_plot, weibull_pp_surv_mean[0], c=blue, label="Weibull, not metastized")
-ax.plot(t_plot, weibull_pp_surv_mean[1], c=red, label="Weibull, metastized")
+ax.plot(t_plot, weibull_pp_surv_mean[0], c="C0", label="Weibull, not metastized")
+ax.plot(t_plot, weibull_pp_surv_mean[1], c="C1", label="Weibull, metastized")
 
-ax.plot(t_plot, log_logistic_pp_surv_mean[0], "--", c=blue, label="Log-logistic, not metastized")
-ax.plot(t_plot, log_logistic_pp_surv_mean[1], "--", c=red, label="Log-logistic, metastized")
+ax.plot(t_plot, log_logistic_pp_surv_mean[0], "--", c="C0", label="Log-logistic, not metastized")
+ax.plot(t_plot, log_logistic_pp_surv_mean[1], "--", c="C1", label="Log-logistic, metastized")
 
-ax.set_xlim(0, 230)
-ax.set_xlabel("Weeks since mastectomy")
 
-ax.set_ylim(top=1)
-ax.yaxis.set_major_formatter(pct_formatter)
-ax.set_ylabel("Survival probability")
+ax.set(
+    xlabel="Weeks since mastectomy",
+    ylabel="Survival probability",
+    title="Weibull and log-logistic\nsurvival regression models",
+    xlim=(0, 230),
+    ylim=(0, 1),
+)
 
-ax.legend(loc=1)
-ax.set_title("Weibull and log-logistic\nsurvival regression models");
+ax.legend()
+ax.yaxis.set_major_formatter(pct_formatter)
 ```
 
 This post has been a short introduction to implementing parametric survival regression models in PyMC with a fairly simple data set.  The modular nature of probabilistic programming with PyMC should make it straightforward to generalize these techniques to more complex and interesting data set.
@@ -400,8 +395,17 @@ This post has been a short introduction to implementing parametric survival regr
 - Originally authored as a blog post by [Austin Rochford](https://austinrochford.com/posts/2017-10-02-bayes-param-survival.html) on October 2, 2017.
 - Updated by [George Ho](https://eigenfoo.xyz/) on July 18, 2018.
 - Updated by @fonnesbeck on September 11, 2024.
+- Updated by Osvaldo Martin on December 2025.
 
 ```{code-cell} ipython3
 %load_ext watermark
 %watermark -n -u -v -iv -w
 ```
+
+```{code-cell} ipython3
+pp_weibull_dt = az.convert_to_datatree(pp_weibull_trace)
+```
+
+```{code-cell} ipython3
+pp_weibull_dt.posterior_predictive
+```
@@ -22,19 +22,18 @@ kernelspec:
 ```{code-cell} ipython3
 from copy import copy
 
-import arviz as az
+import arviz.preview as az
 import matplotlib.pyplot as plt
 import numpy as np
 import pymc as pm
-import seaborn as sns
 
 from numpy.random import default_rng
 ```
 
 ```{code-cell} ipython3
 %config InlineBackend.figure_format = 'retina'
 rng = default_rng(1234)
-az.style.use("arviz-darkgrid")
+az.style.use("arviz-variat")
 ```
 
 [This example notebook on Bayesian survival
@@ -59,7 +58,7 @@ Censored data arises in many modelling problems. Two common examples are:
    range of temperatures.
 
 This example notebook presents two different ways of dealing with censored data
-in PyMC3:
+in PyMC:
 
 1. An imputed censored model, which represents censored data as parameters and
    makes up plausible values for all censored values. As a result of this
@@ -101,8 +100,8 @@ censored = censor(samples, low, high)
 # Visualize uncensored and censored data
 _, ax = plt.subplots(figsize=(10, 3))
 edges = np.linspace(-5, 35, 30)
-ax.hist(samples, bins=edges, density=True, histtype="stepfilled", alpha=0.2, label="Uncensored")
-ax.hist(censored, bins=edges, density=True, histtype="stepfilled", alpha=0.2, label="Censored")
+ax.hist(samples, bins=edges, density=True, histtype="stepfilled", alpha=0.4, label="Uncensored")
+ax.hist(censored, bins=edges, density=True, histtype="stepfilled", alpha=0.4, label="Censored")
 [ax.axvline(x=x, c="k", ls="--") for x in [low, high]]
 ax.legend();
 ```
@@ -124,13 +123,16 @@ We should predict that running the uncensored model on uncensored data, we will
 uncensored_model_1 = uncensored_model(samples)
 with uncensored_model_1:
     idata = pm.sample()
+```
 
-az.plot_posterior(idata, ref_val=[true_mu, true_sigma], round_to=3);
+```{code-cell} ipython3
+pc = az.plot_dist(idata)
+az.add_lines(pc, {"mu": true_mu, "sigma": true_sigma});
 ```
 
 And that is exactly what we find. 
 
-The problem however, is that in censored data contexts, we do not have access to the true values. If we were to use the same uncensored model on the censored data, we would anticipate that our parameter estimates will be biased. If we calculate point estimates for the mean and std, then we can see that we are likely to underestimate the mean and std for this particular dataset and censor bounds.
+The problem however, is that in censored data contexts, we do not have access to the true values. If we were to use the same uncensored model on the censored data, we would anticipate that our parameter estimates will be biased. If we calculate point estimates for the mean and standard deviation, then we can see that we are likely to underestimate the mean and standard deviation for this particular dataset and censor bounds.
 
 ```{code-cell} ipython3
 print(f"mean={np.mean(censored):.2f}; std={np.std(censored):.2f}")
@@ -140,15 +142,18 @@ print(f"mean={np.mean(censored):.2f}; std={np.std(censored):.2f}")
 uncensored_model_2 = uncensored_model(censored)
 with uncensored_model_2:
     idata = pm.sample()
-
-az.plot_posterior(idata, ref_val=[true_mu, true_sigma], round_to=3);
 ```
 
-The figure above confirms this.
+As expected, we see that both the mean and standard deviation are underestimated when using the uncensored model on censored data.
+
+```{code-cell} ipython3
+pc = az.plot_dist(idata)
+az.add_lines(pc, {"mu": true_mu, "sigma": true_sigma});
+```
 
 ## Censored data models
 
-The models below show 2 approaches to dealing with censored data. First, we need to do a bit of data pre-processing to count the number of observations that are left or right censored. We also also need to extract just the non-censored data that we observe.
+The models below show two approaches to dealing with censored data. First, we need to do a bit of data pre-processing to count the number of observations that are left or right censored. We also need to extract just the non-censored data that we observe.
 
 +++
 
@@ -187,11 +192,14 @@ with pm.Model() as imputed_censored_model:
     )
     observed = pm.Normal("observed", mu=mu, sigma=sigma, observed=uncensored, shape=int(n_observed))
     idata = pm.sample()
+```
 
-az.plot_posterior(idata, var_names=["mu", "sigma"], ref_val=[true_mu, true_sigma], round_to=3);
+```{code-cell} ipython3
+pc = az.plot_dist(idata, var_names=["mu", "sigma"])
+az.add_lines(pc, {"mu": true_mu, "sigma": true_sigma});
 ```
 
-We can see that the bias in the estimates of the mean and variance (present in the uncensored model) have been largely removed.
+We can see that the bias in the estimates of the mean and standard deviation (present in the uncensored model) have been largely removed.
 
 +++
 
@@ -205,15 +213,12 @@ with pm.Model() as unimputed_censored_model:
     sigma = pm.HalfNormal("sigma", sigma=(high - low) / 2.0)
     y_latent = pm.Normal.dist(mu=mu, sigma=sigma)
     obs = pm.Censored("obs", y_latent, lower=low, upper=high, observed=censored)
+    idata = pm.sample()
 ```
 
-Sampling
-
 ```{code-cell} ipython3
-with unimputed_censored_model:
-    idata = pm.sample()
-
-az.plot_posterior(idata, var_names=["mu", "sigma"], ref_val=[true_mu, true_sigma], round_to=3);
+pc = az.plot_dist(idata, var_names=["mu", "sigma"])
+az.add_lines(pc, {"mu": true_mu, "sigma": true_sigma});
 ```
 
 Again, the bias in the estimates of the mean and variance (present in the uncensored model) have been largely removed.
@@ -231,7 +236,8 @@ As we can see, both censored models appear to capture the mean and variance of t
 - Originally authored by [Luis Mario Domenzain](https://github.com/domenzain) on Mar 7, 2017.
 - Updated by [George Ho](https://github.com/eigenfoo) on Jul 14, 2018.
 - Updated by [Benjamin Vincent](https://github.com/drbenvincent) in May 2021.
-- Updated by [Benjamin Vincent](https://github.com/drbenvincent) in May 2022 to PyMC v4.
+- Updated by [Benjamin Vincent](https://github.com/drbenvincent) in May 2022.
+- Updated by [Osvaldo Martin](https://github.com/aloctavodia) in Dec 2025.
 
 +++
Original file line number	Diff line number	Diff line change
`@@ -759,7 +759,7 @@`
`759`	`759`	`"name": "python",`
`760`	`760`	`"nbconvert_exporter": "python",`
`761`	`761`	`"pygments_lexer": "ipython3",`
`762`		`- "version": "3.13.5"`
	`762`	`+ "version": "3.11.5"`
`763`	`763`	`}`
`764`	`764`	`},`
`765`	`765`	`"nbformat": 4,`