import os
os.environ["JAX_PLATFORMS"] = "cpu"
import numpy as np
import jax.numpy as jnp
import jax
import numpyro
numpyro.set_host_device_count(4)
from numpyro.infer import MCMC, NUTS, Predictive
import numpyro.distributions as dist
from numpyro import handlers
from typing import Optional
import pandas as pd
import pyro_util
import arviz as az

year = [0, 0, 1, 1, 2, 2]
x = np.random.randn(6)
bases = 2 * np.random.randn(3)
df = pd.DataFrame({'year': pd.CategoricalIndex(year), 'x': x, 'y': x + bases[year] + np.random.randn(6)})

def model(**kwargs):
    pyro_util.glm( 'y ~ year + x', df, **kwargs)

mcmc = pyro_util.fit_nuts(model)

  0%|          | 0/1500 [00:00<?, ?it/s]

  0%|          | 0/1500 [00:00<?, ?it/s]

  0%|          | 0/1500 [00:00<?, ?it/s]

  0%|          | 0/1500 [00:00<?, ?it/s]

az.from_numpyro(mcmc)

<xarray.Dataset> Size: 184kB
Dimensions:     (chain: 4, draw: 1000, mu_dim_0: 6, year_dim_0: 2)
Coordinates:
  * chain       (chain) int64 32B 0 1 2 3
  * draw        (draw) int64 8kB 0 1 2 3 4 5 6 7 ... 993 994 995 996 997 998 999
  * mu_dim_0    (mu_dim_0) int64 48B 0 1 2 3 4 5
  * year_dim_0  (year_dim_0) int64 16B 0 1
Data variables:
    Intercept   (chain, draw) float32 16kB 0.7586 2.631 2.299 ... 0.3715 1.361
    mu          (chain, draw, mu_dim_0) float32 96kB 0.4586 0.5923 ... 4.705
    sigma       (chain, draw) float32 16kB 1.11 2.791 1.157 ... 1.344 1.259
    x           (chain, draw) float32 16kB 0.4241 -0.2606 ... -0.1037 0.2269
    year        (chain, draw, year_dim_0) float32 32kB -3.399 2.84 ... 3.188
Attributes:
    created_at:                 2025-01-08T00:36:28.626591
    arviz_version:              0.17.1
    inference_library:          numpyro
    inference_library_version:  0.15.1

array([0, 1, 2, 3])

array([  0,   1,   2, ..., 997, 998, 999])

array([0, 1, 2, 3, 4, 5])

array([0, 1])

array([[0.75857586, 2.63063   , 2.298524  , ..., 3.1893117 , 3.930863  ,
        3.8521183 ],
       [1.9285047 , 2.3176327 , 2.7241917 , ..., 1.4848075 , 2.2841883 ,
        0.445622  ],
       [1.6812876 , 1.2485336 , 3.1172335 , ..., 2.9870203 , 2.2174242 ,
        2.4899802 ],
       [0.71638304, 4.1856446 , 1.1233672 , ..., 0.37151736, 0.37151736,
        1.360693  ]], dtype=float32)

array([[[ 0.45856354,  0.5922939 , -2.8679502 , -2.8879251 ,
          4.6079144 ,  3.8916883 ],
        [ 2.8149552 ,  2.7327924 , -0.9055467 , -0.8932743 ,
          2.4330864 ,  2.87313   ],
        [ 1.6159793 ,  1.9202234 , -4.572874  , -4.618318  ,
          5.7492843 ,  4.11983   ],
        ...,
        [ 1.5307113 ,  2.270032  , -2.035584  , -2.146014  ,
          4.7721424 ,  0.81252915],
        [ 3.215802  ,  3.5345402 , -2.1341548 , -2.1817636 ,
          3.4110792 ,  1.7039983 ],
        [ 2.772389  ,  3.2536778 , -2.1255581 , -2.1974466 ,
          5.390095  ,  2.8124337 ]],

       [[ 0.69686633,  1.2458688 , -2.3627958 , -2.4447985 ,
          5.8813186 ,  2.9410012 ],
        [ 1.4136187 ,  1.8165826 , -1.7210183 , -1.7812077 ,
          4.7406635 ,  2.5824907 ],
        [ 1.9081947 ,  2.2719252 , -3.1131928 , -3.167522  ,
          4.145621  ,  2.1975734 ],
...
        [ 3.0342183 ,  3.0131798 , -2.8795478 , -2.8764055 ,
          4.5105057 ,  4.623183  ],
        [ 1.9625264 ,  2.076147  , -3.5765648 , -3.5935361 ,
          3.2034104 ,  2.5948875 ],
        [ 1.3551953 ,  1.8610253 , -2.1033273 , -2.1788814 ,
          3.9322953 ,  1.2231984 ]],

       [[-1.151205  , -0.31872818, -4.4340568 , -4.558401  ,
          5.3482323 ,  0.88969857],
        [ 2.9539907 ,  3.503     , -1.0877671 , -1.169771  ,
          6.680791  ,  3.7404366 ],
        [-0.39626086,  0.28111288, -1.8339602 , -1.9351373 ,
          5.0932326 ,  1.4653913 ],
        ...,
        [ 0.44488862,  0.4121834 , -2.4801948 , -2.4753096 ,
          3.3946764 ,  3.569837  ],
        [ 0.44488862,  0.4121834 , -2.4801948 , -2.4753096 ,
          3.3946764 ,  3.569837  ],
        [ 1.2001832 ,  1.2717304 , -2.7713392 , -2.782026  ,
          5.0885663 ,  4.7053776 ]]], dtype=float32)

array([[1.1102884, 2.7913005, 1.1571234, ..., 1.2137805, 2.4473596,
        2.3534856],
       [1.1564898, 1.1613271, 1.3617151, ..., 1.5085388, 2.4395025,
        1.8731871],
       [1.5024555, 1.733058 , 3.1805377, ..., 1.0380949, 1.0931878,
        1.9955833],
       [1.8776833, 1.9939799, 1.4786174, ..., 1.3440568, 1.3440568,
        1.2591903]], dtype=float32)

array([[ 0.42414588, -0.2605919 ,  0.9649554 , ...,  2.3448656 ,
         1.0109258 ,  1.5264798 ],
       [ 1.741243  ,  1.2780603 ,  1.1536251 , ...,  1.6887498 ,
        -1.4377515 ,  0.1342758 ],
       [ 2.5390055 ,  3.2143846 , -0.13694805, ..., -0.06672669,
         0.36036456,  1.6043153 ],
       [ 2.640324  ,  1.7412649 ,  2.1483917 , ..., -0.10372945,
        -0.10372945,  0.2269226 ]], dtype=float32)

array([[[-3.3992376 ,  2.8397505 ],
        [-3.675821  ,  0.42273918],
        [-6.354304  ,  1.1538917 ],
        ...,
        [-3.9683442 , -3.9986172 ],
        [-5.523289  , -2.926075  ],
        [-5.159676  , -2.0954797 ]],

       [[-3.3582144 , -0.19184045],
        [-3.3537722 , -0.6191169 ],
        [-5.2191873 , -1.3245273 ],
        ...,
        [-3.6180646 ,  0.09287859],
        [-5.2057524 ,  4.7405696 ],
        [-3.2393632 ,  3.7050037 ]],

       [[-2.0643342 , -3.6393173 ],
        [-0.9636353 , -0.5539977 ],
        [-9.473647  , -1.3633595 ],
        ...,
        [-5.902325  ,  1.6823144 ],
        [-5.600879  ,  0.12821612],
        [-3.7335973 , -2.3764122 ]],

       [[-3.7355597 , -1.652874  ],
        [-4.340314  , -1.6495602 ],
        [-1.806061  , -1.1439186 ],
        ...,
        [-2.907298  ,  3.2700646 ],
        [-2.907298  ,  3.2700646 ],
        [-4.0104303 ,  3.187733  ]]], dtype=float32)

class extract_dims(handlers.Messenger):
    """
    This effect handler tracks the plates associated with each sample site.
    The resulting map from sample names to lists of plates is stored
    in `self.dims`.
    """
    def __init__(self, fn=None):
        self.dims = {}
        super().__init__(fn)

    def process_message(self, msg):
        if msg["type"] in ("sample", "deterministic"):
            dims = [a.name for a in msg['cond_indep_stack']]
            dims.reverse()
            self.dims[msg['name']] = dims

dimwrap = extract_dims()
with dimwrap:
    with handlers.seed(rng_seed=1):
        model(predictive=False)

dimwrap.dims

{'Intercept': [],
 'year': ['years'],
 'x': [],
 'sigma': [],
 'mu': ['obs'],
 'y': ['obs']}

def from_numpyro(df, model, mcmc, *args):
    dimwrap = extract_dims()
    with dimwrap:
        with handlers.seed(rng_seed=1):
            model(*args, predictive=False)
    result = az.from_numpyro(mcmc,
        dims=dimwrap.dims)
    return result

def from_numpyro(df, model, mcmc, *args):
    post_pred = Predictive(model, mcmc.get_samples())(jax.random.PRNGKey(1), *args, predictive=True)
    prior = Predictive(model, num_samples=1000)(jax.random.PRNGKey(2), *args, predictive=True)
    dimwrap = extract_dims()
    with dimwrap:
        with handlers.seed(rng_seed=1):
            model(*args, predictive=False)
    result = az.from_numpyro(mcmc,
        prior=prior,
        posterior_predictive=post_pred,
        dims=dimwrap.dims)
    result.constant_data = xr.Dataset.from_dataframe(df)
    result._groups.append('constant_data')
    return result