add source

lanl · Jan 14, 2025 · be0b357 · be0b357
1 parent c215b3f
commit be0b357
Show file tree

Hide file tree

Showing 37 changed files with 21,816 additions and 1 deletion.
diff --git a/.github/workflows/CI.yml b/.github/workflows/CI.yml
@@ -0,0 +1,30 @@
+name: CI
+
+on: [push]
+
+jobs:
+  build:
+    runs-on: ${{ matrix.os }}
+    continue-on-error: ${{ matrix.os == 'windows-latest' }}
+    strategy:
+      matrix:
+        os: [ubuntu-latest, macos-latest, windows-latest]
+        python-version:
+          - "3.10"
+          - "3.12"
+          - "3.13"
+          - "3.13t"
+        # NOTE: Example for excluding specific python versions for an different OS's.
+        # exclude:
+        #   - os: windows-latest
+        #     python-version: 3.6
+        #   - os: macos-latest
+        #     python-version: 3.8
+    steps:
+    - uses: actions/checkout@v4
+    - name: Install uv and set the python version
+      uses: astral-sh/setup-uv@v5
+      with:
+        python-version: ${{ matrix.python-version }}
+    - name: Run tests
+      run: uv run pytest -s
diff --git a/.gitignore b/.gitignore
@@ -0,0 +1,12 @@
+# Python-generated files
+__pycache__/
+*.py[oc]
+build/
+dist/
+wheels/
+*.egg-info
+
+# Virtual environments
+.venv
+
+demos/emcee.ipynb
diff --git a/.python-versions b/.python-versions
@@ -0,0 +1,3 @@
+3.10
+3.13
+3.13t
diff --git a/LICENSE b/LICENSE
@@ -1,6 +1,6 @@
 MIT License
 
-Copyright (c) 2025 Los Alamos National Laboratory
+Copyright (c) 2024 Los Alamos National Laboratory
 
 Permission is hereby granted, free of charge, to any person obtaining a copy
 of this software and associated documentation files (the "Software"), to deal

diff --git a/README.md b/README.md
@@ -0,0 +1,181 @@
+# Arianna
+A probabilistic programming language for python built on numpy.
+
+## Installation
+**pip**
+```
+pip install git+https://github.com/lanl/arianna.git
+```
+
+**uv**
+```
+uv add  git+https://github.com/lanl/arianna.git
+```
+
+## Usage
+
+**Model Specification (linear regression)**
+```python
+from typing import Optional
+
+import numpy as np
+from numpy.random import default_rng
+
+from arianna.distributions import Gamma, Normal
+from arianna.ppl.context import Context, Predictive
+from arianna.ppl.inference import (
+    AIES,
+    AffineInvariantMCMC,
+    Chain,
+    LaplaceApproximation,
+    ParallelAIES,
+    RandomWalkMetropolis,
+)
+
+# Type annotation are, of course, optional. Provided only for clarity.
+def linear_regression(
+    ctx: Context,
+    X: np.ndarray,
+    y: Optional[np.ndarray]=None,
+    bias: bool=True
+) -> None:
+    _, p = X.shape
+    beta = ctx.rv("beta", Normal(np.zeros(p), 10))
+    sigma = ctx.rv("sigma", Gamma(1, 1))
+    mu = ctx.cached("mu", X @ beta)
+    if bias:
+        alpha = ctx.rv("alpha", Normal(0, 10))
+        mu += alpha
+
+    ctx.rv("y", Normal(mu, sigma), obs=y)
+```
+
+**Simulate data from Prior Predictive**
+```python
+nobs = 100
+rng = np.random.default_rng(0)
+
+# Generate random predictors (X).
+X = rng.normal(0, 1, (nobs, 1))
+
+# Simulate from prior predictive using Predictive.
+sim_truth = Predictive.run(
+    linear_regression,  # supplied model here.
+    state=dict(sigma=0.7),
+    rng=rng,
+    X=X,
+    # since y is None, the returned dictionary will contain y sampled from it's
+    # predictive distributions.
+    y=None,
+    # Not return cached values, so the sim_truth will contain only parameters
+    # and y.
+    return_cached=False,  
+)
+
+# pop y so that sim_truth contains only model parameters.
+y = sim_truth.pop("y")
+
+# Now sim_truth is a dict containing ("beta", "sigma", "alpha").
+```
+
+**Affine invariant ensemble sampler**
+```python
+aies = AIES(
+    linear_regression,  # model function.
+    nwalkers=10,  # number of walkers.
+    # Whether or not to transform parameters into unconstrained space.
+    transform=True,  # Set to true when possible.
+    # Random number generator for reproducibility.
+    rng=default_rng(0),
+    # Provide data.
+    X=X, y=y,
+)
+
+# Does 3000 steps, with 10 walkers, after burning for 3000, and thins by 1. At
+# the end, 3000 = 3000*10 samples will be aggregated from all 10 walkers. Then,
+# by default, these samples are passed into an importance sampler to reweight
+# the samples, yielding 3000 samples.
+chain = aies.fit(nsteps=3000, burn=3000, thin=1)
+```
+
+`chain` is an object that contains posterior samples (states).
+You can iterate over `chain`.
+
+```python
+for state in chain:
+    print(state)  # state is a e.g., dict(alpha=1.3, beta=2.5, sigma=0.6, mu=some_long_array)
+    break # just print the first one.
+```
+
+You can convert `chain` into a large dict with `bundle = chain.bundle`,
+which is a `dict[str, ndarray]`.
+
+You can also get the samples directly with `chain.samples`.
+
+**Parallel Affine invariant ensemble sampler**
+Works only in python 3.13t. But 3.13t does not yet work with `jupyter`.
+
+```python
+from concurrent.futures import ThreadPoolExecutor
+
+paies = ParallelAIES(
+    linear_regression,  # model function.
+    ThreadPoolExecutor(4)  # use 4 cores.
+    nwalkers=10,  # number of walkers.
+    # Whether or not to transform parameters into unconstrained space.
+    transform=True,  # Set to true when possible.
+    # Random number generator for reproducibility.
+    rng=default_rng(0),
+    # Provide data.
+    X=X, y=y,
+)
+
+# Same as non-parallel version, but will be faster in python 3.13t.
+# Will be slightly slower than the non-parallel version in GIL enabled python
+# builds, i.e. python 3.9, 3.10, 3.11, 3.12, 3.13.
+chain = paies.fit(nsteps=3000, burn=3000, thin=1)
+```
+
+**Laplace Approximation**
+```python
+la = LaplaceApproximation(
+    linear_regression,
+    transform=True,
+    rng=default_rng(0),
+    X=X, y=y,
+)
+
+# The MAP estimate and inverse Hessian are computed via L-BFGS optimization.
+# Those estimates are used to construct a MvNormal object. 3000 samples are
+# drawn from that resulting MvNormal.
+chain = la.fit(nsamples=3000)
+```
+
+**Posterior Predictive**
+```python
+rng = default_rng
+xnew = np.linspace(-3, 3, 50)
+Xnew = xnew.reshape(-1, 1)
+ynew = Chain(
+    Predictive.run(
+        linear_regression, state=state, rng=rng, X=Xnew, y=None
+    )
+    for state in chain
+).get("y")
+```
+
+See [demos](demos/).
+
+## Threading
+As of 8 Jan 2025, `jupyter` does not work with the threaded version of python
+3.13 (3.13t). You can install `arianna` with python 3.13 or python 3.13t but
+you cannot install `jupyter` also. If you must use `jupyter`, use python 3.12.
+
+## Developer Notes
+
+### Updating versions
+1. Update version in `pyproject.toml`
+2. `uv sync`
+3. `git commit -am 'some message'`
+4. Update git tag 
+5. `git push --tags`
diff --git a/demos/friedman.ipynb b/demos/friedman.ipynb
diff --git a/demos/linear-regression.ipynb b/demos/linear-regression.ipynb
diff --git a/docs/arianna.html b/docs/arianna.html
diff --git a/docs/arianna/distributions.html b/docs/arianna/distributions.html
diff --git a/docs/arianna/distributions/abstract.html b/docs/arianna/distributions/abstract.html
diff --git a/docs/arianna/distributions/distributions.html b/docs/arianna/distributions/distributions.html
diff --git a/docs/arianna/ppl.html b/docs/arianna/ppl.html
diff --git a/docs/arianna/ppl/context.html b/docs/arianna/ppl/context.html
diff --git a/docs/arianna/ppl/diagnostics.html b/docs/arianna/ppl/diagnostics.html
diff --git a/docs/arianna/ppl/inference.html b/docs/arianna/ppl/inference.html
diff --git a/docs/arianna/ppl/shaper.html b/docs/arianna/ppl/shaper.html
diff --git a/docs/arianna/types.html b/docs/arianna/types.html
diff --git a/docs/index.html b/docs/index.html
@@ -0,0 +1,7 @@
+<!doctype html>
+<html>
+<head>
+    <meta charset="utf-8">
+    <meta http-equiv="refresh" content="0; url=./arianna.html"/>
+</head>
+</html>
diff --git a/docs/search.js b/docs/search.js
diff --git a/justfile b/justfile
@@ -0,0 +1,83 @@
+alias ta := test-all
+alias tl := test-lowest-versions
+alias th := test-highest-versions
+alias tt := test-nogil
+alias t := test
+alias w := watch
+alias p := python
+alias d := docs
+alias s := serve
+alias r := recover-uvlock
+alias f := fmt
+alias c := clean
+
+@default:
+    just -u -l
+
+watch *flags:
+    uv run --frozen -- watchmedo shell-command \
+      --patterns='*.py' \
+      --recursive \
+      --command='just test {{ flags }}' \
+      --verbose \
+      src/ tests/
+
+# Disable warnings by adding `--disable-warnings`.
+test *flags:
+    uv run --frozen -- \
+    pytest -s tests/ {{ if flags == "-dw" { "--disable-warnings" } else { "" } }}
+
+test-all *flags:
+    just test-lowest-versions {{ flags }}
+    just test-highest-versions {{ flags }}
+    just test-nogil {{ flags }}
+
+test-lowest-versions *flags:
+    uv run --resolution=lowest-direct --python=3.10 --isolated -- \
+    pytest -s {{ if flags == "-dw" { "--disable-warnings" } else { "" } }}
+    just recover-uvlock
+
+test-highest-versions *flags:
+    uv run --resolution=highest --python=3.13 --isolated -- \
+    pytest -s {{ if flags == "-dw" { "--disable-warnings" } else { "" } }}
+    just recover-uvlock
+
+test-nogil *flags:
+    uv run --resolution=highest --python=3.13t --isolated -- \
+    pytest -s {{ if flags == "-dw" { "--disable-warnings" } else { "" } }}
+    just recover-uvlock
+
+sync:
+    uv sync --frozen
+
+python:
+    uv run --frozen -- ipython --no-autoindent
+
+docs:
+    rm -rf docs/*
+    uv run --frozen pdoc --math ./src/arianna -o ./docs --docformat numpy
+
+serve:
+    # uv run --frozen python -m http.server -d ./docs 8000
+    uv run --frozen pdoc --docformat numpy --math -p 8000 ./src/arianna
+
+fmt-self:
+    just --fmt --unstable
+
+recover-uvlock:
+    git checkout uv.lock
+    uv sync --frozen
+
+# uv run --resolution=lowest-direct --python=3.10 --isolated -- pytest -s
+
+fmt-py:
+    ruff format
+
+fmt: fmt-self fmt-py
+
+lint:
+  ruff check --fix
+
+clean:
+  rm -rf src/*.egg-info src/arianna/__pycache__ src/arianna/*/__pycache__
+  rm -rf dist
-Original file line number
+Diff line change
@@ -0,0 +1,3 @@
+.10
+.13
+.13t