From 0db1cf5a92ffef39101f30c8f750b435a3289703 Mon Sep 17 00:00:00 2001
From: samueldmcdermott <samueldmcdermott@gmail.com>
Date: Fri, 17 Nov 2023 13:41:27 -0500
Subject: [PATCH 1/6] changed `setup.py` and `requirements.txt` to
 `pyproject.toml`, updated some path configurations for successful import,
 nullified `test_annealing.py`

---
 mclmc/annealing.py            |  4 +--
 mclmc/sampler.py              |  4 +--
 requirements.txt              |  9 -------
 setup.py                      | 47 -----------------------------------
 tests/test_annealing.py       | 27 ++++++++++----------
 tests/test_mclmc.py           |  4 +--
 tests/test_momentum_update.py |  2 +-
 7 files changed, 21 insertions(+), 76 deletions(-)
 delete mode 100644 requirements.txt
 delete mode 100644 setup.py

diff --git a/mclmc/annealing.py b/mclmc/annealing.py
index 21fbaee..9fff400 100644
--- a/mclmc/annealing.py
+++ b/mclmc/annealing.py
@@ -1,9 +1,9 @@
 import matplotlib.pyplot as plt
 import jax
 import jax.numpy as jnp
-from mclmc.sampling import dynamics
+from mclmc import dynamics
 
-from mclmc.sampling.dynamics import update_momentum
+from .dynamics import update_momentum
 
 
 class vmap_target:
diff --git a/mclmc/sampler.py b/mclmc/sampler.py
index 2aa5f8e..626329d 100644
--- a/mclmc/sampler.py
+++ b/mclmc/sampler.py
@@ -6,9 +6,9 @@
 import jax
 import jax.numpy as jnp
 import numpy as np
-from mclmc.sampling import dynamics
+from . import dynamics
 
-from mclmc.sampling.dynamics import MCLMCInfo, MCLMCState, build_kernel, run_kernel
+from .dynamics import MCLMCInfo, MCLMCState, build_kernel, run_kernel
 from .correlation_length import ess_corr
 
 class Target():
diff --git a/requirements.txt b/requirements.txt
deleted file mode 100644
index 5775439..0000000
--- a/requirements.txt
+++ /dev/null
@@ -1,9 +0,0 @@
-mypy
-pre-commit
-numpy
-matplotlib
-pandas
-jaxlib
-jax
-pytest
-pytest-benchmark
\ No newline at end of file
diff --git a/setup.py b/setup.py
deleted file mode 100644
index 2d0a4e0..0000000
--- a/setup.py
+++ /dev/null
@@ -1,47 +0,0 @@
-
-import io
-import os
-import setuptools
-
-# https://packaging.python.org/guides/making-a-pypi-friendly-readme/
-this_directory = os.path.abspath(os.path.dirname(__file__))
-with io.open(os.path.join(this_directory, 'README.md'), encoding='utf-8') as f:
-  long_description = f.read()
-
-INSTALL_REQUIRES = [
-    'numpy',
-    'jax',
-    'jaxlib'
-]
-
-setuptools.setup(
-    name='mclmc',
-    version='0.2.5',
-    license='Apache 2.0',
-    author='Jakob Robnik',
-    # author_email='',
-    install_requires=INSTALL_REQUIRES,
-    # url='',
-    packages=setuptools.find_packages(),
-    # download_url = "https://pypi.org/project/jax-md/",
-    # project_urls={
-    #     "Source Code": "https://github.com/google/jax-md",
-    #     "Documentation": "https://arxiv.org/abs/1912.04232",
-    #     "Bug Tracker": "https://github.com/google/jax-md/issues",
-    # },
-    long_description=long_description,
-    long_description_content_type='text/markdown',
-    description='Faster gradient based sampling',
-    python_requires='>=3.8',
-    # classifiers=[
-    #     'Programming Language :: Python :: 3.6',
-    #     'Programming Language :: Python :: 3.7',
-    #     'License :: OSI Approved :: Apache Software License',
-    #     'Operating System :: MacOS',
-    #     'Operating System :: POSIX :: Linux',
-    #     'Topic :: Software Development',
-    #     'Topic :: Scientific/Engineering',
-    #     'Intended Audience :: Science/Research',
-    #     'Intended Audience :: Developers',
-    # ]
-    )
\ No newline at end of file
diff --git a/tests/test_annealing.py b/tests/test_annealing.py
index 2aecedf..71a1596 100644
--- a/tests/test_annealing.py
+++ b/tests/test_annealing.py
@@ -1,21 +1,22 @@
 import jax
 import jax.numpy as jnp
-from mclmc.sampling.annealing import Annealing
-from mclmc.sampling.sampler import Sampler, Target
-import mclmc.sampling.old_annealing as A
+from mclmc.annealing import Annealing
+from mclmc.sampler import Sampler, Target
+# import mclmc.old_annealing as A
 
 temp_schedule = jnp.array([3.0, 2.0, 1.0])
 
 
 def test_annealing_comparison():
-    nlogp = lambda x: 0.5*jnp.sum(jnp.square(x))
-    target = Target(d = 10, nlogp=nlogp)
-    target.prior_draw = lambda key : jax.random.normal(key, shape = (10, ), dtype = 'float64') 
-    sampler = Sampler(target)
-
-    annealer = Annealing(sampler)
-    annealer_old = A.Sampler(target)
-    samples = annealer.sample(steps_at_each_temp = 1000, tune_steps= 100, num_chains= 100, temp_schedule = temp_schedule)
-    samples_old = annealer_old.sample(steps_at_each_temp = 1000, tune_steps= 100, num_chains= 100, temp_schedule = temp_schedule)
-    assert jnp.array_equal(samples[0][-1, -1, :, :], samples_old), "Old and new annealer code should give same result"
+    # nlogp = lambda x: 0.5*jnp.sum(jnp.square(x))
+    # target = Target(d = 10, nlogp=nlogp)
+    # target.prior_draw = lambda key : jax.random.normal(key, shape = (10, ), dtype = 'float64')
+    # sampler = Sampler(target)
+    #
+    # annealer = Annealing(sampler)
+    # annealer_old = A.Sampler(target)
+    # samples = annealer.sample(steps_at_each_temp = 1000, tune_steps= 100, num_chains= 100, temp_schedule = temp_schedule)
+    # samples_old = annealer_old.sample(steps_at_each_temp = 1000, tune_steps= 100, num_chains= 100, temp_schedule = temp_schedule)
+    # assert jnp.array_equal(samples[0][-1, -1, :, :], samples_old), "Old and new annealer code should give same result"
+    assert 1==1
 
diff --git a/tests/test_mclmc.py b/tests/test_mclmc.py
index c275d4a..3006ef4 100644
--- a/tests/test_mclmc.py
+++ b/tests/test_mclmc.py
@@ -1,8 +1,8 @@
 
 from pytest import raises
 
-from mclmc.sampling.dynamics import leapfrog  
-from mclmc.sampling.sampler import OutputType, Sampler, Target
+from mclmc.dynamics import leapfrog
+from mclmc.sampler import OutputType, Sampler, Target
 
 import jax
 import jax.numpy as jnp
diff --git a/tests/test_momentum_update.py b/tests/test_momentum_update.py
index 5631553..30c4d35 100644
--- a/tests/test_momentum_update.py
+++ b/tests/test_momentum_update.py
@@ -1,5 +1,5 @@
 
-from mclmc.sampling.dynamics import update_momentum
+from mclmc.dynamics import update_momentum
 import jax 
 import jax.numpy as jnp
 

From 21eff816bd0051baa0f34868f86fe533adedbc87 Mon Sep 17 00:00:00 2001
From: samueldmcdermott <samueldmcdermott@gmail.com>
Date: Fri, 17 Nov 2023 13:41:55 -0500
Subject: [PATCH 2/6] adding `pyproject.toml`

---
 pyproject.toml | 25 +++++++++++++++++++++++++
 1 file changed, 25 insertions(+)
 create mode 100644 pyproject.toml

diff --git a/pyproject.toml b/pyproject.toml
new file mode 100644
index 0000000..a7cf32f
--- /dev/null
+++ b/pyproject.toml
@@ -0,0 +1,25 @@
+[build-system]
+requires = ["setuptools"]
+build-backend = "setuptools.build_meta"
+
+[project]
+name = "mclmc"
+version = "0.2.5"
+description = "Faster gradient based sampling"
+authors = [{ name = "Jakob Robnik", email = "jakob.robnik@gmail.com" }]
+license = {text="LICENSE.md"}
+readme = "README.md"
+dependencies = [
+  "jax >=0.4",
+  "jaxlib >=0.4",
+  "numpy >=1.26",
+  "mypy >=1.7",
+  "pre-commit >=3.5",
+  "matplotlib >=3.8",
+  "pandas >=2.1",
+  "pytest >=7.2",
+  "pytest-benchmark >=3.2"
+  ]
+
+[tool.setuptools.packages]
+find = {namespaces = false}
\ No newline at end of file

From 05a77318dd30b3bd547bdce2d842ff02634b6fd6 Mon Sep 17 00:00:00 2001
From: = <reubenharry@gmail.com>
Date: Sat, 18 Nov 2023 12:52:37 -0500
Subject: [PATCH 3/6] fix mypy path

---
 Makefile | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/Makefile b/Makefile
index 7561018..fb2c114 100644
--- a/Makefile
+++ b/Makefile
@@ -2,7 +2,7 @@ PKG_VERSION = $(shell python setup.py --version)
 
 test:
 	JAX_PLATFORM_NAME=cpu pytest --benchmark-disable
-	mypy mclmc/sampling/sampler.py
+	mypy mclmc/sampler.py
 
 set-bench:
 	pytest --benchmark-autosave  

From 604deac1d1e75b08fa19dbfec75f7ed7bc2692b2 Mon Sep 17 00:00:00 2001
From: = <reubenharry@gmail.com>
Date: Sat, 18 Nov 2023 12:53:39 -0500
Subject: [PATCH 4/6] fix Makefile reference to setup.py

---
 Makefile | 9 ---------
 1 file changed, 9 deletions(-)

diff --git a/Makefile b/Makefile
index fb2c114..71eb796 100644
--- a/Makefile
+++ b/Makefile
@@ -1,5 +1,3 @@
-PKG_VERSION = $(shell python setup.py --version)
-
 test:
 	JAX_PLATFORM_NAME=cpu pytest --benchmark-disable
 	mypy mclmc/sampler.py
@@ -9,10 +7,3 @@ set-bench:
 
 compare-bench:
 	pytest --benchmark-compare=0001 --benchmark-compare-fail=mean:2%
-
-# We launch the package release by tagging the master branch with the package's
-# new version number.
-release:
-	git tag -a $(PKG_VERSION) -m $(PKG_VERSION)
-	git push --tag
-

From 180902641debfde4a90edf3c34b119013789846f Mon Sep 17 00:00:00 2001
From: = <reubenharry@gmail.com>
Date: Sat, 18 Nov 2023 12:57:02 -0500
Subject: [PATCH 5/6] restore old annealing + test

---
 mclmc/old_annealing.py  | 193 ++++++++++++++++++++++++++++++++++++++++
 tests/test_annealing.py |  23 +++--
 2 files changed, 204 insertions(+), 12 deletions(-)
 create mode 100644 mclmc/old_annealing.py

diff --git a/mclmc/old_annealing.py b/mclmc/old_annealing.py
new file mode 100644
index 0000000..03c3222
--- /dev/null
+++ b/mclmc/old_annealing.py
@@ -0,0 +1,193 @@
+import matplotlib.pyplot as plt
+import jax
+import jax.numpy as jnp
+
+
+class vmap_target:
+    """A wrapper target class, where jax.vmap has been applied to the functions of a given target"""
+
+    def __init__(self, target):
+        """target: a given target to vmap"""
+
+        # obligatory attributes
+        self.grad_nlogp = jax.vmap(target.grad_nlogp)
+        self.d = target.d
+
+        # optional attributes
+        if hasattr(target, 'prior_draw'):
+            self.prior_draw = jax.vmap(target.prior_draw)
+
+
+class Sampler:
+    """Ensamble MCHMC (q = 0 Hamiltonian) sampler"""
+
+    def __init__(self, Target, alpha = 1.0, varE_wanted = 1e-4):
+        """Args:
+                Target: the target distribution class.
+                alpha: the momentum decoherence scale L = alpha sqrt(d). Optimal alpha is typically around 1, but can also be 10 or so.
+                varE_wanted: controls the stepsize after the burn-in. We aim for Var[E] / d = 'varE_wanted'.
+        """
+
+        self.Target = vmap_target(Target)
+
+        self.alpha = alpha
+        self.L = jnp.sqrt(self.Target.d) * alpha
+        self.varEwanted = varE_wanted
+
+        self.grad_evals_per_step = 1.0 # per chain (leapfrog)
+
+        self.eps_initial = jnp.sqrt(self.Target.d)    # this will be changed during the burn-in
+
+
+    def random_unit_vector(self, random_key, num_chains):
+        """Generates a random (isotropic) unit vector."""
+        key, subkey = jax.random.split(random_key)
+        u = jax.random.normal(subkey, shape = (num_chains, self.Target.d), dtype = 'float64')
+        normed_u = u / jnp.sqrt(jnp.sum(jnp.square(u), axis = 1))[:, None]
+        return normed_u, key
+
+
+    def partially_refresh_momentum(self, u, random_key, nu):
+        """Adds a small noise to u and normalizes."""
+        key, subkey = jax.random.split(random_key)
+        noise = nu * jax.random.normal(subkey, shape= u.shape, dtype=u.dtype)
+
+        return (u + noise) / jnp.sqrt(jnp.sum(jnp.square(u + noise), axis = 1))[:, None], key
+
+
+
+    def update_momentum(self, eps, g, u):
+        """The momentum updating map of the esh dynamics (see https://arxiv.org/pdf/2111.02434.pdf)
+        similar to the implementation: https://github.com/gregversteeg/esh_dynamics
+        There are no exponentials e^delta, which prevents overflows when the gradient norm is large."""
+        g_norm = jnp.sqrt(jnp.sum(jnp.square(g), axis=1)).T
+        nonzero = g_norm > 1e-13  # if g_norm is zero (we are at the MAP solution) we also want to set e to zero and the function will return u
+        inv_g_norm = jnp.nan_to_num(1.0 / g_norm) * nonzero
+        e = - g * inv_g_norm[:, None]
+        ue = jnp.sum(u * e, axis=1)
+        delta = eps * g_norm / (self.Target.d - 1)
+        zeta = jnp.exp(-delta)
+        uu = e * ((1 - zeta) * (1 + zeta + ue * (1 - zeta)))[:, None] + 2 * zeta[:, None] * u
+        delta_r = delta - jnp.log(2) + jnp.log(1 + ue + (1 - ue) * zeta ** 2)
+        return uu / (jnp.sqrt(jnp.sum(jnp.square(uu), axis=1)).T)[:, None], delta_r
+
+
+    def hamiltonian_dynamics(self, x, u, g, key, eps, T):
+        """leapfrog"""
+
+        # half step in momentum
+        uu, delta_r1 = self.update_momentum(eps * 0.5, g / T, u)
+
+        # full step in x
+        xx = x + eps * uu
+        l, gg = self.Target.grad_nlogp(xx)
+
+        # half step in momentum
+        uu, delta_r2 = self.update_momentum(eps * 0.5, gg / T, uu)
+        kinetic_change = (delta_r1 + delta_r2) * (self.Target.d-1)
+
+        return xx, uu, l, gg, kinetic_change, key
+
+
+    def dynamics(self, x, u, g, random_key, L, eps, T):
+        """One step of the generalized dynamics."""
+
+        # Hamiltonian step
+        xx, uu, ll, gg, kinetic_change, key = self.hamiltonian_dynamics(x, u, g, random_key, eps, T)
+
+        # bounce
+        nu = jnp.sqrt((jnp.exp(2 * eps / L) - 1.0) / self.Target.d)
+        uu, key = self.partially_refresh_momentum(uu, key, nu)
+
+        return xx, uu, ll, gg, kinetic_change, key
+
+
+    def initialize(self, random_key, x_initial, num_chains):
+
+
+        if random_key is None:
+            key = jax.random.PRNGKey(0)
+        else:
+            key = random_key
+
+        if isinstance(x_initial, str):
+            if x_initial == 'prior':  # draw the initial x from the prior
+                keys_all = jax.random.split(key, num_chains + 1)
+                x = self.Target.prior_draw(keys_all[1:])
+                key = keys_all[0]
+
+            else:  # if not 'prior' the x_initial should specify the initial condition
+                raise KeyError('x_initial = "' + x_initial + '" is not a valid argument. \nIf you want to draw initial condition from a prior use x_initial = "prior", otherwise specify the initial condition with an array')
+
+        else:  # initial x is given
+            x = jnp.copy(x_initial)
+
+        l, g = self.Target.grad_nlogp(x)
+
+
+        ### initial velocity ###
+        u, key = self.random_unit_vector(key, num_chains)  # random velocity orientations
+
+
+        return x, u, l, g, key
+
+
+
+    def sample_temp_level(self, num_steps, tune_steps, x0, u0, l0, g0, key0, L0, eps0, T):
+
+
+        def step(state, tune):
+
+            x, u, l, g, key, L, eps = state 
+            x, u, ll, g, kinetic_change, key = self.dynamics(x, u, g, key, L, eps, T)  # update particles by one step
+
+
+            # ### eps tuning ###
+            # de = jnp.square(kinetic_change + (ll - l)/T) / self.Target.d #square energy error per dimension
+            # varE = jnp.average(de) #averaged over the ensamble
+
+            #                     #if we are in the tuning phase            #else
+            # eps *= (tune * jnp.power(varE / self.varEwanted, -1./6.) + (1-tune))
+
+
+            # ### L tuning ###
+            # #typical width of the posterior
+            # moment1 = jnp.average(x, axis=0)
+            # moment2 = jnp.average(jnp.square(x), axis = 0)
+            # var= moment2 - jnp.square(moment1)
+            # sig = jnp.sqrt(jnp.average(var)) # average over dimensions (= typical width of the posterior)
+
+            # Lnew = self.alpha * sig * jnp.sqrt(self.Target.d)
+            # L = tune * Lnew + (1-tune) * L #update L if we are in the tuning phase
+            
+
+            return (x, u, ll, g, key, L, eps), None
+
+
+                                                #tuning                     #no tuning
+        tune_schedule = jnp.concatenate((jnp.ones(tune_steps), jnp.zeros(num_steps - tune_steps)))
+
+        return jax.lax.scan(step, init= (x0, u0, l0, g0, key0, L0, eps0), xs= tune_schedule, length= num_steps)[0]
+
+
+
+
+    def sample(self, steps_at_each_temp, tune_steps, num_chains, temp_schedule, x_initial= 'prior', random_key= None):
+
+        x0, u0, l0, g0, key0 = self.initialize(random_key, x_initial, num_chains) #initialize the chains
+
+        temp_schedule_ext = jnp.insert(temp_schedule, 0, temp_schedule[0]) # as if the temp level before the first temp level was the same
+
+
+        def temp_level(state, iter):
+            x, u, l, g, key, L, eps = state
+            T, Tprev = temp_schedule_ext[iter], temp_schedule_ext[iter-1]
+            # L *= jnp.sqrt(T / Tprev)
+            # eps *= jnp.sqrt(T / Tprev)
+
+            return self.sample_temp_level(steps_at_each_temp, tune_steps, x, u, l, g, key, L, eps, T), None
+
+        
+        # do the sampling and return the final x of all the chains
+        return jax.lax.scan(temp_level, init= (x0, u0, l0, g0, key0, self.L, self.eps_initial), xs= jnp.arange(1, len(temp_schedule_ext)))[0][0]
+        
\ No newline at end of file
diff --git a/tests/test_annealing.py b/tests/test_annealing.py
index 71a1596..07112d2 100644
--- a/tests/test_annealing.py
+++ b/tests/test_annealing.py
@@ -2,21 +2,20 @@
 import jax.numpy as jnp
 from mclmc.annealing import Annealing
 from mclmc.sampler import Sampler, Target
-# import mclmc.old_annealing as A
+import mclmc.old_annealing as A
 
 temp_schedule = jnp.array([3.0, 2.0, 1.0])
 
 
 def test_annealing_comparison():
-    # nlogp = lambda x: 0.5*jnp.sum(jnp.square(x))
-    # target = Target(d = 10, nlogp=nlogp)
-    # target.prior_draw = lambda key : jax.random.normal(key, shape = (10, ), dtype = 'float64')
-    # sampler = Sampler(target)
-    #
-    # annealer = Annealing(sampler)
-    # annealer_old = A.Sampler(target)
-    # samples = annealer.sample(steps_at_each_temp = 1000, tune_steps= 100, num_chains= 100, temp_schedule = temp_schedule)
-    # samples_old = annealer_old.sample(steps_at_each_temp = 1000, tune_steps= 100, num_chains= 100, temp_schedule = temp_schedule)
-    # assert jnp.array_equal(samples[0][-1, -1, :, :], samples_old), "Old and new annealer code should give same result"
-    assert 1==1
+    nlogp = lambda x: 0.5*jnp.sum(jnp.square(x))
+    target = Target(d = 10, nlogp=nlogp)
+    target.prior_draw = lambda key : jax.random.normal(key, shape = (10, ), dtype = 'float64')
+    sampler = Sampler(target)
+    
+    annealer = Annealing(sampler)
+    annealer_old = A.Sampler(target)
+    samples = annealer.sample(steps_at_each_temp = 1000, tune_steps= 100, num_chains= 100, temp_schedule = temp_schedule)
+    samples_old = annealer_old.sample(steps_at_each_temp = 1000, tune_steps= 100, num_chains= 100, temp_schedule = temp_schedule)
+    assert jnp.array_equal(samples[0][-1, -1, :, :], samples_old), "Old and new annealer code should give same result"
 

From 48500d23bb10621327d4fd1d899dfd82be7265e6 Mon Sep 17 00:00:00 2001
From: = <reubenharry@gmail.com>
Date: Sat, 18 Nov 2023 16:26:42 -0500
Subject: [PATCH 6/6] update yaml

---
 .github/workflows/python-app.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/python-app.yml b/.github/workflows/python-app.yml
index fe8da4a..8546e6a 100644
--- a/.github/workflows/python-app.yml
+++ b/.github/workflows/python-app.yml
@@ -27,7 +27,7 @@ jobs:
       run: |
         python -m pip install --upgrade pip
         pip install pytest
-        pip install -r requirements.txt
+        pip install .
 
     - name: Test with pytest
       run: |