├── poetry.toml ├── docs ├── assets │ └── iclogo.png ├── index.md ├── .icons │ └── logos │ │ └── iclogo.svg └── 5-Parallel-Euler-Maruyama-Class.ipynb ├── requirements.txt ├── src └── euler_maruyama │ ├── __init__.py │ ├── plotting.py │ ├── parallel_euler_maruyama.py │ ├── coefficients.py │ └── euler_maruyama.py ├── .github └── workflows │ ├── docs.yml │ └── tests_workflow.yaml ├── .gitignore ├── pyproject.toml ├── LICENSE.md ├── tests ├── test_coefficients.py ├── test_parallel_euler_maruyama.py └── test_euler_maruyama.py ├── mkdocs.yml └── README.md /poetry.toml: -------------------------------------------------------------------------------- 1 | [virtualenvs] 2 | in-project = true -------------------------------------------------------------------------------- /docs/assets/iclogo.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ImperialCollegeLondon/ReCoDe-Euler-Maruyama/HEAD/docs/assets/iclogo.png -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- 1 | 2 | mkdocs-jupyter==0.21.0 3 | mkdocs==1.3.0 4 | mkdocs-material==8.3.9 5 | python-markdown-math==0.8 6 | mkdocs-include-markdown-plugin==3.5.2 7 | poetry 8 | numpy 9 | matplotlib 10 | jupyter 11 | joblib 12 | -------------------------------------------------------------------------------- /src/euler_maruyama/__init__.py: -------------------------------------------------------------------------------- 1 | from .coefficients import ( 2 | ConstantDiffusion, 3 | LinearDrift, 4 | MeanReversionDrift, 5 | MultiplicativeNoiseDiffusion, 6 | ) 7 | from .euler_maruyama import EulerMaruyama 8 | from .parallel_euler_maruyama import ParallelEulerMaruyama 9 | from .plotting import plot_approximation 10 | -------------------------------------------------------------------------------- /docs/index.md: -------------------------------------------------------------------------------- 1 | 7 | 8 | {% 9 | include-markdown "../README.md" 10 | 11 | %} 12 | 13 | 15 | -------------------------------------------------------------------------------- /.github/workflows/docs.yml: -------------------------------------------------------------------------------- 1 | name: docs 2 | on: 3 | push: 4 | branches: 5 | - main 6 | - gnikit/changes 7 | jobs: 8 | deploy: 9 | name: Deploy Mkdocs to gh-pages branch 10 | runs-on: ubuntu-latest 11 | steps: 12 | - uses: actions/checkout@v2 13 | - uses: actions/setup-python@v2 14 | with: 15 | python-version: 3.x 16 | - name: Install dependencies 17 | run: pip install -r requirements.txt 18 | - name: Deploy Mkdocs 19 | run: mkdocs gh-deploy --force 20 | -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- 1 | # Byte-compiled / optimized / DLL files 2 | __pycache__/ 3 | *.py[cod] 4 | *$py.class 5 | 6 | # C extensions 7 | *.so 8 | 9 | # Distribution / packaging 10 | .Python 11 | env/ 12 | .venv/ 13 | .idea/ 14 | build/ 15 | develop-eggs/ 16 | dist/ 17 | downloads/ 18 | eggs/ 19 | .eggs/ 20 | lib/ 21 | lib64/ 22 | parts/ 23 | sdist/ 24 | var/ 25 | *.egg-info/ 26 | .installed.cfg 27 | *.egg 28 | *dist/ 29 | pip-wheel-metadata/ 30 | .python-version 31 | 32 | # Installer logs 33 | pip-log.txt 34 | pip-delete-this-directory.txt 35 | 36 | # Unit test / coverage reports 37 | htmlcov/ 38 | .tox/ 39 | .coverage_report/ 40 | .coverage.* 41 | .coverage 42 | .cache 43 | nosetests.xml 44 | coverage.xml 45 | *,cover 46 | .pytest_cache/ 47 | .mypy_cache/ 48 | .ruff_cache/ 49 | .test_report/ 50 | test-results/ 51 | 52 | ## Docs 53 | docs/_build/ 54 | site/ 55 | -------------------------------------------------------------------------------- /src/euler_maruyama/plotting.py: -------------------------------------------------------------------------------- 1 | import matplotlib.pyplot as plt 2 | import numpy as np 3 | 4 | 5 | def plot_approximation(Y: np.ndarray, t: np.ndarray, title: str) -> None: 6 | """Plot the numerical approximation obtained for the Stochastic Differential Equation. 7 | 8 | Parameters 9 | ---------- 10 | Y: np.ndarray 11 | The approximated trajectories of the Euler-Maruyama method, shape = (number of simulations, number of steps). 12 | 13 | t: np.ndarray 14 | Array containing the time steps values, shape: (number of steps, ). 15 | 16 | title: str 17 | Title of the figure. 18 | """ 19 | 20 | fig, ax = plt.subplots(figsize=(7, 5)) 21 | 22 | ax.plot(t, Y.T, alpha=0.3) 23 | 24 | ax.set_xlabel(r"$t$") 25 | ax.set_ylabel(r"$Y_t$") 26 | 27 | ax.set_title(title) 28 | 29 | plt.show() 30 | -------------------------------------------------------------------------------- /pyproject.toml: -------------------------------------------------------------------------------- 1 | [tool.poetry] 2 | name = "euler-maruyama" 3 | version = "0.1.0" 4 | description = "ReCoDe - Python class for the Euler-Maruyama method for solving stochastic differential equations." 5 | authors = [ 6 | "Antonio Malpica ", 7 | "Chris Cooling " 8 | ] 9 | readme = "README.md" 10 | packages = [{include = "euler_maruyama", from = "src"}] 11 | 12 | [tool.poetry.dependencies] 13 | python = "^3.9" 14 | numpy = "^1.24.3" 15 | matplotlib = "^3.7.1" 16 | jupyter = "^1.0.0" 17 | joblib = "^1.2.0" 18 | 19 | [tool.poetry.group.dev] 20 | optional = true 21 | 22 | [tool.poetry.group.dev.dependencies] 23 | black = {version = "22.10.*", allow-prereleases = true} 24 | isort = "5.12.*" 25 | pytest = "^7.4.0" 26 | pytest-html = "^3.2.0" 27 | 28 | 29 | [build-system] 30 | requires = ["poetry-core"] 31 | build-backend = "poetry.core.masonry.api" 32 | -------------------------------------------------------------------------------- /.github/workflows/tests_workflow.yaml: -------------------------------------------------------------------------------- 1 | name: test - workflow 2 | 3 | on: 4 | push: 5 | branches: [main] 6 | paths: 7 | - 'src/**' 8 | - 'tests/**' 9 | - 'pyproject.toml' 10 | 11 | jobs: 12 | tests: 13 | name: Test (${{ matrix.python }}) 14 | runs-on: ubuntu-latest 15 | strategy: 16 | matrix: 17 | python: [ "3.9", "3.10", "3.11" ] 18 | container: 19 | image: python:${{ matrix.python }} 20 | steps: 21 | - name: Checkout 22 | uses: actions/checkout@v3 23 | with: 24 | path: main 25 | - name: Install poetry 26 | working-directory: ./main 27 | run: | 28 | pip install pip poetry --upgrade 29 | poetry install --with dev 30 | - name: Code format checking 31 | working-directory: ./main 32 | run: poetry run black . 33 | - name: Imports order checking 34 | working-directory: ./main 35 | run: poetry run isort . 36 | - name: Tests 37 | working-directory: ./main 38 | run: poetry run pytest tests/ -vv 39 | -------------------------------------------------------------------------------- /LICENSE.md: -------------------------------------------------------------------------------- 1 | BSD 3-Clause License 2 | 3 | Copyright (c) 2022, Imperial College London 4 | All rights reserved. 5 | 6 | Redistribution and use in source and binary forms, with or without 7 | modification, are permitted provided that the following conditions are met: 8 | 9 | 1. Redistributions of source code must retain the above copyright notice, this 10 | list of conditions and the following disclaimer. 11 | 12 | 2. Redistributions in binary form must reproduce the above copyright notice, 13 | this list of conditions and the following disclaimer in the documentation 14 | and/or other materials provided with the distribution. 15 | 16 | 3. Neither the name of the copyright holder nor the names of its 17 | contributors may be used to endorse or promote products derived from 18 | this software without specific prior written permission. 19 | 20 | THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" 21 | AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 22 | IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE 23 | DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE 24 | FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 25 | DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR 26 | SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER 27 | CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, 28 | OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 29 | OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 30 | -------------------------------------------------------------------------------- /tests/test_coefficients.py: -------------------------------------------------------------------------------- 1 | import numpy as np 2 | import pytest 3 | 4 | from euler_maruyama import ( 5 | ConstantDiffusion, 6 | LinearDrift, 7 | MeanReversionDrift, 8 | MultiplicativeNoiseDiffusion, 9 | ) 10 | 11 | 12 | @pytest.fixture(scope="module") 13 | def X_input(): 14 | X_input = np.random.randn(20, 1) 15 | return X_input 16 | 17 | 18 | @pytest.fixture(scope="module") 19 | def t_input(): 20 | t_input = 10 21 | return t_input 22 | 23 | 24 | def test_LinearDrift(X_input, t_input): 25 | 26 | a = 2.5 27 | linear_drift = LinearDrift(a=a) 28 | 29 | output = linear_drift.get_value(X=X_input, t=t_input) 30 | 31 | expected_output = np.ones_like(X_input) * t_input * a 32 | 33 | np.testing.assert_array_equal(output, expected_output) 34 | 35 | 36 | def test_MeanReversionDrift(X_input, t_input): 37 | 38 | theta = 0.2 39 | mean = 1 40 | mean_reversion_drift = MeanReversionDrift(theta=theta, mean=mean) 41 | 42 | output = mean_reversion_drift.get_value(X=X_input, t=t_input) 43 | 44 | expected_output = theta * (mean - X_input) 45 | 46 | np.testing.assert_array_equal(output, expected_output) 47 | 48 | 49 | def test_ConstantDiffusion(X_input, t_input): 50 | 51 | b = 0.1 52 | constant_diffusion = ConstantDiffusion(b=b) 53 | 54 | output = constant_diffusion.get_value(X=X_input, t=t_input) 55 | 56 | expected_output = np.ones_like(X_input) * b 57 | 58 | np.testing.assert_array_equal(output, expected_output) 59 | 60 | 61 | def test_MultiplicativeNoiseDiffusion(X_input, t_input): 62 | 63 | b = 0.5 64 | multiplicative_noise_diffusion = MultiplicativeNoiseDiffusion(b=b) 65 | 66 | output = multiplicative_noise_diffusion.get_value(X=X_input, t=t_input) 67 | 68 | expected_output = X_input * b 69 | 70 | np.testing.assert_array_equal(output, expected_output) 71 | -------------------------------------------------------------------------------- /mkdocs.yml: -------------------------------------------------------------------------------- 1 | site_name: ReCoDE Euler-Maruyama 2 | 3 | # Steps to follow on GitHub to publish your mkdocs site: 4 | # 1. Create a new branch called gh-pages 5 | # 2. Ensure GitHub Pages is enabled for your repository, Settings>Pages> Enable. 6 | # Make sure that Source is set to `gh-pages` and `/(root)`. Save this setting. 7 | # 3. Ensure that on GitHub workflows have read and write access to your repository 8 | # Settings>Actions>General>Workflow permissions, tick `Read and write permissions` 9 | # and save this setting. 10 | # Change this to the name of your repo 11 | repo_url: https://github.com/ImperialCollegeLondon/ReCoDe-Euler-Maruyama 12 | edit_uri: tree/main/docs/ 13 | 14 | theme: 15 | name: material 16 | custom_dir: docs 17 | 18 | icon: 19 | logo: logos/iclogo 20 | favicon: assets/iclogo.png 21 | font: 22 | text: Roboto 23 | code: Roboto Mono 24 | palette: 25 | - scheme: default 26 | toggle: 27 | icon: material/toggle-switch 28 | name: Switch to dark mode 29 | - scheme: slate 30 | toggle: 31 | icon: material/toggle-switch-off-outline 32 | name: Switch to light mode 33 | 34 | # SPA behaviour 35 | features: 36 | - navigation.instant 37 | - navigation.top 38 | - toc.follow 39 | - content.code.annotate 40 | extra: 41 | homepage: https://imperialcollegelondon.github.io/ReCoDE-home/ 42 | 43 | # Add here all the plugins you want to use. 44 | # Don't forget to add them in requirements.txt as well. 45 | plugins: 46 | - tags 47 | - search 48 | - include-markdown # https://github.com/mondeja/mkdocs-include-markdown-plugin 49 | - mkdocs-jupyter 50 | 51 | # Set settings for markdown extensions 52 | markdown_extensions: 53 | - meta 54 | - mdx_math: 55 | enable_dollar_delimiter: True 56 | - pymdownx.highlight: 57 | anchor_linenums: false 58 | - pymdownx.inlinehilite 59 | - pymdownx.snippets 60 | - pymdownx.superfences 61 | 62 | # Render math in mkdocs 63 | extra_javascript: 64 | - https://cdn.mathjax.org/mathjax/latest/MathJax.js?config=TeX-AMS_HTML 65 | -------------------------------------------------------------------------------- /tests/test_parallel_euler_maruyama.py: -------------------------------------------------------------------------------- 1 | import numpy as np 2 | import pytest 3 | 4 | from euler_maruyama import ConstantDiffusion, LinearDrift, ParallelEulerMaruyama 5 | 6 | 7 | @pytest.fixture(scope="function") 8 | def parallel_em(): 9 | 10 | linear_drift = LinearDrift(a=2) 11 | constant_diffusion = ConstantDiffusion(b=0.5) 12 | 13 | em = ParallelEulerMaruyama( 14 | t_0=0, 15 | t_n=2, 16 | n_steps=500, 17 | X_0=1.0, 18 | drift=linear_drift, 19 | diffusion=constant_diffusion, 20 | n_sim=1000, 21 | n_jobs=4, 22 | ) 23 | 24 | return em 25 | 26 | 27 | def test_n_jobs(parallel_em): 28 | 29 | assert parallel_em.n_jobs == 4 30 | 31 | parallel_em.n_jobs = 2 32 | assert parallel_em.n_jobs == 2 33 | 34 | with pytest.raises(ValueError) as ex_info: 35 | parallel_em.n_jobs = -5 36 | 37 | assert ex_info.value.args[0] == "Number of batches must be positive." 38 | 39 | 40 | def test_num_sim_batch(parallel_em): 41 | 42 | batches = parallel_em._num_sim_batch() 43 | 44 | assert batches == [250] * 4 45 | 46 | parallel_em.n_jobs = 3 47 | 48 | new_batches = parallel_em._num_sim_batch() 49 | 50 | assert new_batches == [333] * (3 - 1) + [334] * 1 51 | 52 | parallel_em.n_jobs = 7 53 | 54 | new_batches_2 = parallel_em._num_sim_batch() 55 | 56 | assert new_batches_2 == [142] * (7 - 6) + [143] * 6 57 | 58 | 59 | def test_numerical_approximation(parallel_em): 60 | 61 | Y = parallel_em.compute_numerical_approximation() 62 | 63 | assert Y.shape == (parallel_em.n_sim, parallel_em.n_steps + 1) 64 | 65 | expected_Y_0 = np.ones(parallel_em.n_sim) * parallel_em._X_0 66 | np.testing.assert_array_equal(Y[:, 0], expected_Y_0) 67 | 68 | expected_mean_Y_t = parallel_em._X_0 + parallel_em._t_n * 2 69 | mean_Y_t = np.mean(Y[:, -1]) 70 | assert expected_mean_Y_t == pytest.approx(mean_Y_t, 0.1) 71 | 72 | expected_std_Y_t = 0.5 * np.sqrt(parallel_em._t_n) 73 | std_Y_t = np.std(Y[:, -1]) 74 | assert expected_std_Y_t == pytest.approx(std_Y_t, 0.1) 75 | -------------------------------------------------------------------------------- /tests/test_euler_maruyama.py: -------------------------------------------------------------------------------- 1 | import numpy as np 2 | import pytest 3 | 4 | from euler_maruyama import ConstantDiffusion, EulerMaruyama, LinearDrift 5 | 6 | 7 | @pytest.fixture(scope="function") 8 | def em(): 9 | 10 | linear_drift = LinearDrift(a=2) 11 | constant_diffusion = ConstantDiffusion(b=0.5) 12 | 13 | em = EulerMaruyama( 14 | t_0=0, 15 | t_n=2, 16 | n_steps=500, 17 | X_0=1.0, 18 | drift=linear_drift, 19 | diffusion=constant_diffusion, 20 | n_sim=1000, 21 | ) 22 | 23 | return em 24 | 25 | 26 | def test_discretisation(em): 27 | 28 | expected_t, expected_delta = np.linspace( 29 | em._t_0, em._t_n, em.n_steps + 1, retstep=True 30 | ) 31 | np.testing.assert_array_equal(em.t, expected_t) 32 | assert em.delta == expected_delta 33 | 34 | 35 | def test_n_sim(em): 36 | 37 | assert em.n_sim == 1000 38 | 39 | em.n_sim = 10 40 | 41 | assert em.n_sim == 10 42 | 43 | with pytest.raises(ValueError) as ex_info: 44 | em.n_sim = -10 45 | 46 | assert ex_info.value.args[0] == "Number of simulations must be positive." 47 | 48 | 49 | def test_n_steps(em): 50 | 51 | assert em.n_steps == 500 52 | 53 | em.n_steps = 10 54 | 55 | assert em.n_steps == 10 56 | expected_t, expected_delta = np.linspace(em._t_0, em._t_n, 10 + 1, retstep=True) 57 | np.testing.assert_array_equal(em.t, expected_t) 58 | assert em.delta == expected_delta 59 | 60 | 61 | def test_allocate_Y(em): 62 | 63 | Y = em._allocate_Y(dim=em.n_sim) 64 | 65 | assert Y.shape == (em.n_sim, em.n_steps + 1) 66 | 67 | expected_Y_0 = np.ones(em.n_sim) * em._X_0 68 | np.testing.assert_array_equal(Y[:, 0], expected_Y_0) 69 | 70 | 71 | def test_numerical_approximation(em): 72 | 73 | Y = em.compute_numerical_approximation() 74 | 75 | assert Y.shape == (em.n_sim, em.n_steps + 1) 76 | 77 | expected_Y_0 = np.ones(em.n_sim) * em._X_0 78 | np.testing.assert_array_equal(Y[:, 0], expected_Y_0) 79 | 80 | expected_mean_Y_t = em._X_0 + em._t_n * 2 81 | mean_Y_t = np.mean(Y[:, -1]) 82 | assert expected_mean_Y_t == pytest.approx(mean_Y_t, 0.1) 83 | 84 | expected_std_Y_t = 0.5 * np.sqrt(em._t_n) 85 | std_Y_t = np.std(Y[:, -1]) 86 | assert expected_std_Y_t == pytest.approx(std_Y_t, 0.1) 87 | -------------------------------------------------------------------------------- /src/euler_maruyama/parallel_euler_maruyama.py: -------------------------------------------------------------------------------- 1 | import numpy as np 2 | from joblib import Parallel, delayed 3 | 4 | from .coefficients import Coefficient 5 | from .euler_maruyama import EulerMaruyama 6 | 7 | 8 | class ParallelEulerMaruyama(EulerMaruyama): 9 | """Class to perform the numerical solution of a Stochastic Differential Equation (SDE) through the Euler-Maruyama method 10 | using parallel computation. 11 | 12 | Parameters 13 | ---------- 14 | t_0: float 15 | Initial time. 16 | 17 | t_n: float 18 | Final time. 19 | 20 | n_steps: int 21 | Number of time steps to discretise the time interval [t_0, t_n]. 22 | 23 | X_0: float 24 | Initial condition of the SDE. 25 | 26 | drift: Coefficient 27 | Drift (mu) coefficient of the SDE. 28 | 29 | diffusion: Coefficient 30 | Diffusion (sigma) coefficient of the SDE. 31 | 32 | n_sim: int 33 | Number of simulated approximations. 34 | 35 | n_jobs: int 36 | Number of batches to compute in parallel. 37 | 38 | Attributes 39 | ---------- 40 | _t_0: float 41 | Initial time. 42 | 43 | _t_n: float 44 | Final time. 45 | 46 | _n_steps: int 47 | Number of time steps to discretise the time interval [t_0, t_n]. 48 | 49 | _X_0: float 50 | Initial condition of the SDE. 51 | 52 | _drift: Coefficient 53 | Drift (mu) coefficient of the SDE. 54 | 55 | _diffusion: Coefficient 56 | Diffusion (sigma) coefficient of the SDE. 57 | 58 | _n_sim: int 59 | Number of simulated approximations. 60 | 61 | _n_jobs: int 62 | Number of batches to compute in parallel. 63 | 64 | delta: float 65 | Length of the time step. 66 | 67 | t: np.ndarray 68 | Array containing the time steps values, shape: (n_steps+1,). 69 | 70 | Y: np.ndarray 71 | Array containing the approximated solution of the SDE, shape: shape(n_sim, n_steps+1). 72 | 73 | Methods 74 | ------- 75 | compute_numerical_approximation 76 | """ 77 | 78 | def __init__( 79 | self, 80 | t_0: float, 81 | t_n: float, 82 | n_steps: int, 83 | X_0: float, 84 | drift: Coefficient, 85 | diffusion: Coefficient, 86 | n_sim: int, 87 | n_jobs: int, 88 | ): 89 | super().__init__( 90 | t_0=t_0, 91 | t_n=t_n, 92 | n_steps=n_steps, 93 | X_0=X_0, 94 | drift=drift, 95 | diffusion=diffusion, 96 | n_sim=n_sim, 97 | ) 98 | self._n_jobs = n_jobs 99 | 100 | @property 101 | def n_jobs(self): 102 | return self._n_jobs 103 | 104 | @n_jobs.setter 105 | def n_jobs(self, value: int): 106 | """Change the number of batches. 107 | 108 | Parameters 109 | ---------- 110 | value: int 111 | Number of batches. 112 | """ 113 | if value > 0: 114 | self._n_jobs = value 115 | else: 116 | raise ValueError("Number of batches must be positive.") 117 | 118 | def _num_sim_batch(self) -> list[int]: 119 | """Calculate the number of simulations within each batch for parallel computation. 120 | 121 | Returns 122 | ------- 123 | batches: list[int] 124 | List containing the number of simulations to include in each batch. 125 | """ 126 | batch_size = self._n_sim // self._n_jobs 127 | remainder = self._n_sim % self._n_jobs 128 | 129 | batches = [batch_size] * (self._n_jobs - remainder) + [ 130 | batch_size + 1 131 | ] * remainder 132 | 133 | return batches 134 | 135 | def compute_numerical_approximation(self) -> np.ndarray: 136 | """Compute the EM approximation for all simulated trajectories using parallel computing. 137 | 138 | Returns 139 | ------- 140 | Y: np.ndarray 141 | Array containing the approximated solution of the SDE, shape(n_sim, n_steps+1). 142 | """ 143 | Y_dim_batch_list = self._num_sim_batch() 144 | 145 | Y = Parallel(n_jobs=self._n_jobs)( 146 | delayed(self._solve_numerical_approximation)(dim=Y_dim) 147 | for Y_dim in Y_dim_batch_list 148 | ) 149 | 150 | self.Y = np.concatenate(Y, axis=0) 151 | 152 | return self.Y 153 | -------------------------------------------------------------------------------- /src/euler_maruyama/coefficients.py: -------------------------------------------------------------------------------- 1 | from abc import ABC, abstractmethod 2 | 3 | import matplotlib.pyplot as plt 4 | import numpy as np 5 | 6 | 7 | class Coefficient(ABC): 8 | """Abstract class to define the internal structure of the drift and diffusion coefficients. 9 | 10 | Methods 11 | ------- 12 | get_value 13 | plot_X_sample 14 | plot_t_sample 15 | """ 16 | 17 | def __init__(self): 18 | pass 19 | 20 | @abstractmethod 21 | def get_value(self, X: np.ndarray, t: float) -> np.ndarray: 22 | raise NotImplementedError 23 | 24 | def plot_X_sample(self) -> None: 25 | """Plot the coefficient value for 100 samples of X between 0 and 10.""" 26 | result = np.zeros(100) 27 | x_array = np.linspace(0, 10, 100) 28 | for i, x in enumerate(x_array): 29 | result[i] = self.get_value(X=np.array(x), t=0) 30 | 31 | fig, ax = plt.subplots(figsize=(7, 5)) 32 | 33 | ax.plot(x_array, result) 34 | 35 | ax.set_xlabel(r"$X$") 36 | ax.set_ylabel(r"Coefficient value") 37 | 38 | plt.show() 39 | 40 | def plot_t_sample(self) -> None: 41 | """Plot the coefficient value for 100 samples of t between 0 and 1.""" 42 | result = np.zeros(100) 43 | t_array = np.linspace(0, 1, 100) 44 | for i, t in enumerate(t_array): 45 | result[i] = self.get_value(X=np.array(1.0), t=t) 46 | 47 | fig, ax = plt.subplots(figsize=(7, 5)) 48 | 49 | ax.plot(t_array, result) 50 | 51 | ax.set_xlabel(r"$t$") 52 | ax.set_ylabel(r"Coefficient value") 53 | 54 | plt.show() 55 | 56 | 57 | class LinearDrift(Coefficient): 58 | """Implement a linear drift of the form: 59 | 60 | mu(X_t, t) = a*t 61 | 62 | where a is a real value parameter. 63 | 64 | Parameters 65 | --------- 66 | a: float 67 | The linear coefficient of drift. 68 | 69 | Methods 70 | ------- 71 | get_value 72 | """ 73 | 74 | def __init__(self, a: float): 75 | super().__init__() 76 | self.a = a 77 | 78 | def get_value(self, X: np.ndarray, t: float) -> np.ndarray: 79 | """Compute the linear drift value as mu(X_t, t) = a*t. 80 | 81 | Parameters 82 | ---------- 83 | X: np.ndarray 84 | The X_t values, shape = (number of simulations, ) 85 | 86 | t: flotat 87 | The time value. 88 | 89 | Returns 90 | ------- 91 | np.ndarray 92 | The linear drift coefficient values, shape = (number of simulations, ) 93 | """ 94 | return np.ones_like(X) * self.a * t 95 | 96 | 97 | class MeanReversionDrift(Coefficient): 98 | """Implement a mean-reversion drift of the form: 99 | 100 | mu(X_t, t) = theta*(mean - X_t) 101 | 102 | where theta and mean are real value parameters. 103 | 104 | Parameters 105 | --------- 106 | theta: float 107 | The speed of reversion. 108 | 109 | mean: float 110 | The equilibrium value. 111 | 112 | Methods 113 | ------- 114 | get_value 115 | """ 116 | 117 | def __init__(self, theta: float, mean: float): 118 | super().__init__() 119 | self.theta = theta 120 | self.mean = mean 121 | 122 | def get_value(self, X: np.ndarray, t: float) -> np.ndarray: 123 | """Compute the mean-reversion drift value as mu(X_t, t) = theta*(mean - X_t). 124 | 125 | Parameters 126 | ---------- 127 | X: np.ndarray 128 | The X_t values, shape = (number of simulations, ) 129 | 130 | t: flotat 131 | The time value. 132 | 133 | Returns 134 | ------- 135 | np.ndarray 136 | The mean-reversion drift coefficient values, shape = (number of simulations, ) 137 | """ 138 | return self.theta * (self.mean - X) 139 | 140 | 141 | class ConstantDiffusion(Coefficient): 142 | """Implement a constant diffusion of the form: 143 | 144 | sigma(X_t, t) = b 145 | 146 | where b is a real value parameter. 147 | 148 | Parameters 149 | --------- 150 | b: float 151 | The constant diffusion value. 152 | 153 | Methods 154 | ------- 155 | get_value 156 | """ 157 | 158 | def __init__(self, b: float): 159 | super().__init__() 160 | self.b = b 161 | 162 | def get_value(self, X: np.ndarray, t: float) -> np.ndarray: 163 | """Compute the constant diffusion value as sigma(X_t, t) = b. 164 | 165 | Parameters 166 | ---------- 167 | X: np.ndarray 168 | The X_t values, shape = (number of simulations, ) 169 | 170 | t: flotat 171 | The time value. 172 | 173 | Returns 174 | ------- 175 | np.ndarray 176 | The constant diffusion coefficient values, shape = (number of simulations, ) 177 | """ 178 | return np.ones_like(X) * self.b 179 | 180 | 181 | class MultiplicativeNoiseDiffusion(Coefficient): 182 | """Implement a multiplicative noise-like diffusion of the form: 183 | 184 | sigma(X_t, t) = b*X_t 185 | 186 | where b is a real value parameter. 187 | 188 | Parameters 189 | --------- 190 | b: float 191 | The amplitude of the multiplicative noise. 192 | 193 | Methods 194 | ------- 195 | get_value 196 | """ 197 | 198 | def __init__(self, b: float): 199 | super().__init__() 200 | self.b = b 201 | 202 | def get_value(self, X: np.ndarray, t: float) -> np.ndarray: 203 | """Compute the multiplicative noise-like diffusion value as sigma(X_t, t) = b*X_t. 204 | 205 | Parameters 206 | ---------- 207 | X: np.ndarray 208 | The X_t values, shape = (number of simulations, ) 209 | 210 | t: flotat 211 | The time value. 212 | 213 | Returns 214 | ------- 215 | np.ndarray 216 | The multiplicative noise-like diffusion coefficient values, shape = (number of simulations, ) 217 | """ 218 | return self.b * X 219 | -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- 1 | # ReCoDE project - Euler-Maruyama method 2 | 3 | ## Description 4 | 5 | This code is part of the **Re**search **Co**mputing and **D**ata Science **E**xamples (ReCoDE) projects. 6 | The project consists of a Python class containing the Euler-Maruyama (EM) method for the numerical solution 7 | of a Stochastic Differential Equation (SDE). SDEs describe the dynamics that govern the time-evolution of 8 | systems subjected to deterministic and random influences. They arise in fields such as biology, physics or 9 | finance to model variables exhibiting uncertain and fluctuating behaviour. Being able to numerical solve an SDE 10 | is essential for these fields, especially if there is no closed-form solution. This project provides an 11 | object-oriented implementation of the EM method. Throughout the project, it is emphasised the benefits that 12 | class encapsulation provides in terms of code modularity and re-usability. 13 | 14 | ## Learning Outcomes 15 | This project is designed for Master's and Ph.D. students with basic Python knowledge and need to solve SDEs 16 | for their research projects. After going through this project, students will: 17 | 18 | 1. Understand how to solve an SDE using the EM method. 19 | 2. Learn to encapsulate the EM method code into a Python class. 20 | 3. Explore how to parallelise the code to improve solution speed. 21 | 22 | 23 | ## Requirements 24 | 25 | ### System 26 | 27 | | Program | Version | 28 | |------------------------------------------------------------|---------| 29 | | [Git](https://git-scm.com/) | >= 2.41 | 30 | | [Python](https://www.python.org/downloads/) | >= 3.9 | 31 | 32 | ### Dependencies 33 | 34 | | Packages | Version | 35 | |--------------------------------------------------------|-----------| 36 | | [poetry](https://python-poetry.org/docs/) | >= 1.4.* | 37 | | [numpy](https://numpy.org/doc/stable/) | >= 1.24.* | 38 | | [matplotlib](https://matplotlib.org/stable/index.html) | >= 3.7.* | 39 | | [jupyter](http://jupyter.org/install) | >= 1.0.* | 40 | | [joblib](https://joblib.readthedocs.io/en/stable/) | >= 1.2.* | 41 | 42 | ## Project Structure 43 | ```bash 44 | . 45 | ├── .github/workflows 46 | │ └── tests_workflow.yaml 47 | ├── docs 48 | │ ├── 1-Introduction.ipynb 49 | │ ├── 2-Probability-Distributions.ipynb 50 | │ ├── 3-Euler-Maruyama-Method.ipynb 51 | │ ├── 4-Euler-Maruyama-Class.ipynb 52 | │ └── 5-Parallel-Euler-Maruyama-Class.ipynb 53 | ├── src 54 | │ └── euler_maruyama 55 | │ ├── __init__.py 56 | │ ├── coefficients.py 57 | │ ├── euler_maruyama.py 58 | │ └── parallel_euler_maruyama.py 59 | ├── tests 60 | │ ├── test_coefficient.py 61 | │ ├── test_euler_maruyama.py 62 | │ └── test_parallel_euler_maruyama.py 63 | ├── .gitignore 64 | ├── poetry.lock 65 | ├── poetry.toml 66 | ├── pyproject.toml 67 | ├── README.md 68 | └── requirements.txt 69 | ``` 70 | 71 | ## Getting Started 72 | 73 | You can read the Jupyter notebooks non-interactively on Github. Click [here](https://github.com/ImperialCollegeLondon/ReCoDe_Euler_Maruyama/tree/main/docs) 74 | to view the collection of Jupyter notebooks located in the ``docs`` folder. However, for an improved experience, we suggest cloning the Github repository and running the Jupyter notebooks on your local 75 | machine. To assist you setting up the project locally, we provide a list of steps: 76 | 77 | ### 1. Clone the repository 78 | 79 | After installing `git` in your local machine, you can run the following command in a terminal: 80 | 81 | ```bash 82 | git clone https://github.com/ImperialCollegeLondon/ReCoDe_Euler_Maruyama.git euler-maruyama 83 | cd euler-maruyama 84 | ``` 85 | 86 | ### 2. Install poetry 87 | 88 | Once you have downloaded a `Python` version, you need to install `poetry`. 89 | `Poetry` is a dependency management and packaging tool for `Python` projects that simplifies the process of managing dependencies and distributing packages. 90 | It allows you to define project dependencies in a `pyproject.toml` file and provides commands to install, update, and remove dependencies. 91 | The main advantages of `poetry` include dependency resolution to ensure consistent environments, the management of virtual environments for isolation and simplified package publishing. 92 | It streamlines the development workflow and facilitates collaboration by providing a unified and straightforward approach to managing dependencies in `Python` projects. 93 | You can find more information in its [documentation](https://python-poetry.org/). 94 | Our main focus here is to use `poetry` to install the project and their dependencies locally. 95 | 96 | ```bash 97 | pip install poetry 98 | ``` 99 | 100 | You can check that `poetry` has been successfully installed by running: 101 | 102 | ```bash 103 | poetry --version 104 | Poetry (version 1.4.0) 105 | ``` 106 | 107 | 108 | ### 3. Install the project 109 | 110 | Now, we need to install the project and its requirements. You can run the following command in the folder 111 | where you downloaded the Github repository: 112 | 113 | ```bash 114 | poetry install 115 | ``` 116 | 117 | This command creates a virtual environment in the same folder you are working, as specified by the 118 | `poetry.toml` configuration file of the project. Then, the packages requirements are installed and 119 | finally, the project is installed locally with the name `euler-maruyama` version (0.1.0). 120 | 121 | ### 4. Activate the local environment 122 | 123 | Run the following command to activate the local environment you created in the previous step: 124 | 125 | ```bash 126 | poetry shell 127 | ``` 128 | 129 | ### 5. Launch the Jupyter notebooks 130 | 131 | You can run this command to launch the Jupyter notebook: 132 | 133 | ```bash 134 | jupyter notebook 135 | ``` 136 | 137 | Now, you can explore and experiment with the different notebook examples we have prepared to help you 138 | understand this project. 139 | 140 | ### 6. Close the environment 141 | 142 | If you have closed the Jupyter notebooks and want to exit from the local environment, just run: 143 | 144 | ```bash 145 | exit 146 | ``` 147 | -------------------------------------------------------------------------------- /src/euler_maruyama/euler_maruyama.py: -------------------------------------------------------------------------------- 1 | import numpy as np 2 | 3 | from .coefficients import Coefficient 4 | 5 | 6 | class EulerMaruyama: 7 | """Class to perform the numerical solution of a Stochastic Differential Equation (SDE) through the Euler-Maruyama method. 8 | 9 | Considering a SDE of the form: dX_t = mu(X_t, t)dt + sigma(X_t, t)dW_t, the solution of this SDE over 10 | the time interval [t_0, t_n] can be approximated as follows: 11 | 12 | Y_{n+1} = Y_n + mu(Y_n, tau_n)(tau_{n+1} - tau_n) + sigma(Y_n, tau_n)(W_{tau_{n+1}} - W_{tau_n}) 13 | 14 | with initial condition Y_0 = X_0 and where the time interval is discretised: 15 | 16 | t_0 = tau_0 < tau_1 < ... < tau_n = t_n 17 | 18 | with Delta_t = tau_{n+1} - tau_n = (t_n - t_0) / n and DeltaW_n = (W_{tau_{n+1}} - W_{tau_n}) ~ N(0, Delta_t) 19 | because W_t is a Wiener process, so-called Brownian motion. 20 | 21 | Parameters 22 | ---------- 23 | t_0: float 24 | Initial time. 25 | 26 | t_n: float 27 | Final time. 28 | 29 | n_steps: int 30 | Number of time steps to discretise the time interval [t_0, t_n]. 31 | 32 | X_0: float 33 | Initial condition of the SDE. 34 | 35 | drift: Coefficient 36 | Drift (mu) coefficient of the SDE. 37 | 38 | diffusion: Coefficient 39 | Diffusion (sigma) coefficient of the SDE. 40 | 41 | n_sim: int 42 | Number of simulated approximations. 43 | 44 | Attributes 45 | ---------- 46 | _t_0: float 47 | Initial time. 48 | 49 | _t_n: float 50 | Final time. 51 | 52 | _n_steps: int 53 | Number of time steps to discretise the time interval [t_0, t_n]. 54 | 55 | _X_0: float 56 | Initial condition of the SDE. 57 | 58 | _drift: Coefficient 59 | Drift (mu) coefficient of the SDE. 60 | 61 | _diffusion: Coefficient 62 | Diffusion (sigma) coefficient of the SDE. 63 | 64 | _n_sim: int 65 | Number of simulated approximations. 66 | 67 | delta: float 68 | Length of the time step. 69 | 70 | t: np.ndarray 71 | Array containing the time steps values, shape: (n_steps+1,). 72 | 73 | Y: np.ndarray 74 | Array containing the approximated solution of the SDE, shape: shape(n_sim, n_steps+1). 75 | 76 | Methods 77 | ------- 78 | compute_numerical_approximation 79 | """ 80 | 81 | def __init__( 82 | self, 83 | t_0: float, 84 | t_n: float, 85 | n_steps: int, 86 | X_0: float, 87 | drift: Coefficient, 88 | diffusion: Coefficient, 89 | n_sim: int, 90 | ): 91 | 92 | self._t_0 = t_0 93 | self._t_n = t_n 94 | self._n_steps = n_steps 95 | 96 | self._X_0 = X_0 97 | 98 | self._drift = drift 99 | self._diffusion = diffusion 100 | 101 | self._n_sim = n_sim 102 | 103 | self.Y = None 104 | self._compute_discretisation() 105 | 106 | @property 107 | def n_sim(self): 108 | return self._n_sim 109 | 110 | @n_sim.setter 111 | def n_sim(self, value: int): 112 | """Change the number of simulations. 113 | 114 | Parameters 115 | ---------- 116 | value: int 117 | Number of simulations. 118 | """ 119 | if value > 0: 120 | self._n_sim = value 121 | else: 122 | raise ValueError("Number of simulations must be positive.") 123 | 124 | @property 125 | def n_steps(self): 126 | return self._n_steps 127 | 128 | @n_steps.setter 129 | def n_steps(self, value: int): 130 | """Change the number of time steps attribute and recalculate the discretisation. 131 | 132 | Parameters 133 | ---------- 134 | value: int 135 | Number of time steps. 136 | """ 137 | if value > 0: 138 | self._n_steps = value 139 | self._compute_discretisation() 140 | else: 141 | raise ValueError("Number of steps must be positive.") 142 | 143 | def _compute_discretisation(self) -> None: 144 | """Calculate time steps and time delta.""" 145 | self.t, self.delta = np.linspace( 146 | self._t_0, self._t_n, self._n_steps + 1, retstep=True 147 | ) 148 | 149 | def _allocate_Y(self, dim: int) -> np.ndarray: 150 | """Allocate an array for the approximated solution. 151 | 152 | Parameters 153 | ---------- 154 | dim: int 155 | Number of simulations, dimension 0 of Y. 156 | 157 | Returns 158 | ------- 159 | Y: np.ndarray 160 | Array for the approximated solution. 161 | """ 162 | Y = np.zeros((dim, self._n_steps + 1), dtype=float) 163 | Y[:, 0] = self._X_0 * np.ones(dim) 164 | return Y 165 | 166 | def _solve_numerical_approximation(self, dim: int) -> np.ndarray: 167 | """Solve the EM approximation for the given number of simulated trajectories. 168 | 169 | Parameters 170 | ---------- 171 | dim: int 172 | The number of simulations, dimension 0 of Y. 173 | 174 | Returns 175 | ------- 176 | Y: np.ndarray 177 | Array containing the approximated solution of the SDE, shape(n_sim, n_steps+1). 178 | """ 179 | Y = self._allocate_Y(dim=dim) 180 | for n in range(self._n_steps + 1)[:-1]: 181 | tau_n = self.t[n] 182 | Y_n = Y[:, n] 183 | 184 | mu = self._drift.get_value(X=Y_n, t=tau_n) 185 | sigma = self._diffusion.get_value(X=Y_n, t=tau_n) 186 | 187 | dW = np.random.normal(loc=0, scale=np.sqrt(self.delta), size=dim) 188 | 189 | # Compute next step of the EM scheme 190 | Y[:, n + 1] = Y_n + mu * self.delta + sigma * dW 191 | 192 | return Y 193 | 194 | def compute_numerical_approximation(self) -> np.ndarray: 195 | """Compute the EM approximation for all simulated trajectories. 196 | 197 | Returns 198 | ------- 199 | Y: np.ndarray 200 | Array containing the approximated solution of the SDE, shape(n_sim, n_steps+1). 201 | """ 202 | self.Y = self._solve_numerical_approximation(dim=self._n_sim) 203 | return self.Y 204 | -------------------------------------------------------------------------------- /docs/.icons/logos/iclogo.svg: -------------------------------------------------------------------------------- 1 | 2 | 3 | 4 | 622 | -------------------------------------------------------------------------------- /docs/5-Parallel-Euler-Maruyama-Class.ipynb: -------------------------------------------------------------------------------- 1 | { 2 | "cells": [ 3 | { 4 | "cell_type": "markdown", 5 | "id": "cf534b09", 6 | "metadata": {}, 7 | "source": [ 8 | "# 5 - Parallel Euler-Maruyama class\n", 9 | "\n", 10 | "In our previous explanations, we covered the process of solving a Stochastic Differential Equation (SDE) using the Euler-Maruyama method. Moreover, we learnt to encapsulate the logic of the EM method into a Python class, the `EulerMaruyama`. This class implementation provides code reusability and modularity, making the `EulerMaruyama` class a versatile numerical tool for solving user-defined SDEs. It also allows us to analyse the performance of the EM method by modifying input parameters such as the number of time steps or the number of simulations.\n", 11 | "\n", 12 | "The aim of this notebook is to improve the performance of the already implemented `EulerMaruyama` class. To achieve this, we will design a child class of `EulerMaruyama` class that provides parallel computing to optimise the numerical solution of the EM method. This new class introduces the concept of parallel computation and highlights the advantages of object-oriented programming, refreshing the concept of inheritance." 13 | ] 14 | }, 15 | { 16 | "cell_type": "markdown", 17 | "id": "821ac275", 18 | "metadata": {}, 19 | "source": [ 20 | "## Contents\n", 21 | "### [A. Parallel computation: the joblib package](#joblib)\n", 22 | "### [B. The Parallel Euler-Maruyama class](#parallel-em-class)" 23 | ] 24 | }, 25 | { 26 | "cell_type": "markdown", 27 | "id": "85003ff3", 28 | "metadata": {}, 29 | "source": [ 30 | "\n", 31 | "### A. Parallel computation: the joblib package\n", 32 | "\n", 33 | "Parallel computing refers to the technique of executing several computational tasks simultaneously, dividing the required workload across multiple cores. The presence of multiple cores in modern laptops, and the availability of High Performance Computing (HPC) resources (such as [those at Imperial](https://www.imperial.ac.uk/computational-methods/hpc/)) enables parallel processing, where different cores can handle separate tasks. By relying on this core multiplicity, parallel computation can significantly speed up computations that can be divided into independent parts. By harnessing the power of parallel processing, parallel computing enables faster execution times, improved performance, and the ability to handle larger and more complex computations. To learn more about parallel computing in Python, you can refer to the following link: [Python Concurrency - What is Parallelism?](https://realpython.com/python-concurrency/#what-is-parallelism). Please note that the linked resource covers additional topics beyond the scope of this project.\n", 34 | "\n", 35 | "With the following code, you can check the number of CPU cores in your local machine:" 36 | ] 37 | }, 38 | { 39 | "cell_type": "code", 40 | "execution_count": 1, 41 | "id": "59c6dc46", 42 | "metadata": {}, 43 | "outputs": [ 44 | { 45 | "name": "stdout", 46 | "output_type": "stream", 47 | "text": [ 48 | "Number of CPU cores: 10\n" 49 | ] 50 | } 51 | ], 52 | "source": [ 53 | "import joblib\n", 54 | "\n", 55 | "num_cores = joblib.cpu_count()\n", 56 | "print(\"Number of CPU cores:\", num_cores)" 57 | ] 58 | }, 59 | { 60 | "cell_type": "markdown", 61 | "id": "66fbd222", 62 | "metadata": {}, 63 | "source": [ 64 | "Here, we have introduced the Python `joblib` package, which simplifies and automates parallel computing tasks. It provides easy-to-use functions and utilities for distributing tasks across multiple cores, without requiring intricate low-level coding. `joblib` offers a high-level interface for parallel computing, making it accessible and convenient for users who want to leverage the power of parallel processing without dealing with the complexities of threading or multiprocessing in Python. You can check the `joblib` documentation in this [link](https://joblib.readthedocs.io/en/stable/).\n", 65 | "\n", 66 | "\n", 67 | "To illustrate the advantages of parallel computing, we show a simple example using the `joblib` package. Through this example, we demonstrate how parallel processing can significantly reduce computation time yielding an equivalent result." 68 | ] 69 | }, 70 | { 71 | "cell_type": "code", 72 | "execution_count": 2, 73 | "id": "d888dc3c", 74 | "metadata": {}, 75 | "outputs": [], 76 | "source": [ 77 | "# Import required functions from joblib\n", 78 | "from joblib import Parallel, delayed\n", 79 | "import time\n", 80 | "\n", 81 | "def process_data(data):\n", 82 | " time.sleep(1) # this line waits for 1s to simulate the behaviour of a time-consuming task \n", 83 | " result = data * 2\n", 84 | " return result" 85 | ] 86 | }, 87 | { 88 | "cell_type": "code", 89 | "execution_count": 3, 90 | "id": "08b7e7df", 91 | "metadata": {}, 92 | "outputs": [], 93 | "source": [ 94 | "# Compute a sequential processing: all calculations are done in 1 single core\n", 95 | "start_time = time.time()\n", 96 | "results_seq = [process_data(data) for data in range(10)]\n", 97 | "end_time = time.time()\n", 98 | "seq_time = end_time - start_time" 99 | ] 100 | }, 101 | { 102 | "cell_type": "code", 103 | "execution_count": 4, 104 | "id": "d858535b", 105 | "metadata": {}, 106 | "outputs": [], 107 | "source": [ 108 | "# Compute a parallel processing: all calculations are split into 4 cores. \n", 109 | "start_time = time.time()\n", 110 | "# This is the joblib implementation to send all elements of the for loop into distinct cores\n", 111 | "# The cores are specified with the n_job parameter. Here, we specify 4 cores.\n", 112 | "results_parallel = Parallel(n_jobs=4)(delayed(process_data)(data) for data in range(10))\n", 113 | "end_time = time.time()\n", 114 | "parallel_time = end_time - start_time" 115 | ] 116 | }, 117 | { 118 | "cell_type": "code", 119 | "execution_count": 5, 120 | "id": "2c52a2ba", 121 | "metadata": {}, 122 | "outputs": [ 123 | { 124 | "name": "stdout", 125 | "output_type": "stream", 126 | "text": [ 127 | "Sequential Results: [0, 2, 4, 6, 8, 10, 12, 14, 16, 18] in 10.03 s\n", 128 | "Parallel Results: [0, 2, 4, 6, 8, 10, 12, 14, 16, 18] in 3.56 s\n" 129 | ] 130 | } 131 | ], 132 | "source": [ 133 | "# Check results\n", 134 | "print(f\"Sequential Results: {results_seq} in {seq_time:.2f} s\" )\n", 135 | "print(f\"Parallel Results: {results_parallel} in {parallel_time:.2f} s\")" 136 | ] 137 | }, 138 | { 139 | "cell_type": "markdown", 140 | "id": "4993f80a", 141 | "metadata": {}, 142 | "source": [ 143 | "By using 4 cores, we reduce 50% of the computation time! Now, let us try a different numbers of `n_jobs` values to see the effect in the computation time." 144 | ] 145 | }, 146 | { 147 | "cell_type": "code", 148 | "execution_count": 6, 149 | "id": "57b9bc16", 150 | "metadata": {}, 151 | "outputs": [ 152 | { 153 | "name": "stdout", 154 | "output_type": "stream", 155 | "text": [ 156 | "Parallel Results with n_jobs=1: [0, 2, 4, 6, 8, 10, 12, 14, 16, 18] in 10.05 s\n" 157 | ] 158 | } 159 | ], 160 | "source": [ 161 | "# n_jobs=1 means no parallel computation\n", 162 | "start_time = time.time()\n", 163 | "results_parallel = Parallel(n_jobs=1)(delayed(process_data)(data) for data in range(10))\n", 164 | "end_time = time.time()\n", 165 | "parallel_time = end_time - start_time\n", 166 | "\n", 167 | "print(f\"Parallel Results with n_jobs=1: {results_parallel} in {parallel_time:.2f} s\")" 168 | ] 169 | }, 170 | { 171 | "cell_type": "code", 172 | "execution_count": 7, 173 | "id": "b8e5526e", 174 | "metadata": {}, 175 | "outputs": [ 176 | { 177 | "name": "stdout", 178 | "output_type": "stream", 179 | "text": [ 180 | "Parallel Results with n_jobs=2: [0, 2, 4, 6, 8, 10, 12, 14, 16, 18] in 5.54 s\n" 181 | ] 182 | } 183 | ], 184 | "source": [ 185 | "# 2 cores \n", 186 | "start_time = time.time()\n", 187 | "results_parallel = Parallel(n_jobs=2)(delayed(process_data)(data) for data in range(10))\n", 188 | "end_time = time.time()\n", 189 | "parallel_time = end_time - start_time\n", 190 | "\n", 191 | "print(f\"Parallel Results with n_jobs=2: {results_parallel} in {parallel_time:.2f} s\")" 192 | ] 193 | }, 194 | { 195 | "cell_type": "code", 196 | "execution_count": 8, 197 | "id": "bcd3561d", 198 | "metadata": {}, 199 | "outputs": [ 200 | { 201 | "name": "stdout", 202 | "output_type": "stream", 203 | "text": [ 204 | "Parallel Results with n_jobs=6: [0, 2, 4, 6, 8, 10, 12, 14, 16, 18] in 2.61 s\n" 205 | ] 206 | } 207 | ], 208 | "source": [ 209 | "# 6 cores\n", 210 | "start_time = time.time()\n", 211 | "results_parallel = Parallel(n_jobs=6)(delayed(process_data)(data) for data in range(10))\n", 212 | "end_time = time.time()\n", 213 | "parallel_time = end_time - start_time\n", 214 | "\n", 215 | "print(f\"Parallel Results with n_jobs=6: {results_parallel} in {parallel_time:.2f} s\")" 216 | ] 217 | }, 218 | { 219 | "cell_type": "code", 220 | "execution_count": 9, 221 | "id": "8a43beeb", 222 | "metadata": {}, 223 | "outputs": [ 224 | { 225 | "name": "stdout", 226 | "output_type": "stream", 227 | "text": [ 228 | "Parallel Results with n_jobs=10: [0, 2, 4, 6, 8, 10, 12, 14, 16, 18] in 1.51 s\n" 229 | ] 230 | } 231 | ], 232 | "source": [ 233 | "# 10 cores\n", 234 | "# Note that if your laptop has less cores, setting this to 10 would be equivalent to setting maximum number of cores\n", 235 | "start_time = time.time()\n", 236 | "results_parallel = Parallel(n_jobs=10)(delayed(process_data)(data) for data in range(10))\n", 237 | "end_time = time.time()\n", 238 | "parallel_time = end_time - start_time\n", 239 | "\n", 240 | "print(f\"Parallel Results with n_jobs=10: {results_parallel} in {parallel_time:.2f} s\")" 241 | ] 242 | }, 243 | { 244 | "cell_type": "markdown", 245 | "id": "a75adce1", 246 | "metadata": {}, 247 | "source": [ 248 | "`n_jobs=10` yields the minimum time elapsed in this particular example. This result is specific of this simple example, since we can allocate each element of the for loop into a different core. This ensures that the workload is evenly distributed across the cores, processing `process_data` only once in each core. The optimal value of `n_jobs` will depend on the specific task at hand." 249 | ] 250 | }, 251 | { 252 | "cell_type": "markdown", 253 | "id": "fc2baed4", 254 | "metadata": {}, 255 | "source": [ 256 | "\n", 257 | "### B. The Parallel Euler-Maruyama class\n", 258 | "\n", 259 | "Once we have explained parallel computing and how to use the `joblib` package, we introduce a new class `ParallelEulerMaruyama` in the `src/euler_maruyama/parallel_euler_maruyama.py` file. This class replicates the functionality of the `EulerMaruyama` class and provides parallel computation of the numerical approximation. We achieve such functionality relying on class inheritance. Therefore, `ParallelEulerMaruyama` is a child class of `EulerMaruyama`:\n", 260 | "\n", 261 | "```python\n", 262 | "from .euler_maruyama import EulerMaruyama\n", 263 | "\n", 264 | "class ParallelEulerMaruyama(EulerMaruyama):\n", 265 | "```\n", 266 | "\n", 267 | "By doing so, `ParallelEulerMaruyama` has the same attributes and methods that `EulerMaruyama`. Now, our aim is to modify the `compute_numerical_approximation` method to include the parallel computing. If we define a new method called `compute_numerical_approximation` in the `ParallelEulerMaruyama` class, we are overriding this method. Overriding a method redefines the implementation of the parent class. When a method if overridden, the child class provides a different implementation of the method, replacing the logic inherited from the parent class. By overriding a method, we can redefine the behavior of a particular method for a specific child class, allowing it to have its own unique functionality while still inheriting other characteristics from the parent class.\n", 268 | "\n", 269 | "```python\n", 270 | "from .euler_maruyama import EulerMaruyama\n", 271 | "\n", 272 | "class ParallelEulerMaruyama(EulerMaruyama):\n", 273 | "\n", 274 | " # __init__ and some code ...\n", 275 | "\n", 276 | " def compute_numerical_approximation(self) -> np.ndarray:\n", 277 | " # a distinct implementation from compute_numerical_approximation of EulerMaruyama\n", 278 | "```\n", 279 | "\n", 280 | "The `EulerMaruyama` class performs the numerical solution for all simulated trajectories simultaneously. By using `numpy` vectorisation, the method `_solve_numerical_approximation` efficiently updates the numerical approximation across all time steps for the specified number (`dim`) of simulated trajectories. This is precisely the reason of implementing the method `compute_numerical_approximation` in `EulerMaruyama` class as follows:\n", 281 | "\n", 282 | "```python\n", 283 | "def compute_numerical_approximation(self) -> np.ndarray:\n", 284 | " self.Y = self._solve_numerical_approximation(dim=self._n_sim) # we are solving for all _n_sim simulations \n", 285 | " return self.Y\n", 286 | "```\n", 287 | "\n", 288 | "On the other hand, we would like to split all specified simulations `_n_sim` into different batches. and compute each batch in a different core. To achieve this, we use the parallel computing approach we have commented in the previous section. Therefore, we require to define a number of batches and split the number of simulations `_n_sim` into different batches. The number of batches is specified in the class constructor with `n_jobs`, which follows a property pattern. The `_num_sim_bat` method then calculates the number of simulations that should be in each batch:\n", 289 | "\n", 290 | "```python\n", 291 | "def _num_sim_batch(self) -> list[int]:\n", 292 | " batch_size = self._n_sim // self._n_jobs\n", 293 | " remainder = self._n_sim % self._n_jobs\n", 294 | "\n", 295 | " batches = [batch_size] * (self._n_jobs - remainder) + [batch_size + 1] * remainder\n", 296 | "\n", 297 | " return batches\n", 298 | "```\n", 299 | "\n", 300 | "For example, for `_n_sim=1234` and `_n_jobs=3`, `_num_sim_batch` returns: `[411, 411, 412]`. We can use the result of `_num_sim_batch` inside the `compute_numerical_approximation` of `ParallelEulerMaruyama`:\n", 301 | "\n", 302 | "```python\n", 303 | "def compute_numerical_approximation(self) -> np.ndarray:\n", 304 | " Y_dim_batch_list = self._num_sim_batch()\n", 305 | "\n", 306 | " Y = Parallel(n_jobs=self._n_jobs)(\n", 307 | " delayed(self._solve_numerical_approximation)(dim=Y_dim) for Y_dim in Y_dim_batch_list\n", 308 | " )\n", 309 | "\n", 310 | " self.Y = np.concatenate(Y, axis=0)\n", 311 | "\n", 312 | " return self.Y\n", 313 | "```\n", 314 | "\n", 315 | "We have our parallel computation of the EM method! We will solve a particular SDE with different parameters to see the advantage of using parallel processing. " 316 | ] 317 | }, 318 | { 319 | "cell_type": "code", 320 | "execution_count": 10, 321 | "id": "7ea39e06", 322 | "metadata": {}, 323 | "outputs": [], 324 | "source": [ 325 | "import sys\n", 326 | " \n", 327 | "# we include outside folders in path\n", 328 | "sys.path.append('..')\n", 329 | "\n", 330 | "from src.euler_maruyama import ConstantDiffusion, EulerMaruyama, LinearDrift, ParallelEulerMaruyama" 331 | ] 332 | }, 333 | { 334 | "cell_type": "code", 335 | "execution_count": 11, 336 | "id": "74eccf81", 337 | "metadata": {}, 338 | "outputs": [], 339 | "source": [ 340 | "linear_drift = LinearDrift(a=1) # drift (mu) = 1*t\n", 341 | "constant_diffusion = ConstantDiffusion(b=2.5) # diffusion (sigma) = 2.5 " 342 | ] 343 | }, 344 | { 345 | "cell_type": "markdown", 346 | "id": "d85afd8b", 347 | "metadata": {}, 348 | "source": [ 349 | "We start with the simple example of `n_steps=100` and `n_sim=1_000`." 350 | ] 351 | }, 352 | { 353 | "cell_type": "code", 354 | "execution_count": 12, 355 | "id": "26aea349", 356 | "metadata": {}, 357 | "outputs": [], 358 | "source": [ 359 | "em = EulerMaruyama(t_0=0, \n", 360 | " t_n=2, \n", 361 | " n_steps=100, \n", 362 | " X_0=1, \n", 363 | " drift=linear_drift, \n", 364 | " diffusion=constant_diffusion, \n", 365 | " n_sim=1_000)" 366 | ] 367 | }, 368 | { 369 | "cell_type": "code", 370 | "execution_count": 13, 371 | "id": "7d5838f8", 372 | "metadata": {}, 373 | "outputs": [], 374 | "source": [ 375 | "start_time = time.time()\n", 376 | "results_seq_em = em.compute_numerical_approximation()\n", 377 | "end_time = time.time()\n", 378 | "seq_em_time = end_time - start_time" 379 | ] 380 | }, 381 | { 382 | "cell_type": "markdown", 383 | "id": "3761d20b", 384 | "metadata": {}, 385 | "source": [ 386 | "And we try with `n_jobs=2`" 387 | ] 388 | }, 389 | { 390 | "cell_type": "code", 391 | "execution_count": 14, 392 | "id": "4d3093b5", 393 | "metadata": {}, 394 | "outputs": [], 395 | "source": [ 396 | "parallel_em = ParallelEulerMaruyama(t_0=0, \n", 397 | " t_n=2, \n", 398 | " n_steps=100, \n", 399 | " X_0=1, \n", 400 | " drift=linear_drift, \n", 401 | " diffusion=constant_diffusion, \n", 402 | " n_sim=1_000, \n", 403 | " n_jobs=2)" 404 | ] 405 | }, 406 | { 407 | "cell_type": "code", 408 | "execution_count": 15, 409 | "id": "f7d92a2d", 410 | "metadata": {}, 411 | "outputs": [], 412 | "source": [ 413 | "start_time = time.time()\n", 414 | "results_parallel_em = parallel_em.compute_numerical_approximation()\n", 415 | "end_time = time.time()\n", 416 | "parallel_em_time = end_time - start_time" 417 | ] 418 | }, 419 | { 420 | "cell_type": "code", 421 | "execution_count": 16, 422 | "id": "2b44d004", 423 | "metadata": {}, 424 | "outputs": [ 425 | { 426 | "name": "stdout", 427 | "output_type": "stream", 428 | "text": [ 429 | "Time elapsed in EulerMaruyama class: 0.02 s\n", 430 | "Time elapsed in ParallelEulerMaruyama class with n_jobs=2: 0.82 s\n" 431 | ] 432 | } 433 | ], 434 | "source": [ 435 | "print(f\"Time elapsed in EulerMaruyama class: {seq_em_time:.2f} s\")\n", 436 | "print(f\"Time elapsed in ParallelEulerMaruyama class with n_jobs={parallel_em.n_jobs}: {parallel_em_time:.2f} s\")" 437 | ] 438 | }, 439 | { 440 | "cell_type": "markdown", 441 | "id": "a904a086", 442 | "metadata": {}, 443 | "source": [ 444 | "It seems that for this simple and reduced example `numpy` vectorisation is faster than parallel processing. This is because setting up the parallel processing run with `joblib` and the recombination of the arrays with `numpy.concatenate` introduces extra work, which slows down the code. For relatively small tasks this more than offsets the gains made in the parallelisation of the task.\n", 445 | "\n", 446 | "Let us try another number of `n_jobs`:" 447 | ] 448 | }, 449 | { 450 | "cell_type": "code", 451 | "execution_count": 17, 452 | "id": "53579c62", 453 | "metadata": {}, 454 | "outputs": [ 455 | { 456 | "name": "stdout", 457 | "output_type": "stream", 458 | "text": [ 459 | "Time elapsed in ParallelEulerMaruyama class with n_jobs=5: 0.90 s\n" 460 | ] 461 | } 462 | ], 463 | "source": [ 464 | "parallel_em.n_jobs = 5\n", 465 | "start_time = time.time()\n", 466 | "results_parallel_em = parallel_em.compute_numerical_approximation()\n", 467 | "end_time = time.time()\n", 468 | "parallel_em_time = end_time - start_time\n", 469 | "print(f\"Time elapsed in ParallelEulerMaruyama class with n_jobs={parallel_em.n_jobs}: {parallel_em_time:.2f} s\")" 470 | ] 471 | }, 472 | { 473 | "cell_type": "code", 474 | "execution_count": 18, 475 | "id": "88ac7fa0", 476 | "metadata": {}, 477 | "outputs": [ 478 | { 479 | "name": "stdout", 480 | "output_type": "stream", 481 | "text": [ 482 | "Time elapsed in ParallelEulerMaruyama class with n_jobs=10: 1.22 s\n" 483 | ] 484 | } 485 | ], 486 | "source": [ 487 | "parallel_em.n_jobs = 10\n", 488 | "start_time = time.time()\n", 489 | "results_parallel_em = parallel_em.compute_numerical_approximation()\n", 490 | "end_time = time.time()\n", 491 | "parallel_em_time = end_time - start_time\n", 492 | "print(f\"Time elapsed in ParallelEulerMaruyama class with n_jobs={parallel_em.n_jobs}: {parallel_em_time:.2f} s\")" 493 | ] 494 | }, 495 | { 496 | "cell_type": "markdown", 497 | "id": "eb12de46", 498 | "metadata": {}, 499 | "source": [ 500 | "No, any value of `n_jobs` improves the performance of the `ParallelEulerMaruyama` over the sequential-style `EulerMaruyama` class. The reason is that the number of steps and number of simulations is such small, that it takes more time to prepare the parallel processing than processing everything into a single core.\n", 501 | "\n", 502 | "Now, let us try to increase the number of simulations to `n_sim=1_000_000`:" 503 | ] 504 | }, 505 | { 506 | "cell_type": "code", 507 | "execution_count": 19, 508 | "id": "b540af61", 509 | "metadata": {}, 510 | "outputs": [], 511 | "source": [ 512 | "em = EulerMaruyama(t_0=0, \n", 513 | " t_n=2, \n", 514 | " n_steps=100, \n", 515 | " X_0=1, \n", 516 | " drift=linear_drift, \n", 517 | " diffusion=constant_diffusion, \n", 518 | " n_sim=1_000_000)" 519 | ] 520 | }, 521 | { 522 | "cell_type": "code", 523 | "execution_count": 20, 524 | "id": "6fd1b824", 525 | "metadata": {}, 526 | "outputs": [], 527 | "source": [ 528 | "start_time = time.time()\n", 529 | "results_seq_em = em.compute_numerical_approximation()\n", 530 | "end_time = time.time()\n", 531 | "seq_em_time = end_time - start_time" 532 | ] 533 | }, 534 | { 535 | "cell_type": "code", 536 | "execution_count": 21, 537 | "id": "7b1ff8ae", 538 | "metadata": {}, 539 | "outputs": [], 540 | "source": [ 541 | "parallel_em = ParallelEulerMaruyama(t_0=0, \n", 542 | " t_n=2, \n", 543 | " n_steps=100, \n", 544 | " X_0=1, \n", 545 | " drift=linear_drift, \n", 546 | " diffusion=constant_diffusion, \n", 547 | " n_sim=1_000_000, \n", 548 | " n_jobs=2)" 549 | ] 550 | }, 551 | { 552 | "cell_type": "code", 553 | "execution_count": 22, 554 | "id": "bcf6bfe1", 555 | "metadata": {}, 556 | "outputs": [], 557 | "source": [ 558 | "start_time = time.time()\n", 559 | "results_parallel_em = parallel_em.compute_numerical_approximation()\n", 560 | "end_time = time.time()\n", 561 | "parallel_em_time = end_time - start_time" 562 | ] 563 | }, 564 | { 565 | "cell_type": "code", 566 | "execution_count": 23, 567 | "id": "9d41ec01", 568 | "metadata": {}, 569 | "outputs": [ 570 | { 571 | "name": "stdout", 572 | "output_type": "stream", 573 | "text": [ 574 | "Time elapsed in EulerMaruyama class: 3.96 s\n", 575 | "Time elapsed in ParallelEulerMaruyama class with n_jobs=2: 4.33 s\n" 576 | ] 577 | } 578 | ], 579 | "source": [ 580 | "print(f\"Time elapsed in EulerMaruyama class: {seq_em_time:.2f} s\")\n", 581 | "print(f\"Time elapsed in ParallelEulerMaruyama class with n_jobs={parallel_em.n_jobs}: {parallel_em_time:.2f} s\")" 582 | ] 583 | }, 584 | { 585 | "cell_type": "markdown", 586 | "id": "2ff56e78", 587 | "metadata": {}, 588 | "source": [ 589 | "Still not working... Let us try all possible values of `n_jobs` from 1 (sequential processing) to 10 and plot the result:" 590 | ] 591 | }, 592 | { 593 | "cell_type": "code", 594 | "execution_count": 26, 595 | "id": "1dda2d42", 596 | "metadata": {}, 597 | "outputs": [], 598 | "source": [ 599 | "parallel_results = []\n", 600 | "n_jobs_values = range(1, 11)\n", 601 | "for i in n_jobs_values:\n", 602 | " parallel_em.n_jobs = i\n", 603 | " \n", 604 | " start_time = time.time()\n", 605 | " results_parallel_em = parallel_em.compute_numerical_approximation()\n", 606 | " end_time = time.time()\n", 607 | " parallel_em_time = end_time - start_time\n", 608 | " \n", 609 | " parallel_results.append(parallel_em_time)" 610 | ] 611 | }, 612 | { 613 | "cell_type": "code", 614 | "execution_count": 27, 615 | "id": "65dc2da0", 616 | "metadata": {}, 617 | "outputs": [ 618 | { 619 | "data": { 620 | "image/png": "", 621 | "text/plain": [ 622 | "
" 623 | ] 624 | }, 625 | "metadata": {}, 626 | "output_type": "display_data" 627 | } 628 | ], 629 | "source": [ 630 | "import matplotlib.pyplot as plt\n", 631 | "\n", 632 | "fig, ax = plt.subplots(figsize=(10, 7))\n", 633 | "\n", 634 | "ax.scatter(n_jobs_values, parallel_results, label=\"ParallelEulerMaruyama\", color=\"red\")\n", 635 | "ax.axhline(y=seq_em_time, label=\"EulerMaruyama\")\n", 636 | "\n", 637 | "ax.set_xticks(n_jobs_values)\n", 638 | "\n", 639 | "ax.set_xlabel(\"n_jobs parameter (Number of cores)\")\n", 640 | "ax.set_ylabel(\"time elapsed [s]\")\n", 641 | "ax.set_title(\"Time to compute 1000000 simulations of the EM method\")\n", 642 | "\n", 643 | "ax.legend(loc=0)\n", 644 | "\n", 645 | "plt.show()" 646 | ] 647 | }, 648 | { 649 | "cell_type": "markdown", 650 | "id": "1ab62140", 651 | "metadata": {}, 652 | "source": [ 653 | "In this simple example encompassing 1,000,000 simulations of the EM method, parallel processing shows improved performance over numpy vectorization when using more than three cores. Compared to the earlier case where we performed 1,000 simulations, the task is much larger. This means we save quite a lot of time through parallelising it, which more than offsets the additional time taken to set up the parallel processing jobs and recombine the array at the end. This sort of pattern is fairly typical of parallel programming - it will tend to slow down smaller tasks, but may speed up larger tasks." 654 | ] 655 | } 656 | ], 657 | "metadata": { 658 | "kernelspec": { 659 | "display_name": "Python 3 (ipykernel)", 660 | "language": "python", 661 | "name": "python3" 662 | }, 663 | "language_info": { 664 | "codemirror_mode": { 665 | "name": "ipython", 666 | "version": 3 667 | }, 668 | "file_extension": ".py", 669 | "mimetype": "text/x-python", 670 | "name": "python", 671 | "nbconvert_exporter": "python", 672 | "pygments_lexer": "ipython3", 673 | "version": "3.9.7" 674 | } 675 | }, 676 | "nbformat": 4, 677 | "nbformat_minor": 5 678 | } 679 | --------------------------------------------------------------------------------